Serialization.h 1.64 KB
Newer Older
Zhekai Zhang's avatar
Zhekai Zhang committed
1
2
3
4
5
6
7
8
#pragma once

#include "common.h"
#include "Tensor.h"

class BufferMMap : public Buffer {
public:
    BufferMMap(void *ptr, size_t size, std::shared_ptr<void> parent) : parent(parent) {
Muyang Li's avatar
Muyang Li committed
9
        this->size        = size;
Zhekai Zhang's avatar
Zhekai Zhang committed
10
        this->device.type = Device::CPU;
Muyang Li's avatar
Muyang Li committed
11
        this->ptr         = ptr;
fengzch-das's avatar
fengzch-das committed
12
13
        // auto ret = cudaHostRegister(ptr, size, cudaHostRegisterPortable | cudaHostRegisterReadOnly);
        // if (ret == cudaSuccess) {
Zhekai Zhang's avatar
Zhekai Zhang committed
14
15
        //     this->registered = true;
        // } else {
fengzch-das's avatar
fengzch-das committed
16
17
        //     log(std::format("cudaHostRegister failed at {:p} (size={}): {}", ptr, size,
        //     cudaGetErrorString(cudaGetLastError()))); this->registered = false;
Zhekai Zhang's avatar
Zhekai Zhang committed
18
19
20
21
        // }
    }
    virtual ~BufferMMap() {
        // if (registered) {
fengzch-das's avatar
fengzch-das committed
22
        //     checkCUDA(cudaHostUnregister(ptr));
Zhekai Zhang's avatar
Zhekai Zhang committed
23
24
        // }
    }
Muyang Li's avatar
Muyang Li committed
25

Zhekai Zhang's avatar
Zhekai Zhang committed
26
27
28
29
30
31
32
public:
    std::shared_ptr<void> parent;
    // bool registered;
};

class SafeTensors : public TensorsProvider, public std::enable_shared_from_this<SafeTensors> {
public:
33
    SafeTensors(const std::string &filename);
Zhekai Zhang's avatar
Zhekai Zhang committed
34
35
    ~SafeTensors();

Muyang Li's avatar
Muyang Li committed
36
    virtual bool contains(const std::string &key) const override {
Zhekai Zhang's avatar
Zhekai Zhang committed
37
38
39
40
41
42
43
44
        return tensors.contains(key);
    }
    virtual Tensor getTensor(const std::string &key) override;

private:
    void parseHeader();

private:
45
46
47
    class MMapImpl;
    class MMapImplMio;
    class MMapImplPrivate;
muyangli's avatar
muyangli committed
48
    class MMapImplRead;
49

Zhekai Zhang's avatar
Zhekai Zhang committed
50
51
52
53
54
55
56
57
    struct TensorInfo {
        TensorShape shape;
        Tensor::ScalarType type;
        size_t offset;
        size_t length;
        std::weak_ptr<BufferMMap> buffer;
    };
    std::map<std::string, TensorInfo> tensors;
58
    std::unique_ptr<MMapImpl> mapped;
muyangli's avatar
muyangli committed
59
60

    bool hostRegistered, memoryPinned;
Muyang Li's avatar
Muyang Li committed
61
};