tensor.cpp 11 KB
Newer Older
PanZezhong's avatar
init  
PanZezhong committed
1
2
#include "../tensor.hpp"
#include "../utils.hpp"
3
#include <algorithm>
PanZezhong's avatar
init  
PanZezhong committed
4
5
#include <fstream>
#include <iostream>
6
#include <mutex>
PanZezhong's avatar
init  
PanZezhong committed
7
#include <numeric>
PanZezhong's avatar
PanZezhong committed
8
#include <sstream>
PanZezhong's avatar
init  
PanZezhong committed
9
10
11
12

std::shared_ptr<TensorDesc>
TensorDesc::create(infiniDtype_t dtype, const std::vector<size_t> &shape,
                   const std::vector<ptrdiff_t> &strides) {
PanZezhong's avatar
PanZezhong committed
13
    return std::shared_ptr<TensorDesc>(new TensorDesc(dtype, shape, strides));
PanZezhong's avatar
init  
PanZezhong committed
14
15
}

16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
std::shared_ptr<TensorDesc>
TensorDesc::create(infiniDtype_t dtype, const std::vector<size_t> &shape) {
    auto ndim = shape.size();
    auto strides = std::vector<ptrdiff_t>(ndim);
    if (ndim > 0) {
        strides[ndim - 1] = 1;
        for (int i = ndim - 2; i >= 0; i--) {
            strides[i] = strides[i + 1] * shape[i + 1];
        }
    }
    return create(dtype, shape, strides);
}

std::shared_ptr<TensorDesc>
TensorDesc::createWithOrder(infiniDtype_t dtype, const std::vector<size_t> &shape,
                            const std::vector<size_t> &order) {
    ASSERT_EQ(shape.size(), order.size());
    auto ndim = shape.size();
    if (ndim == 0) {
        return create(dtype, shape);
    }
    auto strides = std::vector<ptrdiff_t>(order.size());
    auto idx = std::find(order.begin(), order.end(), size_t(ndim - 1));
    strides[std::distance(order.begin(), idx)] = 1;
    for (int i = ndim - 2; i >= 0; i--) {
        auto prev_dim = shape[std::distance(order.begin(), idx)];
        auto prev_stride = strides[std::distance(order.begin(), idx)];
        idx = std::find(order.begin(), order.end(), size_t(i));
        strides[std::distance(order.begin(), idx)] = prev_stride * prev_dim;
    }
    return create(dtype, shape, strides);
}

PanZezhong's avatar
PanZezhong committed
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
infiniopTensorDescriptor_t TensorDesc::desc() const {
    if (_desc == nullptr) {
        RUN_INFINI(infiniopCreateTensorDescriptor(
            (infiniopTensorDescriptor_t *)(&_desc), _shape.size(), _shape.data(),
            _strides.data(), _dtype));
    }
    return _desc;
};

void TensorDesc::resetDesc() {
    if (this->_desc != nullptr) {
        infiniopDestroyTensorDescriptor(this->_desc);
        this->_desc = nullptr;
    }
}

bool TensorDesc::isContigous() const {
    auto ndim = this->ndim();
    auto shape = this->shape();
    auto strides = std::vector<ptrdiff_t>(ndim);
    strides[ndim - 1] = 1;
    for (int i = ndim - 2; i >= 0; i--) {
        strides[i] = strides[i + 1] * shape[i + 1];
    }
    ASSERT_EQ(strides.size(), this->_strides.size());
    return std::equal(strides.begin(), strides.end(), this->_strides.begin());
}

std::string TensorDesc::info() const {
    std::stringstream ss;

    ss << "Tensor: "
       << "shape[ ";
    for (auto s : this->shape()) {
        ss << s << " ";
    }
    ss << "] strides[ ";
    for (auto s : this->strides()) {
        ss << s << " ";
    }
    ss << "] dtype=" << this->dtype();

    return ss.str();
}

PanZezhong's avatar
init  
PanZezhong committed
94
TensorDesc::~TensorDesc() {
PanZezhong's avatar
PanZezhong committed
95
    this->resetDesc();
PanZezhong's avatar
init  
PanZezhong committed
96
97
}

PanZezhong's avatar
PanZezhong committed
98
99
100
101
102
103
const std::vector<size_t> &Tensor::shape() const { return this->_desc->shape(); }
const std::vector<ptrdiff_t> &Tensor::strides() const { return this->_desc->strides(); }
size_t Tensor::ndim() const { return this->_desc->ndim(); }
infiniDtype_t Tensor::dtype() const { return this->_desc->dtype(); }
infiniDevice_t Tensor::deviceType() const { return this->_storage->deviceType(); }
int Tensor::deviceId() const { return this->_storage->deviceId(); }
PanZezhong's avatar
init  
PanZezhong committed
104
105
Tensor::~Tensor() {}

PanZezhong's avatar
PanZezhong committed
106
ptrdiff_t Tensor::dataOffset() const {
PanZezhong's avatar
PanZezhong committed
107
    return _offset;
PanZezhong's avatar
init  
PanZezhong committed
108
109
}

PanZezhong's avatar
PanZezhong committed
110
infiniopTensorDescriptor_t Tensor::desc() const { return _desc->desc(); }
wooway777's avatar
wooway777 committed
111
std::shared_ptr<TensorDesc> Tensor::tdesc() const { return _desc; }
PanZezhong's avatar
init  
PanZezhong committed
112
113
114

std::shared_ptr<Tensor> Tensor::buffer(infiniDtype_t dtype,
                                       const std::vector<size_t> &shape,
thatPepe's avatar
thatPepe committed
115
                                       std::shared_ptr<MemoryPool> pool) {
PanZezhong's avatar
init  
PanZezhong committed
116
117
    std::shared_ptr<Tensor> tensor = std::make_shared<Tensor>();
    auto ndim = shape.size();
PanZezhong's avatar
PanZezhong committed
118

PanZezhong's avatar
init  
PanZezhong committed
119
120
    size_t size = std::accumulate(shape.begin(), shape.end(), dsize(dtype), std::multiplies<size_t>());
    auto strides = std::vector<ptrdiff_t>(ndim);
PanZezhong's avatar
PanZezhong committed
121
122
123
124
125
    if (ndim > 0) {
        strides[ndim - 1] = 1;
        for (int i = ndim - 2; i >= 0; i--) {
            strides[i] = strides[i + 1] * shape[i + 1];
        }
PanZezhong's avatar
init  
PanZezhong committed
126
    }
thatPepe's avatar
thatPepe committed
127
    tensor->_storage = Storage::createFromPool(size, pool);
PanZezhong's avatar
PanZezhong committed
128
    tensor->_desc = TensorDesc::create(dtype, shape, strides);
PanZezhong's avatar
init  
PanZezhong committed
129
130
131
132
133
134
135
136
137
138
    tensor->_offset = 0;
    return tensor;
}

std::shared_ptr<Tensor> Tensor::weight(void *data, infiniDtype_t dtype,
                                       const std::vector<size_t> &shape) {
    std::shared_ptr<Tensor> tensor = std::make_shared<Tensor>();
    auto ndim = shape.size();
    size_t size = std::accumulate(shape.begin(), shape.end(), dsize(dtype), std::multiplies<size_t>());
    auto strides = std::vector<ptrdiff_t>(ndim);
PanZezhong's avatar
PanZezhong committed
139
140
141
142
143
    if (ndim > 0) {
        strides[ndim - 1] = 1;
        for (int i = ndim - 2; i >= 0; i--) {
            strides[i] = strides[i + 1] * shape[i + 1];
        }
PanZezhong's avatar
init  
PanZezhong committed
144
    }
PanZezhong's avatar
PanZezhong committed
145

PanZezhong's avatar
PanZezhong committed
146
    tensor->_storage = Storage::create(size);
PanZezhong's avatar
PanZezhong committed
147
    tensor->_desc = TensorDesc::create(dtype, shape, strides);
148
149
150
151
152
153
154
    // NOTE: 为兼容部分平台(沐曦)多线程并发对同一host数据执行memcpy卡死问题
    static std::mutex mutex;
    {
        std::lock_guard<std::mutex> lock(mutex);
        RUN_INFINI(infinirtMemcpy(tensor->_storage->memory(),
                                  data, size, INFINIRT_MEMCPY_H2D));
    }
PanZezhong's avatar
PanZezhong committed
155

PanZezhong's avatar
init  
PanZezhong committed
156
157
158
159
    tensor->_offset = 0;
    return tensor;
}

PanZezhong's avatar
PanZezhong committed
160
161
std::shared_ptr<Tensor> Tensor::memShare(const std::vector<size_t> &shape, infiniDtype_t dtype_) const {
    auto dtype = dtype_ == INFINI_DTYPE_INVALID ? this->dtype() : dtype_;
162
    size_t size = std::accumulate(shape.begin(), shape.end(), dsize(dtype), std::multiplies<size_t>());
PanZezhong's avatar
PanZezhong committed
163
    ASSERT(size <= this->_storage->size());
164
165
166
167
168
169
170
171
172
173
174
175

    std::shared_ptr<Tensor> tensor = std::make_shared<Tensor>();
    auto ndim = shape.size();
    auto strides = std::vector<ptrdiff_t>(ndim);
    if (ndim > 0) {
        strides[ndim - 1] = 1;
        for (int i = ndim - 2; i >= 0; i--) {
            strides[i] = strides[i + 1] * shape[i + 1];
        }
    }
    tensor->_storage = this->_storage;
    tensor->_offset = 0;
PanZezhong's avatar
PanZezhong committed
176
    tensor->_desc = TensorDesc::create(dtype, shape, strides);
177
178
179
    return tensor;
}

PanZezhong's avatar
PanZezhong committed
180
void *Tensor::dataImpl(ptrdiff_t offset) const {
PanZezhong's avatar
PanZezhong committed
181
    return (char *)(this->_storage->memory()) + this->_offset + offset * dsize(this->dtype());
PanZezhong's avatar
init  
PanZezhong committed
182
183
184
}

void *Tensor::data(ptrdiff_t offset) {
PanZezhong's avatar
PanZezhong committed
185
    return this->dataImpl(offset);
PanZezhong's avatar
init  
PanZezhong committed
186
187
188
}

const void *Tensor::data(ptrdiff_t offset) const {
PanZezhong's avatar
PanZezhong committed
189
    return this->dataImpl(offset);
PanZezhong's avatar
init  
PanZezhong committed
190
191
}

PanZezhong's avatar
PanZezhong committed
192
193
void Tensor::copyFrom(std::shared_ptr<Tensor const> src,
                      infiniopHandle_t handle, infinirtStream_t stream) {
PanZezhong's avatar
init  
PanZezhong committed
194
195
196
197
    ASSERT_EQ(this->shape(), src->shape());
    ASSERT_EQ(this->dtype(), src->dtype());
    infiniopRearrangeDescriptor_t desc;
    RUN_INFINI(infiniopCreateRearrangeDescriptor(
PanZezhong's avatar
PanZezhong committed
198
        handle, &desc, this->desc(), src->desc()));
PanZezhong's avatar
init  
PanZezhong committed
199
200
201
202
203
    RUN_INFINI(infiniopRearrange(desc, this->data(), src->data(),
                                 stream));
    RUN_INFINI(infiniopDestroyRearrangeDescriptor(desc));
}

PanZezhong's avatar
PanZezhong committed
204
205
bool Tensor::isContigous() const {
    return this->_desc->isContigous();
PanZezhong's avatar
init  
PanZezhong committed
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
}

template <typename T>
void print_data(T *data, const std::vector<size_t> &shape,
                const std::vector<ptrdiff_t> &strides, size_t dim) {
    if (dim == shape.size() - 1) {
        for (size_t i = 0; i < shape[dim]; i++) {
            std::cout << data[i] << " ";
        }
        std::cout << std::endl;
    } else if (dim < shape.size() - 1) {
        for (size_t i = 0; i < shape[dim]; i++) {
            print_data(data + i * strides[dim], shape, strides, dim + 1);
        }
    }
}

template <>
void print_data(uint16_t const *data, const std::vector<size_t> &shape,
                const std::vector<ptrdiff_t> &strides, size_t dim) {
    if (dim == shape.size() - 1) {
        for (size_t i = 0; i < shape[dim]; i++) {
            std::cout << f16_to_f32(data[i * strides[dim]]) << " ";
        }
PanZezhong's avatar
PanZezhong committed
230
        std::cout << std::endl;
PanZezhong's avatar
init  
PanZezhong committed
231
232
233
234
235
236
237
    } else if (dim < shape.size() - 1) {
        for (size_t i = 0; i < shape[dim]; i++) {
            print_data(data + i * strides[dim], shape, strides, dim + 1);
        }
    }
}

PanZezhong's avatar
PanZezhong committed
238
239
240
241
242
243
244
245
246
247
248
249
250
251
void print_data_bf16(uint16_t const *data, const std::vector<size_t> &shape,
                     const std::vector<ptrdiff_t> &strides, size_t dim) {
    if (dim == shape.size() - 1) {
        for (size_t i = 0; i < shape[dim]; i++) {
            std::cout << bf16_to_f32(data[i * strides[dim]]) << " ";
        }
        std::cout << std::endl;
    } else if (dim < shape.size() - 1) {
        for (size_t i = 0; i < shape[dim]; i++) {
            print_data(data + i * strides[dim], shape, strides, dim + 1);
        }
    }
}

PanZezhong's avatar
PanZezhong committed
252
253
254
255
std::string Tensor::info() const {
    std::stringstream ss;

    ss << "Tensor: "
PanZezhong's avatar
PanZezhong committed
256
       << this->_desc->info()
PanZezhong's avatar
PanZezhong committed
257
258
       << " device=" << this->deviceType()
       << " device_id=" << this->deviceId();
PanZezhong's avatar
PanZezhong committed
259
    return this->_desc->info();
PanZezhong's avatar
PanZezhong committed
260
261
262
}

void Tensor::debug(const std::string &filename) const {
PanZezhong's avatar
PanZezhong committed
263
264
    RUN_INFINI(infinirtDeviceSynchronize());

PanZezhong's avatar
PanZezhong committed
265
    std::cout << info() << std::endl;
PanZezhong's avatar
PanZezhong committed
266

PanZezhong's avatar
init  
PanZezhong committed
267
    void const *cpu_data;
PanZezhong's avatar
PanZezhong committed
268
    if (this->deviceType() != INFINI_DEVICE_CPU) {
PanZezhong's avatar
PanZezhong committed
269
270
271
        void *cpu_memory = std::malloc(this->_storage->size());
        RUN_INFINI(infinirtMemcpy(cpu_memory, this->_storage->memory(),
                                  this->_storage->size(), INFINIRT_MEMCPY_D2H));
PanZezhong's avatar
init  
PanZezhong committed
272
273
        cpu_data = cpu_memory;
    } else {
PanZezhong's avatar
PanZezhong committed
274
        cpu_data = this->_storage->memory();
PanZezhong's avatar
init  
PanZezhong committed
275
276
277
278
279
280
281
282
    }

    if (!filename.empty()) {
        std::ofstream outFile(filename, std::ios::binary);
        if (!outFile) {
            std::cerr << "Error opening file for writing: " << filename << "\n";
            return;
        }
PanZezhong's avatar
PanZezhong committed
283
        outFile.write(reinterpret_cast<const char *>(cpu_data), this->_storage->size());
PanZezhong's avatar
init  
PanZezhong committed
284
285
286
287
288
        outFile.close();
        std::cout << "Data written to file: " << filename << "\n";
        return;
    }

PanZezhong's avatar
PanZezhong committed
289
    switch (this->dtype()) {
PanZezhong's avatar
init  
PanZezhong committed
290
    case INFINI_DTYPE_F16:
PanZezhong's avatar
PanZezhong committed
291
        print_data((uint16_t const *)((char const *)cpu_data + dataOffset()),
PanZezhong's avatar
init  
PanZezhong committed
292
293
294
                   this->shape(), this->strides(), 0);
        break;
    case INFINI_DTYPE_F32:
PanZezhong's avatar
PanZezhong committed
295
        print_data((float const *)((char const *)cpu_data + dataOffset()),
PanZezhong's avatar
init  
PanZezhong committed
296
297
298
                   this->shape(), this->strides(), 0);
        break;
    case INFINI_DTYPE_U64:
PanZezhong's avatar
PanZezhong committed
299
        print_data((uint64_t const *)((char const *)cpu_data + dataOffset()),
PanZezhong's avatar
init  
PanZezhong committed
300
301
302
                   this->shape(), this->strides(), 0);
        break;
    case INFINI_DTYPE_I64:
PanZezhong's avatar
PanZezhong committed
303
        print_data((int64_t const *)((char const *)cpu_data + dataOffset()),
PanZezhong's avatar
init  
PanZezhong committed
304
305
306
                   this->shape(), this->strides(), 0);
        break;
    case INFINI_DTYPE_U32:
PanZezhong's avatar
PanZezhong committed
307
        print_data((uint32_t const *)((char const *)cpu_data + dataOffset()),
PanZezhong's avatar
init  
PanZezhong committed
308
309
310
                   this->shape(), this->strides(), 0);
        break;
    case INFINI_DTYPE_I32:
PanZezhong's avatar
PanZezhong committed
311
        print_data((int32_t const *)((char const *)cpu_data + dataOffset()),
PanZezhong's avatar
init  
PanZezhong committed
312
313
                   this->shape(), this->strides(), 0);
        break;
PanZezhong's avatar
PanZezhong committed
314
315
316
317
    case INFINI_DTYPE_BF16:
        print_data_bf16((uint16_t const *)((char const *)cpu_data + dataOffset()),
                        this->shape(), this->strides(), 0);
        break;
PanZezhong's avatar
init  
PanZezhong committed
318
319
320
321
322
323
    default:
        PANIC("Unsupported data type");
    }
}

void Tensor::debug() const { this->debug(""); }