utils.hpp 1.56 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
#ifndef __INFINIOPTEST_UTILS_HPP__
#define __INFINIOPTEST_UTILS_HPP__
#include "../../utils.h"
#include "gguf.hpp"
#include <cstring>
#include <iostream>

#define CHECK_OR(cmd, action) CHECK_API_OR(cmd, INFINI_STATUS_SUCCESS, action)

inline double getVal(void *ptr, GGML_TYPE ggml_type) {
    switch (ggml_type) {
12
13
    case GGML_TYPE_BF16:
        return utils::cast<float>(*(bf16_t *)ptr);
14
    case GGML_TYPE_F16:
15
        return utils::cast<float>(*(fp16_t *)ptr);
16
17
18
19
    case GGML_TYPE_F32:
        return *(float *)ptr;
    case GGML_TYPE_F64:
        return *(double *)ptr;
20
21
    case GGML_TYPE_Q8_K:
        return *(bool *)ptr;
22
23
24
25
26
27
28
29
30
31
32
33
34
    case GGML_TYPE_I8:
        return *(int8_t *)ptr;
    case GGML_TYPE_I16:
        return *(int16_t *)ptr;
    case GGML_TYPE_I32:
        return *(int32_t *)ptr;
    case GGML_TYPE_I64:
        return (double)(*(int64_t *)ptr);
    default:
        throw std::runtime_error("Unsupported data type");
    }
}

35
36
inline size_t ggmlSizeOf(GGML_TYPE ggml_type) {
    switch (ggml_type) {
37
38
    case GGML_TYPE_BF16:
        return sizeof(bf16_t);
39
40
41
42
43
44
    case GGML_TYPE_F16:
        return sizeof(fp16_t);
    case GGML_TYPE_F32:
        return sizeof(float);
    case GGML_TYPE_F64:
        return sizeof(double);
45
46
    case GGML_TYPE_Q8_K:
        return sizeof(bool);
47
48
49
50
51
52
53
54
55
56
57
58
59
    case GGML_TYPE_I8:
        return sizeof(int8_t);
    case GGML_TYPE_I16:
        return sizeof(int16_t);
    case GGML_TYPE_I32:
        return sizeof(int32_t);
    case GGML_TYPE_I64:
        return sizeof(int64_t);
    default:
        throw std::runtime_error("Unsupported data type");
    }
}

60
#endif