reduce.cc 806 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
#include "reduce.h"

namespace op::common_cpu::reduce_op {

float sum(const fp16_t *data, size_t len, ptrdiff_t stride) {
    float result = 0;
    for (size_t i = 0; i < len; i++) {
        result += utils::cast<float>(data[i * stride]);
    }

    return result;
}

float max(const fp16_t *data, size_t len, ptrdiff_t stride) {
    float result = utils::cast<float>(data[0]);
    for (size_t i = 1; i < len; i++) {
        result = std::max(result, utils::cast<float>(data[i * stride]));
    }

    return result;
}

float sumSquared(const fp16_t *data, size_t len, ptrdiff_t stride) {
    float result = 0;
    for (size_t i = 0; i < len; i++) {
        float val = utils::cast<float>(data[i * stride]);
        result += val * val;
    }

    return result;
}

} // namespace op::common_cpu::reduce_op