"git@developer.sourcefind.cn:orangecat/ollama.git" did not exist on "e592e8fccb390073a51c61a529d4a52529c44aa2"
device.hpp 1.18 KB
Newer Older
Chao Liu's avatar
Chao Liu committed
1
2
#ifndef DEVICE_HPP
#define DEVICE_HPP
3

Chao Liu's avatar
Chao Liu committed
4
#include <memory>
Chao Liu's avatar
Chao Liu committed
5
#include "config.hpp"
6

Chao Liu's avatar
Chao Liu committed
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
struct DeviceMem
{
    DeviceMem() = delete;
    DeviceMem(std::size_t mem_size);
    void* GetDeviceBuffer();
    void ToDevice(const void* p);
    void FromDevice(void* p);
    ~DeviceMem();

    void* mpDeviceBuf;
    std::size_t mMemSize;
};

struct KernelTimerImpl;

struct KernelTimer
{
    KernelTimer();
    ~KernelTimer();
    void Start();
    void End();
    float GetElapsedTime() const;

    std::unique_ptr<KernelTimerImpl> impl;
};

Chao Liu's avatar
Chao Liu committed
33
template <typename... Args, typename F>
Chao Liu's avatar
Chao Liu committed
34
float launch_kernel(F kernel, dim3 grid_dim, dim3 block_dim, std::size_t lds_byte, Args... args)
Chao Liu's avatar
Chao Liu committed
35
36
37
{
    KernelTimer timer;

Chao Liu's avatar
Chao Liu committed
38
#if CK_DEVICE_BACKEND_AMD
Chao Liu's avatar
Chao Liu committed
39
40
    timer.Start();

Chao Liu's avatar
Chao Liu committed
41
    hipLaunchKernelGGL(kernel, grid_dim, block_dim, lds_byte, 0, args...);
Chao Liu's avatar
Chao Liu committed
42
43
44
45

    timer.End();

    hipGetErrorString(hipGetLastError());
Chao Liu's avatar
Chao Liu committed
46
#elif CK_DEVICE_BACKEND_NVIDIA
47
48
    const void* f  = reinterpret_cast<const void*>(kernel);
    void* p_args[] = {&args...};
Chao Liu's avatar
Chao Liu committed
49
50
51

    timer.Start();

Chao Liu's avatar
Chao Liu committed
52
    cudaError_t error = cudaLaunchKernel(f, grid_dim, block_dim, p_args, lds_byte, 0);
Chao Liu's avatar
Chao Liu committed
53
54
55
56
57
58
59
60

    timer.End();

    checkCudaErrors(error);
#endif

    return timer.GetElapsedTime();
}
61
62

#endif