sampling_ext.cpp 1.47 KB
Newer Older
1
2
3
4
// TODO: this is a temporary wrapper to allow calling C++ code from CGo
#include "sampling.h"
#include "sampling_ext.h"

5
6
struct gpt_sampler *gpt_sampler_cinit(
    const struct llama_model *model, struct gpt_sampler_cparams *params)
7
{
8
    gpt_sampler_params sparams;
9
10
11
12
    sparams.top_k = params->top_k;
    sparams.top_p = params->top_p;
    sparams.min_p = params->min_p;
    sparams.tfs_z = params->tfs_z;
13
    sparams.typ_p = params->typical_p;
14
15
16
17
18
19
20
21
22
23
24
    sparams.temp = params->temp;
    sparams.penalty_last_n = params->penalty_last_n;
    sparams.penalty_repeat = params->penalty_repeat;
    sparams.penalty_freq = params->penalty_freq;
    sparams.penalty_present = params->penalty_present;
    sparams.mirostat = params->mirostat;
    sparams.mirostat_tau = params->mirostat_tau;
    sparams.mirostat_eta = params->mirostat_eta;
    sparams.penalize_nl = params->penalize_nl;
    sparams.seed = params->seed;
    sparams.grammar = params->grammar;
25
    return gpt_sampler_init(model, sparams);
26
27
}

28
void gpt_sampler_cfree(struct gpt_sampler *sampler)
29
{
30
    gpt_sampler_free(sampler);
31
32
}

33
void gpt_sampler_creset(struct gpt_sampler *sampler)
34
{
35
    gpt_sampler_reset(sampler);
36
37
}

38
39
llama_token gpt_sampler_csample(
    struct gpt_sampler *sampler,
40
41
42
    struct llama_context *ctx_main,
    int idx)
{
43
    return gpt_sampler_sample(sampler, ctx_main, idx);
44
45
}

46
47
void gpt_sampler_caccept(
    struct gpt_sampler *sampler,
48
49
50
    llama_token id,
    bool apply_grammar)
{
51
    gpt_sampler_accept(sampler, id, apply_grammar);
52
}