sampling_ext.cpp 2.2 KB
Newer Older
1
2
3
// TODO: this is a temporary wrapper to allow calling C++ code from CGo
#include "sampling.h"
#include "sampling_ext.h"
4
#include "json-schema-to-grammar.h"
5

6
7
struct gpt_sampler *gpt_sampler_cinit(
    const struct llama_model *model, struct gpt_sampler_cparams *params)
8
{
9
10
    try
    {
Jesse Gross's avatar
Jesse Gross committed
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
        gpt_sampler_params sparams;
        sparams.top_k = params->top_k;
        sparams.top_p = params->top_p;
        sparams.min_p = params->min_p;
        sparams.tfs_z = params->tfs_z;
        sparams.typ_p = params->typical_p;
        sparams.temp = params->temp;
        sparams.penalty_last_n = params->penalty_last_n;
        sparams.penalty_repeat = params->penalty_repeat;
        sparams.penalty_freq = params->penalty_freq;
        sparams.penalty_present = params->penalty_present;
        sparams.mirostat = params->mirostat;
        sparams.mirostat_tau = params->mirostat_tau;
        sparams.mirostat_eta = params->mirostat_eta;
        sparams.penalize_nl = params->penalize_nl;
        sparams.seed = params->seed;
        sparams.grammar = params->grammar;
        return gpt_sampler_init(model, sparams);
29
30
31
    }
    catch (const std::exception &err)
    {
Jesse Gross's avatar
Jesse Gross committed
32
33
        return nullptr;
    }
34
35
}

36
void gpt_sampler_cfree(struct gpt_sampler *sampler)
37
{
38
    gpt_sampler_free(sampler);
39
40
}

41
void gpt_sampler_creset(struct gpt_sampler *sampler)
42
{
43
    gpt_sampler_reset(sampler);
44
45
}

46
47
llama_token gpt_sampler_csample(
    struct gpt_sampler *sampler,
48
49
50
    struct llama_context *ctx_main,
    int idx)
{
51
    return gpt_sampler_sample(sampler, ctx_main, idx);
52
53
}

54
55
void gpt_sampler_caccept(
    struct gpt_sampler *sampler,
56
57
58
    llama_token id,
    bool apply_grammar)
{
59
    gpt_sampler_accept(sampler, id, apply_grammar);
60
}
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81

int schema_to_grammar(const char *json_schema, char *grammar, size_t max_len)
{
    try
    {
        nlohmann::json schema = nlohmann::json::parse(json_schema);
        std::string grammar_str = json_schema_to_grammar(schema);
        size_t len = grammar_str.length();
        if (len >= max_len)
        {
            len = max_len - 1;
        }
        strncpy(grammar, grammar_str.c_str(), len);
        return len;
    }
    catch (const std::exception &e)
    {
        strncpy(grammar, "", max_len - 1);
        return 0;
    }
}