llama_params.h 332 Bytes
Newer Older
1
2
3
4
5
6
7
// Copyright (c) OpenMMLab. All rights reserved.

#pragma once

namespace turbomind {

struct LlamaAttentionParams {
Li Zhang's avatar
Li Zhang committed
8
    int   rotary_embedding_dim;
Lyu Han's avatar
Lyu Han committed
9
10
    float rotary_embedding_base;
    int   max_position_embeddings;
Li Zhang's avatar
Li Zhang committed
11
12
13
    float rope_scaling_factor;
    // bool  use_dynamic_ntk;
    bool use_logn_attn;
14
15
16
};

}  // namespace turbomind