llama_params.h 299 Bytes
Newer Older
1
2
3
4
5
6
7
// Copyright (c) OpenMMLab. All rights reserved.

#pragma once

namespace turbomind {

struct LlamaAttentionParams {
Lyu Han's avatar
Lyu Han committed
8
9
10
11
12
    int   rotray_embedding_dim;
    float rotary_embedding_base;
    int   max_position_embeddings;
    bool  use_dynamic_ntk;
    bool  use_logn_attn;
13
14
15
};

}  // namespace turbomind