llama_params.h 262 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
// Copyright (c) OpenMMLab. All rights reserved.

#pragma once

namespace turbomind {

struct LlamaAttentionParams {
    int  rotray_embedding_dim;
    int  max_position_embeddings;
    bool use_dynamic_ntk;
    bool use_logn_attn;
};

}  // namespace turbomind