parameters.json 426 Bytes
Newer Older
Rayyyyy's avatar
Rayyyyy committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
{
    "MAX_NEW_TOKENS" : 256,
    "CONCURRENT_LEVELS" : [1, 2, 4, 8, 16, 32, 64, 128, 256],
    "MODEL_PATH" : "meta-llama/Meta-Llama-3-70B-Instruct",
    "MODEL_HEADERS" : {"Content-Type": "application/json"},
    "SAFE_CHECK" : true,
    "THRESHOLD_TPS" : 7,
    "RANDOM_PROMPT_LENGTH" : 1000,
    "TEMPERATURE" : 0.6,
    "TOP_P" : 0.9,
    "MODEL_ENDPOINTS" : [
        "http://localhost:8000/v1/chat/completions"
    ]
}