generate_gemm_config.py 566 Bytes
Newer Older
Li Zhang's avatar
Li Zhang committed
1
2
3
4
5
6
# Copyright (c) OpenMMLab. All rights reserved.

import subprocess
import fire


Li Zhang's avatar
Li Zhang committed
7
def main(head_num: int = 32,
Li Zhang's avatar
Li Zhang committed
8
         size_per_head: int = 128,
Li Zhang's avatar
Li Zhang committed
9
10
11
         vocab_size: int = 32000,
         inter_size: int = 11008,
         tensor_para_size: int = 1,
Li Zhang's avatar
Li Zhang committed
12
13
14
         max_batch_size: int = 64):
    for bsz in range(1, max_batch_size + 1):
        subprocess.call(
Li Zhang's avatar
Li Zhang committed
15
            f'bin/llama_gemm {bsz} 1 1 {head_num} {size_per_head} {inter_size} {vocab_size} 1 {tensor_para_size} {0 if bsz == 1 else 1}',
Li Zhang's avatar
Li Zhang committed
16
17
18
19
20
            shell=True)


if __name__ == '__main__':
    fire.Fire(main)