test_tokenizer.py 334 Bytes
Newer Older
q.yao's avatar
q.yao committed
1
from lmdeploy.turbomind.tokenizer import Tokenizer
2

q.yao's avatar
q.yao committed
3
4
5
6
7

def main():
    tokenizer = Tokenizer('huggyllama/llama-7b')

    prompts = ['cest la vie', '上帝已死']
q.yao's avatar
q.yao committed
8
9
10
11
    for prompt in prompts:
        tokens = tokenizer.encode(prompt)
        output = tokenizer.decode(tokens)
        print(output)
q.yao's avatar
q.yao committed
12

13

q.yao's avatar
q.yao committed
14
15
if __name__ == '__main__':
    main()