Add new file

5534ac8e · zhaoying1 · 7a88fd0a · 5534ac8e
Commit 5534ac8e authored Aug 14, 2023 by zhaoying1
Hide whitespace changes
Inline Side-by-side

Showing with 10 additions and 0 deletions

chatglm-6b testing/test_latency.py chatglm-6b testing/test_latency.py +10 -0

No files found.
--- a/chatglm-6b testing/test_latency.py
+++ b/chatglm-6b testing/test_latency.py
+from transformers import AutoModel, AutoTokenizer
+import os
+tokenizer = AutoTokenizer.from_pretrained("/zhaoy/chatglm-6b-moel", trust_remote_code=True)
+model = AutoModel.from_pretrained("/zhaoy/chatglm-6b-moel", trust_remote_code=True).half().cuda()
+model = model.eval()
+text = "你好"
+response, history = model.measure_latency(tokenizer, text, history=[])
+print(response)