Commit bad62d59 authored by wangsen's avatar wangsen
Browse files

Update model/infer_util.py

parent 3fe98be6
...@@ -25,7 +25,7 @@ def get_infer_setting(gpu_device=0, quant=None): ...@@ -25,7 +25,7 @@ def get_infer_setting(gpu_device=0, quant=None):
quantize(model.transformer, quant) quantize(model.transformer, quant)
model.eval() model.eval()
model = model.cuda() model = model.cuda()
tokenizer = AutoTokenizer.from_pretrained("/data", trust_remote_code=True) tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)
return model, tokenizer return model, tokenizer
def is_chinese(text): def is_chinese(text):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment