"vscode:/vscode.git/clone" did not exist on "30fe765e9facf8892bc0261a6ae234c286b7d802"
Commit 9f7f976c authored by zhuwenwen's avatar zhuwenwen
Browse files

修改triton 量化w8a8 config命令方式

add deps of pd-pp
parent 81eaff62
...@@ -24,6 +24,9 @@ numa ...@@ -24,6 +24,9 @@ numa
pytrie pytrie
setuptools_scm>=8 setuptools_scm>=8
cmake==3.29 cmake==3.29
quart
fastrlock==0.8.3
cupy==12.3.0
torch == 2.5.1 torch == 2.5.1
triton == 3.1 triton == 3.1
......
...@@ -2309,9 +2309,10 @@ class W8a8GetCacheJSON: ...@@ -2309,9 +2309,10 @@ class W8a8GetCacheJSON:
self.triton_json_list=[] self.triton_json_list=[]
self.weight_shapes=[] self.weight_shapes=[]
self.moe_weight_shapes=[] self.moe_weight_shapes=[]
device_name = current_platform.get_device_name().replace(" ", "_") arch_name = torch.cuda.get_device_properties("cuda").gcnArchName.split(':')[0]
if 'K100_AI' in device_name and torch.cuda.get_device_properties(torch.cuda.current_device()).multi_processor_count == 120: arch_cu = torch.cuda.get_device_properties(torch.cuda.current_device()).multi_processor_count
device_name='K100_AI_120'
device_name =arch_name+'_'+str(arch_cu)+'cu'
self.device_name=device_name self.device_name=device_name
self.topk=1 self.topk=1
self.quant_method=None self.quant_method=None
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment