"vscode:/vscode.git/clone" did not exist on "03fa4d3fb3ddfc9ced960d527d075213f32ecf07"
Commit 5bd9b304 authored by zhuwenwen's avatar zhuwenwen
Browse files

解决w8a8 pp16开启marlin的oom问题

parent 6a8fd297
......@@ -128,6 +128,7 @@ class CompressedTensorsW8A8Int8MarlinMoEMethod(CompressedTensorsMarlinMoEMethod)
w1_marlin_list.append(w1_marlin_in)
w1_marlin = torch.stack(w1_marlin_list, dim=0)
del w1_marlin_list
w2_marlin_list = []
for ii in range(layer.w2_weight.shape[0]):
w2_marlin_in = get_w8a8_int8_marlin_weights(layer.w2_weight[ii])
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment