"tests/vscode:/vscode.git/clone" did not exist on "16422ea76f213f5b1035513b441245b19ca5bdce"
Commit fca7ef19 authored by zhuwenwen's avatar zhuwenwen
Browse files

Merge branch 'vllm-v0.3.3-dtk24.04'

parents be0a159d 5c4471ef
......@@ -76,6 +76,9 @@ def get_model(model_config: ModelConfig, device_config: DeviceConfig,
f"{supported_dtypes}")
linear_method = quant_config.get_linear_method()
if linear_method != None:
os.environ['LLAMA_NN'] = '0'
with _set_default_torch_dtype(model_config.dtype):
# Create a model instance.
# The weights will be initialized as empty tensors.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment