"vllm/vscode:/vscode.git/clone" did not exist on "ff36139ffc66294c19b503c1e52dc42c2cd265f6"
Unverified Commit 1b962e24 authored by dolpm's avatar dolpm Committed by GitHub
Browse files

[fix] lora benchmarks pass no_lora_flag_cpu (#23774)


Signed-off-by: default avatarDylan Maloy <34420038+dolpm@users.noreply.github.com>
Co-authored-by: default avatarJee Jee Li <pandaleefree@gmail.com>
parent bfe93801
...@@ -464,7 +464,11 @@ class BenchmarkTensors: ...@@ -464,7 +464,11 @@ class BenchmarkTensors:
for field_name in LoRAKernelMeta.__dataclass_fields__: for field_name in LoRAKernelMeta.__dataclass_fields__:
field = getattr(self.lora_kernel_meta, field_name) field = getattr(self.lora_kernel_meta, field_name)
assert isinstance(field, torch.Tensor) assert isinstance(field, torch.Tensor)
setattr(self.lora_kernel_meta, field_name, to_device(field)) setattr(
self.lora_kernel_meta,
field_name,
to_device(field) if field_name != "no_lora_flag_cpu" else field,
)
def metadata(self) -> tuple[int, int, int]: def metadata(self) -> tuple[int, int, int]:
""" """
...@@ -512,6 +516,7 @@ class BenchmarkTensors: ...@@ -512,6 +516,7 @@ class BenchmarkTensors:
"lora_token_start_loc": self.lora_kernel_meta.lora_token_start_loc, "lora_token_start_loc": self.lora_kernel_meta.lora_token_start_loc,
"lora_ids": self.lora_kernel_meta.active_lora_ids, "lora_ids": self.lora_kernel_meta.active_lora_ids,
"scaling": 1.0, "scaling": 1.0,
"no_lora_flag_cpu": self.lora_kernel_meta.no_lora_flag_cpu,
} }
def as_lora_expand_kwargs(self, add_inputs: bool) -> dict[str, Any]: def as_lora_expand_kwargs(self, add_inputs: bool) -> dict[str, Any]:
...@@ -552,6 +557,7 @@ class BenchmarkTensors: ...@@ -552,6 +557,7 @@ class BenchmarkTensors:
"lora_ids": self.lora_kernel_meta.active_lora_ids, "lora_ids": self.lora_kernel_meta.active_lora_ids,
"offset_start": 0, "offset_start": 0,
"add_inputs": add_inputs, "add_inputs": add_inputs,
"no_lora_flag_cpu": self.lora_kernel_meta.no_lora_flag_cpu,
} }
def bench_fn_kwargs( def bench_fn_kwargs(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment