[Feature] Initial support for multi-LoRA serving (#1307)

71221692 · Ying Sheng · GitHub · c33d82a2 · 71221692
Unverified Commit 71221692 authored Sep 12, 2024 by Ying Sheng Committed by GitHub Sep 12, 2024
Show whitespace changes
Inline Side-by-side

Showing with 1 addition and 0 deletions

test/srt/run_suite.py test/srt/run_suite.py +1 -0

No files found.
--- a/test/srt/run_suite.py
+++ b/test/srt/run_suite.py
@@ -7,6 +7,7 @@ suites = {
    "minimal": [
        "models/test_embedding_models.py",
        "models/test_generation_models.py",
+        "models/test_lora.py",
        "sampling/penaltylib",
        "test_chunked_prefill.py",
        "test_embedding_openai_server.py",