Update kv_cache.py

eb188324 · xuxzh1 · aa6b01c6 · eb188324
Commit eb188324 authored Feb 26, 2025 by xuxzh1 🎱
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

server/text_generation_server/layers/attention/kv_cache.py server/text_generation_server/layers/attention/kv_cache.py +1 -1

No files found.
--- a/server/text_generation_server/layers/attention/kv_cache.py
+++ b/server/text_generation_server/layers/attention/kv_cache.py
@@ -215,7 +215,7 @@ def paged_reshape_and_cache(
            raise ImportError(
                f"Could not import vllm paged attention. Make sure your installation is correct. Complete error: {e}"
            )
-        ops.reshape_and_cache(key, value, key_cache, value_cache, slots, "auto", 1.0)
+        ops.reshape_and_cache(key, value, key_cache, value_cache, slots, "auto", 1.0, 1.0)
    elif SYSTEM == "ipex":
        import intel_extension_for_pytorch as ipex