Unverified Commit b361750a authored by huangtingwei's avatar huangtingwei Committed by GitHub
Browse files

Mooncake store get zero copy meta optimization (#9857)

parent 16e56ea6
...@@ -467,6 +467,7 @@ class MHATokenToKVPoolHost(HostKVCache): ...@@ -467,6 +467,7 @@ class MHATokenToKVPoolHost(HostKVCache):
ptr_list = [] ptr_list = []
key_list = [] key_list = []
kv_buffer_data_ptr = self.kv_buffer.data_ptr() kv_buffer_data_ptr = self.kv_buffer.data_ptr()
indices = indices.tolist()
v_offset = ( v_offset = (
self.layer_num self.layer_num
* self.size * self.size
...@@ -706,6 +707,7 @@ class MLATokenToKVPoolHost(HostKVCache): ...@@ -706,6 +707,7 @@ class MLATokenToKVPoolHost(HostKVCache):
ptr_list = [] ptr_list = []
key_list = [] key_list = []
kv_buffer_data_ptr = self.kv_buffer.data_ptr() kv_buffer_data_ptr = self.kv_buffer.data_ptr()
indices = indices.tolist()
for index in range(0, len(indices), self.page_size): for index in range(0, len(indices), self.page_size):
k_ptr = ( k_ptr = (
kv_buffer_data_ptr kv_buffer_data_ptr
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment