mla_unsupported_msg=f"MLA model is not supported without global metadata server, please refer to https://github.com/sgl-project/sglang/blob/main/python/sglang/srt/mem_cache/storage/hf3fs/docs/deploy_sglang_3fs_multinode.md"
mla_unsupported_msg=f"MLA model is not supported without global metadata server, please refer to https://github.com/sgl-project/sglang/blob/main/python/sglang/srt/mem_cache/storage/hf3fs/docs/deploy_sglang_3fs_multinode.md"
...
@@ -213,6 +219,7 @@ class HiCacheHF3FS(HiCacheStorage):
...
@@ -213,6 +219,7 @@ class HiCacheHF3FS(HiCacheStorage):
entries=8,
entries=8,
dtype=dtype,
dtype=dtype,
metadata_client=Hf3fsLocalMetadataClient(),
metadata_client=Hf3fsLocalMetadataClient(),
is_page_first_layout=is_page_first_layout,
)
)
try:
try:
...
@@ -261,6 +268,7 @@ class HiCacheHF3FS(HiCacheStorage):
...
@@ -261,6 +268,7 @@ class HiCacheHF3FS(HiCacheStorage):
dtype=dtype,
dtype=dtype,
metadata_client=metadata_client,
metadata_client=metadata_client,
is_mla_model=is_mla_model,
is_mla_model=is_mla_model,
is_page_first_layout=is_page_first_layout,
)
)
defget(
defget(
...
@@ -407,12 +415,22 @@ class HiCacheHF3FS(HiCacheStorage):
...
@@ -407,12 +415,22 @@ class HiCacheHF3FS(HiCacheStorage):