init

98957dd7 · luopl · 98957dd7 · 98957dd7 · 98957dd7 · 98957dd7
Commit 98957dd7 authored Aug 28, 2024 by luopl
14 changed files
--- a/mamba_ssm/ops/triton/ssd_combined.py
+++ b/mamba_ssm/ops/triton/ssd_combined.py
--- a/mamba_ssm/ops/triton/ssd_state_passing.py
+++ b/mamba_ssm/ops/triton/ssd_state_passing.py
--- a/mamba_ssm/utils/__init__.py
+++ b/mamba_ssm/utils/__init__.py
--- a/mamba_ssm/utils/generation.py
+++ b/mamba_ssm/utils/generation.py
--- a/mamba_ssm/utils/hf.py
+++ b/mamba_ssm/utils/hf.py
+import json
+import torch
+from transformers.utils import WEIGHTS_NAME, CONFIG_NAME
+from transformers.utils.hub import cached_file
+def load_config_hf(model_name):
+    resolved_archive_file = cached_file(model_name, CONFIG_NAME, _raise_exceptions_for_missing_entries=False)
+    return json.load(open(resolved_archive_file))
+def load_state_dict_hf(model_name, device=None, dtype=None):
+    # If not fp32, then we don't want to load directly to the GPU
+    mapped_device = "cpu" if dtype not in [torch.float32, None] else device
+    resolved_archive_file = cached_file(model_name, WEIGHTS_NAME, _raise_exceptions_for_missing_entries=False)
+    return torch.load(resolved_archive_file, map_location=mapped_device)
+    # Convert dtype before moving to GPU to save memory
+    if dtype is not None:
+        state_dict = {k: v.to(dtype=dtype) for k, v in state_dict.items()}
+    state_dict = {k: v.to(device=device) for k, v in state_dict.items()}
+    return state_dict
--- a/model.properties
+++ b/model.properties
+# 模型唯一标识
+modelCode=943
+# 模型名称
+modelName=mamba2_pytorch
+# 模型描述
+modelDescription=Transformers are SSMs: Generalized Models and Efficient Algorithms Through Structured State Space Duality
+# 应用场景
+appScenario=推理,科研,制造,医疗,家居,教育
+# 框架类型
+frameType=pytorch
--- a/pyproject.toml
+++ b/pyproject.toml
--- a/rocm_patch/rocm6_0.patch
+++ b/rocm_patch/rocm6_0.patch
--- a/setup.py
+++ b/setup.py
--- a/tests/ops/test_selective_scan.py
+++ b/tests/ops/test_selective_scan.py
--- a/tests/ops/triton/test_layernorm_gated.py
+++ b/tests/ops/triton/test_layernorm_gated.py
--- a/tests/ops/triton/test_selective_state_update.py
+++ b/tests/ops/triton/test_selective_state_update.py
--- a/tests/ops/triton/test_ssd.py
+++ b/tests/ops/triton/test_ssd.py
--- a/tests/test_generation.py
+++ b/tests/test_generation.py