Unverified Commit 15a0b9e5 authored by lukec's avatar lukec Committed by GitHub
Browse files

Fix spelling errors (#33978)

parent c490d8cc
...@@ -139,7 +139,7 @@ def prepare_inputs( ...@@ -139,7 +139,7 @@ def prepare_inputs(
masked_m.append(mask.sum()) masked_m.append(mask.sum())
masked_m = torch.tensor(masked_m, dtype=torch.int32) masked_m = torch.tensor(masked_m, dtype=torch.int32)
# Intialize the hidden_states_3d with ones instead of empty to avoid nan # Initialize the hidden_states_3d with ones instead of empty to avoid nan
# issue. # issue.
hidden_states_3d = torch.ones( hidden_states_3d = torch.ones(
(num_experts, max(masked_m), hidden_states.shape[1]), dtype=hidden_states.dtype (num_experts, max(masked_m), hidden_states.shape[1]), dtype=hidden_states.dtype
......
...@@ -334,7 +334,7 @@ def test_batched_moe_align_block_size( ...@@ -334,7 +334,7 @@ def test_batched_moe_align_block_size(
ref_expert_ids = torch.empty((Msum // block_size,), dtype=torch.int32) ref_expert_ids = torch.empty((Msum // block_size,), dtype=torch.int32)
ref_num_tokens_post_pad = torch.empty((1,), dtype=torch.int32) ref_num_tokens_post_pad = torch.empty((1,), dtype=torch.int32)
# Intialize # Initialize
sentinel = E * max_tokens_per_batch sentinel = E * max_tokens_per_batch
ref_sorted_ids.fill_(sentinel) ref_sorted_ids.fill_(sentinel)
ref_expert_ids.fill_(-1) ref_expert_ids.fill_(-1)
......
...@@ -12,7 +12,7 @@ START_REASONING = "<think>\n" ...@@ -12,7 +12,7 @@ START_REASONING = "<think>\n"
START_RESPONSE = "\n</think>\n<answer>\n" START_RESPONSE = "\n</think>\n<answer>\n"
END_RESPONSE = "\n</answer>" END_RESPONSE = "\n</answer>"
NO_REASONING_QUICK_THROUGHT = { NO_REASONING_QUICK_THOUGHT = {
"output": f"{START_REASONING}{START_RESPONSE}This is the rest{END_RESPONSE}", # noqa: E501 "output": f"{START_REASONING}{START_RESPONSE}This is the rest{END_RESPONSE}", # noqa: E501
"reasoning": None, "reasoning": None,
"content": "This is the rest", "content": "This is the rest",
...@@ -81,7 +81,7 @@ TEST_CASES = [ ...@@ -81,7 +81,7 @@ TEST_CASES = [
NO_REASONING, NO_REASONING,
id="no_reasoning", id="no_reasoning",
), ),
pytest.param(False, NO_REASONING_QUICK_THROUGHT, id="no_reasoning_quick"), pytest.param(False, NO_REASONING_QUICK_THOUGHT, id="no_reasoning_quick"),
pytest.param( pytest.param(
False, False,
MULTIPLE_LINES, MULTIPLE_LINES,
...@@ -117,7 +117,7 @@ TEST_CASES = [ ...@@ -117,7 +117,7 @@ TEST_CASES = [
NO_REASONING, NO_REASONING,
id="no_reasoning_streaming", id="no_reasoning_streaming",
), ),
pytest.param(True, NO_REASONING_QUICK_THROUGHT, id="no_reasoning_quick_stream"), pytest.param(True, NO_REASONING_QUICK_THOUGHT, id="no_reasoning_quick_stream"),
pytest.param( pytest.param(
True, True,
MULTIPLE_LINES, MULTIPLE_LINES,
......
...@@ -333,7 +333,7 @@ def select_fp8_moe_backend( ...@@ -333,7 +333,7 @@ def select_fp8_moe_backend(
# TODO(rob): per discussion with TPU team, we need a way to register # TODO(rob): per discussion with TPU team, we need a way to register
# MoE backends by OOT plugins, rather than having an explicit list # MoE backends by OOT plugins, rather than having an explicit list
# of AVAILBLE_BACKENDS. Enabling returning `Fp8MoeBackend.NONE` is # of AVAILABLE_BACKENDS. Enabling returning `Fp8MoeBackend.NONE` is
# a temporary measure until these register APIs are complete. # a temporary measure until these register APIs are complete.
if current_platform.is_cuda() or current_platform.is_rocm(): if current_platform.is_cuda() or current_platform.is_rocm():
raise NotImplementedError( raise NotImplementedError(
......
...@@ -52,8 +52,8 @@ def is_flashmla_dense_supported() -> tuple[bool, str | None]: ...@@ -52,8 +52,8 @@ def is_flashmla_dense_supported() -> tuple[bool, str | None]:
""" """
Return: is_supported_flag, unsupported_reason (optional). Return: is_supported_flag, unsupported_reason (optional).
""" """
is_availble, maybe_reason = _is_flashmla_available() is_available, maybe_reason = _is_flashmla_available()
if not is_availble: if not is_available:
return False, maybe_reason return False, maybe_reason
if not current_platform.is_device_capability_family(90): if not current_platform.is_device_capability_family(90):
return False, "FlashMLA Dense is only supported on Hopper devices." return False, "FlashMLA Dense is only supported on Hopper devices."
...@@ -64,8 +64,8 @@ def is_flashmla_sparse_supported() -> tuple[bool, str | None]: ...@@ -64,8 +64,8 @@ def is_flashmla_sparse_supported() -> tuple[bool, str | None]:
""" """
Return: is_supported_flag, unsupported_reason (optional). Return: is_supported_flag, unsupported_reason (optional).
""" """
is_availble, maybe_reason = _is_flashmla_available() is_available, maybe_reason = _is_flashmla_available()
if not is_availble: if not is_available:
return False, maybe_reason return False, maybe_reason
if not ( if not (
current_platform.is_device_capability_family(90) current_platform.is_device_capability_family(90)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment