[Doc] Fix typo (#11666)

Signed-off-by: Kazuhiro Serizawa <nserihiro@gmail.com>

[Doc] Fix typo (#11666)
Signed-off-by: Kazuhiro Serizawa <nserihiro@gmail.com>
6d70198b · Kazuhiro Serizawa · GitHub · f962f426 · 6d70198b · 6d70198b
Unverified Commit 6d70198b authored Jan 01, 2025 by Kazuhiro Serizawa Committed by GitHub Jan 01, 2025
Showing with 2 additions and 2 deletions

vllm/model_executor/layers/rejection_sampler.py vllm/model_executor/layers/rejection_sampler.py +1 -1

vllm/v1/sample/ops/topk_topp_sampler.py vllm/v1/sample/ops/topk_topp_sampler.py +1 -1

No files found.
--- a/vllm/model_executor/layers/rejection_sampler.py
+++ b/vllm/model_executor/layers/rejection_sampler.py
@@ -39,7 +39,7 @@ class RejectionSampler(SpecDecodeStochasticBaseSampler):
            strict_mode: Whether or not to perform shape/device/dtype checks
            during sampling. This catches correctness issues but adds
            nontrivial latency.
-            use_falshinfer: We will use this parameter to determine whether
+            use_flashinfer: We will use this parameter to determine whether
            to use the FlashInfer rejection sampling kernel or not. If it's
            None, we will use the default value from the environment variable.
            This parameter is only used for testing purposes.

--- a/vllm/v1/sample/ops/topk_topp_sampler.py
+++ b/vllm/v1/sample/ops/topk_topp_sampler.py
@@ -44,7 +44,7 @@ class TopKTopPSampler(nn.Module):
                logger.warning(
                    "FlashInfer is not available. Falling back to the PyTorch-"
                    "native implementation of top-p & top-k sampling. For the "
-                    "best performance, please install FalshInfer.")
+                    "best performance, please install FlashInfer.")
                self.forward = self.forward_native
        else:
            self.forward = self.forward_native