Update huggingface.py

4c062d44 · Hailey Schoelkopf · GitHub · 436edcc9 · 4c062d44
Unverified Commit 4c062d44 authored Aug 23, 2023 by Hailey Schoelkopf Committed by GitHub Aug 23, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

lm_eval/models/huggingface.py lm_eval/models/huggingface.py +2 -2

No files found.
--- a/lm_eval/models/huggingface.py
+++ b/lm_eval/models/huggingface.py
@@ -162,7 +162,7 @@ class HuggingFaceAutoLM(BaseLM):
            gptq_use_triton (bool, optional, defaults to False):
                Use Triton for GPTQ inference.
            inject_fused_attention (bool, optional, defaults to True):
-                Inject fused attention.
+                Inject fused attention into GPTQ model.
            bnb_4bit_quant_type (str, optional, defaults to None):
                The quantization type to use for BnB 4bit quantization. See:
                https://github.com/huggingface/transformers/blob/main/src/transformers/utils/quantization_config.py#L77
@@ -781,4 +781,4 @@ def stop_sequences_criteria(
                for sequence in stop_sequences
            ],
        ]
    )
\ No newline at end of file