"...git@developer.sourcefind.cn:wangsen/paddle_dbnet.git" did not exist on "2c2918f27af33aa57eb125f9932ac651f3f5f415"
Unverified Commit 02300273 authored by Ella Charlaix's avatar Ella Charlaix Committed by GitHub
Browse files

🚨 Remove dataset with restrictive license (#31452)

remove dataset with restrictive license
parent a14b055b
...@@ -543,7 +543,7 @@ class GPTQConfig(QuantizationConfigMixin): ...@@ -543,7 +543,7 @@ class GPTQConfig(QuantizationConfigMixin):
using the [`~PreTrainedTokenizer.save_pretrained`] method, e.g., `./my_model_directory/`. using the [`~PreTrainedTokenizer.save_pretrained`] method, e.g., `./my_model_directory/`.
dataset (`Union[List[str]]`, *optional*): dataset (`Union[List[str]]`, *optional*):
The dataset used for quantization. You can provide your own dataset in a list of string or just use the The dataset used for quantization. You can provide your own dataset in a list of string or just use the
original datasets used in GPTQ paper ['wikitext2','c4','c4-new','ptb','ptb-new'] original datasets used in GPTQ paper ['wikitext2','c4','c4-new']
group_size (`int`, *optional*, defaults to 128): group_size (`int`, *optional*, defaults to 128):
The group size to use for quantization. Recommended value is 128 and -1 uses per-column quantization. The group size to use for quantization. Recommended value is 128 and -1 uses per-column quantization.
damp_percent (`float`, *optional*, defaults to 0.1): damp_percent (`float`, *optional*, defaults to 0.1):
...@@ -652,15 +652,20 @@ class GPTQConfig(QuantizationConfigMixin): ...@@ -652,15 +652,20 @@ class GPTQConfig(QuantizationConfigMixin):
raise ValueError("damp_percent must between 0 and 1.") raise ValueError("damp_percent must between 0 and 1.")
if self.dataset is not None: if self.dataset is not None:
if isinstance(self.dataset, str): if isinstance(self.dataset, str):
if self.dataset not in ["wikitext2", "c4", "c4-new", "ptb", "ptb-new"]: if self.dataset in ["ptb", "ptb-new"]:
raise ValueError(
f"""{self.dataset} dataset was deprecated. You can only choose between
['wikitext2','c4','c4-new']"""
)
if self.dataset not in ["wikitext2", "c4", "c4-new"]:
raise ValueError( raise ValueError(
f"""You have entered a string value for dataset. You can only choose between f"""You have entered a string value for dataset. You can only choose between
['wikitext2','c4','c4-new','ptb','ptb-new'], but we found {self.dataset}""" ['wikitext2','c4','c4-new'], but we found {self.dataset}"""
) )
elif not isinstance(self.dataset, list): elif not isinstance(self.dataset, list):
raise ValueError( raise ValueError(
f"""dataset needs to be either a list of string or a value in f"""dataset needs to be either a list of string or a value in
['wikitext2','c4','c4-new','ptb','ptb-new'], but we found {self.dataset}""" ['wikitext2','c4','c4-new'], but we found {self.dataset}"""
) )
if self.disable_exllama is None and self.use_exllama is None: if self.disable_exllama is None and self.use_exllama is None:
......
...@@ -46,7 +46,6 @@ class GPTQConfigTest(unittest.TestCase): ...@@ -46,7 +46,6 @@ class GPTQConfigTest(unittest.TestCase):
with self.assertRaises(ValueError): with self.assertRaises(ValueError):
GPTQConfig(bits=2, dataset="auto_gpt") GPTQConfig(bits=2, dataset="auto_gpt")
GPTQConfig(bits=2, dataset="c4") GPTQConfig(bits=2, dataset="c4")
GPTQConfig(bits=2, dataset="ptb-new")
def test_damp_percent(self): def test_damp_percent(self):
with self.assertRaises(ValueError): with self.assertRaises(ValueError):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment