Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
AutoAWQ
Commits
c58ec73b
Commit
c58ec73b
authored
Sep 09, 2023
by
Casper Hansen
Browse files
Remove warnings about GEMM
parent
ebbbc3a5
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
0 additions
and
9 deletions
+0
-9
awq/models/base.py
awq/models/base.py
+0
-9
No files found.
awq/models/base.py
View file @
c58ec73b
...
...
@@ -44,10 +44,6 @@ class BaseAWQForCausalLM(nn.Module):
calib_data
=
"pileval"
):
self
.
quant_config
=
quant_config
quant_config
[
"version"
]
=
"GEMM"
if
'version'
not
in
quant_config
.
keys
()
else
quant_config
[
"version"
]
if
quant_config
[
"version"
]
==
"GEMM"
:
logging
.
warning
(
'Deprecated model weight format. Re-quantize '
'your weights again with version="GEMV" for a speedup. '
'In the next AutoAWQ version, GEMM will be deprecated.'
)
if
run_search
:
self
.
search_result
=
self
.
_awq_search
(
tokenizer
,
quant_config
,
n_samples
=
n_samples
,
seqlen
=
seqlen
,
...
...
@@ -351,11 +347,6 @@ class BaseAWQForCausalLM(nn.Module):
def
_load_quantized_modules
(
self
,
model
,
quant_config
,
version
):
# Real quantization of weights
assert
quant_config
[
"zero_point"
],
"We only support zero_point quantization now."
if
version
==
'GEMM'
:
logging
.
warning
(
'Deprecated model weight format. Re-quantize '
'your weights again with version="GEMV" for a speedup. '
'In the next AutoAWQ version, GEMM will be deprecated.'
)
# Get blocks of model
layers
=
self
.
get_model_layers
(
model
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment