Unverified Commit 8d4b48cf authored by MPU王荣胜's avatar MPU王荣胜 Committed by GitHub
Browse files

fix qlora inference error

parent 8306539e
......@@ -40,8 +40,8 @@ def main():
if args.quant:
quantize(model.transformer, args.quant)
if torch.cuda.is_available():
model = model.cuda()
#if torch.cuda.is_available():
# model = model.cuda()
model.add_mixin('auto-regressive', CachedAutoregressiveMixin())
......@@ -101,4 +101,4 @@ def main():
if __name__ == "__main__":
main()
\ No newline at end of file
main()
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment