Unverified Commit 8d4b48cf authored by MPU王荣胜's avatar MPU王荣胜 Committed by GitHub
Browse files

fix qlora inference error

parent 8306539e
...@@ -40,8 +40,8 @@ def main(): ...@@ -40,8 +40,8 @@ def main():
if args.quant: if args.quant:
quantize(model.transformer, args.quant) quantize(model.transformer, args.quant)
if torch.cuda.is_available(): #if torch.cuda.is_available():
model = model.cuda() # model = model.cuda()
model.add_mixin('auto-regressive', CachedAutoregressiveMixin()) model.add_mixin('auto-regressive', CachedAutoregressiveMixin())
...@@ -101,4 +101,4 @@ def main(): ...@@ -101,4 +101,4 @@ def main():
if __name__ == "__main__": if __name__ == "__main__":
main() main()
\ No newline at end of file
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment