[chat] fix train_prompts.py gemini strategy bug (#3666)

* fix gemini strategy bug * add comment * add comment * better solution

[chat] fix train_prompts.py gemini strategy bug (#3666)
* fix gemini strategy bug * add comment * add comment * better solution
2da5d81d · zhang-yi-chi · GitHub · d5566488 · 2da5d81d
Unverified Commit 2da5d81d authored May 06, 2023 by zhang-yi-chi Committed by GitHub May 06, 2023
Show whitespace changes
Inline Side-by-side

Showing with 35 additions and 35 deletions

applications/Chat/examples/train_prompts.py applications/Chat/examples/train_prompts.py +35 -35

No files found.
--- a/applications/Chat/examples/train_prompts.py
+++ b/applications/Chat/examples/train_prompts.py
@@ -36,6 +36,7 @@ def main(args):
    if args.rm_path is not None:
        state_dict = torch.load(args.rm_path, map_location='cpu')
+    with strategy.model_init_context():
        # configure model
        if args.model == 'gpt2':
            initial_model = GPTActor(pretrained=args.pretrain)
@@ -74,7 +75,6 @@ def main(args):
        initial_model.to(torch.float16).to(torch.cuda.current_device())
        reward_model.to(torch.float16).to(torch.cuda.current_device())
-    with strategy.model_init_context():
        if args.model == 'gpt2':
            actor = GPTActor(pretrained=args.pretrain, lora_rank=args.lora_rank)
        elif args.model == 'bloom':