[chat] fix train_prompts.py gemini strategy bug (#3666)

* fix gemini strategy bug * add comment * add comment * better solution
2023-05-06 16:46:38 +08:00 · 2023-05-06 16:46:38 +08:00 · 2da5d81dec
parent d556648885
commit 2da5d81dec
1 changed files with 38 additions and 38 deletions
--- a/applications/Chat/examples/train_prompts.py
+++ b/applications/Chat/examples/train_prompts.py
@ -36,6 +36,7 @@ def main(args):
    if args.rm_path is not None:
        state_dict = torch.load(args.rm_path, map_location='cpu')
    with strategy.model_init_context():
        # configure model
        if args.model == 'gpt2':
            initial_model = GPTActor(pretrained=args.pretrain)
@ -74,7 +75,6 @@ def main(args):
        initial_model.to(torch.float16).to(torch.cuda.current_device())
        reward_model.to(torch.float16).to(torch.cuda.current_device())
    with strategy.model_init_context():
        if args.model == 'gpt2':
            actor = GPTActor(pretrained=args.pretrain, lora_rank=args.lora_rank)
        elif args.model == 'bloom':