Merge branch 'main' of github.com:THUDM/ChatGLM-6B

pull/558/merge
duzx16 2023-04-12 09:49:20 +08:00
commit 57e9da3822
2 changed files with 2 additions and 3 deletions

View File

@ -126,8 +126,8 @@ gradient_accumulation_steps=1
``` ```
learning_rate=5e-4 learning_rate=5e-4
per_device_train_batch_size=1 per_device_train_batch_size=16
gradient_accumulation_steps=16 gradient_accumulation_steps=1
``` ```

View File

@ -2,7 +2,6 @@
LR=1e-4 LR=1e-4
MASTER_PORT=$(shuf -n 1 -i 10000-65535) MASTER_PORT=$(shuf -n 1 -i 10000-65535)
MASTER_PORT=50003
deepspeed --num_gpus=4 --master_port $MASTER_PORT main.py \ deepspeed --num_gpus=4 --master_port $MASTER_PORT main.py \
--deepspeed deepspeed.json \ --deepspeed deepspeed.json \