mirror of https://github.com/THUDM/ChatGLM-6B
parent
08d880141d
commit
73f4fe1ffe
|
@ -4,6 +4,7 @@ STEP=3000
|
|||
|
||||
CUDA_VISIBLE_DEVICES=0 python3 main.py \
|
||||
--do_predict \
|
||||
--validation_file AdvertiseGen/dev.json \
|
||||
--test_file AdvertiseGen/dev.json \
|
||||
--overwrite_cache \
|
||||
--prompt_column content \
|
||||
|
@ -15,6 +16,5 @@ CUDA_VISIBLE_DEVICES=0 python3 main.py \
|
|||
--max_target_length 64 \
|
||||
--per_device_eval_batch_size 1 \
|
||||
--predict_with_generate \
|
||||
--max_predict_samples 10 \
|
||||
--pre_seq_len $PRE_SEQ_LEN \
|
||||
--quantization_bit 4
|
||||
|
|
|
@ -9,7 +9,7 @@ CUDA_VISIBLE_DEVICES=0 python3 main.py \
|
|||
--response_column summary \
|
||||
--overwrite_cache \
|
||||
--model_name_or_path THUDM/chatglm-6b \
|
||||
--output_dir output/adgen-chatglm-6b-pt-$PRE_SEQ_LEN-$LR-dev \
|
||||
--output_dir output/adgen-chatglm-6b-pt-$PRE_SEQ_LEN-$LR \
|
||||
--overwrite_output_dir \
|
||||
--max_source_length 64 \
|
||||
--max_target_length 64 \
|
||||
|
|
Loading…
Reference in New Issue