From 73f4fe1ffe6af778796a2ed88882af5655062eb0 Mon Sep 17 00:00:00 2001 From: duzx16 Date: Fri, 31 Mar 2023 20:15:35 +0800 Subject: [PATCH] Add validation file name Use full prediction --- ptuning/evaluate.sh | 2 +- ptuning/train.sh | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/ptuning/evaluate.sh b/ptuning/evaluate.sh index db2a8c1..1217ceb 100644 --- a/ptuning/evaluate.sh +++ b/ptuning/evaluate.sh @@ -4,6 +4,7 @@ STEP=3000 CUDA_VISIBLE_DEVICES=0 python3 main.py \ --do_predict \ + --validation_file AdvertiseGen/dev.json \ --test_file AdvertiseGen/dev.json \ --overwrite_cache \ --prompt_column content \ @@ -15,6 +16,5 @@ CUDA_VISIBLE_DEVICES=0 python3 main.py \ --max_target_length 64 \ --per_device_eval_batch_size 1 \ --predict_with_generate \ - --max_predict_samples 10 \ --pre_seq_len $PRE_SEQ_LEN \ --quantization_bit 4 diff --git a/ptuning/train.sh b/ptuning/train.sh index 1d03a25..3189829 100644 --- a/ptuning/train.sh +++ b/ptuning/train.sh @@ -9,7 +9,7 @@ CUDA_VISIBLE_DEVICES=0 python3 main.py \ --response_column summary \ --overwrite_cache \ --model_name_or_path THUDM/chatglm-6b \ - --output_dir output/adgen-chatglm-6b-pt-$PRE_SEQ_LEN-$LR-dev \ + --output_dir output/adgen-chatglm-6b-pt-$PRE_SEQ_LEN-$LR \ --overwrite_output_dir \ --max_source_length 64 \ --max_target_length 64 \