mirror of https://github.com/THUDM/ChatGLM-6B
Update train script
parent
08d880141d
commit
893706a82d
|
@ -203,8 +203,8 @@ class DataTrainingArguments:
|
|||
|
||||
|
||||
def __post_init__(self):
|
||||
if self.dataset_name is None and self.train_file is None and self.validation_file is None:
|
||||
raise ValueError("Need either a dataset name or a training/validation file.")
|
||||
if self.dataset_name is None and self.train_file is None and self.validation_file is None and self.test_file is None:
|
||||
raise ValueError("Need either a dataset name or a training/validation/test file.")
|
||||
else:
|
||||
if self.train_file is not None:
|
||||
extension = self.train_file.split(".")[-1]
|
||||
|
|
|
@ -9,7 +9,7 @@ CUDA_VISIBLE_DEVICES=0 python3 main.py \
|
|||
--response_column summary \
|
||||
--overwrite_cache \
|
||||
--model_name_or_path THUDM/chatglm-6b \
|
||||
--output_dir output/adgen-chatglm-6b-pt-$PRE_SEQ_LEN-$LR-dev \
|
||||
--output_dir output/adgen-chatglm-6b-pt-$PRE_SEQ_LEN-$LR \
|
||||
--overwrite_output_dir \
|
||||
--max_source_length 64 \
|
||||
--max_target_length 64 \
|
||||
|
|
Loading…
Reference in New Issue