diff --git a/running.sh b/running.sh index a7a1dd0..6b53697 100644 --- a/running.sh +++ b/running.sh @@ -1,9 +1,11 @@ ## 변경사항: 법률 데이터 미포함, 데이터셋 비율 50%, 정리를 위한 wandb project 변경 + +## Train ## 시도해볼 부분: epoch 수정해보기 ## 변경 필요한 arguments: output_dir python train.py \ --do_train \ ---output_dir model/kobart_bV1 \ +--output_dir model/baseV1.0_Kobart \ --dataset_name paper,news,magazine \ --num_train_epochs 3 \ --learning_rate 3e-05 \ @@ -14,17 +16,23 @@ python train.py \ --es_patience 3 \ --load_best_model_at_end True \ --relative_sample_ratio 0.5 \ ---project_name Kobart_bV1.0 \ +--project_name baseV1.0_Kobart \ --wandb_unique_tag kobartV1_ep2_lr3e05_len1024_R50 +## Eval # ## 시도해볼 부분: num_beams # ## 변경 필요한 model_name_or_path: output_dir # python train.py \ # --do_eval \ -# --model_name_or_path model/kobart_bV1 \ +# --model_name_or_path model/baseV1.0_Kobart \ # --dataset_name paper,news,magazine \ # --output_dir evaluation/kobart_eval \ # --num_beams 3 \ # --relative_sample_ratio 1 \ -# --project_name Kobart_bV1.0 \ -# --wandb_unique_tag Eval_kobartV1_ep2_lr3e05_len1024_R50 \ No newline at end of file +# --project_name baseV1.0_Kobart \ +# --wandb_unique_tag Eval_kobartV1_ep2_lr3e05_len1024_R50 + +# ## Predict +# python predict.py \ +# --model_name_or_path baseV1.0_Kobart \ +# --num_beams 3 diff --git a/train.py b/train.py index ce90db1..897c3e1 100644 --- a/train.py +++ b/train.py @@ -86,7 +86,7 @@ def main(): train_dataset = train_dataset.shuffle(training_args.seed) valid_dataset = valid_dataset.shuffle(training_args.seed) - print('** Dataset example', train_dataset[0]['title'], train_dataset[0]['title'], sep = '\n') + print('** Dataset example', train_dataset[0]['title'], train_dataset[1]['title'], sep = '\n') column_names = train_dataset.column_names if data_args.relative_eval_steps :