|
export MODEL_DIR="$(pwd)" |
|
export DATA_PATH=/home/$USER/dataset |
|
|
|
python3 run_summarization_flax.py \ |
|
--output_dir ${MODEL_DIR} \ |
|
--model_name_or_path ${MODEL_DIR}/flax_model.msgpack \ |
|
--config_name ${MODEL_DIR} \ |
|
--tokenizer_name ${MODEL_DIR} \ |
|
--train_file ${DATA_PATH}/train_sen_jsonlines.json \ |
|
--validation_file ${DATA_PATH}/val_sen_jsonlines.json \ |
|
--test_file ${DATA_PATH}/test_sen_jsonlines.json \ |
|
--do_train --do_eval --do_predict --predict_with_generate \ |
|
--num_train_epochs 3 \ |
|
--learning_rate 5e-5 --warmup_steps 0 \ |
|
--per_device_train_batch_size 8 \ |
|
--per_device_eval_batch_size 8 \ |
|
--overwrite_output_dir \ |
|
--max_source_length 256 \ |
|
--max_target_length 64 \ |
|
--text_column src \ |
|
--summary_column tgt \ |
|
--hub_model_id alvinwatner/bart-qg-alpha-interro \ |
|
--push_to_hub |
|
|
|
|
|
|