File size: 802 Bytes
1d7fe78
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
export MODEL_DIR="$(pwd)"
export DATA_PATH=/home/$USER/dataset

python3 run_summarization_flax.py \
	--output_dir ${MODEL_DIR} \
	--model_name_or_path ${MODEL_DIR}/flax_model.msgpack \
	--config_name ${MODEL_DIR} \
	--tokenizer_name ${MODEL_DIR} \
	--train_file ${DATA_PATH}/train_sen_jsonlines.json \
	--validation_file ${DATA_PATH}/val_sen_jsonlines.json \
	--test_file ${DATA_PATH}/test_sen_jsonlines.json \
	--do_train --do_eval --do_predict --predict_with_generate \
	--num_train_epochs 3 \
	--learning_rate 5e-5 --warmup_steps 0 \
	--per_device_train_batch_size 8 \
	--per_device_eval_batch_size 8 \
	--overwrite_output_dir \
	--max_source_length 256 \
   	--max_target_length 64 \
	--text_column src \
	--summary_column tgt \
	--hub_model_id alvinwatner/bart-qg-alpha-interro \
	--push_to_hub