|
python run_translation_t5_flax.py \ |
|
--output_dir "." \ |
|
--model_name_or_path NbAiLab/nb-t5-base \ |
|
--tokenizer_name NbAiLab/nb-t5-base \ |
|
--train_file nb_nn_nb.json \ |
|
--validation_file parallel_src_tgt_dev.json \ |
|
--test_file parallel_src_tgt_test.json \ |
|
--do_train --do_eval --do_predict \ |
|
--predict_with_generate \ |
|
--num_train_epochs 10 \ |
|
--learning_rate 7e-4 \ |
|
--warmup_steps 3000 \ |
|
--per_device_train_batch_size 8 \ |
|
--per_device_eval_batch_size 8 \ |
|
--overwrite_output_dir \ |
|
--max_source_length 512 \ |
|
--max_target_length 512 \ |
|
--adafactor |
|
|