python run_translation_t5_flax.py \ | |
--output_dir "." \ | |
--model_name_or_path /mnt/disks/flaxdisk/norwegian-t5-base-NCC-fast \ | |
--tokenizer_name /mnt/disks/flaxdisk/norwegian-t5-base-NCC \ | |
--train_file src_tgt_nb-nn.json \ | |
--validation_file parallel_src_tgt_dev.json \ | |
--test_file parallel_src_tgt_test.json \ | |
--do_train --do_eval --do_predict \ | |
--predict_with_generate \ | |
--num_train_epochs 100 \ | |
--learning_rate 5e-5 \ | |
--warmup_steps 0 \ | |
--per_device_train_batch_size 64 \ | |
--per_device_eval_batch_size 64 \ | |
--overwrite_output_dir \ | |
--max_source_length 128 \ | |
--max_target_length 128 \ | |
--adafactor | |