python run_translation_t5_flax.py \ --output_dir "." \ --model_name_or_path /mnt/disks/flaxdisk/norwegian-t5-base-NCC-fast \ --tokenizer_name /mnt/disks/flaxdisk/norwegian-t5-base-NCC \ --train_file src_tgt_nb-nn.json \ --validation_file parallel_src_tgt_dev.json \ --test_file parallel_src_tgt_test.json \ --do_train --do_eval --do_predict \ --predict_with_generate \ --num_train_epochs 100 \ --learning_rate 5e-5 \ --warmup_steps 0 \ --per_device_train_batch_size 64 \ --per_device_eval_batch_size 64 \ --overwrite_output_dir \ --max_source_length 128 \ --max_target_length 128 \ --adafactor