Training in progress, step 2500

0094a2a verified about 2 months ago

460 Bytes

	{
	"train_batch_size": "auto",
	"train_micro_batch_size_per_gpu": "auto",
	"gradient_accumulation_steps": "auto",
	"gradient_clipping": "auto",
	"zero_allow_untested_optimizer": true,
	"bf16": {
	"enabled": true
	},
	"zero_optimization": {
	"stage": 2,
	"allgather_partitions": true,
	"allgather_bucket_size": 5e8,
	"reduce_scatter": true,
	"reduce_bucket_size": 5e8,
	"overlap_comm": false,
	"contiguous_gradients": true
	}
	}