File size: 347 Bytes
d845ecf |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 |
type = "mbart"
[task]
change_ratio = 0.3
denoise_langs = []
poisson_lambda = 3.0
source_langs = ["br"]
target_langs = ["fr"]
[tuning]
batch_size = 16
betas = [0.9, 0.999]
epsilon = 1e-8
learning_rate = 5e-5
gradient_clipping = 1.0
# Uncomment these for a more complex training setup
lr_decay_steps = -1
warmup_steps = 1024
# weight_decay = 1e-5
|