tmm1 commited on
Commit
9f99104
·
1 Parent(s): 36fefcf

update comment for group_by_length

Browse files
Files changed (1) hide show
  1. README.md +2 -1
README.md CHANGED
@@ -426,7 +426,8 @@ save_safetensors:
426
 
427
  # whether to mask out or include the human's prompt from the training labels
428
  train_on_inputs: false
429
- # don't use this, leads to wonky training (according to someone on the internet)
 
430
  group_by_length: false
431
 
432
  # Whether to use gradient checkpointing https://huggingface.co/docs/transformers/v4.18.0/en/performance#gradient-checkpointing
 
426
 
427
  # whether to mask out or include the human's prompt from the training labels
428
  train_on_inputs: false
429
+ # group similarly sized data to minimize padding
430
+ # may be slower to start as it must download and sort the entire dataset
431
  group_by_length: false
432
 
433
  # Whether to use gradient checkpointing https://huggingface.co/docs/transformers/v4.18.0/en/performance#gradient-checkpointing