Spaces:

Dovakiins
/

qwerrwe

Build error

tmm1 commited on Aug 7, 2023

Commit

b4d1d22

1 Parent(s): 9f99104

note pattern when using groups

Files changed (1) hide show

README.md CHANGED Viewed

@@ -427,7 +427,8 @@ save_safetensors:
 # whether to mask out or include the human's prompt from the training labels
 train_on_inputs: false
 # group similarly sized data to minimize padding
-# may be slower to start as it must download and sort the entire dataset
 group_by_length: false
 # Whether to use gradient checkpointing https://huggingface.co/docs/transformers/v4.18.0/en/performance#gradient-checkpointing

 # whether to mask out or include the human's prompt from the training labels
 train_on_inputs: false
 # group similarly sized data to minimize padding
+# may be slower to start, as it must download and sort the entire dataset
+# note that training loss may have an oscillating pattern with this enabled
 group_by_length: false
 # Whether to use gradient checkpointing https://huggingface.co/docs/transformers/v4.18.0/en/performance#gradient-checkpointing