Update README.md on pretraining_dataset (#360)

* Update README.md on pretraining_dataset

* Fix message
This commit is contained in:
NanoCode012
2023-08-11 12:17:07 +09:00
committed by GitHub
parent 94d03c8402
commit fae6ed8092

View File

@@ -505,6 +505,9 @@ torchdistx_path:
# Set padding for data collator to 'longest'
collator_pad_to_longest:
# Set to HF dataset for type: 'completion' for streaming instead of pre-tokenize
pretraining_dataset:
# Debug mode
debug: