feat(doc): add more info on train_on_split (#855)

This commit is contained in:
NanoCode012
2023-11-15 23:42:26 +09:00
committed by GitHub
parent 614cff4107
commit 306fe19c54

View File

@@ -491,6 +491,7 @@ datasets:
data_files: # Optional[str] path to source data files
shards: # Optional[int] number of shards to split data into
name: # Optional[str] name of dataset configuration to load
train_on_split: train # Optional[str] name of dataset split to load from
# Optional[str] fastchat conversation type, only used with type: sharegpt
conversation: # Options (see Conversation 'name'): https://github.com/lm-sys/FastChat/blob/main/fastchat/conversation.py