Fix shard config
This commit is contained in:
@@ -199,8 +199,7 @@ datasets:
|
|||||||
# The type of prompt to use for training. [alpaca, sharegpt, gpteacher, oasst, reflection]
|
# The type of prompt to use for training. [alpaca, sharegpt, gpteacher, oasst, reflection]
|
||||||
type: alpaca # format OR format:prompt_style (chat/instruct)
|
type: alpaca # format OR format:prompt_style (chat/instruct)
|
||||||
data_files: # path to source data files
|
data_files: # path to source data files
|
||||||
shards: # true if use subset data. make sure to set `shards` param also
|
shards: # number of shards to split data into
|
||||||
shards: # number of shards to split dataset into
|
|
||||||
|
|
||||||
# axolotl attempts to save the dataset as an arrow after packing the data together so
|
# axolotl attempts to save the dataset as an arrow after packing the data together so
|
||||||
# subsequent training attempts load faster, relative path
|
# subsequent training attempts load faster, relative path
|
||||||
|
|||||||
Reference in New Issue
Block a user