hash for temperature too

This commit is contained in:
Wing Lian
2024-12-24 15:48:35 -05:00
parent 8b0104fa7c
commit 8d77dc385e

View File

@@ -176,10 +176,11 @@ def load_tokenized_prepared_datasets(
+ "@"
+ str(cfg.group_by_length)
+ "@"
+ str(cfg.kd_temperature or 1.0)
+ "|".join(
sorted(
[
f"{d.path}:{d.type}:{d.shards}:{d.conversation}{d.split}"
f"{d.path}:{d.type}:{d.shards}:{d.conversation}:{d.split}:{d.temperature or 1.0}"
for d in cfg_datasets
]
)