add support for include_tokens_per_second in training args (#2269)

* add support for include_tokens_per_second in training args

* Update docs/config.qmd

Co-authored-by: NanoCode012 <nano@axolotl.ai>

* Update src/axolotl/core/trainer_builder.py

Co-authored-by: NanoCode012 <nano@axolotl.ai>

---------

Co-authored-by: NanoCode012 <nano@axolotl.ai>
This commit is contained in:
Wing Lian
2025-02-13 17:39:19 -05:00
committed by GitHub
parent 2e57391bf8
commit a98526ef78
3 changed files with 10 additions and 0 deletions

View File

@@ -330,6 +330,12 @@ class HFCausalTrainerBuilder(TrainerBuilderBase):
)
training_arguments_kwargs = {}
if self.cfg.include_tokens_per_second is not None:
training_arguments_kwargs[
"include_tokens_per_second"
] = self.cfg.include_tokens_per_second
if self.cfg.bf16 == "full":
training_arguments_kwargs["bf16_full_eval"] = True
else:

View File

@@ -844,6 +844,7 @@ class AxolotlInputConfig(
save_only_model: Optional[bool] = False
use_tensorboard: Optional[bool] = None
profiler_steps: Optional[int] = None
include_tokens_per_second: Optional[bool] = None
neftune_noise_alpha: Optional[float] = None