diff --git a/src/axolotl/core/trainer_builder.py b/src/axolotl/core/trainer_builder.py index 35318b836..f552ea7cb 100644 --- a/src/axolotl/core/trainer_builder.py +++ b/src/axolotl/core/trainer_builder.py @@ -1058,6 +1058,9 @@ class HFCausalTrainerBuilder(TrainerBuilderBase): if self.cfg.save_safetensors is not None: training_arguments_kwargs["save_safetensors"] = self.cfg.save_safetensors + if self.cfg.save_only_model is not None: + training_arguments_kwargs["save_only_model"] = self.cfg.save_only_model + if self.cfg.sample_packing_eff_est: training_arguments_kwargs[ "sample_packing_efficiency" diff --git a/src/axolotl/utils/config/models/input/v0_4_1/__init__.py b/src/axolotl/utils/config/models/input/v0_4_1/__init__.py index 20887dccf..48a35ea11 100644 --- a/src/axolotl/utils/config/models/input/v0_4_1/__init__.py +++ b/src/axolotl/utils/config/models/input/v0_4_1/__init__.py @@ -355,6 +355,7 @@ class ModelOutputConfig(BaseModel): hub_model_id: Optional[str] = None hub_strategy: Optional[str] = None save_safetensors: Optional[bool] = None + save_only_model: Optional[bool] = None class MLFlowConfig(BaseModel):