diff --git a/src/axolotl/core/trainer_builder.py b/src/axolotl/core/trainer_builder.py index 411496ac5..b151be8fa 100755 --- a/src/axolotl/core/trainer_builder.py +++ b/src/axolotl/core/trainer_builder.py @@ -758,13 +758,13 @@ class HFCausalTrainerBuilder(TrainerBuilderBase): self.cfg.kd_zscore_base_temp ) if self.cfg.kd_top_k_before_softmax is not None: - training_arguments_kwargs[ - "kd_top_k_before_softmax" - ] = self.cfg.kd_top_k_before_softmax + training_arguments_kwargs["kd_top_k_before_softmax"] = ( + self.cfg.kd_top_k_before_softmax + ) - training_arguments_kwargs[ - "sequence_parallel_degree" - ] = self.cfg.sequence_parallel_degree + training_arguments_kwargs["sequence_parallel_degree"] = ( + self.cfg.sequence_parallel_degree + ) if self.cfg.reward_model: training_args_cls = AxolotlRewardConfig diff --git a/src/axolotl/core/trainers/__init__.py b/src/axolotl/core/trainers/__init__.py index 1080c5f6c..32a889af9 100644 --- a/src/axolotl/core/trainers/__init__.py +++ b/src/axolotl/core/trainers/__init__.py @@ -1,4 +1,5 @@ """Init for axolotl.core.trainers""" + # pylint: disable=unused-import # flake8: noqa diff --git a/src/axolotl/core/trainers/base.py b/src/axolotl/core/trainers/base.py index 3b94ed282..9267dd040 100644 --- a/src/axolotl/core/trainers/base.py +++ b/src/axolotl/core/trainers/base.py @@ -1,4 +1,5 @@ """Module for customized trainers""" + # pylint: disable=too-many-lines from __future__ import annotations @@ -114,7 +115,6 @@ class AxolotlTrainer(SchedulerMixin, OptimizerMixin, SequenceParallelMixin, Trai drop_last=True, ) - @override def _get_train_sampler(self) -> Sampler | None: """ Helper method to get the sampler for training. Handles cases for sequence @@ -146,7 +146,6 @@ class AxolotlTrainer(SchedulerMixin, OptimizerMixin, SequenceParallelMixin, Trai return base_sampler - @override def _get_eval_sampler(self, eval_dataset: Dataset | None = None) -> Sampler | None: """ Helper method to get the sampler for evaluation. Handles sequence parallelism @@ -591,7 +590,6 @@ class AxolotlTrainer(SchedulerMixin, OptimizerMixin, SequenceParallelMixin, Trai os.makedirs(output_dir, exist_ok=True) return super()._save_checkpoint(model, trial, **kwargs) - @override def training_step( self, model: nn.Module, diff --git a/src/axolotl/core/trainers/mixins/__init__.py b/src/axolotl/core/trainers/mixins/__init__.py index a4b8fb1e2..12c8277fc 100644 --- a/src/axolotl/core/trainers/mixins/__init__.py +++ b/src/axolotl/core/trainers/mixins/__init__.py @@ -1,4 +1,5 @@ """Init for axolotl.core.trainers.mixins""" + # pylint: disable=unused-import # flake8: noqa diff --git a/src/axolotl/utils/schemas/config.py b/src/axolotl/utils/schemas/config.py index 463e957ce..7992e6559 100644 --- a/src/axolotl/utils/schemas/config.py +++ b/src/axolotl/utils/schemas/config.py @@ -1,4 +1,5 @@ """Module with Pydantic models for configuration.""" + # pylint: disable=too-many-lines import logging diff --git a/tests/e2e/patched/test_sp.py b/tests/e2e/patched/test_sp.py index 7dd0e152d..58251b5e3 100644 --- a/tests/e2e/patched/test_sp.py +++ b/tests/e2e/patched/test_sp.py @@ -1,4 +1,5 @@ """Tests for sequence parallelism functionality.""" + # pylint: disable=redefined-outer-name,unused-argument from unittest.mock import MagicMock, patch