diff --git a/src/axolotl/utils/schemas/config.py b/src/axolotl/utils/schemas/config.py index 20698d920..b2ff154f3 100644 --- a/src/axolotl/utils/schemas/config.py +++ b/src/axolotl/utils/schemas/config.py @@ -106,12 +106,6 @@ class AxolotlInputConfig( "description": "Don't upcast the embeddings to float32 when using PEFT. Useful for low-VRAM GPUs" }, ) - moe_kernels: bool = Field( - default=False, - json_schema_extra={ - "description": "Enable Axolotl's vendored MoE kernels when supported (e.g., DeepSeek V3)" - }, - ) reinit_weights: bool | None = Field( default=None, json_schema_extra={ @@ -119,6 +113,13 @@ class AxolotlInputConfig( }, ) + moe_kernels: bool | None = Field( + default=None, + json_schema_extra={ + "description": "Enable Axolotl's vendored MoE kernels when supported (e.g., DeepSeek V3)" + }, + ) + trainer_cls: str | None = Field( default=None, json_schema_extra={