diff --git a/examples/llama-4/scout-qlora-single-h100-flex.yaml b/examples/llama-4/scout-qlora-single-h100-flex.yaml index c7a3b28d0..20352f81e 100644 --- a/examples/llama-4/scout-qlora-single-h100-flex.yaml +++ b/examples/llama-4/scout-qlora-single-h100-flex.yaml @@ -10,7 +10,6 @@ plugins: liger_glu_activation: true liger_rms_norm: true liger_layer_norm: true -cut_cross_entropy: true llama4_linearized_experts: true # needed with custom linearized experts model load_in_4bit: true diff --git a/src/axolotl/integrations/cut_cross_entropy/README.md b/src/axolotl/integrations/cut_cross_entropy/README.md index 724e0688d..462bcbedc 100644 --- a/src/axolotl/integrations/cut_cross_entropy/README.md +++ b/src/axolotl/integrations/cut_cross_entropy/README.md @@ -27,8 +27,6 @@ pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transform ```yaml plugins: - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin - -cut_cross_entropy: true ``` ## Supported Models diff --git a/src/axolotl/integrations/cut_cross_entropy/args.py b/src/axolotl/integrations/cut_cross_entropy/args.py index c16d91ede..da1db7397 100644 --- a/src/axolotl/integrations/cut_cross_entropy/args.py +++ b/src/axolotl/integrations/cut_cross_entropy/args.py @@ -28,7 +28,7 @@ class CutCrossEntropyArgs(BaseModel): Input args for Cut Cross Entropy. """ - cut_cross_entropy: Optional[bool] = None + cut_cross_entropy: Optional[bool] = True @model_validator(mode="before") @classmethod