From 35e6a7e228d3978d310afbcfe69e5f1178e1a7eb Mon Sep 17 00:00:00 2001 From: Quarto GHA Workflow Runner Date: Tue, 3 Mar 2026 14:34:09 +0000 Subject: [PATCH] Built site for gh-pages --- .nojekyll | 2 +- docs/models/qwen3-next.html | 27 +-- search.json | 2 +- sitemap.xml | 472 ++++++++++++++++++------------------ 4 files changed, 244 insertions(+), 259 deletions(-) diff --git a/.nojekyll b/.nojekyll index c73b28016..d717f3928 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -ec7962f3 \ No newline at end of file +590c8a6b \ No newline at end of file diff --git a/docs/models/qwen3-next.html b/docs/models/qwen3-next.html index 890a1d492..4916ede73 100644 --- a/docs/models/qwen3-next.html +++ b/docs/models/qwen3-next.html @@ -784,31 +784,16 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});

Getting started

    -
  1. Install Axolotl following the installation guide. You need to install from main as Qwen3-Next is only on nightly or use our latest Docker images.

    -

    Here is an example of how to install from main for pip:

  2. +
  3. Install Axolotl following the installation guide.

  4. +
  5. Install Cut Cross Entropy to reduce training VRAM usage.

  6. +
  7. Install FLA for improved performance

-
# Ensure you have Pytorch installed (Pytorch 2.6.0 min)
-git clone https://github.com/axolotl-ai-cloud/axolotl.git
-cd axolotl
-
-pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja
-pip3 install --no-build-isolation -e '.[flash-attn]'
-
-# Install CCE https://docs.axolotl.ai/docs/custom_integrations.html#cut-cross-entropy
-python scripts/cutcrossentropy_install.py | sh
-
    -
  1. Install Qwen3-Next transformers commit
  2. -
-
pip3 uninstall -y transformers && pip3 install "git+https://github.com/huggingface/transformers.git@b9282355bea846b54ed850a066901496b19da654"
-
    -
  1. Install FLA for improved performance
  2. -
-
pip3 uninstall -y causal-conv1d && pip3 install flash-linear-attention==0.3.2
+
pip3 uninstall -y causal-conv1d && pip3 install flash-linear-attention==0.4.1
  1. Run the finetuning example:
-
axolotl train examples/qwen3-next/qwen3-next-80b-a3b-qlora.yaml
-

This config uses about 45.62 GiB VRAM.

+
axolotl train examples/qwen3-next/qwen3-next-80b-a3b-qlora.yaml
+

This config uses about ~47 GiB (no target experts) and ~71GiB (target experts) VRAM.

Let us know how it goes. Happy finetuning! 🚀

TIPS

diff --git a/search.json b/search.json index 93c849e42..021b35870 100644 --- a/search.json +++ b/search.json @@ -5572,7 +5572,7 @@ "href": "docs/models/qwen3-next.html#getting-started", "title": "Qwen 3 Next", "section": "Getting started", - "text": "Getting started\n\nInstall Axolotl following the installation guide. You need to install from main as Qwen3-Next is only on nightly or use our latest Docker images.\nHere is an example of how to install from main for pip:\n\n# Ensure you have Pytorch installed (Pytorch 2.6.0 min)\ngit clone https://github.com/axolotl-ai-cloud/axolotl.git\ncd axolotl\n\npip3 install packaging==26.0 setuptools==75.8.0 wheel ninja\npip3 install --no-build-isolation -e '.[flash-attn]'\n\n# Install CCE https://docs.axolotl.ai/docs/custom_integrations.html#cut-cross-entropy\npython scripts/cutcrossentropy_install.py | sh\n\nInstall Qwen3-Next transformers commit\n\npip3 uninstall -y transformers && pip3 install \"git+https://github.com/huggingface/transformers.git@b9282355bea846b54ed850a066901496b19da654\"\n\nInstall FLA for improved performance\n\npip3 uninstall -y causal-conv1d && pip3 install flash-linear-attention==0.3.2\n\nRun the finetuning example:\n\naxolotl train examples/qwen3-next/qwen3-next-80b-a3b-qlora.yaml\nThis config uses about 45.62 GiB VRAM.\nLet us know how it goes. Happy finetuning! 🚀\n\nTIPS\n\nFor inference, you can experiment with temperature: 0.7, top_p: 0.8, top_k: 20, and min_p: 0.\nYou can run a full finetuning by removing the adapter: qlora and load_in_4bit: true from the config. See Multi-GPU section below.\nRead more on how to load your own dataset at docs.\nThe dataset format follows the OpenAI Messages format as seen here.", + "text": "Getting started\n\nInstall Axolotl following the installation guide.\nInstall Cut Cross Entropy to reduce training VRAM usage.\nInstall FLA for improved performance\n\npip3 uninstall -y causal-conv1d && pip3 install flash-linear-attention==0.4.1\n\nRun the finetuning example:\n\naxolotl train examples/qwen3-next/qwen3-next-80b-a3b-qlora.yaml\nThis config uses about ~47 GiB (no target experts) and ~71GiB (target experts) VRAM.\nLet us know how it goes. Happy finetuning! 🚀\n\nTIPS\n\nFor inference, you can experiment with temperature: 0.7, top_p: 0.8, top_k: 20, and min_p: 0.\nYou can run a full finetuning by removing the adapter: qlora and load_in_4bit: true from the config. See Multi-GPU section below.\nRead more on how to load your own dataset at docs.\nThe dataset format follows the OpenAI Messages format as seen here.", "crumbs": [ "Getting Started", "Model Guides", diff --git a/sitemap.xml b/sitemap.xml index 7a3b0a69f..87cc2676e 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -2,946 +2,946 @@ https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html - 2026-03-02T21:40:48.654Z + 2026-03-03T14:27:57.076Z https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html - 2026-03-02T21:40:48.676Z + 2026-03-03T14:27:57.103Z https://docs.axolotl.ai/docs/inference.html - 2026-03-02T21:40:48.647Z + 2026-03-03T14:27:57.066Z https://docs.axolotl.ai/docs/debugging.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/models/ministral3/vision.html - 2026-03-02T21:44:45.694Z + 2026-03-03T14:31:49.671Z https://docs.axolotl.ai/docs/models/ministral.html - 2026-03-02T21:44:45.696Z + 2026-03-03T14:31:49.672Z https://docs.axolotl.ai/docs/models/qwen3.html - 2026-03-02T21:44:45.702Z + 2026-03-03T14:31:49.675Z https://docs.axolotl.ai/docs/models/magistral.html - 2026-03-02T21:44:45.695Z + 2026-03-03T14:31:49.672Z https://docs.axolotl.ai/docs/models/voxtral.html - 2026-03-02T21:44:45.697Z + 2026-03-03T14:31:49.673Z https://docs.axolotl.ai/docs/models/llama-4.html - 2026-03-02T21:44:45.701Z + 2026-03-03T14:31:49.674Z https://docs.axolotl.ai/docs/models/magistral/think.html - 2026-03-02T21:44:45.695Z + 2026-03-03T14:31:49.672Z https://docs.axolotl.ai/docs/models/ministral3.html - 2026-03-02T21:44:45.694Z + 2026-03-03T14:31:49.670Z https://docs.axolotl.ai/docs/models/arcee.html - 2026-03-02T21:44:45.693Z + 2026-03-03T14:31:49.669Z https://docs.axolotl.ai/docs/models/gemma3n.html - 2026-03-02T21:44:45.703Z + 2026-03-03T14:31:49.676Z https://docs.axolotl.ai/docs/models/plano.html - 2026-03-02T21:44:45.690Z + 2026-03-03T14:31:49.667Z https://docs.axolotl.ai/docs/models/apertus.html - 2026-03-02T21:44:45.703Z + 2026-03-03T14:31:49.676Z https://docs.axolotl.ai/docs/models/phi.html - 2026-03-02T21:44:45.705Z + 2026-03-03T14:31:49.677Z https://docs.axolotl.ai/docs/models/hunyuan.html - 2026-03-02T21:44:45.706Z + 2026-03-03T14:31:49.679Z https://docs.axolotl.ai/docs/models/trinity.html - 2026-03-02T21:44:45.692Z + 2026-03-03T14:31:49.669Z https://docs.axolotl.ai/docs/models/mistral.html - 2026-03-02T21:44:45.699Z + 2026-03-03T14:31:49.674Z https://docs.axolotl.ai/docs/models/LiquidAI.html - 2026-03-02T21:44:45.706Z + 2026-03-03T14:31:49.678Z https://docs.axolotl.ai/docs/multimodal.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/docs/batch_vs_grad.html - 2026-03-02T21:40:48.644Z + 2026-03-03T14:27:57.061Z https://docs.axolotl.ai/docs/multi-gpu.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/docs/nccl.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/docs/reward_modelling.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.068Z https://docs.axolotl.ai/docs/torchao.html - 2026-03-02T21:40:48.649Z + 2026-03-03T14:27:57.069Z https://docs.axolotl.ai/docs/multipack.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html - 2026-03-02T21:44:05.507Z + 2026-03-03T14:31:27.479Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html - 2026-03-02T21:44:05.381Z + 2026-03-03T14:31:27.352Z https://docs.axolotl.ai/docs/api/utils.chat_templates.html - 2026-03-02T21:44:05.856Z + 2026-03-03T14:31:27.831Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html - 2026-03-02T21:44:05.505Z + 2026-03-03T14:31:27.477Z https://docs.axolotl.ai/docs/api/cli.inference.html - 2026-03-02T21:44:05.022Z + 2026-03-03T14:31:26.990Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html - 2026-03-02T21:44:05.277Z + 2026-03-03T14:31:27.247Z https://docs.axolotl.ai/docs/api/kernels.swiglu.html - 2026-03-02T21:44:05.696Z + 2026-03-03T14:31:27.668Z https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html - 2026-03-02T21:44:05.981Z + 2026-03-03T14:31:27.958Z https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html - 2026-03-02T21:44:06.462Z + 2026-03-03T14:31:28.443Z https://docs.axolotl.ai/docs/api/utils.schemas.utils.html - 2026-03-02T21:44:06.132Z + 2026-03-03T14:31:28.109Z https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html - 2026-03-02T21:44:05.807Z + 2026-03-03T14:31:27.781Z https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html - 2026-03-02T21:44:05.870Z + 2026-03-03T14:31:27.845Z https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html - 2026-03-02T21:44:05.047Z + 2026-03-03T14:31:27.015Z https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html - 2026-03-02T21:44:05.005Z + 2026-03-03T14:31:26.972Z https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html - 2026-03-02T21:44:06.306Z + 2026-03-03T14:31:28.286Z https://docs.axolotl.ai/docs/api/utils.dict.html - 2026-03-02T21:44:05.971Z + 2026-03-03T14:31:27.948Z https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html - 2026-03-02T21:44:05.719Z + 2026-03-03T14:31:27.692Z https://docs.axolotl.ai/docs/api/utils.schemas.config.html - 2026-03-02T21:44:06.032Z + 2026-03-03T14:31:28.008Z https://docs.axolotl.ai/docs/api/cli.cloud.base.html - 2026-03-02T21:44:05.076Z + 2026-03-03T14:31:27.044Z https://docs.axolotl.ai/docs/api/utils.collators.batching.html - 2026-03-02T21:44:06.378Z + 2026-03-03T14:31:28.359Z https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html - 2026-03-02T21:44:05.443Z + 2026-03-03T14:31:27.415Z https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html - 2026-03-02T21:44:06.329Z + 2026-03-03T14:31:28.309Z https://docs.axolotl.ai/docs/api/cli.config.html - 2026-03-02T21:44:04.999Z + 2026-03-03T14:31:26.966Z https://docs.axolotl.ai/docs/api/evaluate.html - 2026-03-02T21:44:04.702Z + 2026-03-03T14:31:26.667Z https://docs.axolotl.ai/docs/api/utils.schemas.training.html - 2026-03-02T21:44:06.049Z + 2026-03-03T14:31:28.026Z https://docs.axolotl.ai/docs/api/core.trainers.base.html - 2026-03-02T21:44:05.153Z + 2026-03-03T14:31:27.122Z https://docs.axolotl.ai/docs/api/cli.utils.args.html - 2026-03-02T21:44:05.100Z + 2026-03-03T14:31:27.068Z https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html - 2026-03-02T21:44:04.858Z + 2026-03-03T14:31:26.825Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html - 2026-03-02T21:44:05.510Z + 2026-03-03T14:31:27.483Z https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html - 2026-03-02T21:44:05.470Z + 2026-03-03T14:31:27.442Z https://docs.axolotl.ai/docs/api/monkeypatch.relora.html - 2026-03-02T21:44:05.724Z + 2026-03-03T14:31:27.697Z https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html - 2026-03-02T21:44:06.470Z + 2026-03-03T14:31:28.452Z https://docs.axolotl.ai/docs/api/cli.art.html - 2026-03-02T21:44:04.969Z + 2026-03-03T14:31:26.936Z https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html - 2026-03-02T21:44:06.307Z + 2026-03-03T14:31:28.287Z https://docs.axolotl.ai/docs/api/datasets.html - 2026-03-02T21:44:04.710Z + 2026-03-03T14:31:26.675Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html - 2026-03-02T21:44:05.521Z + 2026-03-03T14:31:27.493Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html - 2026-03-02T21:44:05.531Z + 2026-03-03T14:31:27.504Z https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html - 2026-03-02T21:44:05.318Z + 2026-03-03T14:31:27.288Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html - 2026-03-02T21:44:05.201Z + 2026-03-03T14:31:27.170Z https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html - 2026-03-02T21:44:06.438Z + 2026-03-03T14:31:28.419Z https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html - 2026-03-02T21:44:05.187Z + 2026-03-03T14:31:27.156Z https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html - 2026-03-02T21:44:05.809Z + 2026-03-03T14:31:27.783Z https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html - 2026-03-02T21:44:06.094Z + 2026-03-03T14:31:28.071Z https://docs.axolotl.ai/docs/api/utils.lora.html - 2026-03-02T21:44:05.863Z + 2026-03-03T14:31:27.837Z https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html - 2026-03-02T21:44:04.860Z + 2026-03-03T14:31:26.827Z https://docs.axolotl.ai/docs/api/cli.train.html - 2026-03-02T21:44:04.930Z + 2026-03-03T14:31:26.897Z https://docs.axolotl.ai/docs/api/utils.trainer.html - 2026-03-02T21:44:05.906Z + 2026-03-03T14:31:27.881Z https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html - 2026-03-02T21:44:05.717Z + 2026-03-03T14:31:27.690Z https://docs.axolotl.ai/docs/api/core.builders.base.html - 2026-03-02T21:44:04.799Z + 2026-03-03T14:31:26.765Z https://docs.axolotl.ai/docs/api/cli.utils.fetch.html - 2026-03-02T21:44:05.106Z + 2026-03-03T14:31:27.075Z https://docs.axolotl.ai/docs/api/utils.tokenization.html - 2026-03-02T21:44:05.855Z + 2026-03-03T14:31:27.829Z https://docs.axolotl.ai/docs/api/core.trainers.trl.html - 2026-03-02T21:44:05.172Z + 2026-03-03T14:31:27.141Z https://docs.axolotl.ai/docs/api/cli.checks.html - 2026-03-02T21:44:04.977Z + 2026-03-03T14:31:26.944Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html - 2026-03-02T21:44:05.533Z + 2026-03-03T14:31:27.506Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html - 2026-03-02T21:44:05.714Z + 2026-03-03T14:31:27.687Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html - 2026-03-02T21:44:05.726Z + 2026-03-03T14:31:27.699Z https://docs.axolotl.ai/docs/api/cli.utils.html - 2026-03-02T21:44:05.086Z + 2026-03-03T14:31:27.054Z https://docs.axolotl.ai/docs/api/common.architectures.html - 2026-03-02T21:44:06.331Z + 2026-03-03T14:31:28.311Z https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html - 2026-03-02T21:44:05.464Z + 2026-03-03T14:31:27.437Z https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html - 2026-03-02T21:44:05.786Z + 2026-03-03T14:31:27.759Z https://docs.axolotl.ai/docs/api/kernels.geglu.html - 2026-03-02T21:44:05.683Z + 2026-03-03T14:31:27.656Z https://docs.axolotl.ai/docs/api/utils.schedulers.html - 2026-03-02T21:44:05.939Z + 2026-03-03T14:31:27.915Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html - 2026-03-02T21:44:05.813Z + 2026-03-03T14:31:27.787Z https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html - 2026-03-02T21:44:06.325Z + 2026-03-03T14:31:28.305Z https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html - 2026-03-02T21:44:05.406Z + 2026-03-03T14:31:27.378Z https://docs.axolotl.ai/docs/api/cli.quantize.html - 2026-03-02T21:44:05.063Z + 2026-03-03T14:31:27.031Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html - 2026-03-02T21:44:05.509Z + 2026-03-03T14:31:27.481Z https://docs.axolotl.ai/docs/api/monkeypatch.utils.html - 2026-03-02T21:44:05.771Z + 2026-03-03T14:31:27.744Z https://docs.axolotl.ai/docs/api/utils.quantization.html - 2026-03-02T21:44:06.015Z + 2026-03-03T14:31:27.991Z https://docs.axolotl.ai/docs/api/loaders.patch_manager.html - 2026-03-02T21:44:05.268Z + 2026-03-03T14:31:27.238Z https://docs.axolotl.ai/docs/api/cli.utils.load.html - 2026-03-02T21:44:05.113Z + 2026-03-03T14:31:27.082Z https://docs.axolotl.ai/docs/api/common.const.html - 2026-03-02T21:44:06.333Z + 2026-03-03T14:31:28.313Z https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html - 2026-03-02T21:44:04.878Z + 2026-03-03T14:31:26.844Z https://docs.axolotl.ai/docs/api/utils.schemas.trl.html - 2026-03-02T21:44:06.087Z + 2026-03-03T14:31:28.064Z https://docs.axolotl.ai/docs/api/cli.main.html - 2026-03-02T21:44:04.920Z + 2026-03-03T14:31:26.886Z https://docs.axolotl.ai/docs/dataset-formats/pretraining.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/dataset-formats/tokenized.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/dataset-formats/conversation.html - 2026-03-02T21:40:48.644Z + 2026-03-03T14:27:57.061Z https://docs.axolotl.ai/docs/checkpoint_saving.html - 2026-03-02T21:40:48.644Z + 2026-03-03T14:27:57.061Z https://docs.axolotl.ai/docs/qat.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/docs/custom_integrations.html - 2026-03-02T21:40:48.644Z + 2026-03-03T14:27:57.061Z https://docs.axolotl.ai/docs/rlhf.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.068Z https://docs.axolotl.ai/docs/quantize.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/docs/dataset_loading.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/nd_parallelism.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/docs/input_output.html - 2026-03-02T21:40:48.647Z + 2026-03-03T14:27:57.066Z https://docs.axolotl.ai/docs/multi-node.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/docs/getting-started.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/optimizers.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/index.html - 2026-03-02T21:40:48.670Z + 2026-03-03T14:27:57.096Z https://docs.axolotl.ai/docs/mac.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.066Z https://docs.axolotl.ai/docs/optimizations.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/docs/lr_groups.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.066Z https://docs.axolotl.ai/docs/amd_hpc.html - 2026-03-02T21:40:48.644Z + 2026-03-03T14:27:57.061Z https://docs.axolotl.ai/docs/mixed_precision.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.066Z https://docs.axolotl.ai/docs/unsloth.html - 2026-03-02T21:40:48.649Z + 2026-03-03T14:27:57.069Z https://docs.axolotl.ai/docs/sequence_parallelism.html - 2026-03-02T21:40:48.649Z + 2026-03-03T14:27:57.069Z https://docs.axolotl.ai/docs/streaming.html - 2026-03-02T21:40:48.649Z + 2026-03-03T14:27:57.069Z https://docs.axolotl.ai/docs/ray-integration.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.067Z https://docs.axolotl.ai/docs/config-reference.html - 2026-03-02T21:44:44.809Z + 2026-03-03T14:31:48.842Z https://docs.axolotl.ai/docs/telemetry.html - 2026-03-02T21:40:48.649Z + 2026-03-03T14:27:57.069Z https://docs.axolotl.ai/docs/dataset-formats/index.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/dataset-formats/template_free.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/fsdp_qlora.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/api/index.html - 2026-03-02T21:44:04.613Z + 2026-03-03T14:31:26.578Z https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html - 2026-03-02T21:44:05.564Z + 2026-03-03T14:31:27.537Z https://docs.axolotl.ai/docs/api/core.chat.format.shared.html - 2026-03-02T21:44:04.862Z + 2026-03-03T14:31:26.829Z https://docs.axolotl.ai/docs/api/cli.args.html - 2026-03-02T21:44:04.965Z + 2026-03-03T14:31:26.932Z https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html - 2026-03-02T21:44:06.353Z + 2026-03-03T14:31:28.334Z https://docs.axolotl.ai/docs/api/convert.html - 2026-03-02T21:44:04.727Z + 2026-03-03T14:31:26.692Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html - 2026-03-02T21:44:05.290Z + 2026-03-03T14:31:27.260Z https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html - 2026-03-02T21:44:05.084Z + 2026-03-03T14:31:27.052Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html - 2026-03-02T21:44:05.282Z + 2026-03-03T14:31:27.251Z https://docs.axolotl.ai/docs/api/prompt_tokenizers.html - 2026-03-02T21:44:04.780Z + 2026-03-03T14:31:26.745Z https://docs.axolotl.ai/docs/api/utils.data.streaming.html - 2026-03-02T21:44:05.983Z + 2026-03-03T14:31:27.960Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html - 2026-03-02T21:44:05.846Z + 2026-03-03T14:31:27.820Z https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html - 2026-03-02T21:44:06.317Z + 2026-03-03T14:31:28.297Z https://docs.axolotl.ai/docs/api/utils.freeze.html - 2026-03-02T21:44:05.884Z + 2026-03-03T14:31:27.859Z https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html - 2026-03-02T21:44:06.457Z + 2026-03-03T14:31:28.439Z https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html - 2026-03-02T21:44:06.451Z + 2026-03-03T14:31:28.432Z https://docs.axolotl.ai/docs/api/kernels.lora.html - 2026-03-02T21:44:05.671Z + 2026-03-03T14:31:27.643Z https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html - 2026-03-02T21:44:05.794Z + 2026-03-03T14:31:27.767Z https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html - 2026-03-02T21:44:05.456Z + 2026-03-03T14:31:27.428Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html - 2026-03-02T21:44:05.379Z + 2026-03-03T14:31:27.350Z https://docs.axolotl.ai/docs/api/core.datasets.chat.html - 2026-03-02T21:44:04.869Z + 2026-03-03T14:31:26.835Z https://docs.axolotl.ai/docs/api/cli.evaluate.html - 2026-03-02T21:44:04.940Z + 2026-03-03T14:31:26.907Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html - 2026-03-02T21:44:05.395Z + 2026-03-03T14:31:27.367Z https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html - 2026-03-02T21:44:05.559Z + 2026-03-03T14:31:27.532Z https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html - 2026-03-02T21:44:06.114Z + 2026-03-03T14:31:28.091Z https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html - 2026-03-02T21:44:06.388Z + 2026-03-03T14:31:28.369Z https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html - 2026-03-02T21:44:06.446Z + 2026-03-03T14:31:28.427Z https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html - 2026-03-02T21:44:05.362Z + 2026-03-03T14:31:27.333Z https://docs.axolotl.ai/docs/api/kernels.utils.html - 2026-03-02T21:44:05.707Z + 2026-03-03T14:31:27.679Z https://docs.axolotl.ai/docs/api/cli.vllm_serve.html - 2026-03-02T21:44:05.072Z + 2026-03-03T14:31:27.040Z https://docs.axolotl.ai/docs/api/core.trainers.mamba.html - 2026-03-02T21:44:05.179Z + 2026-03-03T14:31:27.148Z https://docs.axolotl.ai/docs/api/utils.bench.html - 2026-03-02T21:44:05.874Z + 2026-03-03T14:31:27.849Z https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html - 2026-03-02T21:44:05.120Z + 2026-03-03T14:31:27.089Z https://docs.axolotl.ai/docs/api/cli.merge_lora.html - 2026-03-02T21:44:05.033Z + 2026-03-03T14:31:27.000Z https://docs.axolotl.ai/docs/api/loaders.model.html - 2026-03-02T21:44:05.229Z + 2026-03-03T14:31:27.198Z https://docs.axolotl.ai/docs/api/cli.preprocess.html - 2026-03-02T21:44:05.057Z + 2026-03-03T14:31:27.025Z https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html - 2026-03-02T21:44:06.453Z + 2026-03-03T14:31:28.434Z https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html - 2026-03-02T21:44:05.451Z + 2026-03-03T14:31:27.424Z https://docs.axolotl.ai/docs/api/utils.schemas.enums.html - 2026-03-02T21:44:06.125Z + 2026-03-03T14:31:28.102Z https://docs.axolotl.ai/docs/api/kernels.quantize.html - 2026-03-02T21:44:05.705Z + 2026-03-03T14:31:27.678Z https://docs.axolotl.ai/docs/api/utils.schemas.model.html - 2026-03-02T21:44:06.040Z + 2026-03-03T14:31:28.017Z https://docs.axolotl.ai/docs/api/utils.collators.core.html - 2026-03-02T21:44:06.355Z + 2026-03-03T14:31:28.335Z https://docs.axolotl.ai/docs/api/core.builders.rl.html - 2026-03-02T21:44:04.811Z + 2026-03-03T14:31:26.777Z https://docs.axolotl.ai/docs/api/core.builders.causal.html - 2026-03-02T21:44:04.805Z + 2026-03-03T14:31:26.771Z https://docs.axolotl.ai/docs/api/utils.distributed.html - 2026-03-02T21:44:05.965Z + 2026-03-03T14:31:27.941Z https://docs.axolotl.ai/docs/api/train.html - 2026-03-02T21:44:04.690Z + 2026-03-03T14:31:26.654Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html - 2026-03-02T21:44:05.478Z + 2026-03-03T14:31:27.450Z https://docs.axolotl.ai/docs/api/integrations.base.html - 2026-03-02T21:44:06.302Z + 2026-03-03T14:31:28.282Z https://docs.axolotl.ai/docs/api/core.chat.messages.html - 2026-03-02T21:44:04.857Z + 2026-03-03T14:31:26.823Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html - 2026-03-02T21:44:05.215Z + 2026-03-03T14:31:27.185Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html - 2026-03-02T21:44:05.491Z + 2026-03-03T14:31:27.464Z https://docs.axolotl.ai/docs/api/integrations.liger.args.html - 2026-03-02T21:44:06.321Z + 2026-03-03T14:31:28.301Z https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html - 2026-03-02T21:44:05.795Z + 2026-03-03T14:31:27.769Z https://docs.axolotl.ai/docs/api/logging_config.html - 2026-03-02T21:44:04.792Z + 2026-03-03T14:31:26.757Z https://docs.axolotl.ai/docs/api/common.datasets.html - 2026-03-02T21:44:06.352Z + 2026-03-03T14:31:28.332Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html - 2026-03-02T21:44:05.716Z + 2026-03-03T14:31:27.688Z https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html - 2026-03-02T21:44:05.422Z + 2026-03-03T14:31:27.394Z https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html - 2026-03-02T21:44:06.072Z + 2026-03-03T14:31:28.049Z https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html - 2026-03-02T21:44:05.782Z + 2026-03-03T14:31:27.755Z https://docs.axolotl.ai/docs/api/cli.utils.train.html - 2026-03-02T21:44:05.135Z + 2026-03-03T14:31:27.104Z https://docs.axolotl.ai/docs/api/loaders.constants.html - 2026-03-02T21:44:05.270Z + 2026-03-03T14:31:27.240Z https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html - 2026-03-02T21:44:05.429Z + 2026-03-03T14:31:27.402Z https://docs.axolotl.ai/docs/api/loaders.tokenizer.html - 2026-03-02T21:44:05.240Z + 2026-03-03T14:31:27.209Z https://docs.axolotl.ai/docs/api/core.training_args.html - 2026-03-02T21:44:04.827Z + 2026-03-03T14:31:26.793Z https://docs.axolotl.ai/docs/api/loaders.processor.html - 2026-03-02T21:44:05.242Z + 2026-03-03T14:31:27.211Z https://docs.axolotl.ai/docs/api/prompt_strategies.base.html - 2026-03-02T21:44:05.320Z + 2026-03-03T14:31:27.290Z https://docs.axolotl.ai/docs/api/utils.collators.mamba.html - 2026-03-02T21:44:06.382Z + 2026-03-03T14:31:28.363Z https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html - 2026-03-02T21:44:05.760Z + 2026-03-03T14:31:27.734Z https://docs.axolotl.ai/docs/api/utils.schemas.peft.html - 2026-03-02T21:44:06.083Z + 2026-03-03T14:31:28.060Z https://docs.axolotl.ai/docs/api/utils.data.sft.html - 2026-03-02T21:44:05.991Z + 2026-03-03T14:31:27.967Z https://docs.axolotl.ai/docs/api/core.trainers.utils.html - 2026-03-02T21:44:05.217Z + 2026-03-03T14:31:27.186Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html - 2026-03-02T21:44:05.774Z + 2026-03-03T14:31:27.748Z https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html - 2026-03-02T21:44:05.772Z + 2026-03-03T14:31:27.746Z https://docs.axolotl.ai/docs/api/loaders.adapter.html - 2026-03-02T21:44:05.249Z + 2026-03-03T14:31:27.218Z https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html - 2026-03-02T21:44:05.437Z + 2026-03-03T14:31:27.409Z https://docs.axolotl.ai/docs/attention.html - 2026-03-02T21:40:48.644Z + 2026-03-03T14:27:57.061Z https://docs.axolotl.ai/docs/docker.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/dataset_preprocessing.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/gradient_checkpointing.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/docs/cli.html - 2026-03-02T21:40:48.644Z + 2026-03-03T14:27:57.061Z https://docs.axolotl.ai/docs/lora_optims.html - 2026-03-02T21:40:48.648Z + 2026-03-03T14:27:57.066Z https://docs.axolotl.ai/docs/models/index.html - 2026-03-02T21:44:45.709Z + 2026-03-03T14:31:49.679Z https://docs.axolotl.ai/docs/models/devstral.html - 2026-03-02T21:44:45.698Z + 2026-03-03T14:31:49.673Z https://docs.axolotl.ai/docs/models/mistral-small.html - 2026-03-02T21:44:45.697Z + 2026-03-03T14:31:49.673Z https://docs.axolotl.ai/docs/models/jamba.html - 2026-03-02T21:44:45.707Z + 2026-03-03T14:31:49.679Z https://docs.axolotl.ai/docs/models/olmo3.html - 2026-03-02T21:44:45.692Z + 2026-03-03T14:31:49.669Z https://docs.axolotl.ai/docs/models/smolvlm2.html - 2026-03-02T21:44:45.705Z + 2026-03-03T14:31:49.677Z https://docs.axolotl.ai/docs/models/kimi-linear.html - 2026-03-02T21:44:45.689Z + 2026-03-03T14:31:49.667Z https://docs.axolotl.ai/docs/models/llama-2.html - 2026-03-02T21:44:45.701Z + 2026-03-03T14:31:49.675Z https://docs.axolotl.ai/docs/models/qwen3-next.html - 2026-03-02T21:44:45.702Z + 2026-03-03T14:31:49.675Z https://docs.axolotl.ai/docs/models/gpt-oss.html - 2026-03-02T21:44:45.704Z + 2026-03-03T14:31:49.676Z https://docs.axolotl.ai/docs/models/mimo.html - 2026-03-02T21:44:45.691Z + 2026-03-03T14:31:49.668Z https://docs.axolotl.ai/docs/models/magistral/vision.html - 2026-03-02T21:44:45.696Z + 2026-03-03T14:31:49.672Z https://docs.axolotl.ai/docs/models/internvl3_5.html - 2026-03-02T21:44:45.692Z + 2026-03-03T14:31:49.668Z https://docs.axolotl.ai/docs/models/orpheus.html - 2026-03-02T21:44:45.709Z + 2026-03-03T14:31:49.679Z https://docs.axolotl.ai/docs/models/seed-oss.html - 2026-03-02T21:44:45.704Z + 2026-03-03T14:31:49.677Z https://docs.axolotl.ai/docs/models/granite4.html - 2026-03-02T21:44:45.706Z + 2026-03-03T14:31:49.678Z https://docs.axolotl.ai/docs/models/ministral3/think.html - 2026-03-02T21:44:45.694Z + 2026-03-03T14:31:49.670Z https://docs.axolotl.ai/docs/installation.html - 2026-03-02T21:40:48.647Z + 2026-03-03T14:27:57.066Z https://docs.axolotl.ai/docs/faq.html - 2026-03-02T21:40:48.645Z + 2026-03-03T14:27:57.062Z https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html - 2026-03-02T21:40:48.676Z + 2026-03-03T14:27:57.102Z https://docs.axolotl.ai/FAQS.html - 2026-03-02T21:40:48.642Z + 2026-03-03T14:27:57.058Z