diff --git a/.nojekyll b/.nojekyll
index 6651e5108..0843099f8 100644
--- a/.nojekyll
+++ b/.nojekyll
@@ -1 +1 @@
-8569c582
\ No newline at end of file
+394adab2
\ No newline at end of file
diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html
index 3c6557fdf..dfde3cbc5 100644
--- a/docs/custom_integrations.html
+++ b/docs/custom_integrations.html
@@ -611,7 +611,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
If you are installing from pip
-pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c564afc"
+pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c5aa3ef"
Usage
@@ -655,6 +655,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
qwen2_5_vl
qwen3
qwen3_moe
+qwen3_next
smollm3
seed_oss
voxtral
diff --git a/examples/colab-notebooks/colab-axolotl-example.html b/examples/colab-notebooks/colab-axolotl-example.html
index 27e6e4f27..9a6ac5ed7 100644
--- a/examples/colab-notebooks/colab-axolotl-example.html
+++ b/examples/colab-notebooks/colab-axolotl-example.html
@@ -559,7 +559,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
%% capture
# This step can take ~5-10 minutes to install dependencies
! pip install -- no- build- isolation axolotl[flash- attn]>= 0.9.1
-! pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c564afc"
+! pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c5aa3ef"
Demo: Talk Like a Pirate
diff --git a/search.json b/search.json
index 31022a961..470ccb577 100644
--- a/search.json
+++ b/search.json
@@ -285,7 +285,7 @@
"href": "docs/custom_integrations.html#cut-cross-entropy",
"title": "Custom Integrations",
"section": "Cut Cross Entropy",
- "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c564afc\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\narcee\ncohere\ncohere2\ndeepseek_v3\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nglm4_moe\ngpt_oss\ngranite\ngranitemoe\nhunyuan_v1_dense\nhunyuan_v1_moe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmixtral\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nsmollm3\nseed_oss\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
+ "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c5aa3ef\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\narcee\ncohere\ncohere2\ndeepseek_v3\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nglm4_moe\ngpt_oss\ngranite\ngranitemoe\nhunyuan_v1_dense\nhunyuan_v1_moe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmixtral\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nqwen3_next\nsmollm3\nseed_oss\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
"crumbs": [
"Advanced Features",
"Custom Integrations"
diff --git a/sitemap.xml b/sitemap.xml
index db6f35b92..b01ea6639 100644
--- a/sitemap.xml
+++ b/sitemap.xml
@@ -2,794 +2,794 @@
https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html
- 2025-09-19T10:34:36.740Z
+ 2025-09-23T04:31:24.847Z
https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html
- 2025-09-19T10:34:36.757Z
+ 2025-09-23T04:31:24.864Z
https://docs.axolotl.ai/FAQS.html
- 2025-09-19T10:34:36.729Z
+ 2025-09-23T04:31:24.837Z
https://docs.axolotl.ai/docs/unsloth.html
- 2025-09-19T10:34:36.736Z
+ 2025-09-23T04:31:24.843Z
https://docs.axolotl.ai/docs/reward_modelling.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.843Z
https://docs.axolotl.ai/docs/docker.html
- 2025-09-19T10:34:36.732Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/batch_vs_grad.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.838Z
https://docs.axolotl.ai/docs/streaming.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.843Z
https://docs.axolotl.ai/docs/nccl.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/quantize.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.843Z
https://docs.axolotl.ai/docs/nd_parallelism.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/custom_integrations.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/debugging.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/gradient_checkpointing.html
- 2025-09-19T10:34:36.732Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/multimodal.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/dataset_loading.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html
- 2025-09-19T10:38:05.774Z
+ 2025-09-23T04:34:52.953Z
https://docs.axolotl.ai/docs/api/loaders.adapter.html
- 2025-09-19T10:38:04.915Z
+ 2025-09-23T04:34:52.101Z
https://docs.axolotl.ai/docs/api/core.builders.base.html
- 2025-09-19T10:38:04.547Z
+ 2025-09-23T04:34:51.738Z
https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html
- 2025-09-19T10:38:04.751Z
+ 2025-09-23T04:34:51.938Z
https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html
- 2025-09-19T10:38:04.781Z
+ 2025-09-23T04:34:51.967Z
https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html
- 2025-09-19T10:38:05.336Z
+ 2025-09-23T04:34:52.518Z
https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html
- 2025-09-19T10:38:05.764Z
+ 2025-09-23T04:34:52.943Z
https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html
- 2025-09-19T10:38:04.715Z
+ 2025-09-23T04:34:51.903Z
https://docs.axolotl.ai/docs/api/cli.evaluate.html
- 2025-09-19T10:38:04.662Z
+ 2025-09-23T04:34:51.851Z
https://docs.axolotl.ai/docs/api/utils.schemas.model.html
- 2025-09-19T10:38:05.546Z
+ 2025-09-23T04:34:52.725Z
https://docs.axolotl.ai/docs/api/cli.art.html
- 2025-09-19T10:38:04.686Z
+ 2025-09-23T04:34:51.874Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html
- 2025-09-19T10:38:05.100Z
+ 2025-09-23T04:34:52.284Z
https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html
- 2025-09-19T10:38:04.595Z
+ 2025-09-23T04:34:51.786Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html
- 2025-09-19T10:38:05.131Z
+ 2025-09-23T04:34:52.315Z
https://docs.axolotl.ai/docs/api/cli.args.html
- 2025-09-19T10:38:04.683Z
+ 2025-09-23T04:34:51.871Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html
- 2025-09-19T10:38:05.361Z
+ 2025-09-23T04:34:52.543Z
https://docs.axolotl.ai/docs/api/evaluate.html
- 2025-09-19T10:38:04.469Z
+ 2025-09-23T04:34:51.661Z
https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html
- 2025-09-19T10:38:05.062Z
+ 2025-09-23T04:34:52.246Z
https://docs.axolotl.ai/docs/api/cli.vllm_serve.html
- 2025-09-19T10:38:04.771Z
+ 2025-09-23T04:34:51.958Z
https://docs.axolotl.ai/docs/api/cli.quantize.html
- 2025-09-19T10:38:04.764Z
+ 2025-09-23T04:34:51.951Z
https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html
- 2025-09-19T10:38:04.811Z
+ 2025-09-23T04:34:51.998Z
https://docs.axolotl.ai/docs/api/core.builders.rl.html
- 2025-09-19T10:38:04.556Z
+ 2025-09-23T04:34:51.748Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html
- 2025-09-19T10:38:05.110Z
+ 2025-09-23T04:34:52.294Z
https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html
- 2025-09-19T10:38:05.073Z
+ 2025-09-23T04:34:52.257Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html
- 2025-09-19T10:38:05.114Z
+ 2025-09-23T04:34:52.298Z
https://docs.axolotl.ai/docs/api/core.datasets.chat.html
- 2025-09-19T10:38:04.602Z
+ 2025-09-23T04:34:51.793Z
https://docs.axolotl.ai/docs/api/utils.distributed.html
- 2025-09-19T10:38:05.483Z
+ 2025-09-23T04:34:52.664Z
https://docs.axolotl.ai/docs/api/integrations.base.html
- 2025-09-19T10:38:05.752Z
+ 2025-09-23T04:34:52.931Z
https://docs.axolotl.ai/docs/api/index.html
- 2025-09-19T10:38:04.400Z
+ 2025-09-23T04:34:51.593Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html
- 2025-09-19T10:38:05.387Z
+ 2025-09-23T04:34:52.569Z
https://docs.axolotl.ai/docs/api/utils.quantization.html
- 2025-09-19T10:38:05.524Z
+ 2025-09-23T04:34:52.704Z
https://docs.axolotl.ai/docs/api/utils.dict.html
- 2025-09-19T10:38:05.489Z
+ 2025-09-23T04:34:52.669Z
https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html
- 2025-09-19T10:38:04.865Z
+ 2025-09-23T04:34:52.051Z
https://docs.axolotl.ai/docs/api/utils.schemas.config.html
- 2025-09-19T10:38:05.538Z
+ 2025-09-23T04:34:52.718Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html
- 2025-09-19T10:38:05.077Z
+ 2025-09-23T04:34:52.261Z
https://docs.axolotl.ai/docs/api/utils.collators.mamba.html
- 2025-09-19T10:38:05.817Z
+ 2025-09-23T04:34:52.996Z
https://docs.axolotl.ai/docs/api/datasets.html
- 2025-09-19T10:38:04.476Z
+ 2025-09-23T04:34:51.668Z
https://docs.axolotl.ai/docs/api/convert.html
- 2025-09-19T10:38:04.489Z
+ 2025-09-23T04:34:51.681Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html
- 2025-09-19T10:38:05.123Z
+ 2025-09-23T04:34:52.307Z
https://docs.axolotl.ai/docs/api/utils.tokenization.html
- 2025-09-19T10:38:05.394Z
+ 2025-09-23T04:34:52.576Z
https://docs.axolotl.ai/docs/api/core.trainers.base.html
- 2025-09-19T10:38:04.837Z
+ 2025-09-23T04:34:52.024Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html
- 2025-09-19T10:38:05.291Z
+ 2025-09-23T04:34:52.473Z
https://docs.axolotl.ai/docs/api/loaders.model.html
- 2025-09-19T10:38:04.899Z
+ 2025-09-23T04:34:52.086Z
https://docs.axolotl.ai/docs/api/logging_config.html
- 2025-09-19T10:38:04.541Z
+ 2025-09-23T04:34:51.732Z
https://docs.axolotl.ai/docs/api/core.chat.format.shared.html
- 2025-09-19T10:38:04.597Z
+ 2025-09-23T04:34:51.788Z
https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html
- 2025-09-19T10:38:05.793Z
+ 2025-09-23T04:34:52.972Z
https://docs.axolotl.ai/docs/api/utils.schemas.enums.html
- 2025-09-19T10:38:05.609Z
+ 2025-09-23T04:34:52.788Z
https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html
- 2025-09-19T10:38:05.874Z
+ 2025-09-23T04:34:53.052Z
https://docs.axolotl.ai/docs/api/utils.bench.html
- 2025-09-19T10:38:05.410Z
+ 2025-09-23T04:34:52.592Z
https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html
- 2025-09-19T10:38:05.863Z
+ 2025-09-23T04:34:53.042Z
https://docs.axolotl.ai/docs/api/core.trainers.mamba.html
- 2025-09-19T10:38:04.858Z
+ 2025-09-23T04:34:52.044Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html
- 2025-09-19T10:38:05.015Z
+ 2025-09-23T04:34:52.200Z
https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html
- 2025-09-19T10:38:05.329Z
+ 2025-09-23T04:34:52.511Z
https://docs.axolotl.ai/docs/api/core.chat.messages.html
- 2025-09-19T10:38:04.592Z
+ 2025-09-23T04:34:51.783Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html
- 2025-09-19T10:38:05.330Z
+ 2025-09-23T04:34:52.513Z
https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html
- 2025-09-19T10:38:05.358Z
+ 2025-09-23T04:34:52.540Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html
- 2025-09-19T10:38:04.942Z
+ 2025-09-23T04:34:52.128Z
https://docs.axolotl.ai/docs/api/loaders.patch_manager.html
- 2025-09-19T10:38:04.925Z
+ 2025-09-23T04:34:52.111Z
https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html
- 2025-09-19T10:38:05.496Z
+ 2025-09-23T04:34:52.677Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html
- 2025-09-19T10:38:05.283Z
+ 2025-09-23T04:34:52.465Z
https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html
- 2025-09-19T10:38:05.870Z
+ 2025-09-23T04:34:53.048Z
https://docs.axolotl.ai/docs/api/loaders.tokenizer.html
- 2025-09-19T10:38:04.908Z
+ 2025-09-23T04:34:52.094Z
https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html
- 2025-09-19T10:38:05.084Z
+ 2025-09-23T04:34:52.268Z
https://docs.axolotl.ai/docs/api/utils.lora.html
- 2025-09-19T10:38:05.401Z
+ 2025-09-23T04:34:52.583Z
https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html
- 2025-09-19T10:38:05.037Z
+ 2025-09-23T04:34:52.221Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html
- 2025-09-19T10:38:04.935Z
+ 2025-09-23T04:34:52.121Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html
- 2025-09-19T10:38:05.113Z
+ 2025-09-23T04:34:52.297Z
https://docs.axolotl.ai/docs/api/kernels.swiglu.html
- 2025-09-19T10:38:05.266Z
+ 2025-09-23T04:34:52.449Z
https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html
- 2025-09-19T10:38:05.588Z
+ 2025-09-23T04:34:52.767Z
https://docs.axolotl.ai/docs/api/cli.main.html
- 2025-09-19T10:38:04.645Z
+ 2025-09-23T04:34:51.835Z
https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html
- 2025-09-19T10:38:04.966Z
+ 2025-09-23T04:34:52.152Z
https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html
- 2025-09-19T10:38:05.286Z
+ 2025-09-23T04:34:52.468Z
https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html
- 2025-09-19T10:38:04.594Z
+ 2025-09-23T04:34:51.785Z
https://docs.axolotl.ai/docs/api/cli.cloud.base.html
- 2025-09-19T10:38:04.775Z
+ 2025-09-23T04:34:51.961Z
https://docs.axolotl.ai/docs/api/core.trainers.trl.html
- 2025-09-19T10:38:04.852Z
+ 2025-09-23T04:34:52.039Z
https://docs.axolotl.ai/docs/mixed_precision.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/installation.html
- 2025-09-19T10:34:36.734Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/mac.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/sequence_parallelism.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.843Z
https://docs.axolotl.ai/docs/faq.html
- 2025-09-19T10:34:36.732Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/dataset-formats/tokenized.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/dataset-formats/pretraining.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/dataset-formats/template_free.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/dataset-formats/index.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/dataset-formats/conversation.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/lr_groups.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/inference.html
- 2025-09-19T10:34:36.734Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/lora_optims.html
- 2025-09-19T10:34:36.734Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/multipack.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/amd_hpc.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.838Z
https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html
- 2025-09-19T10:38:05.339Z
+ 2025-09-23T04:34:52.521Z
https://docs.axolotl.ai/docs/api/cli.inference.html
- 2025-09-19T10:38:04.730Z
+ 2025-09-23T04:34:51.917Z
https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html
- 2025-09-19T10:38:05.822Z
+ 2025-09-23T04:34:53.001Z
https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html
- 2025-09-19T10:38:05.406Z
+ 2025-09-23T04:34:52.588Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html
- 2025-09-19T10:38:05.281Z
+ 2025-09-23T04:34:52.463Z
https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html
- 2025-09-19T10:38:05.756Z
+ 2025-09-23T04:34:52.935Z
https://docs.axolotl.ai/docs/api/utils.schemas.training.html
- 2025-09-19T10:38:05.552Z
+ 2025-09-23T04:34:52.732Z
https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html
- 2025-09-19T10:38:05.600Z
+ 2025-09-23T04:34:52.779Z
https://docs.axolotl.ai/docs/api/utils.schemas.utils.html
- 2025-09-19T10:38:05.615Z
+ 2025-09-23T04:34:52.794Z
https://docs.axolotl.ai/docs/api/cli.checks.html
- 2025-09-19T10:38:04.692Z
+ 2025-09-23T04:34:51.880Z
https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html
- 2025-09-19T10:38:05.890Z
+ 2025-09-23T04:34:53.068Z
https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html
- 2025-09-19T10:38:05.284Z
+ 2025-09-23T04:34:52.466Z
https://docs.axolotl.ai/docs/api/utils.data.sft.html
- 2025-09-19T10:38:05.504Z
+ 2025-09-23T04:34:52.685Z
https://docs.axolotl.ai/docs/api/utils.chat_templates.html
- 2025-09-19T10:38:05.396Z
+ 2025-09-23T04:34:52.578Z
https://docs.axolotl.ai/docs/api/monkeypatch.utils.html
- 2025-09-19T10:38:05.327Z
+ 2025-09-23T04:34:52.510Z
https://docs.axolotl.ai/docs/api/cli.utils.fetch.html
- 2025-09-19T10:38:04.799Z
+ 2025-09-23T04:34:51.986Z
https://docs.axolotl.ai/docs/api/core.builders.causal.html
- 2025-09-19T10:38:04.552Z
+ 2025-09-23T04:34:51.743Z
https://docs.axolotl.ai/docs/api/utils.schemas.trl.html
- 2025-09-19T10:38:05.583Z
+ 2025-09-23T04:34:52.762Z
https://docs.axolotl.ai/docs/api/utils.data.streaming.html
- 2025-09-19T10:38:05.498Z
+ 2025-09-23T04:34:52.678Z
https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html
- 2025-09-19T10:38:05.347Z
+ 2025-09-23T04:34:52.529Z
https://docs.axolotl.ai/docs/api/prompt_strategies.base.html
- 2025-09-19T10:38:04.968Z
+ 2025-09-23T04:34:52.153Z
https://docs.axolotl.ai/docs/api/cli.merge_lora.html
- 2025-09-19T10:38:04.739Z
+ 2025-09-23T04:34:51.926Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html
- 2025-09-19T10:38:05.017Z
+ 2025-09-23T04:34:52.201Z
https://docs.axolotl.ai/docs/api/loaders.constants.html
- 2025-09-19T10:38:04.926Z
+ 2025-09-23T04:34:52.112Z
https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html
- 2025-09-19T10:38:05.346Z
+ 2025-09-23T04:34:52.528Z
https://docs.axolotl.ai/docs/api/monkeypatch.relora.html
- 2025-09-19T10:38:05.289Z
+ 2025-09-23T04:34:52.471Z
https://docs.axolotl.ai/docs/api/utils.schedulers.html
- 2025-09-19T10:38:05.463Z
+ 2025-09-23T04:34:52.644Z
https://docs.axolotl.ai/docs/api/kernels.lora.html
- 2025-09-19T10:38:05.245Z
+ 2025-09-23T04:34:52.428Z
https://docs.axolotl.ai/docs/api/utils.collators.batching.html
- 2025-09-19T10:38:05.814Z
+ 2025-09-23T04:34:52.992Z
https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html
- 2025-09-19T10:38:05.056Z
+ 2025-09-23T04:34:52.240Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html
- 2025-09-19T10:38:04.876Z
+ 2025-09-23T04:34:52.062Z
https://docs.axolotl.ai/docs/api/common.architectures.html
- 2025-09-19T10:38:05.775Z
+ 2025-09-23T04:34:52.954Z
https://docs.axolotl.ai/docs/api/cli.utils.html
- 2025-09-19T10:38:04.782Z
+ 2025-09-23T04:34:51.969Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html
- 2025-09-19T10:38:05.153Z
+ 2025-09-23T04:34:52.337Z
https://docs.axolotl.ai/docs/api/core.training_args.html
- 2025-09-19T10:38:04.569Z
+ 2025-09-23T04:34:51.760Z
https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html
- 2025-09-19T10:38:05.571Z
+ 2025-09-23T04:34:52.750Z
https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html
- 2025-09-19T10:38:05.001Z
+ 2025-09-23T04:34:52.186Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html
- 2025-09-19T10:38:05.029Z
+ 2025-09-23T04:34:52.213Z
https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html
- 2025-09-19T10:38:05.755Z
+ 2025-09-23T04:34:52.934Z
https://docs.axolotl.ai/docs/api/common.const.html
- 2025-09-19T10:38:05.777Z
+ 2025-09-23T04:34:52.956Z
https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html
- 2025-09-19T10:38:05.319Z
+ 2025-09-23T04:34:52.502Z
https://docs.axolotl.ai/docs/api/kernels.quantize.html
- 2025-09-19T10:38:05.274Z
+ 2025-09-23T04:34:52.456Z
https://docs.axolotl.ai/docs/api/cli.config.html
- 2025-09-19T10:38:04.711Z
+ 2025-09-23T04:34:51.898Z
https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html
- 2025-09-19T10:38:05.050Z
+ 2025-09-23T04:34:52.234Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html
- 2025-09-19T10:38:05.112Z
+ 2025-09-23T04:34:52.295Z
https://docs.axolotl.ai/docs/api/kernels.geglu.html
- 2025-09-19T10:38:05.256Z
+ 2025-09-23T04:34:52.439Z
https://docs.axolotl.ai/docs/api/utils.freeze.html
- 2025-09-19T10:38:05.418Z
+ 2025-09-23T04:34:52.599Z
https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html
- 2025-09-19T10:38:05.879Z
+ 2025-09-23T04:34:53.057Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html
- 2025-09-19T10:38:04.888Z
+ 2025-09-23T04:34:52.074Z
https://docs.axolotl.ai/docs/api/cli.utils.train.html
- 2025-09-19T10:38:04.823Z
+ 2025-09-23T04:34:52.009Z
https://docs.axolotl.ai/docs/api/cli.utils.load.html
- 2025-09-19T10:38:04.805Z
+ 2025-09-23T04:34:51.991Z
https://docs.axolotl.ai/docs/api/utils.collators.core.html
- 2025-09-19T10:38:05.794Z
+ 2025-09-23T04:34:52.973Z
https://docs.axolotl.ai/docs/api/integrations.liger.args.html
- 2025-09-19T10:38:05.767Z
+ 2025-09-23T04:34:52.946Z
https://docs.axolotl.ai/docs/api/cli.preprocess.html
- 2025-09-19T10:38:04.759Z
+ 2025-09-23T04:34:51.946Z
https://docs.axolotl.ai/docs/api/kernels.utils.html
- 2025-09-19T10:38:05.276Z
+ 2025-09-23T04:34:52.458Z
https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html
- 2025-09-19T10:38:05.875Z
+ 2025-09-23T04:34:53.053Z
https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html
- 2025-09-19T10:38:05.356Z
+ 2025-09-23T04:34:52.538Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html
- 2025-09-19T10:38:04.932Z
+ 2025-09-23T04:34:52.118Z
https://docs.axolotl.ai/docs/api/loaders.processor.html
- 2025-09-19T10:38:04.909Z
+ 2025-09-23T04:34:52.095Z
https://docs.axolotl.ai/docs/api/core.trainers.utils.html
- 2025-09-19T10:38:04.890Z
+ 2025-09-23T04:34:52.076Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html
- 2025-09-19T10:38:05.090Z
+ 2025-09-23T04:34:52.273Z
https://docs.axolotl.ai/docs/api/prompt_tokenizers.html
- 2025-09-19T10:38:04.531Z
+ 2025-09-23T04:34:51.723Z
https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html
- 2025-09-19T10:38:05.883Z
+ 2025-09-23T04:34:53.061Z
https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html
- 2025-09-19T10:38:04.610Z
+ 2025-09-23T04:34:51.801Z
https://docs.axolotl.ai/docs/api/utils.trainer.html
- 2025-09-19T10:38:05.435Z
+ 2025-09-23T04:34:52.616Z
https://docs.axolotl.ai/docs/api/cli.train.html
- 2025-09-19T10:38:04.654Z
+ 2025-09-23T04:34:51.843Z
https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html
- 2025-09-19T10:38:05.770Z
+ 2025-09-23T04:34:52.950Z
https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html
- 2025-09-19T10:38:05.088Z
+ 2025-09-23T04:34:52.272Z
https://docs.axolotl.ai/docs/api/utils.schemas.peft.html
- 2025-09-19T10:38:05.579Z
+ 2025-09-23T04:34:52.759Z
https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html
- 2025-09-19T10:38:05.156Z
+ 2025-09-23T04:34:52.341Z
https://docs.axolotl.ai/docs/api/cli.utils.args.html
- 2025-09-19T10:38:04.794Z
+ 2025-09-23T04:34:51.980Z
https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html
- 2025-09-19T10:38:05.066Z
+ 2025-09-23T04:34:52.250Z
https://docs.axolotl.ai/docs/api/common.datasets.html
- 2025-09-19T10:38:05.792Z
+ 2025-09-23T04:34:52.971Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html
- 2025-09-19T10:38:05.132Z
+ 2025-09-23T04:34:52.316Z
https://docs.axolotl.ai/docs/api/train.html
- 2025-09-19T10:38:04.459Z
+ 2025-09-23T04:34:51.651Z
https://docs.axolotl.ai/docs/multi-node.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/input_output.html
- 2025-09-19T10:34:36.734Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/ray-integration.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.843Z
https://docs.axolotl.ai/docs/getting-started.html
- 2025-09-19T10:34:36.732Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/optimizers.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.843Z
https://docs.axolotl.ai/docs/multi-gpu.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.842Z
https://docs.axolotl.ai/docs/dataset_preprocessing.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/torchao.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.843Z
https://docs.axolotl.ai/docs/config-reference.html
- 2025-09-19T10:38:21.431Z
+ 2025-09-23T04:35:08.477Z
https://docs.axolotl.ai/docs/rlhf.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.843Z
https://docs.axolotl.ai/docs/cli.html
- 2025-09-19T10:34:36.731Z
+ 2025-09-23T04:31:24.838Z
https://docs.axolotl.ai/docs/fsdp_qlora.html
- 2025-09-19T10:34:36.732Z
+ 2025-09-23T04:31:24.839Z
https://docs.axolotl.ai/docs/qat.html
- 2025-09-19T10:34:36.735Z
+ 2025-09-23T04:31:24.843Z
https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html
- 2025-09-19T10:34:36.757Z
+ 2025-09-23T04:31:24.864Z
https://docs.axolotl.ai/index.html
- 2025-09-19T10:34:36.752Z
+ 2025-09-23T04:31:24.859Z