diff --git a/.nojekyll b/.nojekyll
index 9b61f7a3f..5eaebcec7 100644
--- a/.nojekyll
+++ b/.nojekyll
@@ -1 +1 @@
-e6ac6d19
\ No newline at end of file
+d96239da
\ No newline at end of file
diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html
index b2a92abbd..cedfcd757 100644
--- a/docs/custom_integrations.html
+++ b/docs/custom_integrations.html
@@ -617,7 +617,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
If you are installing from pip
-pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@147ea28"
+pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@49f3308"
Usage
@@ -650,9 +650,13 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
granitemoehybrid
hunyuan_v1_dense
hunyuan_v1_moe
+lfm2
+lfm2_moe
+lfm2_vl
llama
llama4
llama4_text
+llava
mistral
mistral3
mixtral
diff --git a/examples/colab-notebooks/colab-axolotl-example.html b/examples/colab-notebooks/colab-axolotl-example.html
index 29e39ec4e..5d76178b4 100644
--- a/examples/colab-notebooks/colab-axolotl-example.html
+++ b/examples/colab-notebooks/colab-axolotl-example.html
@@ -565,7 +565,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
%% capture
# This step can take ~5-10 minutes to install dependencies
! pip install -- no- build- isolation axolotl[flash- attn]>= 0.9.1
-! pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@147ea28"
+! pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@49f3308"
Demo: Talk Like a Pirate
diff --git a/search.json b/search.json
index 3419dc1d6..002f8999c 100644
--- a/search.json
+++ b/search.json
@@ -2283,7 +2283,7 @@
"href": "docs/custom_integrations.html#cut-cross-entropy",
"title": "Custom Integrations",
"section": "Cut Cross Entropy",
- "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@147ea28\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\napertus\narcee\ncohere\ncohere2\ndeepseek_v3\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nglm4_moe\nglm4v\nglm4v_moe\ngpt_oss\ngranite\ngranitemoe\ngranitemoeshared\ngranitemoehybrid\nhunyuan_v1_dense\nhunyuan_v1_moe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmixtral\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nqwen3_vl\nqwen3_vl_moe\nqwen3_next\nsmollm3\nseed_oss\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
+ "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@49f3308\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\napertus\narcee\ncohere\ncohere2\ndeepseek_v3\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nglm4_moe\nglm4v\nglm4v_moe\ngpt_oss\ngranite\ngranitemoe\ngranitemoeshared\ngranitemoehybrid\nhunyuan_v1_dense\nhunyuan_v1_moe\nlfm2\nlfm2_moe\nlfm2_vl\nllama\nllama4\nllama4_text\nllava\nmistral\nmistral3\nmixtral\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nqwen3_vl\nqwen3_vl_moe\nqwen3_next\nsmollm3\nseed_oss\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
"crumbs": [
"Advanced Features",
"Custom Integrations"
diff --git a/sitemap.xml b/sitemap.xml
index 8a7c202ca..76aa2b525 100644
--- a/sitemap.xml
+++ b/sitemap.xml
@@ -2,798 +2,798 @@
https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html
- 2025-10-08T14:43:50.007Z
+ 2025-10-09T15:50:46.514Z
https://docs.axolotl.ai/docs/mac.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/cli.html
- 2025-10-08T14:43:49.980Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/nccl.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/getting-started.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/lr_groups.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/qat.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/multipack.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/streaming.html
- 2025-10-08T14:43:49.985Z
+ 2025-10-09T15:50:46.493Z
https://docs.axolotl.ai/docs/lora_optims.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/amd_hpc.html
- 2025-10-08T14:43:49.980Z
+ 2025-10-09T15:50:46.487Z
https://docs.axolotl.ai/docs/debugging.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/dataset-formats/conversation.html
- 2025-10-08T14:43:49.980Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/dataset-formats/index.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/config-reference.html
- 2025-10-08T14:47:29.858Z
+ 2025-10-09T15:54:27.221Z
https://docs.axolotl.ai/docs/multimodal.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/ray-integration.html
- 2025-10-08T14:43:49.985Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/faq.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/dataset_preprocessing.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/torchao.html
- 2025-10-08T14:43:49.985Z
+ 2025-10-09T15:50:46.493Z
https://docs.axolotl.ai/docs/optimizers.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/api/utils.schedulers.html
- 2025-10-08T14:47:14.552Z
+ 2025-10-09T15:54:11.136Z
https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html
- 2025-10-08T14:47:13.756Z
+ 2025-10-09T15:54:10.381Z
https://docs.axolotl.ai/docs/api/datasets.html
- 2025-10-08T14:47:13.354Z
+ 2025-10-09T15:54:10.000Z
https://docs.axolotl.ai/docs/api/utils.tokenization.html
- 2025-10-08T14:47:14.470Z
+ 2025-10-09T15:54:11.056Z
https://docs.axolotl.ai/docs/api/loaders.tokenizer.html
- 2025-10-08T14:47:13.874Z
+ 2025-10-09T15:54:10.493Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html
- 2025-10-08T14:47:14.338Z
+ 2025-10-09T15:54:10.934Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html
- 2025-10-08T14:47:14.427Z
+ 2025-10-09T15:54:11.015Z
https://docs.axolotl.ai/docs/api/utils.data.sft.html
- 2025-10-08T14:47:14.604Z
+ 2025-10-09T15:54:11.184Z
https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html
- 2025-10-08T14:47:14.408Z
+ 2025-10-09T15:54:10.997Z
https://docs.axolotl.ai/docs/api/loaders.patch_manager.html
- 2025-10-08T14:47:13.895Z
+ 2025-10-09T15:54:10.513Z
https://docs.axolotl.ai/docs/api/integrations.liger.args.html
- 2025-10-08T14:47:14.928Z
+ 2025-10-09T15:54:11.500Z
https://docs.axolotl.ai/docs/api/utils.schemas.peft.html
- 2025-10-08T14:47:14.695Z
+ 2025-10-09T15:54:11.277Z
https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html
- 2025-10-08T14:47:14.086Z
+ 2025-10-09T15:54:10.695Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html
- 2025-10-08T14:47:14.005Z
+ 2025-10-09T15:54:10.618Z
https://docs.axolotl.ai/docs/api/cli.cloud.base.html
- 2025-10-08T14:47:13.712Z
+ 2025-10-09T15:54:10.339Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html
- 2025-10-08T14:47:14.459Z
+ 2025-10-09T15:54:11.045Z
https://docs.axolotl.ai/docs/api/kernels.swiglu.html
- 2025-10-08T14:47:14.309Z
+ 2025-10-09T15:54:10.906Z
https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html
- 2025-10-08T14:47:14.913Z
+ 2025-10-09T15:54:11.486Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html
- 2025-10-08T14:47:14.146Z
+ 2025-10-09T15:54:10.753Z
https://docs.axolotl.ai/docs/api/monkeypatch.utils.html
- 2025-10-08T14:47:14.385Z
+ 2025-10-09T15:54:10.976Z
https://docs.axolotl.ai/docs/api/core.builders.rl.html
- 2025-10-08T14:47:13.452Z
+ 2025-10-09T15:54:10.092Z
https://docs.axolotl.ai/docs/api/loaders.processor.html
- 2025-10-08T14:47:13.876Z
+ 2025-10-09T15:54:10.495Z
https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html
- 2025-10-08T14:47:15.059Z
+ 2025-10-09T15:54:11.622Z
https://docs.axolotl.ai/docs/api/core.training_args.html
- 2025-10-08T14:47:13.468Z
+ 2025-10-09T15:54:10.106Z
https://docs.axolotl.ai/docs/api/loaders.adapter.html
- 2025-10-08T14:47:13.882Z
+ 2025-10-09T15:54:10.501Z
https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html
- 2025-10-08T14:47:13.684Z
+ 2025-10-09T15:54:10.312Z
https://docs.axolotl.ai/docs/api/cli.train.html
- 2025-10-08T14:47:13.568Z
+ 2025-10-09T15:54:10.201Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html
- 2025-10-08T14:47:13.907Z
+ 2025-10-09T15:54:10.525Z
https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html
- 2025-10-08T14:47:14.052Z
+ 2025-10-09T15:54:10.663Z
https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html
- 2025-10-08T14:47:14.065Z
+ 2025-10-09T15:54:10.675Z
https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html
- 2025-10-08T14:47:14.375Z
+ 2025-10-09T15:54:10.966Z
https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html
- 2025-10-08T14:47:14.091Z
+ 2025-10-09T15:54:10.700Z
https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html
- 2025-10-08T14:47:14.029Z
+ 2025-10-09T15:54:10.641Z
https://docs.axolotl.ai/docs/api/core.chat.messages.html
- 2025-10-08T14:47:13.497Z
+ 2025-10-09T15:54:10.132Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html
- 2025-10-08T14:47:13.916Z
+ 2025-10-09T15:54:10.533Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html
- 2025-10-08T14:47:14.122Z
+ 2025-10-09T15:54:10.730Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html
- 2025-10-08T14:47:14.134Z
+ 2025-10-09T15:54:10.741Z
https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html
- 2025-10-08T14:47:14.721Z
+ 2025-10-09T15:54:11.302Z
https://docs.axolotl.ai/docs/api/convert.html
- 2025-10-08T14:47:13.371Z
+ 2025-10-09T15:54:10.015Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html
- 2025-10-08T14:47:14.124Z
+ 2025-10-09T15:54:10.732Z
https://docs.axolotl.ai/docs/api/utils.schemas.config.html
- 2025-10-08T14:47:14.643Z
+ 2025-10-09T15:54:11.222Z
https://docs.axolotl.ai/docs/api/utils.schemas.enums.html
- 2025-10-08T14:47:14.732Z
+ 2025-10-09T15:54:11.312Z
https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html
- 2025-10-08T14:47:14.387Z
+ 2025-10-09T15:54:10.977Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html
- 2025-10-08T14:47:14.093Z
+ 2025-10-09T15:54:10.702Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html
- 2025-10-08T14:47:13.834Z
+ 2025-10-09T15:54:10.456Z
https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html
- 2025-10-08T14:47:14.932Z
+ 2025-10-09T15:54:11.503Z
https://docs.axolotl.ai/docs/api/utils.collators.core.html
- 2025-10-08T14:47:14.961Z
+ 2025-10-09T15:54:11.531Z
https://docs.axolotl.ai/docs/api/core.chat.format.shared.html
- 2025-10-08T14:47:13.502Z
+ 2025-10-09T15:54:10.137Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html
- 2025-10-08T14:47:14.172Z
+ 2025-10-09T15:54:10.777Z
https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html
- 2025-10-08T14:47:15.045Z
+ 2025-10-09T15:54:11.609Z
https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html
- 2025-10-08T14:47:15.079Z
+ 2025-10-09T15:54:11.638Z
https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html
- 2025-10-08T14:47:13.987Z
+ 2025-10-09T15:54:10.600Z
https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html
- 2025-10-08T14:47:14.706Z
+ 2025-10-09T15:54:11.287Z
https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html
- 2025-10-08T14:47:15.071Z
+ 2025-10-09T15:54:11.630Z
https://docs.axolotl.ai/docs/api/prompt_strategies.base.html
- 2025-10-08T14:47:13.946Z
+ 2025-10-09T15:54:10.562Z
https://docs.axolotl.ai/docs/api/kernels.utils.html
- 2025-10-08T14:47:14.320Z
+ 2025-10-09T15:54:10.917Z
https://docs.axolotl.ai/docs/api/cli.merge_lora.html
- 2025-10-08T14:47:13.669Z
+ 2025-10-09T15:54:10.298Z
https://docs.axolotl.ai/docs/api/cli.utils.html
- 2025-10-08T14:47:13.722Z
+ 2025-10-09T15:54:10.349Z
https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html
- 2025-10-08T14:47:13.945Z
+ 2025-10-09T15:54:10.560Z
https://docs.axolotl.ai/docs/api/index.html
- 2025-10-08T14:47:13.254Z
+ 2025-10-09T15:54:09.906Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html
- 2025-10-08T14:47:14.106Z
+ 2025-10-09T15:54:10.714Z
https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html
- 2025-10-08T14:47:14.423Z
+ 2025-10-09T15:54:11.011Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html
- 2025-10-08T14:47:14.078Z
+ 2025-10-09T15:54:10.687Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html
- 2025-10-08T14:47:13.849Z
+ 2025-10-09T15:54:10.470Z
https://docs.axolotl.ai/docs/api/utils.lora.html
- 2025-10-08T14:47:14.477Z
+ 2025-10-09T15:54:11.064Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html
- 2025-10-08T14:47:13.903Z
+ 2025-10-09T15:54:10.521Z
https://docs.axolotl.ai/docs/api/cli.config.html
- 2025-10-08T14:47:13.635Z
+ 2025-10-09T15:54:10.266Z
https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html
- 2025-10-08T14:47:14.332Z
+ 2025-10-09T15:54:10.928Z
https://docs.axolotl.ai/docs/api/utils.collators.batching.html
- 2025-10-08T14:47:14.986Z
+ 2025-10-09T15:54:11.553Z
https://docs.axolotl.ai/docs/api/utils.quantization.html
- 2025-10-08T14:47:14.628Z
+ 2025-10-09T15:54:11.206Z
https://docs.axolotl.ai/docs/api/utils.dict.html
- 2025-10-08T14:47:14.586Z
+ 2025-10-09T15:54:11.166Z
https://docs.axolotl.ai/docs/api/kernels.quantize.html
- 2025-10-08T14:47:14.318Z
+ 2025-10-09T15:54:10.915Z
https://docs.axolotl.ai/docs/api/utils.schemas.training.html
- 2025-10-08T14:47:14.660Z
+ 2025-10-09T15:54:11.240Z
https://docs.axolotl.ai/docs/api/train.html
- 2025-10-08T14:47:13.334Z
+ 2025-10-09T15:54:09.979Z
https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html
- 2025-10-08T14:47:13.518Z
+ 2025-10-09T15:54:10.153Z
https://docs.axolotl.ai/docs/inference.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.491Z
https://docs.axolotl.ai/FAQS.html
- 2025-10-08T14:43:49.979Z
+ 2025-10-09T15:50:46.486Z
https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html
- 2025-10-08T14:43:49.989Z
+ 2025-10-09T15:50:46.497Z
https://docs.axolotl.ai/index.html
- 2025-10-08T14:43:50.002Z
+ 2025-10-09T15:50:46.510Z
https://docs.axolotl.ai/docs/custom_integrations.html
- 2025-10-08T14:43:49.980Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/api/utils.schemas.utils.html
- 2025-10-08T14:47:14.738Z
+ 2025-10-09T15:54:11.319Z
https://docs.axolotl.ai/docs/api/kernels.geglu.html
- 2025-10-08T14:47:14.297Z
+ 2025-10-09T15:54:10.894Z
https://docs.axolotl.ai/docs/api/core.builders.causal.html
- 2025-10-08T14:47:13.447Z
+ 2025-10-09T15:54:10.086Z
https://docs.axolotl.ai/docs/api/core.trainers.mamba.html
- 2025-10-08T14:47:13.813Z
+ 2025-10-09T15:54:10.436Z
https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html
- 2025-10-08T14:47:14.176Z
+ 2025-10-09T15:54:10.781Z
https://docs.axolotl.ai/docs/api/core.datasets.chat.html
- 2025-10-08T14:47:13.508Z
+ 2025-10-09T15:54:10.143Z
https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html
- 2025-10-08T14:47:14.996Z
+ 2025-10-09T15:54:11.562Z
https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html
- 2025-10-08T14:47:14.045Z
+ 2025-10-09T15:54:10.656Z
https://docs.axolotl.ai/docs/api/common.const.html
- 2025-10-08T14:47:14.940Z
+ 2025-10-09T15:54:11.511Z
https://docs.axolotl.ai/docs/api/cli.quantize.html
- 2025-10-08T14:47:13.700Z
+ 2025-10-09T15:54:10.327Z
https://docs.axolotl.ai/docs/api/utils.trainer.html
- 2025-10-08T14:47:14.519Z
+ 2025-10-09T15:54:11.103Z
https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html
- 2025-10-08T14:47:13.641Z
+ 2025-10-09T15:54:10.272Z
https://docs.axolotl.ai/docs/api/evaluate.html
- 2025-10-08T14:47:13.346Z
+ 2025-10-09T15:54:09.992Z
https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html
- 2025-10-08T14:47:14.330Z
+ 2025-10-09T15:54:10.926Z
https://docs.axolotl.ai/docs/api/loaders.model.html
- 2025-10-08T14:47:13.864Z
+ 2025-10-09T15:54:10.483Z
https://docs.axolotl.ai/docs/api/utils.distributed.html
- 2025-10-08T14:47:14.579Z
+ 2025-10-09T15:54:11.158Z
https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html
- 2025-10-08T14:47:14.484Z
+ 2025-10-09T15:54:11.070Z
https://docs.axolotl.ai/docs/api/kernels.lora.html
- 2025-10-08T14:47:14.284Z
+ 2025-10-09T15:54:10.882Z
https://docs.axolotl.ai/docs/api/cli.main.html
- 2025-10-08T14:47:13.558Z
+ 2025-10-09T15:54:10.191Z
https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html
- 2025-10-08T14:47:14.936Z
+ 2025-10-09T15:54:11.507Z
https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html
- 2025-10-08T14:47:14.595Z
+ 2025-10-09T15:54:11.174Z
https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html
- 2025-10-08T14:47:13.720Z
+ 2025-10-09T15:54:10.347Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html
- 2025-10-08T14:47:14.327Z
+ 2025-10-09T15:54:10.923Z
https://docs.axolotl.ai/docs/api/core.builders.base.html
- 2025-10-08T14:47:13.441Z
+ 2025-10-09T15:54:10.081Z
https://docs.axolotl.ai/docs/api/utils.schemas.trl.html
- 2025-10-08T14:47:14.699Z
+ 2025-10-09T15:54:11.281Z
https://docs.axolotl.ai/docs/api/cli.utils.args.html
- 2025-10-08T14:47:13.736Z
+ 2025-10-09T15:54:10.362Z
https://docs.axolotl.ai/docs/api/core.trainers.base.html
- 2025-10-08T14:47:13.788Z
+ 2025-10-09T15:54:10.412Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html
- 2025-10-08T14:47:14.389Z
+ 2025-10-09T15:54:10.979Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html
- 2025-10-08T14:47:14.328Z
+ 2025-10-09T15:54:10.925Z
https://docs.axolotl.ai/docs/api/utils.schemas.model.html
- 2025-10-08T14:47:14.652Z
+ 2025-10-09T15:54:11.230Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html
- 2025-10-08T14:47:14.144Z
+ 2025-10-09T15:54:10.751Z
https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html
- 2025-10-08T14:47:15.065Z
+ 2025-10-09T15:54:11.626Z
https://docs.axolotl.ai/docs/api/common.datasets.html
- 2025-10-08T14:47:14.958Z
+ 2025-10-09T15:54:11.528Z
https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html
- 2025-10-08T14:47:14.685Z
+ 2025-10-09T15:54:11.264Z
https://docs.axolotl.ai/docs/api/cli.utils.fetch.html
- 2025-10-08T14:47:13.742Z
+ 2025-10-09T15:54:10.368Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html
- 2025-10-08T14:47:14.119Z
+ 2025-10-09T15:54:10.726Z
https://docs.axolotl.ai/docs/api/monkeypatch.relora.html
- 2025-10-08T14:47:14.336Z
+ 2025-10-09T15:54:10.932Z
https://docs.axolotl.ai/docs/api/cli.evaluate.html
- 2025-10-08T14:47:13.578Z
+ 2025-10-09T15:54:10.211Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html
- 2025-10-08T14:47:14.121Z
+ 2025-10-09T15:54:10.728Z
https://docs.axolotl.ai/docs/api/core.trainers.utils.html
- 2025-10-08T14:47:13.851Z
+ 2025-10-09T15:54:10.472Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html
- 2025-10-08T14:47:14.020Z
+ 2025-10-09T15:54:10.631Z
https://docs.axolotl.ai/docs/api/utils.chat_templates.html
- 2025-10-08T14:47:14.471Z
+ 2025-10-09T15:54:11.058Z
https://docs.axolotl.ai/docs/api/utils.data.streaming.html
- 2025-10-08T14:47:14.597Z
+ 2025-10-09T15:54:11.177Z
https://docs.axolotl.ai/docs/api/utils.bench.html
- 2025-10-08T14:47:14.488Z
+ 2025-10-09T15:54:11.075Z
https://docs.axolotl.ai/docs/api/common.architectures.html
- 2025-10-08T14:47:14.938Z
+ 2025-10-09T15:54:11.509Z
https://docs.axolotl.ai/docs/api/cli.checks.html
- 2025-10-08T14:47:13.614Z
+ 2025-10-09T15:54:10.245Z
https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html
- 2025-10-08T14:47:13.821Z
+ 2025-10-09T15:54:10.444Z
https://docs.axolotl.ai/docs/api/integrations.base.html
- 2025-10-08T14:47:14.909Z
+ 2025-10-09T15:54:11.482Z
https://docs.axolotl.ai/docs/api/cli.utils.train.html
- 2025-10-08T14:47:13.771Z
+ 2025-10-09T15:54:10.395Z
https://docs.axolotl.ai/docs/api/utils.collators.mamba.html
- 2025-10-08T14:47:14.991Z
+ 2025-10-09T15:54:11.557Z
https://docs.axolotl.ai/docs/api/cli.art.html
- 2025-10-08T14:47:13.606Z
+ 2025-10-09T15:54:10.238Z
https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html
- 2025-10-08T14:47:14.400Z
+ 2025-10-09T15:54:10.990Z
https://docs.axolotl.ai/docs/api/logging_config.html
- 2025-10-08T14:47:13.433Z
+ 2025-10-09T15:54:10.074Z
https://docs.axolotl.ai/docs/api/utils.freeze.html
- 2025-10-08T14:47:14.498Z
+ 2025-10-09T15:54:11.084Z
https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html
- 2025-10-08T14:47:14.074Z
+ 2025-10-09T15:54:10.683Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html
- 2025-10-08T14:47:14.003Z
+ 2025-10-09T15:54:10.616Z
https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html
- 2025-10-08T14:47:14.396Z
+ 2025-10-09T15:54:10.986Z
https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html
- 2025-10-08T14:47:14.959Z
+ 2025-10-09T15:54:11.529Z
https://docs.axolotl.ai/docs/api/core.trainers.trl.html
- 2025-10-08T14:47:13.806Z
+ 2025-10-09T15:54:10.429Z
https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html
- 2025-10-08T14:47:14.060Z
+ 2025-10-09T15:54:10.670Z
https://docs.axolotl.ai/docs/api/loaders.constants.html
- 2025-10-08T14:47:13.896Z
+ 2025-10-09T15:54:10.514Z
https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html
- 2025-10-08T14:47:14.421Z
+ 2025-10-09T15:54:11.009Z
https://docs.axolotl.ai/docs/api/cli.vllm_serve.html
- 2025-10-08T14:47:13.708Z
+ 2025-10-09T15:54:10.335Z
https://docs.axolotl.ai/docs/api/prompt_tokenizers.html
- 2025-10-08T14:47:13.421Z
+ 2025-10-09T15:54:10.063Z
https://docs.axolotl.ai/docs/api/cli.args.html
- 2025-10-08T14:47:13.602Z
+ 2025-10-09T15:54:10.234Z
https://docs.axolotl.ai/docs/api/cli.inference.html
- 2025-10-08T14:47:13.658Z
+ 2025-10-09T15:54:10.288Z
https://docs.axolotl.ai/docs/api/cli.utils.load.html
- 2025-10-08T14:47:13.749Z
+ 2025-10-09T15:54:10.375Z
https://docs.axolotl.ai/docs/api/cli.preprocess.html
- 2025-10-08T14:47:13.694Z
+ 2025-10-09T15:54:10.321Z
https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html
- 2025-10-08T14:47:15.058Z
+ 2025-10-09T15:54:11.620Z
https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html
- 2025-10-08T14:47:15.053Z
+ 2025-10-09T15:54:11.616Z
https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html
- 2025-10-08T14:47:13.498Z
+ 2025-10-09T15:54:10.134Z
https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html
- 2025-10-08T14:47:14.915Z
+ 2025-10-09T15:54:11.487Z
https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html
- 2025-10-08T14:47:14.924Z
+ 2025-10-09T15:54:11.496Z
https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html
- 2025-10-08T14:47:14.410Z
+ 2025-10-09T15:54:10.999Z
https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html
- 2025-10-08T14:47:13.500Z
+ 2025-10-09T15:54:10.136Z
https://docs.axolotl.ai/docs/reward_modelling.html
- 2025-10-08T14:43:49.985Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/quantize.html
- 2025-10-08T14:43:49.985Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/fsdp_qlora.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/nd_parallelism.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/batch_vs_grad.html
- 2025-10-08T14:43:49.980Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/multi-node.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/rlhf.html
- 2025-10-08T14:43:49.985Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/dataset-formats/pretraining.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/dataset-formats/tokenized.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/dataset-formats/template_free.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/multi-gpu.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/input_output.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.491Z
https://docs.axolotl.ai/docs/docker.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/gradient_checkpointing.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.489Z
https://docs.axolotl.ai/docs/optimizations.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/sequence_parallelism.html
- 2025-10-08T14:43:49.985Z
+ 2025-10-09T15:50:46.493Z
https://docs.axolotl.ai/docs/dataset_loading.html
- 2025-10-08T14:43:49.981Z
+ 2025-10-09T15:50:46.488Z
https://docs.axolotl.ai/docs/installation.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.491Z
https://docs.axolotl.ai/docs/mixed_precision.html
- 2025-10-08T14:43:49.984Z
+ 2025-10-09T15:50:46.492Z
https://docs.axolotl.ai/docs/unsloth.html
- 2025-10-08T14:43:49.985Z
+ 2025-10-09T15:50:46.493Z
https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html
- 2025-10-08T14:43:50.006Z
+ 2025-10-09T15:50:46.514Z