diff --git a/.nojekyll b/.nojekyll
index b1c52659c..eb21b11d5 100644
--- a/.nojekyll
+++ b/.nojekyll
@@ -1 +1 @@
-7a5d1929
\ No newline at end of file
+a66039f8
\ No newline at end of file
diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html
index b4e0ca3b3..2ad385d7a 100644
--- a/docs/custom_integrations.html
+++ b/docs/custom_integrations.html
@@ -617,7 +617,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
If you are installing from pip
-pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c5aa3ef"
+pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@147ea28"
Usage
@@ -627,6 +627,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
Supported Models
+apertus
arcee
cohere
cohere2
@@ -640,9 +641,13 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
glm
glm4
glm4_moe
+glm4v
+glm4v_moe
gpt_oss
granite
granitemoe
+granitemoeshared
+granitemoehybrid
hunyuan_v1_dense
hunyuan_v1_moe
llama
@@ -661,6 +666,8 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
qwen2_5_vl
qwen3
qwen3_moe
+qwen3_vl
+qwen3_vl_moe
qwen3_next
smollm3
seed_oss
diff --git a/examples/colab-notebooks/colab-axolotl-example.html b/examples/colab-notebooks/colab-axolotl-example.html
index 414777538..42306179f 100644
--- a/examples/colab-notebooks/colab-axolotl-example.html
+++ b/examples/colab-notebooks/colab-axolotl-example.html
@@ -565,7 +565,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
%% capture
# This step can take ~5-10 minutes to install dependencies
! pip install -- no- build- isolation axolotl[flash- attn]>= 0.9.1
-! pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c5aa3ef"
+! pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@147ea28"
Demo: Talk Like a Pirate
diff --git a/search.json b/search.json
index 267129c55..847b536b3 100644
--- a/search.json
+++ b/search.json
@@ -2283,7 +2283,7 @@
"href": "docs/custom_integrations.html#cut-cross-entropy",
"title": "Custom Integrations",
"section": "Cut Cross Entropy",
- "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c5aa3ef\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\narcee\ncohere\ncohere2\ndeepseek_v3\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nglm4_moe\ngpt_oss\ngranite\ngranitemoe\nhunyuan_v1_dense\nhunyuan_v1_moe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmixtral\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nqwen3_next\nsmollm3\nseed_oss\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
+ "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@147ea28\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\napertus\narcee\ncohere\ncohere2\ndeepseek_v3\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nglm4_moe\nglm4v\nglm4v_moe\ngpt_oss\ngranite\ngranitemoe\ngranitemoeshared\ngranitemoehybrid\nhunyuan_v1_dense\nhunyuan_v1_moe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmixtral\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nqwen3_vl\nqwen3_vl_moe\nqwen3_next\nsmollm3\nseed_oss\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
"crumbs": [
"Advanced Features",
"Custom Integrations"
diff --git a/sitemap.xml b/sitemap.xml
index c9c19858b..f3bd5ab8a 100644
--- a/sitemap.xml
+++ b/sitemap.xml
@@ -2,798 +2,798 @@
https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html
- 2025-09-25T16:03:59.059Z
+ 2025-09-26T05:11:39.160Z
https://docs.axolotl.ai/docs/mac.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/cli.html
- 2025-09-25T16:03:59.033Z
+ 2025-09-26T05:11:39.134Z
https://docs.axolotl.ai/docs/nccl.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/getting-started.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/lr_groups.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/qat.html
- 2025-09-25T16:03:59.038Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/multipack.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/streaming.html
- 2025-09-25T16:03:59.038Z
+ 2025-09-26T05:11:39.139Z
https://docs.axolotl.ai/docs/lora_optims.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/amd_hpc.html
- 2025-09-25T16:03:59.033Z
+ 2025-09-26T05:11:39.134Z
https://docs.axolotl.ai/docs/debugging.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/dataset-formats/conversation.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.134Z
https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.134Z
https://docs.axolotl.ai/docs/dataset-formats/index.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.134Z
https://docs.axolotl.ai/docs/config-reference.html
- 2025-09-25T16:07:41.262Z
+ 2025-09-26T05:15:28.531Z
https://docs.axolotl.ai/docs/multimodal.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/ray-integration.html
- 2025-09-25T16:03:59.038Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/faq.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/dataset_preprocessing.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/torchao.html
- 2025-09-25T16:03:59.038Z
+ 2025-09-26T05:11:39.139Z
https://docs.axolotl.ai/docs/optimizers.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/api/utils.schedulers.html
- 2025-09-25T16:07:25.684Z
+ 2025-09-26T05:15:12.695Z
https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html
- 2025-09-25T16:07:25.045Z
+ 2025-09-26T05:15:12.045Z
https://docs.axolotl.ai/docs/api/datasets.html
- 2025-09-25T16:07:24.718Z
+ 2025-09-26T05:15:11.713Z
https://docs.axolotl.ai/docs/api/utils.tokenization.html
- 2025-09-25T16:07:25.617Z
+ 2025-09-26T05:15:12.626Z
https://docs.axolotl.ai/docs/api/loaders.tokenizer.html
- 2025-09-25T16:07:25.140Z
+ 2025-09-26T05:15:12.142Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html
- 2025-09-25T16:07:25.515Z
+ 2025-09-26T05:15:12.523Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html
- 2025-09-25T16:07:25.585Z
+ 2025-09-26T05:15:12.593Z
https://docs.axolotl.ai/docs/api/utils.data.sft.html
- 2025-09-25T16:07:25.725Z
+ 2025-09-26T05:15:12.736Z
https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html
- 2025-09-25T16:07:25.569Z
+ 2025-09-26T05:15:12.578Z
https://docs.axolotl.ai/docs/api/loaders.patch_manager.html
- 2025-09-25T16:07:25.157Z
+ 2025-09-26T05:15:12.159Z
https://docs.axolotl.ai/docs/api/integrations.liger.args.html
- 2025-09-25T16:07:25.986Z
+ 2025-09-26T05:15:13.004Z
https://docs.axolotl.ai/docs/api/utils.schemas.peft.html
- 2025-09-25T16:07:25.799Z
+ 2025-09-26T05:15:12.813Z
https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html
- 2025-09-25T16:07:25.313Z
+ 2025-09-26T05:15:12.317Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html
- 2025-09-25T16:07:25.247Z
+ 2025-09-26T05:15:12.250Z
https://docs.axolotl.ai/docs/api/cli.cloud.base.html
- 2025-09-25T16:07:25.009Z
+ 2025-09-26T05:15:12.009Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html
- 2025-09-25T16:07:25.610Z
+ 2025-09-26T05:15:12.619Z
https://docs.axolotl.ai/docs/api/kernels.swiglu.html
- 2025-09-25T16:07:25.491Z
+ 2025-09-26T05:15:12.499Z
https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html
- 2025-09-25T16:07:25.974Z
+ 2025-09-26T05:15:12.992Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html
- 2025-09-25T16:07:25.361Z
+ 2025-09-26T05:15:12.366Z
https://docs.axolotl.ai/docs/api/monkeypatch.utils.html
- 2025-09-25T16:07:25.551Z
+ 2025-09-26T05:15:12.559Z
https://docs.axolotl.ai/docs/api/core.builders.rl.html
- 2025-09-25T16:07:24.797Z
+ 2025-09-26T05:15:11.794Z
https://docs.axolotl.ai/docs/api/loaders.processor.html
- 2025-09-25T16:07:25.142Z
+ 2025-09-26T05:15:12.144Z
https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html
- 2025-09-25T16:07:26.092Z
+ 2025-09-26T05:15:13.112Z
https://docs.axolotl.ai/docs/api/core.training_args.html
- 2025-09-25T16:07:24.810Z
+ 2025-09-26T05:15:11.807Z
https://docs.axolotl.ai/docs/api/loaders.adapter.html
- 2025-09-25T16:07:25.147Z
+ 2025-09-26T05:15:12.149Z
https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html
- 2025-09-25T16:07:24.986Z
+ 2025-09-26T05:15:11.986Z
https://docs.axolotl.ai/docs/api/cli.train.html
- 2025-09-25T16:07:24.892Z
+ 2025-09-26T05:15:11.890Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html
- 2025-09-25T16:07:25.167Z
+ 2025-09-26T05:15:12.170Z
https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html
- 2025-09-25T16:07:25.285Z
+ 2025-09-26T05:15:12.289Z
https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html
- 2025-09-25T16:07:25.296Z
+ 2025-09-26T05:15:12.300Z
https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html
- 2025-09-25T16:07:25.543Z
+ 2025-09-26T05:15:12.551Z
https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html
- 2025-09-25T16:07:25.317Z
+ 2025-09-26T05:15:12.322Z
https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html
- 2025-09-25T16:07:25.267Z
+ 2025-09-26T05:15:12.270Z
https://docs.axolotl.ai/docs/api/core.chat.messages.html
- 2025-09-25T16:07:24.833Z
+ 2025-09-26T05:15:11.830Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html
- 2025-09-25T16:07:25.174Z
+ 2025-09-26T05:15:12.176Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html
- 2025-09-25T16:07:25.342Z
+ 2025-09-26T05:15:12.347Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html
- 2025-09-25T16:07:25.351Z
+ 2025-09-26T05:15:12.357Z
https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html
- 2025-09-25T16:07:25.820Z
+ 2025-09-26T05:15:12.834Z
https://docs.axolotl.ai/docs/api/convert.html
- 2025-09-25T16:07:24.731Z
+ 2025-09-26T05:15:11.727Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html
- 2025-09-25T16:07:25.343Z
+ 2025-09-26T05:15:12.348Z
https://docs.axolotl.ai/docs/api/utils.schemas.config.html
- 2025-09-25T16:07:25.759Z
+ 2025-09-26T05:15:12.772Z
https://docs.axolotl.ai/docs/api/utils.schemas.enums.html
- 2025-09-25T16:07:25.829Z
+ 2025-09-26T05:15:12.843Z
https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html
- 2025-09-25T16:07:25.553Z
+ 2025-09-26T05:15:12.561Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html
- 2025-09-25T16:07:25.318Z
+ 2025-09-26T05:15:12.323Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html
- 2025-09-25T16:07:25.109Z
+ 2025-09-26T05:15:12.110Z
https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html
- 2025-09-25T16:07:25.989Z
+ 2025-09-26T05:15:13.007Z
https://docs.axolotl.ai/docs/api/utils.collators.core.html
- 2025-09-25T16:07:26.013Z
+ 2025-09-26T05:15:13.032Z
https://docs.axolotl.ai/docs/api/core.chat.format.shared.html
- 2025-09-25T16:07:24.837Z
+ 2025-09-26T05:15:11.834Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html
- 2025-09-25T16:07:25.381Z
+ 2025-09-26T05:15:12.387Z
https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html
- 2025-09-25T16:07:26.080Z
+ 2025-09-26T05:15:13.100Z
https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html
- 2025-09-25T16:07:26.105Z
+ 2025-09-26T05:15:13.126Z
https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html
- 2025-09-25T16:07:25.232Z
+ 2025-09-26T05:15:12.235Z
https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html
- 2025-09-25T16:07:25.808Z
+ 2025-09-26T05:15:12.822Z
https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html
- 2025-09-25T16:07:26.099Z
+ 2025-09-26T05:15:13.119Z
https://docs.axolotl.ai/docs/api/prompt_strategies.base.html
- 2025-09-25T16:07:25.199Z
+ 2025-09-26T05:15:12.202Z
https://docs.axolotl.ai/docs/api/kernels.utils.html
- 2025-09-25T16:07:25.500Z
+ 2025-09-26T05:15:12.508Z
https://docs.axolotl.ai/docs/api/cli.merge_lora.html
- 2025-09-25T16:07:24.974Z
+ 2025-09-26T05:15:11.973Z
https://docs.axolotl.ai/docs/api/cli.utils.html
- 2025-09-25T16:07:25.017Z
+ 2025-09-26T05:15:12.017Z
https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html
- 2025-09-25T16:07:25.197Z
+ 2025-09-26T05:15:12.200Z
https://docs.axolotl.ai/docs/api/index.html
- 2025-09-25T16:07:24.643Z
+ 2025-09-26T05:15:11.638Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html
- 2025-09-25T16:07:25.329Z
+ 2025-09-26T05:15:12.334Z
https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html
- 2025-09-25T16:07:25.581Z
+ 2025-09-26T05:15:12.590Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html
- 2025-09-25T16:07:25.306Z
+ 2025-09-26T05:15:12.311Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html
- 2025-09-25T16:07:25.121Z
+ 2025-09-26T05:15:12.122Z
https://docs.axolotl.ai/docs/api/utils.lora.html
- 2025-09-25T16:07:25.623Z
+ 2025-09-26T05:15:12.633Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html
- 2025-09-25T16:07:25.164Z
+ 2025-09-26T05:15:12.166Z
https://docs.axolotl.ai/docs/api/cli.config.html
- 2025-09-25T16:07:24.947Z
+ 2025-09-26T05:15:11.945Z
https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html
- 2025-09-25T16:07:25.510Z
+ 2025-09-26T05:15:12.518Z
https://docs.axolotl.ai/docs/api/utils.collators.batching.html
- 2025-09-25T16:07:26.032Z
+ 2025-09-26T05:15:13.051Z
https://docs.axolotl.ai/docs/api/utils.quantization.html
- 2025-09-25T16:07:25.744Z
+ 2025-09-26T05:15:12.756Z
https://docs.axolotl.ai/docs/api/utils.dict.html
- 2025-09-25T16:07:25.709Z
+ 2025-09-26T05:15:12.721Z
https://docs.axolotl.ai/docs/api/kernels.quantize.html
- 2025-09-25T16:07:25.499Z
+ 2025-09-26T05:15:12.506Z
https://docs.axolotl.ai/docs/api/utils.schemas.training.html
- 2025-09-25T16:07:25.773Z
+ 2025-09-26T05:15:12.786Z
https://docs.axolotl.ai/docs/api/train.html
- 2025-09-25T16:07:24.701Z
+ 2025-09-26T05:15:11.697Z
https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html
- 2025-09-25T16:07:24.850Z
+ 2025-09-26T05:15:11.847Z
https://docs.axolotl.ai/docs/inference.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/FAQS.html
- 2025-09-25T16:03:59.032Z
+ 2025-09-26T05:11:39.133Z
https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html
- 2025-09-25T16:03:59.042Z
+ 2025-09-26T05:11:39.143Z
https://docs.axolotl.ai/index.html
- 2025-09-25T16:03:59.055Z
+ 2025-09-26T05:11:39.156Z
https://docs.axolotl.ai/docs/custom_integrations.html
- 2025-09-25T16:03:59.033Z
+ 2025-09-26T05:11:39.134Z
https://docs.axolotl.ai/docs/api/utils.schemas.utils.html
- 2025-09-25T16:07:25.834Z
+ 2025-09-26T05:15:12.849Z
https://docs.axolotl.ai/docs/api/kernels.geglu.html
- 2025-09-25T16:07:25.481Z
+ 2025-09-26T05:15:12.489Z
https://docs.axolotl.ai/docs/api/core.builders.causal.html
- 2025-09-25T16:07:24.793Z
+ 2025-09-26T05:15:11.789Z
https://docs.axolotl.ai/docs/api/core.trainers.mamba.html
- 2025-09-25T16:07:25.091Z
+ 2025-09-26T05:15:12.092Z
https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html
- 2025-09-25T16:07:25.384Z
+ 2025-09-26T05:15:12.390Z
https://docs.axolotl.ai/docs/api/core.datasets.chat.html
- 2025-09-25T16:07:24.842Z
+ 2025-09-26T05:15:11.839Z
https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html
- 2025-09-25T16:07:26.040Z
+ 2025-09-26T05:15:13.059Z
https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html
- 2025-09-25T16:07:25.280Z
+ 2025-09-26T05:15:12.283Z
https://docs.axolotl.ai/docs/api/common.const.html
- 2025-09-25T16:07:25.995Z
+ 2025-09-26T05:15:13.014Z
https://docs.axolotl.ai/docs/api/cli.quantize.html
- 2025-09-25T16:07:24.999Z
+ 2025-09-26T05:15:11.999Z
https://docs.axolotl.ai/docs/api/utils.trainer.html
- 2025-09-25T16:07:25.657Z
+ 2025-09-26T05:15:12.668Z
https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html
- 2025-09-25T16:07:24.952Z
+ 2025-09-26T05:15:11.950Z
https://docs.axolotl.ai/docs/api/evaluate.html
- 2025-09-25T16:07:24.711Z
+ 2025-09-26T05:15:11.707Z
https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html
- 2025-09-25T16:07:25.509Z
+ 2025-09-26T05:15:12.516Z
https://docs.axolotl.ai/docs/api/loaders.model.html
- 2025-09-25T16:07:25.132Z
+ 2025-09-26T05:15:12.134Z
https://docs.axolotl.ai/docs/api/utils.distributed.html
- 2025-09-25T16:07:25.704Z
+ 2025-09-26T05:15:12.715Z
https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html
- 2025-09-25T16:07:25.629Z
+ 2025-09-26T05:15:12.638Z
https://docs.axolotl.ai/docs/api/kernels.lora.html
- 2025-09-25T16:07:25.471Z
+ 2025-09-26T05:15:12.478Z
https://docs.axolotl.ai/docs/api/cli.main.html
- 2025-09-25T16:07:24.883Z
+ 2025-09-26T05:15:11.882Z
https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html
- 2025-09-25T16:07:25.992Z
+ 2025-09-26T05:15:13.011Z
https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html
- 2025-09-25T16:07:25.717Z
+ 2025-09-26T05:15:12.728Z
https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html
- 2025-09-25T16:07:25.015Z
+ 2025-09-26T05:15:12.016Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html
- 2025-09-25T16:07:25.506Z
+ 2025-09-26T05:15:12.513Z
https://docs.axolotl.ai/docs/api/core.builders.base.html
- 2025-09-25T16:07:24.788Z
+ 2025-09-26T05:15:11.784Z
https://docs.axolotl.ai/docs/api/utils.schemas.trl.html
- 2025-09-25T16:07:25.803Z
+ 2025-09-26T05:15:12.817Z
https://docs.axolotl.ai/docs/api/cli.utils.args.html
- 2025-09-25T16:07:25.028Z
+ 2025-09-26T05:15:12.029Z
https://docs.axolotl.ai/docs/api/core.trainers.base.html
- 2025-09-25T16:07:25.071Z
+ 2025-09-26T05:15:12.072Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html
- 2025-09-25T16:07:25.554Z
+ 2025-09-26T05:15:12.562Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html
- 2025-09-25T16:07:25.507Z
+ 2025-09-26T05:15:12.515Z
https://docs.axolotl.ai/docs/api/utils.schemas.model.html
- 2025-09-25T16:07:25.766Z
+ 2025-09-26T05:15:12.779Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html
- 2025-09-25T16:07:25.359Z
+ 2025-09-26T05:15:12.365Z
https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html
- 2025-09-25T16:07:26.095Z
+ 2025-09-26T05:15:13.115Z
https://docs.axolotl.ai/docs/api/common.datasets.html
- 2025-09-25T16:07:26.010Z
+ 2025-09-26T05:15:13.029Z
https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html
- 2025-09-25T16:07:25.791Z
+ 2025-09-26T05:15:12.804Z
https://docs.axolotl.ai/docs/api/cli.utils.fetch.html
- 2025-09-25T16:07:25.033Z
+ 2025-09-26T05:15:12.034Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html
- 2025-09-25T16:07:25.339Z
+ 2025-09-26T05:15:12.344Z
https://docs.axolotl.ai/docs/api/monkeypatch.relora.html
- 2025-09-25T16:07:25.514Z
+ 2025-09-26T05:15:12.521Z
https://docs.axolotl.ai/docs/api/cli.evaluate.html
- 2025-09-25T16:07:24.900Z
+ 2025-09-26T05:15:11.898Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html
- 2025-09-25T16:07:25.340Z
+ 2025-09-26T05:15:12.345Z
https://docs.axolotl.ai/docs/api/core.trainers.utils.html
- 2025-09-25T16:07:25.122Z
+ 2025-09-26T05:15:12.124Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html
- 2025-09-25T16:07:25.259Z
+ 2025-09-26T05:15:12.262Z
https://docs.axolotl.ai/docs/api/utils.chat_templates.html
- 2025-09-25T16:07:25.619Z
+ 2025-09-26T05:15:12.628Z
https://docs.axolotl.ai/docs/api/utils.data.streaming.html
- 2025-09-25T16:07:25.719Z
+ 2025-09-26T05:15:12.730Z
https://docs.axolotl.ai/docs/api/utils.bench.html
- 2025-09-25T16:07:25.633Z
+ 2025-09-26T05:15:12.642Z
https://docs.axolotl.ai/docs/api/common.architectures.html
- 2025-09-25T16:07:25.994Z
+ 2025-09-26T05:15:13.012Z
https://docs.axolotl.ai/docs/api/cli.checks.html
- 2025-09-25T16:07:24.929Z
+ 2025-09-26T05:15:11.928Z
https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html
- 2025-09-25T16:07:25.098Z
+ 2025-09-26T05:15:12.099Z
https://docs.axolotl.ai/docs/api/integrations.base.html
- 2025-09-25T16:07:25.970Z
+ 2025-09-26T05:15:12.988Z
https://docs.axolotl.ai/docs/api/cli.utils.train.html
- 2025-09-25T16:07:25.057Z
+ 2025-09-26T05:15:12.057Z
https://docs.axolotl.ai/docs/api/utils.collators.mamba.html
- 2025-09-25T16:07:26.035Z
+ 2025-09-26T05:15:13.054Z
https://docs.axolotl.ai/docs/api/cli.art.html
- 2025-09-25T16:07:24.923Z
+ 2025-09-26T05:15:11.921Z
https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html
- 2025-09-25T16:07:25.563Z
+ 2025-09-26T05:15:12.571Z
https://docs.axolotl.ai/docs/api/logging_config.html
- 2025-09-25T16:07:24.782Z
+ 2025-09-26T05:15:11.778Z
https://docs.axolotl.ai/docs/api/utils.freeze.html
- 2025-09-25T16:07:25.640Z
+ 2025-09-26T05:15:12.650Z
https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html
- 2025-09-25T16:07:25.302Z
+ 2025-09-26T05:15:12.307Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html
- 2025-09-25T16:07:25.246Z
+ 2025-09-26T05:15:12.248Z
https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html
- 2025-09-25T16:07:25.560Z
+ 2025-09-26T05:15:12.568Z
https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html
- 2025-09-25T16:07:26.011Z
+ 2025-09-26T05:15:13.030Z
https://docs.axolotl.ai/docs/api/core.trainers.trl.html
- 2025-09-25T16:07:25.086Z
+ 2025-09-26T05:15:12.087Z
https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html
- 2025-09-25T16:07:25.291Z
+ 2025-09-26T05:15:12.296Z
https://docs.axolotl.ai/docs/api/loaders.constants.html
- 2025-09-25T16:07:25.158Z
+ 2025-09-26T05:15:12.161Z
https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html
- 2025-09-25T16:07:25.580Z
+ 2025-09-26T05:15:12.588Z
https://docs.axolotl.ai/docs/api/cli.vllm_serve.html
- 2025-09-25T16:07:25.006Z
+ 2025-09-26T05:15:12.006Z
https://docs.axolotl.ai/docs/api/prompt_tokenizers.html
- 2025-09-25T16:07:24.772Z
+ 2025-09-26T05:15:11.769Z
https://docs.axolotl.ai/docs/api/cli.args.html
- 2025-09-25T16:07:24.919Z
+ 2025-09-26T05:15:11.918Z
https://docs.axolotl.ai/docs/api/cli.inference.html
- 2025-09-25T16:07:24.966Z
+ 2025-09-26T05:15:11.965Z
https://docs.axolotl.ai/docs/api/cli.utils.load.html
- 2025-09-25T16:07:25.039Z
+ 2025-09-26T05:15:12.040Z
https://docs.axolotl.ai/docs/api/cli.preprocess.html
- 2025-09-25T16:07:24.994Z
+ 2025-09-26T05:15:11.994Z
https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html
- 2025-09-25T16:07:26.090Z
+ 2025-09-26T05:15:13.110Z
https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html
- 2025-09-25T16:07:26.086Z
+ 2025-09-26T05:15:13.106Z
https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html
- 2025-09-25T16:07:24.834Z
+ 2025-09-26T05:15:11.831Z
https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html
- 2025-09-25T16:07:25.975Z
+ 2025-09-26T05:15:12.993Z
https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html
- 2025-09-25T16:07:25.982Z
+ 2025-09-26T05:15:13.001Z
https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html
- 2025-09-25T16:07:25.571Z
+ 2025-09-26T05:15:12.579Z
https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html
- 2025-09-25T16:07:24.836Z
+ 2025-09-26T05:15:11.833Z
https://docs.axolotl.ai/docs/reward_modelling.html
- 2025-09-25T16:03:59.038Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/quantize.html
- 2025-09-25T16:03:59.038Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/fsdp_qlora.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/nd_parallelism.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/batch_vs_grad.html
- 2025-09-25T16:03:59.033Z
+ 2025-09-26T05:11:39.134Z
https://docs.axolotl.ai/docs/multi-node.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/rlhf.html
- 2025-09-25T16:03:59.038Z
+ 2025-09-26T05:11:39.139Z
https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/dataset-formats/pretraining.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/dataset-formats/tokenized.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/dataset-formats/template_free.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/multi-gpu.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/input_output.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/docker.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/gradient_checkpointing.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/optimizations.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/sequence_parallelism.html
- 2025-09-25T16:03:59.038Z
+ 2025-09-26T05:11:39.139Z
https://docs.axolotl.ai/docs/dataset_loading.html
- 2025-09-25T16:03:59.034Z
+ 2025-09-26T05:11:39.135Z
https://docs.axolotl.ai/docs/installation.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/mixed_precision.html
- 2025-09-25T16:03:59.037Z
+ 2025-09-26T05:11:39.138Z
https://docs.axolotl.ai/docs/unsloth.html
- 2025-09-25T16:03:59.038Z
+ 2025-09-26T05:11:39.139Z
https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html
- 2025-09-25T16:03:59.059Z
+ 2025-09-26T05:11:39.160Z