diff --git a/.nojekyll b/.nojekyll
index 5e356bf8e..fbce3de79 100644
--- a/.nojekyll
+++ b/.nojekyll
@@ -1 +1 @@
-5f2282be
\ No newline at end of file
+b3ac09e6
\ No newline at end of file
diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html
index 2c480d38e..0bbd82a78 100644
--- a/docs/custom_integrations.html
+++ b/docs/custom_integrations.html
@@ -574,7 +574,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
If you are installing from pip
-pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@010c3ac3f1e725098961832830303eeb4142dd88"
+pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@849c3c5"
Usage
@@ -594,6 +594,8 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
gemma3n_text
glm
glm4
+granite
+granitemoe
llama
llama4
llama4_text
@@ -609,6 +611,8 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
qwen2_5_vl
qwen3
qwen3_moe
+smollm3
+voxtral
diff --git a/examples/colab-notebooks/colab-axolotl-example.html b/examples/colab-notebooks/colab-axolotl-example.html
index 5f4329b66..f51f72662 100644
--- a/examples/colab-notebooks/colab-axolotl-example.html
+++ b/examples/colab-notebooks/colab-axolotl-example.html
@@ -538,7 +538,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
%% capture
# This step can take ~5-10 minutes to install dependencies
! pip install -- no- build- isolation axolotl[flash- attn]>= 0.9.1
-! pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@010c3ac3f1e725098961832830303eeb4142dd88"
+! pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@849c3c5"
Demo: Talk Like a Pirate
diff --git a/search.json b/search.json
index 2d7f1faaa..022bb2a7e 100644
--- a/search.json
+++ b/search.json
@@ -2841,7 +2841,7 @@
"href": "docs/custom_integrations.html#cut-cross-entropy",
"title": "Custom Integrations",
"section": "Cut Cross Entropy",
- "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@010c3ac3f1e725098961832830303eeb4142dd88\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\ncohere\ncohere2\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
+ "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@849c3c5\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\ncohere\ncohere2\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\ngranite\ngranitemoe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nsmollm3\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
"crumbs": [
"Advanced Features",
"Custom Integrations"
diff --git a/sitemap.xml b/sitemap.xml
index 12fc59674..c0e27cb89 100644
--- a/sitemap.xml
+++ b/sitemap.xml
@@ -2,786 +2,786 @@
https://docs.axolotl.ai/TODO.html
- 2025-07-31T19:25:10.800Z
+ 2025-07-31T22:18:52.245Z
https://docs.axolotl.ai/index.html
- 2025-07-31T19:25:10.821Z
+ 2025-07-31T22:18:52.265Z
https://docs.axolotl.ai/docs/debugging.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.247Z
https://docs.axolotl.ai/docs/amd_hpc.html
- 2025-07-31T19:25:10.801Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html
- 2025-07-31T19:28:28.464Z
+ 2025-07-31T22:22:20.582Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html
- 2025-07-31T19:28:27.881Z
+ 2025-07-31T22:22:20.009Z
https://docs.axolotl.ai/docs/api/loaders.patch_manager.html
- 2025-07-31T19:28:27.487Z
+ 2025-07-31T22:22:19.620Z
https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html
- 2025-07-31T19:28:27.167Z
+ 2025-07-31T22:22:19.305Z
https://docs.axolotl.ai/docs/api/cli.train.html
- 2025-07-31T19:28:27.224Z
+ 2025-07-31T22:22:19.361Z
https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html
- 2025-07-31T19:28:28.455Z
+ 2025-07-31T22:22:20.574Z
https://docs.axolotl.ai/docs/api/core.chat.messages.html
- 2025-07-31T19:28:27.164Z
+ 2025-07-31T22:22:19.302Z
https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html
- 2025-07-31T19:28:28.460Z
+ 2025-07-31T22:22:20.579Z
https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html
- 2025-07-31T19:28:27.320Z
+ 2025-07-31T22:22:19.454Z
https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html
- 2025-07-31T19:28:27.941Z
+ 2025-07-31T22:22:20.068Z
https://docs.axolotl.ai/docs/api/utils.chat_templates.html
- 2025-07-31T19:28:27.979Z
+ 2025-07-31T22:22:20.105Z
https://docs.axolotl.ai/docs/api/core.chat.format.shared.html
- 2025-07-31T19:28:27.169Z
+ 2025-07-31T22:22:19.306Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html
- 2025-07-31T19:28:27.494Z
+ 2025-07-31T22:22:19.627Z
https://docs.axolotl.ai/docs/api/utils.collators.mamba.html
- 2025-07-31T19:28:28.403Z
+ 2025-07-31T22:22:20.522Z
https://docs.axolotl.ai/docs/api/logging_config.html
- 2025-07-31T19:28:27.113Z
+ 2025-07-31T22:22:19.251Z
https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html
- 2025-07-31T19:28:28.408Z
+ 2025-07-31T22:22:20.527Z
https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html
- 2025-07-31T19:28:27.617Z
+ 2025-07-31T22:22:19.748Z
https://docs.axolotl.ai/docs/api/kernels.utils.html
- 2025-07-31T19:28:27.833Z
+ 2025-07-31T22:22:19.961Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html
- 2025-07-31T19:28:27.651Z
+ 2025-07-31T22:22:19.782Z
https://docs.axolotl.ai/docs/api/kernels.swiglu.html
- 2025-07-31T19:28:27.824Z
+ 2025-07-31T22:22:19.952Z
https://docs.axolotl.ai/docs/api/common.const.html
- 2025-07-31T19:28:28.363Z
+ 2025-07-31T22:22:20.483Z
https://docs.axolotl.ai/docs/api/cli.cloud.base.html
- 2025-07-31T19:28:27.343Z
+ 2025-07-31T22:22:19.477Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html
- 2025-07-31T19:28:27.714Z
+ 2025-07-31T22:22:19.845Z
https://docs.axolotl.ai/docs/api/core.builders.rl.html
- 2025-07-31T19:28:27.129Z
+ 2025-07-31T22:22:19.266Z
https://docs.axolotl.ai/docs/api/utils.dict.html
- 2025-07-31T19:28:28.072Z
+ 2025-07-31T22:22:20.196Z
https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html
- 2025-07-31T19:28:28.186Z
+ 2025-07-31T22:22:20.307Z
https://docs.axolotl.ai/docs/api/core.trainers.utils.html
- 2025-07-31T19:28:27.452Z
+ 2025-07-31T22:22:19.585Z
https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html
- 2025-07-31T19:28:27.930Z
+ 2025-07-31T22:22:20.057Z
https://docs.axolotl.ai/docs/api/cli.evaluate.html
- 2025-07-31T19:28:27.232Z
+ 2025-07-31T22:22:19.369Z
https://docs.axolotl.ai/docs/api/core.builders.causal.html
- 2025-07-31T19:28:27.124Z
+ 2025-07-31T22:22:19.262Z
https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html
- 2025-07-31T19:28:27.876Z
+ 2025-07-31T22:22:20.004Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html
- 2025-07-31T19:28:27.921Z
+ 2025-07-31T22:22:20.048Z
https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html
- 2025-07-31T19:28:27.285Z
+ 2025-07-31T22:22:19.420Z
https://docs.axolotl.ai/docs/api/utils.schemas.trl.html
- 2025-07-31T19:28:28.168Z
+ 2025-07-31T22:22:20.290Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html
- 2025-07-31T19:28:27.673Z
+ 2025-07-31T22:22:19.804Z
https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html
- 2025-07-31T19:28:28.350Z
+ 2025-07-31T22:22:20.470Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html
- 2025-07-31T19:28:27.971Z
+ 2025-07-31T22:22:20.097Z
https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html
- 2025-07-31T19:28:28.080Z
+ 2025-07-31T22:22:20.204Z
https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html
- 2025-07-31T19:28:27.940Z
+ 2025-07-31T22:22:20.066Z
https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html
- 2025-07-31T19:28:27.349Z
+ 2025-07-31T22:22:19.483Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html
- 2025-07-31T19:28:27.577Z
+ 2025-07-31T22:22:19.708Z
https://docs.axolotl.ai/docs/api/utils.freeze.html
- 2025-07-31T19:28:28.001Z
+ 2025-07-31T22:22:20.127Z
https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html
- 2025-07-31T19:28:27.718Z
+ 2025-07-31T22:22:19.848Z
https://docs.axolotl.ai/docs/api/integrations.base.html
- 2025-07-31T19:28:28.338Z
+ 2025-07-31T22:22:20.458Z
https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html
- 2025-07-31T19:28:27.938Z
+ 2025-07-31T22:22:20.065Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html
- 2025-07-31T19:28:27.692Z
+ 2025-07-31T22:22:19.823Z
https://docs.axolotl.ai/docs/api/cli.main.html
- 2025-07-31T19:28:27.215Z
+ 2025-07-31T22:22:19.352Z
https://docs.axolotl.ai/docs/api/common.datasets.html
- 2025-07-31T19:28:28.378Z
+ 2025-07-31T22:22:20.497Z
https://docs.axolotl.ai/docs/api/train.html
- 2025-07-31T19:28:27.026Z
+ 2025-07-31T22:22:19.166Z
https://docs.axolotl.ai/docs/api/utils.trainer.html
- 2025-07-31T19:28:28.018Z
+ 2025-07-31T22:22:20.143Z
https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html
- 2025-07-31T19:28:27.611Z
+ 2025-07-31T22:22:19.742Z
https://docs.axolotl.ai/docs/api/index.html
- 2025-07-31T19:28:26.965Z
+ 2025-07-31T22:22:19.104Z
https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html
- 2025-07-31T19:28:27.563Z
+ 2025-07-31T22:22:19.695Z
https://docs.axolotl.ai/docs/api/core.training_args.html
- 2025-07-31T19:28:27.141Z
+ 2025-07-31T22:22:19.279Z
https://docs.axolotl.ai/docs/api/kernels.quantize.html
- 2025-07-31T19:28:27.831Z
+ 2025-07-31T22:22:19.960Z
https://docs.axolotl.ai/docs/api/convert.html
- 2025-07-31T19:28:27.062Z
+ 2025-07-31T22:22:19.200Z
https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html
- 2025-07-31T19:28:28.343Z
+ 2025-07-31T22:22:20.462Z
https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html
- 2025-07-31T19:28:27.628Z
+ 2025-07-31T22:22:19.759Z
https://docs.axolotl.ai/docs/api/utils.schemas.model.html
- 2025-07-31T19:28:28.131Z
+ 2025-07-31T22:22:20.253Z
https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html
- 2025-07-31T19:28:28.474Z
+ 2025-07-31T22:22:20.593Z
https://docs.axolotl.ai/docs/api/loaders.constants.html
- 2025-07-31T19:28:27.489Z
+ 2025-07-31T22:22:19.621Z
https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html
- 2025-07-31T19:28:27.379Z
+ 2025-07-31T22:22:19.513Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html
- 2025-07-31T19:28:27.661Z
+ 2025-07-31T22:22:19.792Z
https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html
- 2025-07-31T19:28:27.182Z
+ 2025-07-31T22:22:19.319Z
https://docs.axolotl.ai/docs/api/cli.utils.fetch.html
- 2025-07-31T19:28:27.368Z
+ 2025-07-31T22:22:19.501Z
https://docs.axolotl.ai/docs/api/core.trainers.mamba.html
- 2025-07-31T19:28:27.420Z
+ 2025-07-31T22:22:19.554Z
https://docs.axolotl.ai/docs/api/utils.schemas.enums.html
- 2025-07-31T19:28:28.197Z
+ 2025-07-31T22:22:20.317Z
https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html
- 2025-07-31T19:28:28.459Z
+ 2025-07-31T22:22:20.577Z
https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html
- 2025-07-31T19:28:27.634Z
+ 2025-07-31T22:22:19.765Z
https://docs.axolotl.ai/docs/api/core.trainers.trl.html
- 2025-07-31T19:28:27.415Z
+ 2025-07-31T22:22:19.549Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html
- 2025-07-31T19:28:27.638Z
+ 2025-07-31T22:22:19.769Z
https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html
- 2025-07-31T19:28:28.449Z
+ 2025-07-31T22:22:20.567Z
https://docs.axolotl.ai/docs/api/utils.schedulers.html
- 2025-07-31T19:28:28.046Z
+ 2025-07-31T22:22:20.171Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html
- 2025-07-31T19:28:27.438Z
+ 2025-07-31T22:22:19.572Z
https://docs.axolotl.ai/docs/api/prompt_tokenizers.html
- 2025-07-31T19:28:27.104Z
+ 2025-07-31T22:22:19.242Z
https://docs.axolotl.ai/docs/config-reference.html
- 2025-07-31T19:28:41.750Z
+ 2025-07-31T22:22:33.863Z
https://docs.axolotl.ai/docs/multimodal.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/mixed_precision.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/unsloth.html
- 2025-07-31T19:25:10.806Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/ray-integration.html
- 2025-07-31T19:25:10.806Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/dataset-formats/template_free.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/dataset-formats/index.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/dataset-formats/pretraining.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/multi-gpu.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/torchao.html
- 2025-07-31T19:25:10.806Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/cli.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/nccl.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/dataset_preprocessing.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/faq.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.247Z
https://docs.axolotl.ai/docs/qat.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/gradient_checkpointing.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.247Z
https://docs.axolotl.ai/docs/input_output.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.249Z
https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html
- 2025-07-31T19:25:10.826Z
+ 2025-07-31T22:18:52.270Z
https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html
- 2025-07-31T19:25:10.826Z
+ 2025-07-31T22:18:52.270Z
https://docs.axolotl.ai/docs/mac.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/lr_groups.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/dataset_loading.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/getting-started.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.247Z
https://docs.axolotl.ai/docs/lora_optims.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/multi-node.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/fsdp_qlora.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.247Z
https://docs.axolotl.ai/docs/inference.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.249Z
https://docs.axolotl.ai/docs/sequence_parallelism.html
- 2025-07-31T19:25:10.806Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/rlhf.html
- 2025-07-31T19:25:10.806Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/dataset-formats/tokenized.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/dataset-formats/conversation.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/reward_modelling.html
- 2025-07-31T19:25:10.806Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/docker.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.247Z
https://docs.axolotl.ai/docs/installation.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.249Z
https://docs.axolotl.ai/docs/quantize.html
- 2025-07-31T19:25:10.806Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/docs/custom_integrations.html
- 2025-07-31T19:25:10.802Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/batch_vs_grad.html
- 2025-07-31T19:25:10.801Z
+ 2025-07-31T22:18:52.246Z
https://docs.axolotl.ai/docs/api/cli.utils.train.html
- 2025-07-31T19:28:27.389Z
+ 2025-07-31T22:22:19.523Z
https://docs.axolotl.ai/docs/api/cli.art.html
- 2025-07-31T19:28:27.255Z
+ 2025-07-31T22:22:19.391Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html
- 2025-07-31T19:28:27.450Z
+ 2025-07-31T22:22:19.584Z
https://docs.axolotl.ai/docs/api/loaders.model.html
- 2025-07-31T19:28:27.462Z
+ 2025-07-31T22:22:19.595Z
https://docs.axolotl.ai/docs/api/cli.preprocess.html
- 2025-07-31T19:28:27.328Z
+ 2025-07-31T22:22:19.462Z
https://docs.axolotl.ai/docs/api/cli.utils.html
- 2025-07-31T19:28:27.351Z
+ 2025-07-31T22:22:19.484Z
https://docs.axolotl.ai/docs/api/cli.inference.html
- 2025-07-31T19:28:27.299Z
+ 2025-07-31T22:22:19.434Z
https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html
- 2025-07-31T19:28:27.920Z
+ 2025-07-31T22:22:20.047Z
https://docs.axolotl.ai/docs/api/datasets.html
- 2025-07-31T19:28:27.048Z
+ 2025-07-31T22:22:19.187Z
https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html
- 2025-07-31T19:28:27.937Z
+ 2025-07-31T22:22:20.063Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html
- 2025-07-31T19:28:27.859Z
+ 2025-07-31T22:22:19.987Z
https://docs.axolotl.ai/docs/api/monkeypatch.relora.html
- 2025-07-31T19:28:27.880Z
+ 2025-07-31T22:22:20.007Z
https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html
- 2025-07-31T19:28:27.927Z
+ 2025-07-31T22:22:20.054Z
https://docs.axolotl.ai/docs/api/loaders.adapter.html
- 2025-07-31T19:28:27.477Z
+ 2025-07-31T22:22:19.610Z
https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html
- 2025-07-31T19:28:27.427Z
+ 2025-07-31T22:22:19.561Z
https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html
- 2025-07-31T19:28:28.341Z
+ 2025-07-31T22:22:20.461Z
https://docs.axolotl.ai/docs/api/monkeypatch.utils.html
- 2025-07-31T19:28:27.918Z
+ 2025-07-31T22:22:20.045Z
https://docs.axolotl.ai/docs/api/loaders.processor.html
- 2025-07-31T19:28:27.471Z
+ 2025-07-31T22:22:19.605Z
https://docs.axolotl.ai/docs/api/cli.config.html
- 2025-07-31T19:28:27.280Z
+ 2025-07-31T22:22:19.415Z
https://docs.axolotl.ai/docs/api/integrations.liger.args.html
- 2025-07-31T19:28:28.354Z
+ 2025-07-31T22:22:20.473Z
https://docs.axolotl.ai/docs/api/loaders.tokenizer.html
- 2025-07-31T19:28:27.470Z
+ 2025-07-31T22:22:19.603Z
https://docs.axolotl.ai/docs/api/utils.schemas.config.html
- 2025-07-31T19:28:28.124Z
+ 2025-07-31T22:22:20.246Z
https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html
- 2025-07-31T19:28:27.529Z
+ 2025-07-31T22:22:19.661Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html
- 2025-07-31T19:28:27.504Z
+ 2025-07-31T22:22:19.637Z
https://docs.axolotl.ai/docs/api/core.trainers.base.html
- 2025-07-31T19:28:27.400Z
+ 2025-07-31T22:22:19.534Z
https://docs.axolotl.ai/docs/api/cli.utils.args.html
- 2025-07-31T19:28:27.362Z
+ 2025-07-31T22:22:19.496Z
https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html
- 2025-07-31T19:28:27.649Z
+ 2025-07-31T22:22:19.780Z
https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html
- 2025-07-31T19:28:27.910Z
+ 2025-07-31T22:22:20.037Z
https://docs.axolotl.ai/docs/api/kernels.lora.html
- 2025-07-31T19:28:27.803Z
+ 2025-07-31T22:22:19.931Z
https://docs.axolotl.ai/docs/api/cli.vllm_serve.html
- 2025-07-31T19:28:27.340Z
+ 2025-07-31T22:22:19.473Z
https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html
- 2025-07-31T19:28:28.174Z
+ 2025-07-31T22:22:20.295Z
https://docs.axolotl.ai/docs/api/utils.schemas.utils.html
- 2025-07-31T19:28:28.203Z
+ 2025-07-31T22:22:20.323Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html
- 2025-07-31T19:28:27.860Z
+ 2025-07-31T22:22:19.988Z
https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html
- 2025-07-31T19:28:28.357Z
+ 2025-07-31T22:22:20.476Z
https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html
- 2025-07-31T19:28:27.875Z
+ 2025-07-31T22:22:20.002Z
https://docs.axolotl.ai/docs/api/utils.collators.core.html
- 2025-07-31T19:28:28.381Z
+ 2025-07-31T22:22:20.500Z
https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html
- 2025-07-31T19:28:27.166Z
+ 2025-07-31T22:22:19.304Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html
- 2025-07-31T19:28:27.676Z
+ 2025-07-31T22:22:19.807Z
https://docs.axolotl.ai/docs/api/core.datasets.chat.html
- 2025-07-31T19:28:27.174Z
+ 2025-07-31T22:22:19.312Z
https://docs.axolotl.ai/docs/api/utils.bench.html
- 2025-07-31T19:28:27.993Z
+ 2025-07-31T22:22:20.119Z
https://docs.axolotl.ai/docs/api/utils.schemas.training.html
- 2025-07-31T19:28:28.138Z
+ 2025-07-31T22:22:20.260Z
https://docs.axolotl.ai/docs/api/utils.collators.batching.html
- 2025-07-31T19:28:28.399Z
+ 2025-07-31T22:22:20.519Z
https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html
- 2025-07-31T19:28:27.623Z
+ 2025-07-31T22:22:19.754Z
https://docs.axolotl.ai/docs/api/utils.lora.html
- 2025-07-31T19:28:27.984Z
+ 2025-07-31T22:22:20.110Z
https://docs.axolotl.ai/docs/api/prompt_strategies.base.html
- 2025-07-31T19:28:27.530Z
+ 2025-07-31T22:22:19.662Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html
- 2025-07-31T19:28:27.591Z
+ 2025-07-31T22:22:19.722Z
https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html
- 2025-07-31T19:28:28.156Z
+ 2025-07-31T22:22:20.278Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html
- 2025-07-31T19:28:27.674Z
+ 2025-07-31T22:22:19.805Z
https://docs.axolotl.ai/docs/api/utils.schemas.peft.html
- 2025-07-31T19:28:28.165Z
+ 2025-07-31T22:22:20.286Z
https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html
- 2025-07-31T19:28:27.645Z
+ 2025-07-31T22:22:19.776Z
https://docs.axolotl.ai/docs/api/common.architectures.html
- 2025-07-31T19:28:28.362Z
+ 2025-07-31T22:22:20.481Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html
- 2025-07-31T19:28:27.945Z
+ 2025-07-31T22:22:20.071Z
https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html
- 2025-07-31T19:28:28.468Z
+ 2025-07-31T22:22:20.586Z
https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html
- 2025-07-31T19:28:28.360Z
+ 2025-07-31T22:22:20.480Z
https://docs.axolotl.ai/docs/api/cli.quantize.html
- 2025-07-31T19:28:27.333Z
+ 2025-07-31T22:22:19.467Z
https://docs.axolotl.ai/docs/api/cli.checks.html
- 2025-07-31T19:28:27.261Z
+ 2025-07-31T22:22:19.397Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html
- 2025-07-31T19:28:27.684Z
+ 2025-07-31T22:22:19.815Z
https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html
- 2025-07-31T19:28:27.989Z
+ 2025-07-31T22:22:20.115Z
https://docs.axolotl.ai/docs/api/utils.quantization.html
- 2025-07-31T19:28:28.109Z
+ 2025-07-31T22:22:20.232Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html
- 2025-07-31T19:28:27.497Z
+ 2025-07-31T22:22:19.630Z
https://docs.axolotl.ai/docs/api/kernels.geglu.html
- 2025-07-31T19:28:27.813Z
+ 2025-07-31T22:22:19.942Z
https://docs.axolotl.ai/docs/api/utils.data.pretraining.html
- 2025-07-31T19:28:28.081Z
+ 2025-07-31T22:22:20.205Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html
- 2025-07-31T19:28:27.694Z
+ 2025-07-31T22:22:19.824Z
https://docs.axolotl.ai/docs/api/core.builders.base.html
- 2025-07-31T19:28:27.119Z
+ 2025-07-31T22:22:19.257Z
https://docs.axolotl.ai/docs/api/cli.merge_lora.html
- 2025-07-31T19:28:27.308Z
+ 2025-07-31T22:22:19.442Z
https://docs.axolotl.ai/docs/api/cli.utils.load.html
- 2025-07-31T19:28:27.373Z
+ 2025-07-31T22:22:19.507Z
https://docs.axolotl.ai/docs/api/utils.data.sft.html
- 2025-07-31T19:28:28.088Z
+ 2025-07-31T22:22:20.212Z
https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html
- 2025-07-31T19:28:27.599Z
+ 2025-07-31T22:22:19.730Z
https://docs.axolotl.ai/docs/api/utils.tokenization.html
- 2025-07-31T19:28:27.977Z
+ 2025-07-31T22:22:20.104Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html
- 2025-07-31T19:28:27.671Z
+ 2025-07-31T22:22:19.802Z
https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html
- 2025-07-31T19:28:28.379Z
+ 2025-07-31T22:22:20.498Z
https://docs.axolotl.ai/docs/api/cli.args.html
- 2025-07-31T19:28:27.251Z
+ 2025-07-31T22:22:19.388Z
https://docs.axolotl.ai/docs/api/evaluate.html
- 2025-07-31T19:28:27.037Z
+ 2025-07-31T22:22:19.176Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html
- 2025-07-31T19:28:27.579Z
+ 2025-07-31T22:22:19.710Z
https://docs.axolotl.ai/docs/api/utils.distributed.html
- 2025-07-31T19:28:28.066Z
+ 2025-07-31T22:22:20.191Z
https://docs.axolotl.ai/docs/multipack.html
- 2025-07-31T19:25:10.805Z
+ 2025-07-31T22:18:52.250Z
https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html
- 2025-07-31T19:25:10.810Z
+ 2025-07-31T22:18:52.254Z
https://docs.axolotl.ai/FAQS.html
- 2025-07-31T19:25:10.800Z
+ 2025-07-31T22:18:52.244Z