diff --git a/.nojekyll b/.nojekyll
index 3f9eb5c76..ee8927050 100644
--- a/.nojekyll
+++ b/.nojekyll
@@ -1 +1 @@
-18281ec0
\ No newline at end of file
+6c55d4f1
\ No newline at end of file
diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html
index 3d07cf47d..486294a80 100644
--- a/docs/custom_integrations.html
+++ b/docs/custom_integrations.html
@@ -577,7 +577,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
If you are installing from pip
-pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@849c3c5"
+pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@cbd58e0"
Usage
diff --git a/examples/colab-notebooks/colab-axolotl-example.html b/examples/colab-notebooks/colab-axolotl-example.html
index a783fb65b..25b069ec9 100644
--- a/examples/colab-notebooks/colab-axolotl-example.html
+++ b/examples/colab-notebooks/colab-axolotl-example.html
@@ -541,7 +541,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
%% capture
# This step can take ~5-10 minutes to install dependencies
! pip install -- no- build- isolation axolotl[flash- attn]>= 0.9.1
-! pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@849c3c5"
+! pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@cbd58e0"
Demo: Talk Like a Pirate
diff --git a/search.json b/search.json
index eec472f44..199227f21 100644
--- a/search.json
+++ b/search.json
@@ -2896,7 +2896,7 @@
"href": "docs/custom_integrations.html#cut-cross-entropy",
"title": "Custom Integrations",
"section": "Cut Cross Entropy",
- "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@849c3c5\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\ncohere\ncohere2\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\ngranite\ngranitemoe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nsmollm3\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
+ "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@cbd58e0\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\ncohere\ncohere2\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\ngranite\ngranitemoe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nsmollm3\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
"crumbs": [
"Advanced Features",
"Custom Integrations"
diff --git a/sitemap.xml b/sitemap.xml
index abd656e4f..5a5dc7790 100644
--- a/sitemap.xml
+++ b/sitemap.xml
@@ -2,790 +2,790 @@
https://docs.axolotl.ai/TODO.html
- 2025-08-01T13:59:54.047Z
+ 2025-08-01T17:22:09.551Z
https://docs.axolotl.ai/index.html
- 2025-08-01T13:59:54.067Z
+ 2025-08-01T17:22:09.571Z
https://docs.axolotl.ai/docs/debugging.html
- 2025-08-01T13:59:54.049Z
+ 2025-08-01T17:22:09.553Z
https://docs.axolotl.ai/docs/amd_hpc.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.552Z
https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html
- 2025-08-01T14:03:01.648Z
+ 2025-08-01T17:25:25.650Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html
- 2025-08-01T14:03:01.078Z
+ 2025-08-01T17:25:25.074Z
https://docs.axolotl.ai/docs/api/loaders.patch_manager.html
- 2025-08-01T14:03:00.689Z
+ 2025-08-01T17:25:24.681Z
https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html
- 2025-08-01T14:03:00.374Z
+ 2025-08-01T17:25:24.363Z
https://docs.axolotl.ai/docs/api/cli.train.html
- 2025-08-01T14:03:00.431Z
+ 2025-08-01T17:25:24.420Z
https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html
- 2025-08-01T14:03:01.640Z
+ 2025-08-01T17:25:25.641Z
https://docs.axolotl.ai/docs/api/core.chat.messages.html
- 2025-08-01T14:03:00.372Z
+ 2025-08-01T17:25:24.360Z
https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html
- 2025-08-01T14:03:01.645Z
+ 2025-08-01T17:25:25.647Z
https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html
- 2025-08-01T14:03:00.524Z
+ 2025-08-01T17:25:24.514Z
https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html
- 2025-08-01T14:03:01.136Z
+ 2025-08-01T17:25:25.133Z
https://docs.axolotl.ai/docs/api/utils.chat_templates.html
- 2025-08-01T14:03:01.173Z
+ 2025-08-01T17:25:25.170Z
https://docs.axolotl.ai/docs/api/core.chat.format.shared.html
- 2025-08-01T14:03:00.376Z
+ 2025-08-01T17:25:24.364Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html
- 2025-08-01T14:03:00.696Z
+ 2025-08-01T17:25:24.688Z
https://docs.axolotl.ai/docs/api/utils.collators.mamba.html
- 2025-08-01T14:03:01.588Z
+ 2025-08-01T17:25:25.590Z
https://docs.axolotl.ai/docs/api/logging_config.html
- 2025-08-01T14:03:00.321Z
+ 2025-08-01T17:25:24.309Z
https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html
- 2025-08-01T14:03:01.593Z
+ 2025-08-01T17:25:25.595Z
https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html
- 2025-08-01T14:03:00.818Z
+ 2025-08-01T17:25:24.810Z
https://docs.axolotl.ai/docs/api/kernels.utils.html
- 2025-08-01T14:03:01.029Z
+ 2025-08-01T17:25:25.025Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html
- 2025-08-01T14:03:00.851Z
+ 2025-08-01T17:25:24.844Z
https://docs.axolotl.ai/docs/api/kernels.swiglu.html
- 2025-08-01T14:03:01.021Z
+ 2025-08-01T17:25:25.016Z
https://docs.axolotl.ai/docs/api/common.const.html
- 2025-08-01T14:03:01.549Z
+ 2025-08-01T17:25:25.550Z
https://docs.axolotl.ai/docs/api/cli.cloud.base.html
- 2025-08-01T14:03:00.547Z
+ 2025-08-01T17:25:24.537Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html
- 2025-08-01T14:03:00.913Z
+ 2025-08-01T17:25:24.908Z
https://docs.axolotl.ai/docs/api/core.builders.rl.html
- 2025-08-01T14:03:00.336Z
+ 2025-08-01T17:25:24.324Z
https://docs.axolotl.ai/docs/api/utils.dict.html
- 2025-08-01T14:03:01.264Z
+ 2025-08-01T17:25:25.261Z
https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html
- 2025-08-01T14:03:01.376Z
+ 2025-08-01T17:25:25.374Z
https://docs.axolotl.ai/docs/api/core.trainers.utils.html
- 2025-08-01T14:03:00.655Z
+ 2025-08-01T17:25:24.646Z
https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html
- 2025-08-01T14:03:01.126Z
+ 2025-08-01T17:25:25.122Z
https://docs.axolotl.ai/docs/api/cli.evaluate.html
- 2025-08-01T14:03:00.439Z
+ 2025-08-01T17:25:24.428Z
https://docs.axolotl.ai/docs/api/core.builders.causal.html
- 2025-08-01T14:03:00.332Z
+ 2025-08-01T17:25:24.320Z
https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html
- 2025-08-01T14:03:01.073Z
+ 2025-08-01T17:25:25.069Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html
- 2025-08-01T14:03:01.117Z
+ 2025-08-01T17:25:25.113Z
https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html
- 2025-08-01T14:03:00.490Z
+ 2025-08-01T17:25:24.479Z
https://docs.axolotl.ai/docs/api/utils.schemas.trl.html
- 2025-08-01T14:03:01.358Z
+ 2025-08-01T17:25:25.356Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html
- 2025-08-01T14:03:00.872Z
+ 2025-08-01T17:25:24.867Z
https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html
- 2025-08-01T14:03:01.536Z
+ 2025-08-01T17:25:25.537Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html
- 2025-08-01T14:03:01.165Z
+ 2025-08-01T17:25:25.162Z
https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html
- 2025-08-01T14:03:01.272Z
+ 2025-08-01T17:25:25.269Z
https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html
- 2025-08-01T14:03:01.135Z
+ 2025-08-01T17:25:25.131Z
https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html
- 2025-08-01T14:03:00.553Z
+ 2025-08-01T17:25:24.543Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html
- 2025-08-01T14:03:00.778Z
+ 2025-08-01T17:25:24.770Z
https://docs.axolotl.ai/docs/api/utils.freeze.html
- 2025-08-01T14:03:01.195Z
+ 2025-08-01T17:25:25.192Z
https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html
- 2025-08-01T14:03:00.917Z
+ 2025-08-01T17:25:24.912Z
https://docs.axolotl.ai/docs/api/integrations.base.html
- 2025-08-01T14:03:01.525Z
+ 2025-08-01T17:25:25.525Z
https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html
- 2025-08-01T14:03:01.134Z
+ 2025-08-01T17:25:25.130Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html
- 2025-08-01T14:03:00.891Z
+ 2025-08-01T17:25:24.886Z
https://docs.axolotl.ai/docs/api/cli.main.html
- 2025-08-01T14:03:00.422Z
+ 2025-08-01T17:25:24.411Z
https://docs.axolotl.ai/docs/api/common.datasets.html
- 2025-08-01T14:03:01.564Z
+ 2025-08-01T17:25:25.565Z
https://docs.axolotl.ai/docs/api/train.html
- 2025-08-01T14:03:00.235Z
+ 2025-08-01T17:25:24.223Z
https://docs.axolotl.ai/docs/api/utils.trainer.html
- 2025-08-01T14:03:01.212Z
+ 2025-08-01T17:25:25.209Z
https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html
- 2025-08-01T14:03:00.812Z
+ 2025-08-01T17:25:24.804Z
https://docs.axolotl.ai/docs/api/index.html
- 2025-08-01T14:03:00.174Z
+ 2025-08-01T17:25:24.161Z
https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html
- 2025-08-01T14:03:00.764Z
+ 2025-08-01T17:25:24.756Z
https://docs.axolotl.ai/docs/api/core.training_args.html
- 2025-08-01T14:03:00.349Z
+ 2025-08-01T17:25:24.337Z
https://docs.axolotl.ai/docs/api/kernels.quantize.html
- 2025-08-01T14:03:01.028Z
+ 2025-08-01T17:25:25.023Z
https://docs.axolotl.ai/docs/api/convert.html
- 2025-08-01T14:03:00.270Z
+ 2025-08-01T17:25:24.258Z
https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html
- 2025-08-01T14:03:01.529Z
+ 2025-08-01T17:25:25.529Z
https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html
- 2025-08-01T14:03:00.828Z
+ 2025-08-01T17:25:24.821Z
https://docs.axolotl.ai/docs/api/utils.schemas.model.html
- 2025-08-01T14:03:01.321Z
+ 2025-08-01T17:25:25.319Z
https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html
- 2025-08-01T14:03:01.658Z
+ 2025-08-01T17:25:25.661Z
https://docs.axolotl.ai/docs/api/loaders.constants.html
- 2025-08-01T14:03:00.690Z
+ 2025-08-01T17:25:24.682Z
https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html
- 2025-08-01T14:03:00.582Z
+ 2025-08-01T17:25:24.573Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html
- 2025-08-01T14:03:00.861Z
+ 2025-08-01T17:25:24.855Z
https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html
- 2025-08-01T14:03:00.389Z
+ 2025-08-01T17:25:24.377Z
https://docs.axolotl.ai/docs/api/cli.utils.fetch.html
- 2025-08-01T14:03:00.571Z
+ 2025-08-01T17:25:24.561Z
https://docs.axolotl.ai/docs/api/core.trainers.mamba.html
- 2025-08-01T14:03:00.624Z
+ 2025-08-01T17:25:24.615Z
https://docs.axolotl.ai/docs/api/utils.schemas.enums.html
- 2025-08-01T14:03:01.386Z
+ 2025-08-01T17:25:25.384Z
https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html
- 2025-08-01T14:03:01.643Z
+ 2025-08-01T17:25:25.645Z
https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html
- 2025-08-01T14:03:00.835Z
+ 2025-08-01T17:25:24.827Z
https://docs.axolotl.ai/docs/api/core.trainers.trl.html
- 2025-08-01T14:03:00.618Z
+ 2025-08-01T17:25:24.609Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html
- 2025-08-01T14:03:00.838Z
+ 2025-08-01T17:25:24.831Z
https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html
- 2025-08-01T14:03:01.633Z
+ 2025-08-01T17:25:25.635Z
https://docs.axolotl.ai/docs/api/utils.schedulers.html
- 2025-08-01T14:03:01.239Z
+ 2025-08-01T17:25:25.236Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html
- 2025-08-01T14:03:00.641Z
+ 2025-08-01T17:25:24.632Z
https://docs.axolotl.ai/docs/api/prompt_tokenizers.html
- 2025-08-01T14:03:00.311Z
+ 2025-08-01T17:25:24.299Z
https://docs.axolotl.ai/docs/config-reference.html
- 2025-08-01T14:03:14.306Z
+ 2025-08-01T17:25:37.925Z
https://docs.axolotl.ai/docs/multimodal.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/mixed_precision.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/unsloth.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.557Z
https://docs.axolotl.ai/docs/ray-integration.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.552Z
https://docs.axolotl.ai/docs/dataset-formats/template_free.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.553Z
https://docs.axolotl.ai/docs/dataset-formats/index.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.552Z
https://docs.axolotl.ai/docs/dataset-formats/pretraining.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.552Z
https://docs.axolotl.ai/docs/nd_parallelism.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/sequence_parallelism.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.557Z
https://docs.axolotl.ai/docs/inference.html
- 2025-08-01T13:59:54.051Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/fsdp_qlora.html
- 2025-08-01T13:59:54.049Z
+ 2025-08-01T17:22:09.553Z
https://docs.axolotl.ai/docs/multi-node.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/lora_optims.html
- 2025-08-01T13:59:54.051Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/getting-started.html
- 2025-08-01T13:59:54.049Z
+ 2025-08-01T17:22:09.553Z
https://docs.axolotl.ai/docs/dataset_loading.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.553Z
https://docs.axolotl.ai/docs/lr_groups.html
- 2025-08-01T13:59:54.051Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/mac.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html
- 2025-08-01T13:59:54.072Z
+ 2025-08-01T17:22:09.576Z
https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html
- 2025-08-01T13:59:54.071Z
+ 2025-08-01T17:22:09.576Z
https://docs.axolotl.ai/docs/input_output.html
- 2025-08-01T13:59:54.051Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/gradient_checkpointing.html
- 2025-08-01T13:59:54.049Z
+ 2025-08-01T17:22:09.553Z
https://docs.axolotl.ai/docs/qat.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/faq.html
- 2025-08-01T13:59:54.049Z
+ 2025-08-01T17:22:09.553Z
https://docs.axolotl.ai/docs/dataset_preprocessing.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.553Z
https://docs.axolotl.ai/docs/nccl.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/cli.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.552Z
https://docs.axolotl.ai/docs/torchao.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.557Z
https://docs.axolotl.ai/docs/multi-gpu.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/rlhf.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/dataset-formats/tokenized.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.553Z
https://docs.axolotl.ai/docs/dataset-formats/conversation.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.552Z
https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.552Z
https://docs.axolotl.ai/docs/reward_modelling.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/docker.html
- 2025-08-01T13:59:54.049Z
+ 2025-08-01T17:22:09.553Z
https://docs.axolotl.ai/docs/installation.html
- 2025-08-01T13:59:54.051Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/quantize.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/docs/custom_integrations.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.552Z
https://docs.axolotl.ai/docs/batch_vs_grad.html
- 2025-08-01T13:59:54.048Z
+ 2025-08-01T17:22:09.552Z
https://docs.axolotl.ai/docs/api/cli.utils.train.html
- 2025-08-01T14:03:00.593Z
+ 2025-08-01T17:25:24.583Z
https://docs.axolotl.ai/docs/api/cli.art.html
- 2025-08-01T14:03:00.461Z
+ 2025-08-01T17:25:24.450Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html
- 2025-08-01T14:03:00.653Z
+ 2025-08-01T17:25:24.644Z
https://docs.axolotl.ai/docs/api/loaders.model.html
- 2025-08-01T14:03:00.664Z
+ 2025-08-01T17:25:24.656Z
https://docs.axolotl.ai/docs/api/cli.preprocess.html
- 2025-08-01T14:03:00.532Z
+ 2025-08-01T17:25:24.522Z
https://docs.axolotl.ai/docs/api/cli.utils.html
- 2025-08-01T14:03:00.554Z
+ 2025-08-01T17:25:24.545Z
https://docs.axolotl.ai/docs/api/cli.inference.html
- 2025-08-01T14:03:00.504Z
+ 2025-08-01T17:25:24.493Z
https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html
- 2025-08-01T14:03:01.115Z
+ 2025-08-01T17:25:25.111Z
https://docs.axolotl.ai/docs/api/datasets.html
- 2025-08-01T14:03:00.257Z
+ 2025-08-01T17:25:24.244Z
https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html
- 2025-08-01T14:03:01.132Z
+ 2025-08-01T17:25:25.128Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html
- 2025-08-01T14:03:01.055Z
+ 2025-08-01T17:25:25.051Z
https://docs.axolotl.ai/docs/api/monkeypatch.relora.html
- 2025-08-01T14:03:01.076Z
+ 2025-08-01T17:25:25.072Z
https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html
- 2025-08-01T14:03:01.123Z
+ 2025-08-01T17:25:25.119Z
https://docs.axolotl.ai/docs/api/loaders.adapter.html
- 2025-08-01T14:03:00.679Z
+ 2025-08-01T17:25:24.671Z
https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html
- 2025-08-01T14:03:00.630Z
+ 2025-08-01T17:25:24.621Z
https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html
- 2025-08-01T14:03:01.528Z
+ 2025-08-01T17:25:25.528Z
https://docs.axolotl.ai/docs/api/monkeypatch.utils.html
- 2025-08-01T14:03:01.114Z
+ 2025-08-01T17:25:25.110Z
https://docs.axolotl.ai/docs/api/loaders.processor.html
- 2025-08-01T14:03:00.674Z
+ 2025-08-01T17:25:24.665Z
https://docs.axolotl.ai/docs/api/cli.config.html
- 2025-08-01T14:03:00.485Z
+ 2025-08-01T17:25:24.475Z
https://docs.axolotl.ai/docs/api/integrations.liger.args.html
- 2025-08-01T14:03:01.540Z
+ 2025-08-01T17:25:25.541Z
https://docs.axolotl.ai/docs/api/loaders.tokenizer.html
- 2025-08-01T14:03:00.672Z
+ 2025-08-01T17:25:24.664Z
https://docs.axolotl.ai/docs/api/utils.schemas.config.html
- 2025-08-01T14:03:01.314Z
+ 2025-08-01T17:25:25.312Z
https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html
- 2025-08-01T14:03:00.730Z
+ 2025-08-01T17:25:24.722Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html
- 2025-08-01T14:03:00.706Z
+ 2025-08-01T17:25:24.698Z
https://docs.axolotl.ai/docs/api/core.trainers.base.html
- 2025-08-01T14:03:00.603Z
+ 2025-08-01T17:25:24.594Z
https://docs.axolotl.ai/docs/api/cli.utils.args.html
- 2025-08-01T14:03:00.566Z
+ 2025-08-01T17:25:24.556Z
https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html
- 2025-08-01T14:03:00.849Z
+ 2025-08-01T17:25:24.842Z
https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html
- 2025-08-01T14:03:01.106Z
+ 2025-08-01T17:25:25.102Z
https://docs.axolotl.ai/docs/api/kernels.lora.html
- 2025-08-01T14:03:01.000Z
+ 2025-08-01T17:25:24.995Z
https://docs.axolotl.ai/docs/api/cli.vllm_serve.html
- 2025-08-01T14:03:00.544Z
+ 2025-08-01T17:25:24.533Z
https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html
- 2025-08-01T14:03:01.363Z
+ 2025-08-01T17:25:25.362Z
https://docs.axolotl.ai/docs/api/utils.schemas.utils.html
- 2025-08-01T14:03:01.391Z
+ 2025-08-01T17:25:25.390Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html
- 2025-08-01T14:03:01.057Z
+ 2025-08-01T17:25:25.053Z
https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html
- 2025-08-01T14:03:01.543Z
+ 2025-08-01T17:25:25.544Z
https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html
- 2025-08-01T14:03:01.071Z
+ 2025-08-01T17:25:25.067Z
https://docs.axolotl.ai/docs/api/utils.collators.core.html
- 2025-08-01T14:03:01.566Z
+ 2025-08-01T17:25:25.568Z
https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html
- 2025-08-01T14:03:00.373Z
+ 2025-08-01T17:25:24.361Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html
- 2025-08-01T14:03:00.875Z
+ 2025-08-01T17:25:24.870Z
https://docs.axolotl.ai/docs/api/core.datasets.chat.html
- 2025-08-01T14:03:00.381Z
+ 2025-08-01T17:25:24.369Z
https://docs.axolotl.ai/docs/api/utils.bench.html
- 2025-08-01T14:03:01.187Z
+ 2025-08-01T17:25:25.184Z
https://docs.axolotl.ai/docs/api/utils.schemas.training.html
- 2025-08-01T14:03:01.328Z
+ 2025-08-01T17:25:25.326Z
https://docs.axolotl.ai/docs/api/utils.collators.batching.html
- 2025-08-01T14:03:01.585Z
+ 2025-08-01T17:25:25.586Z
https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html
- 2025-08-01T14:03:00.823Z
+ 2025-08-01T17:25:24.816Z
https://docs.axolotl.ai/docs/api/utils.lora.html
- 2025-08-01T14:03:01.178Z
+ 2025-08-01T17:25:25.175Z
https://docs.axolotl.ai/docs/api/prompt_strategies.base.html
- 2025-08-01T14:03:00.731Z
+ 2025-08-01T17:25:24.724Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html
- 2025-08-01T14:03:00.791Z
+ 2025-08-01T17:25:24.784Z
https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html
- 2025-08-01T14:03:01.346Z
+ 2025-08-01T17:25:25.344Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html
- 2025-08-01T14:03:00.874Z
+ 2025-08-01T17:25:24.868Z
https://docs.axolotl.ai/docs/api/utils.schemas.peft.html
- 2025-08-01T14:03:01.355Z
+ 2025-08-01T17:25:25.353Z
https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html
- 2025-08-01T14:03:00.845Z
+ 2025-08-01T17:25:24.838Z
https://docs.axolotl.ai/docs/api/common.architectures.html
- 2025-08-01T14:03:01.548Z
+ 2025-08-01T17:25:25.549Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html
- 2025-08-01T14:03:01.140Z
+ 2025-08-01T17:25:25.136Z
https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html
- 2025-08-01T14:03:01.652Z
+ 2025-08-01T17:25:25.654Z
https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html
- 2025-08-01T14:03:01.546Z
+ 2025-08-01T17:25:25.547Z
https://docs.axolotl.ai/docs/api/cli.quantize.html
- 2025-08-01T14:03:00.537Z
+ 2025-08-01T17:25:24.527Z
https://docs.axolotl.ai/docs/api/cli.checks.html
- 2025-08-01T14:03:00.467Z
+ 2025-08-01T17:25:24.457Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html
- 2025-08-01T14:03:00.883Z
+ 2025-08-01T17:25:24.878Z
https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html
- 2025-08-01T14:03:01.184Z
+ 2025-08-01T17:25:25.181Z
https://docs.axolotl.ai/docs/api/utils.quantization.html
- 2025-08-01T14:03:01.300Z
+ 2025-08-01T17:25:25.298Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html
- 2025-08-01T14:03:00.699Z
+ 2025-08-01T17:25:24.691Z
https://docs.axolotl.ai/docs/api/kernels.geglu.html
- 2025-08-01T14:03:01.010Z
+ 2025-08-01T17:25:25.006Z
https://docs.axolotl.ai/docs/api/utils.data.pretraining.html
- 2025-08-01T14:03:01.273Z
+ 2025-08-01T17:25:25.270Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html
- 2025-08-01T14:03:00.893Z
+ 2025-08-01T17:25:24.887Z
https://docs.axolotl.ai/docs/api/core.builders.base.html
- 2025-08-01T14:03:00.327Z
+ 2025-08-01T17:25:24.315Z
https://docs.axolotl.ai/docs/api/cli.merge_lora.html
- 2025-08-01T14:03:00.512Z
+ 2025-08-01T17:25:24.502Z
https://docs.axolotl.ai/docs/api/cli.utils.load.html
- 2025-08-01T14:03:00.576Z
+ 2025-08-01T17:25:24.567Z
https://docs.axolotl.ai/docs/api/utils.data.sft.html
- 2025-08-01T14:03:01.280Z
+ 2025-08-01T17:25:25.277Z
https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html
- 2025-08-01T14:03:00.799Z
+ 2025-08-01T17:25:24.792Z
https://docs.axolotl.ai/docs/api/utils.tokenization.html
- 2025-08-01T14:03:01.172Z
+ 2025-08-01T17:25:25.169Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html
- 2025-08-01T14:03:00.871Z
+ 2025-08-01T17:25:24.865Z
https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html
- 2025-08-01T14:03:01.565Z
+ 2025-08-01T17:25:25.566Z
https://docs.axolotl.ai/docs/api/cli.args.html
- 2025-08-01T14:03:00.458Z
+ 2025-08-01T17:25:24.447Z
https://docs.axolotl.ai/docs/api/evaluate.html
- 2025-08-01T14:03:00.246Z
+ 2025-08-01T17:25:24.233Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html
- 2025-08-01T14:03:00.779Z
+ 2025-08-01T17:25:24.772Z
https://docs.axolotl.ai/docs/api/utils.distributed.html
- 2025-08-01T14:03:01.259Z
+ 2025-08-01T17:25:25.256Z
https://docs.axolotl.ai/docs/multipack.html
- 2025-08-01T13:59:54.052Z
+ 2025-08-01T17:22:09.556Z
https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html
- 2025-08-01T13:59:54.056Z
+ 2025-08-01T17:22:09.560Z
https://docs.axolotl.ai/FAQS.html
- 2025-08-01T13:59:54.046Z
+ 2025-08-01T17:22:09.551Z