From 3c93a11045a13639c50ef8da12d61122fb80f885 Mon Sep 17 00:00:00 2001 From: Quarto GHA Workflow Runner Date: Thu, 9 Oct 2025 15:56:25 +0000 Subject: [PATCH] Built site for gh-pages --- .nojekyll | 2 +- docs/custom_integrations.html | 6 +- .../colab-axolotl-example.html | 2 +- search.json | 2 +- sitemap.xml | 398 +++++++++--------- 5 files changed, 207 insertions(+), 203 deletions(-) diff --git a/.nojekyll b/.nojekyll index 9b61f7a3f..5eaebcec7 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -e6ac6d19 \ No newline at end of file +d96239da \ No newline at end of file diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html index b2a92abbd..cedfcd757 100644 --- a/docs/custom_integrations.html +++ b/docs/custom_integrations.html @@ -617,7 +617,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true}); -
pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@147ea28"
+
pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@49f3308"

Usage

@@ -650,9 +650,13 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
  • granitemoehybrid
  • hunyuan_v1_dense
  • hunyuan_v1_moe
  • +
  • lfm2
  • +
  • lfm2_moe
  • +
  • lfm2_vl
  • llama
  • llama4
  • llama4_text
  • +
  • llava
  • mistral
  • mistral3
  • mixtral
  • diff --git a/examples/colab-notebooks/colab-axolotl-example.html b/examples/colab-notebooks/colab-axolotl-example.html index 29e39ec4e..5d76178b4 100644 --- a/examples/colab-notebooks/colab-axolotl-example.html +++ b/examples/colab-notebooks/colab-axolotl-example.html @@ -565,7 +565,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
    %%capture
     # This step can take ~5-10 minutes to install dependencies
     !pip install --no-build-isolation axolotl[flash-attn]>=0.9.1
    -!pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@147ea28"
    +!pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@49f3308"

    Demo: Talk Like a Pirate

    diff --git a/search.json b/search.json index 3419dc1d6..002f8999c 100644 --- a/search.json +++ b/search.json @@ -2283,7 +2283,7 @@ "href": "docs/custom_integrations.html#cut-cross-entropy", "title": "Custom Integrations", "section": "Cut Cross Entropy", - "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@147ea28\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\napertus\narcee\ncohere\ncohere2\ndeepseek_v3\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nglm4_moe\nglm4v\nglm4v_moe\ngpt_oss\ngranite\ngranitemoe\ngranitemoeshared\ngranitemoehybrid\nhunyuan_v1_dense\nhunyuan_v1_moe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmixtral\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nqwen3_vl\nqwen3_vl_moe\nqwen3_next\nsmollm3\nseed_oss\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here", + "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@49f3308\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\napertus\narcee\ncohere\ncohere2\ndeepseek_v3\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nglm4_moe\nglm4v\nglm4v_moe\ngpt_oss\ngranite\ngranitemoe\ngranitemoeshared\ngranitemoehybrid\nhunyuan_v1_dense\nhunyuan_v1_moe\nlfm2\nlfm2_moe\nlfm2_vl\nllama\nllama4\nllama4_text\nllava\nmistral\nmistral3\nmixtral\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nqwen3_vl\nqwen3_vl_moe\nqwen3_next\nsmollm3\nseed_oss\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here", "crumbs": [ "Advanced Features", "Custom Integrations" diff --git a/sitemap.xml b/sitemap.xml index 8a7c202ca..76aa2b525 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -2,798 +2,798 @@ https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html - 2025-10-08T14:43:50.007Z + 2025-10-09T15:50:46.514Z https://docs.axolotl.ai/docs/mac.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/cli.html - 2025-10-08T14:43:49.980Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/nccl.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/getting-started.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/lr_groups.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/qat.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/multipack.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/streaming.html - 2025-10-08T14:43:49.985Z + 2025-10-09T15:50:46.493Z https://docs.axolotl.ai/docs/lora_optims.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/amd_hpc.html - 2025-10-08T14:43:49.980Z + 2025-10-09T15:50:46.487Z https://docs.axolotl.ai/docs/debugging.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/dataset-formats/conversation.html - 2025-10-08T14:43:49.980Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/dataset-formats/index.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/config-reference.html - 2025-10-08T14:47:29.858Z + 2025-10-09T15:54:27.221Z https://docs.axolotl.ai/docs/multimodal.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/ray-integration.html - 2025-10-08T14:43:49.985Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/faq.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/dataset_preprocessing.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/torchao.html - 2025-10-08T14:43:49.985Z + 2025-10-09T15:50:46.493Z https://docs.axolotl.ai/docs/optimizers.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/api/utils.schedulers.html - 2025-10-08T14:47:14.552Z + 2025-10-09T15:54:11.136Z https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html - 2025-10-08T14:47:13.756Z + 2025-10-09T15:54:10.381Z https://docs.axolotl.ai/docs/api/datasets.html - 2025-10-08T14:47:13.354Z + 2025-10-09T15:54:10.000Z https://docs.axolotl.ai/docs/api/utils.tokenization.html - 2025-10-08T14:47:14.470Z + 2025-10-09T15:54:11.056Z https://docs.axolotl.ai/docs/api/loaders.tokenizer.html - 2025-10-08T14:47:13.874Z + 2025-10-09T15:54:10.493Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html - 2025-10-08T14:47:14.338Z + 2025-10-09T15:54:10.934Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html - 2025-10-08T14:47:14.427Z + 2025-10-09T15:54:11.015Z https://docs.axolotl.ai/docs/api/utils.data.sft.html - 2025-10-08T14:47:14.604Z + 2025-10-09T15:54:11.184Z https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html - 2025-10-08T14:47:14.408Z + 2025-10-09T15:54:10.997Z https://docs.axolotl.ai/docs/api/loaders.patch_manager.html - 2025-10-08T14:47:13.895Z + 2025-10-09T15:54:10.513Z https://docs.axolotl.ai/docs/api/integrations.liger.args.html - 2025-10-08T14:47:14.928Z + 2025-10-09T15:54:11.500Z https://docs.axolotl.ai/docs/api/utils.schemas.peft.html - 2025-10-08T14:47:14.695Z + 2025-10-09T15:54:11.277Z https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html - 2025-10-08T14:47:14.086Z + 2025-10-09T15:54:10.695Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html - 2025-10-08T14:47:14.005Z + 2025-10-09T15:54:10.618Z https://docs.axolotl.ai/docs/api/cli.cloud.base.html - 2025-10-08T14:47:13.712Z + 2025-10-09T15:54:10.339Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html - 2025-10-08T14:47:14.459Z + 2025-10-09T15:54:11.045Z https://docs.axolotl.ai/docs/api/kernels.swiglu.html - 2025-10-08T14:47:14.309Z + 2025-10-09T15:54:10.906Z https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html - 2025-10-08T14:47:14.913Z + 2025-10-09T15:54:11.486Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html - 2025-10-08T14:47:14.146Z + 2025-10-09T15:54:10.753Z https://docs.axolotl.ai/docs/api/monkeypatch.utils.html - 2025-10-08T14:47:14.385Z + 2025-10-09T15:54:10.976Z https://docs.axolotl.ai/docs/api/core.builders.rl.html - 2025-10-08T14:47:13.452Z + 2025-10-09T15:54:10.092Z https://docs.axolotl.ai/docs/api/loaders.processor.html - 2025-10-08T14:47:13.876Z + 2025-10-09T15:54:10.495Z https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html - 2025-10-08T14:47:15.059Z + 2025-10-09T15:54:11.622Z https://docs.axolotl.ai/docs/api/core.training_args.html - 2025-10-08T14:47:13.468Z + 2025-10-09T15:54:10.106Z https://docs.axolotl.ai/docs/api/loaders.adapter.html - 2025-10-08T14:47:13.882Z + 2025-10-09T15:54:10.501Z https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html - 2025-10-08T14:47:13.684Z + 2025-10-09T15:54:10.312Z https://docs.axolotl.ai/docs/api/cli.train.html - 2025-10-08T14:47:13.568Z + 2025-10-09T15:54:10.201Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html - 2025-10-08T14:47:13.907Z + 2025-10-09T15:54:10.525Z https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html - 2025-10-08T14:47:14.052Z + 2025-10-09T15:54:10.663Z https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html - 2025-10-08T14:47:14.065Z + 2025-10-09T15:54:10.675Z https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html - 2025-10-08T14:47:14.375Z + 2025-10-09T15:54:10.966Z https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html - 2025-10-08T14:47:14.091Z + 2025-10-09T15:54:10.700Z https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html - 2025-10-08T14:47:14.029Z + 2025-10-09T15:54:10.641Z https://docs.axolotl.ai/docs/api/core.chat.messages.html - 2025-10-08T14:47:13.497Z + 2025-10-09T15:54:10.132Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html - 2025-10-08T14:47:13.916Z + 2025-10-09T15:54:10.533Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html - 2025-10-08T14:47:14.122Z + 2025-10-09T15:54:10.730Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html - 2025-10-08T14:47:14.134Z + 2025-10-09T15:54:10.741Z https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html - 2025-10-08T14:47:14.721Z + 2025-10-09T15:54:11.302Z https://docs.axolotl.ai/docs/api/convert.html - 2025-10-08T14:47:13.371Z + 2025-10-09T15:54:10.015Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html - 2025-10-08T14:47:14.124Z + 2025-10-09T15:54:10.732Z https://docs.axolotl.ai/docs/api/utils.schemas.config.html - 2025-10-08T14:47:14.643Z + 2025-10-09T15:54:11.222Z https://docs.axolotl.ai/docs/api/utils.schemas.enums.html - 2025-10-08T14:47:14.732Z + 2025-10-09T15:54:11.312Z https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html - 2025-10-08T14:47:14.387Z + 2025-10-09T15:54:10.977Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html - 2025-10-08T14:47:14.093Z + 2025-10-09T15:54:10.702Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html - 2025-10-08T14:47:13.834Z + 2025-10-09T15:54:10.456Z https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html - 2025-10-08T14:47:14.932Z + 2025-10-09T15:54:11.503Z https://docs.axolotl.ai/docs/api/utils.collators.core.html - 2025-10-08T14:47:14.961Z + 2025-10-09T15:54:11.531Z https://docs.axolotl.ai/docs/api/core.chat.format.shared.html - 2025-10-08T14:47:13.502Z + 2025-10-09T15:54:10.137Z https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html - 2025-10-08T14:47:14.172Z + 2025-10-09T15:54:10.777Z https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html - 2025-10-08T14:47:15.045Z + 2025-10-09T15:54:11.609Z https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html - 2025-10-08T14:47:15.079Z + 2025-10-09T15:54:11.638Z https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html - 2025-10-08T14:47:13.987Z + 2025-10-09T15:54:10.600Z https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html - 2025-10-08T14:47:14.706Z + 2025-10-09T15:54:11.287Z https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html - 2025-10-08T14:47:15.071Z + 2025-10-09T15:54:11.630Z https://docs.axolotl.ai/docs/api/prompt_strategies.base.html - 2025-10-08T14:47:13.946Z + 2025-10-09T15:54:10.562Z https://docs.axolotl.ai/docs/api/kernels.utils.html - 2025-10-08T14:47:14.320Z + 2025-10-09T15:54:10.917Z https://docs.axolotl.ai/docs/api/cli.merge_lora.html - 2025-10-08T14:47:13.669Z + 2025-10-09T15:54:10.298Z https://docs.axolotl.ai/docs/api/cli.utils.html - 2025-10-08T14:47:13.722Z + 2025-10-09T15:54:10.349Z https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html - 2025-10-08T14:47:13.945Z + 2025-10-09T15:54:10.560Z https://docs.axolotl.ai/docs/api/index.html - 2025-10-08T14:47:13.254Z + 2025-10-09T15:54:09.906Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html - 2025-10-08T14:47:14.106Z + 2025-10-09T15:54:10.714Z https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html - 2025-10-08T14:47:14.423Z + 2025-10-09T15:54:11.011Z https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html - 2025-10-08T14:47:14.078Z + 2025-10-09T15:54:10.687Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html - 2025-10-08T14:47:13.849Z + 2025-10-09T15:54:10.470Z https://docs.axolotl.ai/docs/api/utils.lora.html - 2025-10-08T14:47:14.477Z + 2025-10-09T15:54:11.064Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html - 2025-10-08T14:47:13.903Z + 2025-10-09T15:54:10.521Z https://docs.axolotl.ai/docs/api/cli.config.html - 2025-10-08T14:47:13.635Z + 2025-10-09T15:54:10.266Z https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html - 2025-10-08T14:47:14.332Z + 2025-10-09T15:54:10.928Z https://docs.axolotl.ai/docs/api/utils.collators.batching.html - 2025-10-08T14:47:14.986Z + 2025-10-09T15:54:11.553Z https://docs.axolotl.ai/docs/api/utils.quantization.html - 2025-10-08T14:47:14.628Z + 2025-10-09T15:54:11.206Z https://docs.axolotl.ai/docs/api/utils.dict.html - 2025-10-08T14:47:14.586Z + 2025-10-09T15:54:11.166Z https://docs.axolotl.ai/docs/api/kernels.quantize.html - 2025-10-08T14:47:14.318Z + 2025-10-09T15:54:10.915Z https://docs.axolotl.ai/docs/api/utils.schemas.training.html - 2025-10-08T14:47:14.660Z + 2025-10-09T15:54:11.240Z https://docs.axolotl.ai/docs/api/train.html - 2025-10-08T14:47:13.334Z + 2025-10-09T15:54:09.979Z https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html - 2025-10-08T14:47:13.518Z + 2025-10-09T15:54:10.153Z https://docs.axolotl.ai/docs/inference.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.491Z https://docs.axolotl.ai/FAQS.html - 2025-10-08T14:43:49.979Z + 2025-10-09T15:50:46.486Z https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html - 2025-10-08T14:43:49.989Z + 2025-10-09T15:50:46.497Z https://docs.axolotl.ai/index.html - 2025-10-08T14:43:50.002Z + 2025-10-09T15:50:46.510Z https://docs.axolotl.ai/docs/custom_integrations.html - 2025-10-08T14:43:49.980Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/api/utils.schemas.utils.html - 2025-10-08T14:47:14.738Z + 2025-10-09T15:54:11.319Z https://docs.axolotl.ai/docs/api/kernels.geglu.html - 2025-10-08T14:47:14.297Z + 2025-10-09T15:54:10.894Z https://docs.axolotl.ai/docs/api/core.builders.causal.html - 2025-10-08T14:47:13.447Z + 2025-10-09T15:54:10.086Z https://docs.axolotl.ai/docs/api/core.trainers.mamba.html - 2025-10-08T14:47:13.813Z + 2025-10-09T15:54:10.436Z https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html - 2025-10-08T14:47:14.176Z + 2025-10-09T15:54:10.781Z https://docs.axolotl.ai/docs/api/core.datasets.chat.html - 2025-10-08T14:47:13.508Z + 2025-10-09T15:54:10.143Z https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html - 2025-10-08T14:47:14.996Z + 2025-10-09T15:54:11.562Z https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html - 2025-10-08T14:47:14.045Z + 2025-10-09T15:54:10.656Z https://docs.axolotl.ai/docs/api/common.const.html - 2025-10-08T14:47:14.940Z + 2025-10-09T15:54:11.511Z https://docs.axolotl.ai/docs/api/cli.quantize.html - 2025-10-08T14:47:13.700Z + 2025-10-09T15:54:10.327Z https://docs.axolotl.ai/docs/api/utils.trainer.html - 2025-10-08T14:47:14.519Z + 2025-10-09T15:54:11.103Z https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html - 2025-10-08T14:47:13.641Z + 2025-10-09T15:54:10.272Z https://docs.axolotl.ai/docs/api/evaluate.html - 2025-10-08T14:47:13.346Z + 2025-10-09T15:54:09.992Z https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html - 2025-10-08T14:47:14.330Z + 2025-10-09T15:54:10.926Z https://docs.axolotl.ai/docs/api/loaders.model.html - 2025-10-08T14:47:13.864Z + 2025-10-09T15:54:10.483Z https://docs.axolotl.ai/docs/api/utils.distributed.html - 2025-10-08T14:47:14.579Z + 2025-10-09T15:54:11.158Z https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html - 2025-10-08T14:47:14.484Z + 2025-10-09T15:54:11.070Z https://docs.axolotl.ai/docs/api/kernels.lora.html - 2025-10-08T14:47:14.284Z + 2025-10-09T15:54:10.882Z https://docs.axolotl.ai/docs/api/cli.main.html - 2025-10-08T14:47:13.558Z + 2025-10-09T15:54:10.191Z https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html - 2025-10-08T14:47:14.936Z + 2025-10-09T15:54:11.507Z https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html - 2025-10-08T14:47:14.595Z + 2025-10-09T15:54:11.174Z https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html - 2025-10-08T14:47:13.720Z + 2025-10-09T15:54:10.347Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html - 2025-10-08T14:47:14.327Z + 2025-10-09T15:54:10.923Z https://docs.axolotl.ai/docs/api/core.builders.base.html - 2025-10-08T14:47:13.441Z + 2025-10-09T15:54:10.081Z https://docs.axolotl.ai/docs/api/utils.schemas.trl.html - 2025-10-08T14:47:14.699Z + 2025-10-09T15:54:11.281Z https://docs.axolotl.ai/docs/api/cli.utils.args.html - 2025-10-08T14:47:13.736Z + 2025-10-09T15:54:10.362Z https://docs.axolotl.ai/docs/api/core.trainers.base.html - 2025-10-08T14:47:13.788Z + 2025-10-09T15:54:10.412Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html - 2025-10-08T14:47:14.389Z + 2025-10-09T15:54:10.979Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html - 2025-10-08T14:47:14.328Z + 2025-10-09T15:54:10.925Z https://docs.axolotl.ai/docs/api/utils.schemas.model.html - 2025-10-08T14:47:14.652Z + 2025-10-09T15:54:11.230Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html - 2025-10-08T14:47:14.144Z + 2025-10-09T15:54:10.751Z https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html - 2025-10-08T14:47:15.065Z + 2025-10-09T15:54:11.626Z https://docs.axolotl.ai/docs/api/common.datasets.html - 2025-10-08T14:47:14.958Z + 2025-10-09T15:54:11.528Z https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html - 2025-10-08T14:47:14.685Z + 2025-10-09T15:54:11.264Z https://docs.axolotl.ai/docs/api/cli.utils.fetch.html - 2025-10-08T14:47:13.742Z + 2025-10-09T15:54:10.368Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html - 2025-10-08T14:47:14.119Z + 2025-10-09T15:54:10.726Z https://docs.axolotl.ai/docs/api/monkeypatch.relora.html - 2025-10-08T14:47:14.336Z + 2025-10-09T15:54:10.932Z https://docs.axolotl.ai/docs/api/cli.evaluate.html - 2025-10-08T14:47:13.578Z + 2025-10-09T15:54:10.211Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html - 2025-10-08T14:47:14.121Z + 2025-10-09T15:54:10.728Z https://docs.axolotl.ai/docs/api/core.trainers.utils.html - 2025-10-08T14:47:13.851Z + 2025-10-09T15:54:10.472Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html - 2025-10-08T14:47:14.020Z + 2025-10-09T15:54:10.631Z https://docs.axolotl.ai/docs/api/utils.chat_templates.html - 2025-10-08T14:47:14.471Z + 2025-10-09T15:54:11.058Z https://docs.axolotl.ai/docs/api/utils.data.streaming.html - 2025-10-08T14:47:14.597Z + 2025-10-09T15:54:11.177Z https://docs.axolotl.ai/docs/api/utils.bench.html - 2025-10-08T14:47:14.488Z + 2025-10-09T15:54:11.075Z https://docs.axolotl.ai/docs/api/common.architectures.html - 2025-10-08T14:47:14.938Z + 2025-10-09T15:54:11.509Z https://docs.axolotl.ai/docs/api/cli.checks.html - 2025-10-08T14:47:13.614Z + 2025-10-09T15:54:10.245Z https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html - 2025-10-08T14:47:13.821Z + 2025-10-09T15:54:10.444Z https://docs.axolotl.ai/docs/api/integrations.base.html - 2025-10-08T14:47:14.909Z + 2025-10-09T15:54:11.482Z https://docs.axolotl.ai/docs/api/cli.utils.train.html - 2025-10-08T14:47:13.771Z + 2025-10-09T15:54:10.395Z https://docs.axolotl.ai/docs/api/utils.collators.mamba.html - 2025-10-08T14:47:14.991Z + 2025-10-09T15:54:11.557Z https://docs.axolotl.ai/docs/api/cli.art.html - 2025-10-08T14:47:13.606Z + 2025-10-09T15:54:10.238Z https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html - 2025-10-08T14:47:14.400Z + 2025-10-09T15:54:10.990Z https://docs.axolotl.ai/docs/api/logging_config.html - 2025-10-08T14:47:13.433Z + 2025-10-09T15:54:10.074Z https://docs.axolotl.ai/docs/api/utils.freeze.html - 2025-10-08T14:47:14.498Z + 2025-10-09T15:54:11.084Z https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html - 2025-10-08T14:47:14.074Z + 2025-10-09T15:54:10.683Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html - 2025-10-08T14:47:14.003Z + 2025-10-09T15:54:10.616Z https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html - 2025-10-08T14:47:14.396Z + 2025-10-09T15:54:10.986Z https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html - 2025-10-08T14:47:14.959Z + 2025-10-09T15:54:11.529Z https://docs.axolotl.ai/docs/api/core.trainers.trl.html - 2025-10-08T14:47:13.806Z + 2025-10-09T15:54:10.429Z https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html - 2025-10-08T14:47:14.060Z + 2025-10-09T15:54:10.670Z https://docs.axolotl.ai/docs/api/loaders.constants.html - 2025-10-08T14:47:13.896Z + 2025-10-09T15:54:10.514Z https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html - 2025-10-08T14:47:14.421Z + 2025-10-09T15:54:11.009Z https://docs.axolotl.ai/docs/api/cli.vllm_serve.html - 2025-10-08T14:47:13.708Z + 2025-10-09T15:54:10.335Z https://docs.axolotl.ai/docs/api/prompt_tokenizers.html - 2025-10-08T14:47:13.421Z + 2025-10-09T15:54:10.063Z https://docs.axolotl.ai/docs/api/cli.args.html - 2025-10-08T14:47:13.602Z + 2025-10-09T15:54:10.234Z https://docs.axolotl.ai/docs/api/cli.inference.html - 2025-10-08T14:47:13.658Z + 2025-10-09T15:54:10.288Z https://docs.axolotl.ai/docs/api/cli.utils.load.html - 2025-10-08T14:47:13.749Z + 2025-10-09T15:54:10.375Z https://docs.axolotl.ai/docs/api/cli.preprocess.html - 2025-10-08T14:47:13.694Z + 2025-10-09T15:54:10.321Z https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html - 2025-10-08T14:47:15.058Z + 2025-10-09T15:54:11.620Z https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html - 2025-10-08T14:47:15.053Z + 2025-10-09T15:54:11.616Z https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html - 2025-10-08T14:47:13.498Z + 2025-10-09T15:54:10.134Z https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html - 2025-10-08T14:47:14.915Z + 2025-10-09T15:54:11.487Z https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html - 2025-10-08T14:47:14.924Z + 2025-10-09T15:54:11.496Z https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html - 2025-10-08T14:47:14.410Z + 2025-10-09T15:54:10.999Z https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html - 2025-10-08T14:47:13.500Z + 2025-10-09T15:54:10.136Z https://docs.axolotl.ai/docs/reward_modelling.html - 2025-10-08T14:43:49.985Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/quantize.html - 2025-10-08T14:43:49.985Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/fsdp_qlora.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/nd_parallelism.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/batch_vs_grad.html - 2025-10-08T14:43:49.980Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/multi-node.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/rlhf.html - 2025-10-08T14:43:49.985Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/dataset-formats/pretraining.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/dataset-formats/tokenized.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/dataset-formats/template_free.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/multi-gpu.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/input_output.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.491Z https://docs.axolotl.ai/docs/docker.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/gradient_checkpointing.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.489Z https://docs.axolotl.ai/docs/optimizations.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/sequence_parallelism.html - 2025-10-08T14:43:49.985Z + 2025-10-09T15:50:46.493Z https://docs.axolotl.ai/docs/dataset_loading.html - 2025-10-08T14:43:49.981Z + 2025-10-09T15:50:46.488Z https://docs.axolotl.ai/docs/installation.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.491Z https://docs.axolotl.ai/docs/mixed_precision.html - 2025-10-08T14:43:49.984Z + 2025-10-09T15:50:46.492Z https://docs.axolotl.ai/docs/unsloth.html - 2025-10-08T14:43:49.985Z + 2025-10-09T15:50:46.493Z https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html - 2025-10-08T14:43:50.006Z + 2025-10-09T15:50:46.514Z