From f7c612a0326715b761d9bc4c38a49d503b926f75 Mon Sep 17 00:00:00 2001 From: Quarto GHA Workflow Runner Date: Tue, 23 Sep 2025 04:37:00 +0000 Subject: [PATCH] Built site for gh-pages --- .nojekyll | 2 +- docs/custom_integrations.html | 3 +- .../colab-axolotl-example.html | 2 +- search.json | 2 +- sitemap.xml | 396 +++++++++--------- 5 files changed, 203 insertions(+), 202 deletions(-) diff --git a/.nojekyll b/.nojekyll index 6651e5108..0843099f8 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -8569c582 \ No newline at end of file +394adab2 \ No newline at end of file diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html index 3c6557fdf..dfde3cbc5 100644 --- a/docs/custom_integrations.html +++ b/docs/custom_integrations.html @@ -611,7 +611,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true}); -
pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c564afc"
+
pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c5aa3ef"

Usage

@@ -655,6 +655,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
  • qwen2_5_vl
  • qwen3
  • qwen3_moe
  • +
  • qwen3_next
  • smollm3
  • seed_oss
  • voxtral
  • diff --git a/examples/colab-notebooks/colab-axolotl-example.html b/examples/colab-notebooks/colab-axolotl-example.html index 27e6e4f27..9a6ac5ed7 100644 --- a/examples/colab-notebooks/colab-axolotl-example.html +++ b/examples/colab-notebooks/colab-axolotl-example.html @@ -559,7 +559,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
    %%capture
     # This step can take ~5-10 minutes to install dependencies
     !pip install --no-build-isolation axolotl[flash-attn]>=0.9.1
    -!pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c564afc"
    +!pip install "cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c5aa3ef"

    Demo: Talk Like a Pirate

    diff --git a/search.json b/search.json index 31022a961..470ccb577 100644 --- a/search.json +++ b/search.json @@ -285,7 +285,7 @@ "href": "docs/custom_integrations.html#cut-cross-entropy", "title": "Custom Integrations", "section": "Cut Cross Entropy", - "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c564afc\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\narcee\ncohere\ncohere2\ndeepseek_v3\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nglm4_moe\ngpt_oss\ngranite\ngranitemoe\nhunyuan_v1_dense\nhunyuan_v1_moe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmixtral\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nsmollm3\nseed_oss\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here", + "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/axolotl-ai-cloud/ml-cross-entropy.git@c5aa3ef\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\n\nSupported Models\n\narcee\ncohere\ncohere2\ndeepseek_v3\ngemma\ngemma2\ngemma3\ngemma3_text\ngemma3n\ngemma3n_text\nglm\nglm4\nglm4_moe\ngpt_oss\ngranite\ngranitemoe\nhunyuan_v1_dense\nhunyuan_v1_moe\nllama\nllama4\nllama4_text\nmistral\nmistral3\nmixtral\nmllama\nphi\nphi3\nphi4_multimodal\nqwen2\nqwen2_vl\nqwen2_moe\nqwen2_5_vl\nqwen3\nqwen3_moe\nqwen3_next\nsmollm3\nseed_oss\nvoxtral\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here", "crumbs": [ "Advanced Features", "Custom Integrations" diff --git a/sitemap.xml b/sitemap.xml index db6f35b92..b01ea6639 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -2,794 +2,794 @@ https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html - 2025-09-19T10:34:36.740Z + 2025-09-23T04:31:24.847Z https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html - 2025-09-19T10:34:36.757Z + 2025-09-23T04:31:24.864Z https://docs.axolotl.ai/FAQS.html - 2025-09-19T10:34:36.729Z + 2025-09-23T04:31:24.837Z https://docs.axolotl.ai/docs/unsloth.html - 2025-09-19T10:34:36.736Z + 2025-09-23T04:31:24.843Z https://docs.axolotl.ai/docs/reward_modelling.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.843Z https://docs.axolotl.ai/docs/docker.html - 2025-09-19T10:34:36.732Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/batch_vs_grad.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.838Z https://docs.axolotl.ai/docs/streaming.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.843Z https://docs.axolotl.ai/docs/nccl.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/quantize.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.843Z https://docs.axolotl.ai/docs/nd_parallelism.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/custom_integrations.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/debugging.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/gradient_checkpointing.html - 2025-09-19T10:34:36.732Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/multimodal.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/dataset_loading.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html - 2025-09-19T10:38:05.774Z + 2025-09-23T04:34:52.953Z https://docs.axolotl.ai/docs/api/loaders.adapter.html - 2025-09-19T10:38:04.915Z + 2025-09-23T04:34:52.101Z https://docs.axolotl.ai/docs/api/core.builders.base.html - 2025-09-19T10:38:04.547Z + 2025-09-23T04:34:51.738Z https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html - 2025-09-19T10:38:04.751Z + 2025-09-23T04:34:51.938Z https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html - 2025-09-19T10:38:04.781Z + 2025-09-23T04:34:51.967Z https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html - 2025-09-19T10:38:05.336Z + 2025-09-23T04:34:52.518Z https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html - 2025-09-19T10:38:05.764Z + 2025-09-23T04:34:52.943Z https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html - 2025-09-19T10:38:04.715Z + 2025-09-23T04:34:51.903Z https://docs.axolotl.ai/docs/api/cli.evaluate.html - 2025-09-19T10:38:04.662Z + 2025-09-23T04:34:51.851Z https://docs.axolotl.ai/docs/api/utils.schemas.model.html - 2025-09-19T10:38:05.546Z + 2025-09-23T04:34:52.725Z https://docs.axolotl.ai/docs/api/cli.art.html - 2025-09-19T10:38:04.686Z + 2025-09-23T04:34:51.874Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html - 2025-09-19T10:38:05.100Z + 2025-09-23T04:34:52.284Z https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html - 2025-09-19T10:38:04.595Z + 2025-09-23T04:34:51.786Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html - 2025-09-19T10:38:05.131Z + 2025-09-23T04:34:52.315Z https://docs.axolotl.ai/docs/api/cli.args.html - 2025-09-19T10:38:04.683Z + 2025-09-23T04:34:51.871Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html - 2025-09-19T10:38:05.361Z + 2025-09-23T04:34:52.543Z https://docs.axolotl.ai/docs/api/evaluate.html - 2025-09-19T10:38:04.469Z + 2025-09-23T04:34:51.661Z https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html - 2025-09-19T10:38:05.062Z + 2025-09-23T04:34:52.246Z https://docs.axolotl.ai/docs/api/cli.vllm_serve.html - 2025-09-19T10:38:04.771Z + 2025-09-23T04:34:51.958Z https://docs.axolotl.ai/docs/api/cli.quantize.html - 2025-09-19T10:38:04.764Z + 2025-09-23T04:34:51.951Z https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html - 2025-09-19T10:38:04.811Z + 2025-09-23T04:34:51.998Z https://docs.axolotl.ai/docs/api/core.builders.rl.html - 2025-09-19T10:38:04.556Z + 2025-09-23T04:34:51.748Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html - 2025-09-19T10:38:05.110Z + 2025-09-23T04:34:52.294Z https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html - 2025-09-19T10:38:05.073Z + 2025-09-23T04:34:52.257Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html - 2025-09-19T10:38:05.114Z + 2025-09-23T04:34:52.298Z https://docs.axolotl.ai/docs/api/core.datasets.chat.html - 2025-09-19T10:38:04.602Z + 2025-09-23T04:34:51.793Z https://docs.axolotl.ai/docs/api/utils.distributed.html - 2025-09-19T10:38:05.483Z + 2025-09-23T04:34:52.664Z https://docs.axolotl.ai/docs/api/integrations.base.html - 2025-09-19T10:38:05.752Z + 2025-09-23T04:34:52.931Z https://docs.axolotl.ai/docs/api/index.html - 2025-09-19T10:38:04.400Z + 2025-09-23T04:34:51.593Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html - 2025-09-19T10:38:05.387Z + 2025-09-23T04:34:52.569Z https://docs.axolotl.ai/docs/api/utils.quantization.html - 2025-09-19T10:38:05.524Z + 2025-09-23T04:34:52.704Z https://docs.axolotl.ai/docs/api/utils.dict.html - 2025-09-19T10:38:05.489Z + 2025-09-23T04:34:52.669Z https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html - 2025-09-19T10:38:04.865Z + 2025-09-23T04:34:52.051Z https://docs.axolotl.ai/docs/api/utils.schemas.config.html - 2025-09-19T10:38:05.538Z + 2025-09-23T04:34:52.718Z https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html - 2025-09-19T10:38:05.077Z + 2025-09-23T04:34:52.261Z https://docs.axolotl.ai/docs/api/utils.collators.mamba.html - 2025-09-19T10:38:05.817Z + 2025-09-23T04:34:52.996Z https://docs.axolotl.ai/docs/api/datasets.html - 2025-09-19T10:38:04.476Z + 2025-09-23T04:34:51.668Z https://docs.axolotl.ai/docs/api/convert.html - 2025-09-19T10:38:04.489Z + 2025-09-23T04:34:51.681Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html - 2025-09-19T10:38:05.123Z + 2025-09-23T04:34:52.307Z https://docs.axolotl.ai/docs/api/utils.tokenization.html - 2025-09-19T10:38:05.394Z + 2025-09-23T04:34:52.576Z https://docs.axolotl.ai/docs/api/core.trainers.base.html - 2025-09-19T10:38:04.837Z + 2025-09-23T04:34:52.024Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html - 2025-09-19T10:38:05.291Z + 2025-09-23T04:34:52.473Z https://docs.axolotl.ai/docs/api/loaders.model.html - 2025-09-19T10:38:04.899Z + 2025-09-23T04:34:52.086Z https://docs.axolotl.ai/docs/api/logging_config.html - 2025-09-19T10:38:04.541Z + 2025-09-23T04:34:51.732Z https://docs.axolotl.ai/docs/api/core.chat.format.shared.html - 2025-09-19T10:38:04.597Z + 2025-09-23T04:34:51.788Z https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html - 2025-09-19T10:38:05.793Z + 2025-09-23T04:34:52.972Z https://docs.axolotl.ai/docs/api/utils.schemas.enums.html - 2025-09-19T10:38:05.609Z + 2025-09-23T04:34:52.788Z https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html - 2025-09-19T10:38:05.874Z + 2025-09-23T04:34:53.052Z https://docs.axolotl.ai/docs/api/utils.bench.html - 2025-09-19T10:38:05.410Z + 2025-09-23T04:34:52.592Z https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html - 2025-09-19T10:38:05.863Z + 2025-09-23T04:34:53.042Z https://docs.axolotl.ai/docs/api/core.trainers.mamba.html - 2025-09-19T10:38:04.858Z + 2025-09-23T04:34:52.044Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html - 2025-09-19T10:38:05.015Z + 2025-09-23T04:34:52.200Z https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html - 2025-09-19T10:38:05.329Z + 2025-09-23T04:34:52.511Z https://docs.axolotl.ai/docs/api/core.chat.messages.html - 2025-09-19T10:38:04.592Z + 2025-09-23T04:34:51.783Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html - 2025-09-19T10:38:05.330Z + 2025-09-23T04:34:52.513Z https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html - 2025-09-19T10:38:05.358Z + 2025-09-23T04:34:52.540Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html - 2025-09-19T10:38:04.942Z + 2025-09-23T04:34:52.128Z https://docs.axolotl.ai/docs/api/loaders.patch_manager.html - 2025-09-19T10:38:04.925Z + 2025-09-23T04:34:52.111Z https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html - 2025-09-19T10:38:05.496Z + 2025-09-23T04:34:52.677Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html - 2025-09-19T10:38:05.283Z + 2025-09-23T04:34:52.465Z https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html - 2025-09-19T10:38:05.870Z + 2025-09-23T04:34:53.048Z https://docs.axolotl.ai/docs/api/loaders.tokenizer.html - 2025-09-19T10:38:04.908Z + 2025-09-23T04:34:52.094Z https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html - 2025-09-19T10:38:05.084Z + 2025-09-23T04:34:52.268Z https://docs.axolotl.ai/docs/api/utils.lora.html - 2025-09-19T10:38:05.401Z + 2025-09-23T04:34:52.583Z https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html - 2025-09-19T10:38:05.037Z + 2025-09-23T04:34:52.221Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html - 2025-09-19T10:38:04.935Z + 2025-09-23T04:34:52.121Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html - 2025-09-19T10:38:05.113Z + 2025-09-23T04:34:52.297Z https://docs.axolotl.ai/docs/api/kernels.swiglu.html - 2025-09-19T10:38:05.266Z + 2025-09-23T04:34:52.449Z https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html - 2025-09-19T10:38:05.588Z + 2025-09-23T04:34:52.767Z https://docs.axolotl.ai/docs/api/cli.main.html - 2025-09-19T10:38:04.645Z + 2025-09-23T04:34:51.835Z https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html - 2025-09-19T10:38:04.966Z + 2025-09-23T04:34:52.152Z https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html - 2025-09-19T10:38:05.286Z + 2025-09-23T04:34:52.468Z https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html - 2025-09-19T10:38:04.594Z + 2025-09-23T04:34:51.785Z https://docs.axolotl.ai/docs/api/cli.cloud.base.html - 2025-09-19T10:38:04.775Z + 2025-09-23T04:34:51.961Z https://docs.axolotl.ai/docs/api/core.trainers.trl.html - 2025-09-19T10:38:04.852Z + 2025-09-23T04:34:52.039Z https://docs.axolotl.ai/docs/mixed_precision.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/installation.html - 2025-09-19T10:34:36.734Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/mac.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/sequence_parallelism.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.843Z https://docs.axolotl.ai/docs/faq.html - 2025-09-19T10:34:36.732Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/dataset-formats/tokenized.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/dataset-formats/pretraining.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/dataset-formats/template_free.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/dataset-formats/index.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/dataset-formats/conversation.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/lr_groups.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/inference.html - 2025-09-19T10:34:36.734Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/lora_optims.html - 2025-09-19T10:34:36.734Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/multipack.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/amd_hpc.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.838Z https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html - 2025-09-19T10:38:05.339Z + 2025-09-23T04:34:52.521Z https://docs.axolotl.ai/docs/api/cli.inference.html - 2025-09-19T10:38:04.730Z + 2025-09-23T04:34:51.917Z https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html - 2025-09-19T10:38:05.822Z + 2025-09-23T04:34:53.001Z https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html - 2025-09-19T10:38:05.406Z + 2025-09-23T04:34:52.588Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html - 2025-09-19T10:38:05.281Z + 2025-09-23T04:34:52.463Z https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html - 2025-09-19T10:38:05.756Z + 2025-09-23T04:34:52.935Z https://docs.axolotl.ai/docs/api/utils.schemas.training.html - 2025-09-19T10:38:05.552Z + 2025-09-23T04:34:52.732Z https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html - 2025-09-19T10:38:05.600Z + 2025-09-23T04:34:52.779Z https://docs.axolotl.ai/docs/api/utils.schemas.utils.html - 2025-09-19T10:38:05.615Z + 2025-09-23T04:34:52.794Z https://docs.axolotl.ai/docs/api/cli.checks.html - 2025-09-19T10:38:04.692Z + 2025-09-23T04:34:51.880Z https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html - 2025-09-19T10:38:05.890Z + 2025-09-23T04:34:53.068Z https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html - 2025-09-19T10:38:05.284Z + 2025-09-23T04:34:52.466Z https://docs.axolotl.ai/docs/api/utils.data.sft.html - 2025-09-19T10:38:05.504Z + 2025-09-23T04:34:52.685Z https://docs.axolotl.ai/docs/api/utils.chat_templates.html - 2025-09-19T10:38:05.396Z + 2025-09-23T04:34:52.578Z https://docs.axolotl.ai/docs/api/monkeypatch.utils.html - 2025-09-19T10:38:05.327Z + 2025-09-23T04:34:52.510Z https://docs.axolotl.ai/docs/api/cli.utils.fetch.html - 2025-09-19T10:38:04.799Z + 2025-09-23T04:34:51.986Z https://docs.axolotl.ai/docs/api/core.builders.causal.html - 2025-09-19T10:38:04.552Z + 2025-09-23T04:34:51.743Z https://docs.axolotl.ai/docs/api/utils.schemas.trl.html - 2025-09-19T10:38:05.583Z + 2025-09-23T04:34:52.762Z https://docs.axolotl.ai/docs/api/utils.data.streaming.html - 2025-09-19T10:38:05.498Z + 2025-09-23T04:34:52.678Z https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html - 2025-09-19T10:38:05.347Z + 2025-09-23T04:34:52.529Z https://docs.axolotl.ai/docs/api/prompt_strategies.base.html - 2025-09-19T10:38:04.968Z + 2025-09-23T04:34:52.153Z https://docs.axolotl.ai/docs/api/cli.merge_lora.html - 2025-09-19T10:38:04.739Z + 2025-09-23T04:34:51.926Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html - 2025-09-19T10:38:05.017Z + 2025-09-23T04:34:52.201Z https://docs.axolotl.ai/docs/api/loaders.constants.html - 2025-09-19T10:38:04.926Z + 2025-09-23T04:34:52.112Z https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html - 2025-09-19T10:38:05.346Z + 2025-09-23T04:34:52.528Z https://docs.axolotl.ai/docs/api/monkeypatch.relora.html - 2025-09-19T10:38:05.289Z + 2025-09-23T04:34:52.471Z https://docs.axolotl.ai/docs/api/utils.schedulers.html - 2025-09-19T10:38:05.463Z + 2025-09-23T04:34:52.644Z https://docs.axolotl.ai/docs/api/kernels.lora.html - 2025-09-19T10:38:05.245Z + 2025-09-23T04:34:52.428Z https://docs.axolotl.ai/docs/api/utils.collators.batching.html - 2025-09-19T10:38:05.814Z + 2025-09-23T04:34:52.992Z https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html - 2025-09-19T10:38:05.056Z + 2025-09-23T04:34:52.240Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html - 2025-09-19T10:38:04.876Z + 2025-09-23T04:34:52.062Z https://docs.axolotl.ai/docs/api/common.architectures.html - 2025-09-19T10:38:05.775Z + 2025-09-23T04:34:52.954Z https://docs.axolotl.ai/docs/api/cli.utils.html - 2025-09-19T10:38:04.782Z + 2025-09-23T04:34:51.969Z https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html - 2025-09-19T10:38:05.153Z + 2025-09-23T04:34:52.337Z https://docs.axolotl.ai/docs/api/core.training_args.html - 2025-09-19T10:38:04.569Z + 2025-09-23T04:34:51.760Z https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html - 2025-09-19T10:38:05.571Z + 2025-09-23T04:34:52.750Z https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html - 2025-09-19T10:38:05.001Z + 2025-09-23T04:34:52.186Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html - 2025-09-19T10:38:05.029Z + 2025-09-23T04:34:52.213Z https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html - 2025-09-19T10:38:05.755Z + 2025-09-23T04:34:52.934Z https://docs.axolotl.ai/docs/api/common.const.html - 2025-09-19T10:38:05.777Z + 2025-09-23T04:34:52.956Z https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html - 2025-09-19T10:38:05.319Z + 2025-09-23T04:34:52.502Z https://docs.axolotl.ai/docs/api/kernels.quantize.html - 2025-09-19T10:38:05.274Z + 2025-09-23T04:34:52.456Z https://docs.axolotl.ai/docs/api/cli.config.html - 2025-09-19T10:38:04.711Z + 2025-09-23T04:34:51.898Z https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html - 2025-09-19T10:38:05.050Z + 2025-09-23T04:34:52.234Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html - 2025-09-19T10:38:05.112Z + 2025-09-23T04:34:52.295Z https://docs.axolotl.ai/docs/api/kernels.geglu.html - 2025-09-19T10:38:05.256Z + 2025-09-23T04:34:52.439Z https://docs.axolotl.ai/docs/api/utils.freeze.html - 2025-09-19T10:38:05.418Z + 2025-09-23T04:34:52.599Z https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html - 2025-09-19T10:38:05.879Z + 2025-09-23T04:34:53.057Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html - 2025-09-19T10:38:04.888Z + 2025-09-23T04:34:52.074Z https://docs.axolotl.ai/docs/api/cli.utils.train.html - 2025-09-19T10:38:04.823Z + 2025-09-23T04:34:52.009Z https://docs.axolotl.ai/docs/api/cli.utils.load.html - 2025-09-19T10:38:04.805Z + 2025-09-23T04:34:51.991Z https://docs.axolotl.ai/docs/api/utils.collators.core.html - 2025-09-19T10:38:05.794Z + 2025-09-23T04:34:52.973Z https://docs.axolotl.ai/docs/api/integrations.liger.args.html - 2025-09-19T10:38:05.767Z + 2025-09-23T04:34:52.946Z https://docs.axolotl.ai/docs/api/cli.preprocess.html - 2025-09-19T10:38:04.759Z + 2025-09-23T04:34:51.946Z https://docs.axolotl.ai/docs/api/kernels.utils.html - 2025-09-19T10:38:05.276Z + 2025-09-23T04:34:52.458Z https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html - 2025-09-19T10:38:05.875Z + 2025-09-23T04:34:53.053Z https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html - 2025-09-19T10:38:05.356Z + 2025-09-23T04:34:52.538Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html - 2025-09-19T10:38:04.932Z + 2025-09-23T04:34:52.118Z https://docs.axolotl.ai/docs/api/loaders.processor.html - 2025-09-19T10:38:04.909Z + 2025-09-23T04:34:52.095Z https://docs.axolotl.ai/docs/api/core.trainers.utils.html - 2025-09-19T10:38:04.890Z + 2025-09-23T04:34:52.076Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html - 2025-09-19T10:38:05.090Z + 2025-09-23T04:34:52.273Z https://docs.axolotl.ai/docs/api/prompt_tokenizers.html - 2025-09-19T10:38:04.531Z + 2025-09-23T04:34:51.723Z https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html - 2025-09-19T10:38:05.883Z + 2025-09-23T04:34:53.061Z https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html - 2025-09-19T10:38:04.610Z + 2025-09-23T04:34:51.801Z https://docs.axolotl.ai/docs/api/utils.trainer.html - 2025-09-19T10:38:05.435Z + 2025-09-23T04:34:52.616Z https://docs.axolotl.ai/docs/api/cli.train.html - 2025-09-19T10:38:04.654Z + 2025-09-23T04:34:51.843Z https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html - 2025-09-19T10:38:05.770Z + 2025-09-23T04:34:52.950Z https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html - 2025-09-19T10:38:05.088Z + 2025-09-23T04:34:52.272Z https://docs.axolotl.ai/docs/api/utils.schemas.peft.html - 2025-09-19T10:38:05.579Z + 2025-09-23T04:34:52.759Z https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html - 2025-09-19T10:38:05.156Z + 2025-09-23T04:34:52.341Z https://docs.axolotl.ai/docs/api/cli.utils.args.html - 2025-09-19T10:38:04.794Z + 2025-09-23T04:34:51.980Z https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html - 2025-09-19T10:38:05.066Z + 2025-09-23T04:34:52.250Z https://docs.axolotl.ai/docs/api/common.datasets.html - 2025-09-19T10:38:05.792Z + 2025-09-23T04:34:52.971Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html - 2025-09-19T10:38:05.132Z + 2025-09-23T04:34:52.316Z https://docs.axolotl.ai/docs/api/train.html - 2025-09-19T10:38:04.459Z + 2025-09-23T04:34:51.651Z https://docs.axolotl.ai/docs/multi-node.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/input_output.html - 2025-09-19T10:34:36.734Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/ray-integration.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.843Z https://docs.axolotl.ai/docs/getting-started.html - 2025-09-19T10:34:36.732Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/optimizers.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.843Z https://docs.axolotl.ai/docs/multi-gpu.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.842Z https://docs.axolotl.ai/docs/dataset_preprocessing.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/torchao.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.843Z https://docs.axolotl.ai/docs/config-reference.html - 2025-09-19T10:38:21.431Z + 2025-09-23T04:35:08.477Z https://docs.axolotl.ai/docs/rlhf.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.843Z https://docs.axolotl.ai/docs/cli.html - 2025-09-19T10:34:36.731Z + 2025-09-23T04:31:24.838Z https://docs.axolotl.ai/docs/fsdp_qlora.html - 2025-09-19T10:34:36.732Z + 2025-09-23T04:31:24.839Z https://docs.axolotl.ai/docs/qat.html - 2025-09-19T10:34:36.735Z + 2025-09-23T04:31:24.843Z https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html - 2025-09-19T10:34:36.757Z + 2025-09-23T04:31:24.864Z https://docs.axolotl.ai/index.html - 2025-09-19T10:34:36.752Z + 2025-09-23T04:31:24.859Z