diff --git a/.nojekyll b/.nojekyll
index 2b824870b..98d17ca0a 100644
--- a/.nojekyll
+++ b/.nojekyll
@@ -1 +1 @@
-6a3f1bdd
\ No newline at end of file
+818a088b
\ No newline at end of file
diff --git a/docs/lora_optims.html b/docs/lora_optims.html
index 8dda3a32a..7d07d16fc 100644
--- a/docs/lora_optims.html
+++ b/docs/lora_optims.html
@@ -551,10 +551,11 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
Inspired by Unsloth, we’ve implemented two
optimizations for LoRA and QLoRA fine-tuning, supporting both single GPU and multi-GPU
-(in the DDP and DeepSpeed settings) training. These include (1) SwiGLU and GEGLU activation function
-Triton kernels, and (2) LoRA MLP and attention custom autograd functions. Our goal was
-to leverage operator fusion and tensor re-use in order to improve speed and reduce
-memory usage during the forward and backward passes of these calculations.
+(including the DDP, DeepSpeed, and FSDP2 settings) training. These include (1) SwiGLU
+and GEGLU activation function Triton kernels, and (2) LoRA MLP and attention custom
+autograd functions. Our goal was to leverage operator fusion and tensor re-use in order
+to improve speed and reduce memory usage during the forward and backward passes of
+these calculations.
We currently support several common model architectures, including (but not limited to):
llama
@@ -687,7 +688,6 @@ computation path.
Future Work
- Support for additional model architectures
-- Support for the FSDP setting
- Support for dropout and bias
- Additional operator fusions
diff --git a/search.json b/search.json
index 0c00f8a24..6d768d62e 100644
--- a/search.json
+++ b/search.json
@@ -319,7 +319,7 @@
"href": "docs/lora_optims.html",
"title": "LoRA Optimizations",
"section": "",
- "text": "Inspired by Unsloth, we’ve implemented two\noptimizations for LoRA and QLoRA fine-tuning, supporting both single GPU and multi-GPU\n(in the DDP and DeepSpeed settings) training. These include (1) SwiGLU and GEGLU activation function\nTriton kernels, and (2) LoRA MLP and attention custom autograd functions. Our goal was\nto leverage operator fusion and tensor re-use in order to improve speed and reduce\nmemory usage during the forward and backward passes of these calculations.\nWe currently support several common model architectures, including (but not limited to):",
+ "text": "Inspired by Unsloth, we’ve implemented two\noptimizations for LoRA and QLoRA fine-tuning, supporting both single GPU and multi-GPU\n(including the DDP, DeepSpeed, and FSDP2 settings) training. These include (1) SwiGLU\nand GEGLU activation function Triton kernels, and (2) LoRA MLP and attention custom\nautograd functions. Our goal was to leverage operator fusion and tensor re-use in order\nto improve speed and reduce memory usage during the forward and backward passes of\nthese calculations.\nWe currently support several common model architectures, including (but not limited to):",
"crumbs": [
"How To Guides",
"LoRA Optimizations"
@@ -363,7 +363,7 @@
"href": "docs/lora_optims.html#future-work",
"title": "LoRA Optimizations",
"section": "Future Work",
- "text": "Future Work\n\nSupport for additional model architectures\nSupport for the FSDP setting\nSupport for dropout and bias\nAdditional operator fusions",
+ "text": "Future Work\n\nSupport for additional model architectures\nSupport for dropout and bias\nAdditional operator fusions",
"crumbs": [
"How To Guides",
"LoRA Optimizations"
diff --git a/sitemap.xml b/sitemap.xml
index 423d2054e..3155d5c0a 100644
--- a/sitemap.xml
+++ b/sitemap.xml
@@ -2,798 +2,798 @@
https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html
- 2025-09-26T09:24:08.905Z
+ 2025-09-26T13:55:24.802Z
https://docs.axolotl.ai/docs/mac.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/cli.html
- 2025-09-26T09:24:08.879Z
+ 2025-09-26T13:55:24.776Z
https://docs.axolotl.ai/docs/nccl.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/getting-started.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/lr_groups.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/qat.html
- 2025-09-26T09:24:08.884Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/multipack.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/streaming.html
- 2025-09-26T09:24:08.884Z
+ 2025-09-26T13:55:24.781Z
https://docs.axolotl.ai/docs/lora_optims.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/amd_hpc.html
- 2025-09-26T09:24:08.879Z
+ 2025-09-26T13:55:24.776Z
https://docs.axolotl.ai/docs/debugging.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/dataset-formats/conversation.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.776Z
https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/dataset-formats/index.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.776Z
https://docs.axolotl.ai/docs/config-reference.html
- 2025-09-26T09:31:04.207Z
+ 2025-09-26T13:59:10.877Z
https://docs.axolotl.ai/docs/multimodal.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/ray-integration.html
- 2025-09-26T09:24:08.884Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/faq.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/dataset_preprocessing.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/torchao.html
- 2025-09-26T09:24:08.884Z
+ 2025-09-26T13:55:24.781Z
https://docs.axolotl.ai/docs/optimizers.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/api/utils.schedulers.html
- 2025-09-26T09:30:49.631Z
+ 2025-09-26T13:58:55.909Z
https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html
- 2025-09-26T09:30:48.990Z
+ 2025-09-26T13:58:55.262Z
https://docs.axolotl.ai/docs/api/datasets.html
- 2025-09-26T09:30:48.662Z
+ 2025-09-26T13:58:54.932Z
https://docs.axolotl.ai/docs/api/utils.tokenization.html
- 2025-09-26T09:30:49.563Z
+ 2025-09-26T13:58:55.840Z
https://docs.axolotl.ai/docs/api/loaders.tokenizer.html
- 2025-09-26T09:30:49.085Z
+ 2025-09-26T13:58:55.358Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html
- 2025-09-26T09:30:49.460Z
+ 2025-09-26T13:58:55.737Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html
- 2025-09-26T09:30:49.530Z
+ 2025-09-26T13:58:55.807Z
https://docs.axolotl.ai/docs/api/utils.data.sft.html
- 2025-09-26T09:30:49.671Z
+ 2025-09-26T13:58:55.950Z
https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html
- 2025-09-26T09:30:49.515Z
+ 2025-09-26T13:58:55.792Z
https://docs.axolotl.ai/docs/api/loaders.patch_manager.html
- 2025-09-26T09:30:49.102Z
+ 2025-09-26T13:58:55.375Z
https://docs.axolotl.ai/docs/api/integrations.liger.args.html
- 2025-09-26T09:30:49.933Z
+ 2025-09-26T13:58:56.213Z
https://docs.axolotl.ai/docs/api/utils.schemas.peft.html
- 2025-09-26T09:30:49.746Z
+ 2025-09-26T13:58:56.024Z
https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html
- 2025-09-26T09:30:49.257Z
+ 2025-09-26T13:58:55.532Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html
- 2025-09-26T09:30:49.191Z
+ 2025-09-26T13:58:55.466Z
https://docs.axolotl.ai/docs/api/cli.cloud.base.html
- 2025-09-26T09:30:48.954Z
+ 2025-09-26T13:58:55.226Z
https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html
- 2025-09-26T09:30:49.556Z
+ 2025-09-26T13:58:55.834Z
https://docs.axolotl.ai/docs/api/kernels.swiglu.html
- 2025-09-26T09:30:49.436Z
+ 2025-09-26T13:58:55.713Z
https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html
- 2025-09-26T09:30:49.921Z
+ 2025-09-26T13:58:56.201Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html
- 2025-09-26T09:30:49.305Z
+ 2025-09-26T13:58:55.581Z
https://docs.axolotl.ai/docs/api/monkeypatch.utils.html
- 2025-09-26T09:30:49.497Z
+ 2025-09-26T13:58:55.773Z
https://docs.axolotl.ai/docs/api/core.builders.rl.html
- 2025-09-26T09:30:48.741Z
+ 2025-09-26T13:58:55.013Z
https://docs.axolotl.ai/docs/api/loaders.processor.html
- 2025-09-26T09:30:49.086Z
+ 2025-09-26T13:58:55.360Z
https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html
- 2025-09-26T09:30:50.039Z
+ 2025-09-26T13:58:56.320Z
https://docs.axolotl.ai/docs/api/core.training_args.html
- 2025-09-26T09:30:48.754Z
+ 2025-09-26T13:58:55.025Z
https://docs.axolotl.ai/docs/api/loaders.adapter.html
- 2025-09-26T09:30:49.092Z
+ 2025-09-26T13:58:55.365Z
https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html
- 2025-09-26T09:30:48.930Z
+ 2025-09-26T13:58:55.203Z
https://docs.axolotl.ai/docs/api/cli.train.html
- 2025-09-26T09:30:48.837Z
+ 2025-09-26T13:58:55.108Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html
- 2025-09-26T09:30:49.112Z
+ 2025-09-26T13:58:55.386Z
https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html
- 2025-09-26T09:30:49.230Z
+ 2025-09-26T13:58:55.505Z
https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html
- 2025-09-26T09:30:49.240Z
+ 2025-09-26T13:58:55.515Z
https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html
- 2025-09-26T09:30:49.489Z
+ 2025-09-26T13:58:55.765Z
https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html
- 2025-09-26T09:30:49.261Z
+ 2025-09-26T13:58:55.536Z
https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html
- 2025-09-26T09:30:49.211Z
+ 2025-09-26T13:58:55.486Z
https://docs.axolotl.ai/docs/api/core.chat.messages.html
- 2025-09-26T09:30:48.777Z
+ 2025-09-26T13:58:55.048Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html
- 2025-09-26T09:30:49.119Z
+ 2025-09-26T13:58:55.392Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html
- 2025-09-26T09:30:49.286Z
+ 2025-09-26T13:58:55.562Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html
- 2025-09-26T09:30:49.296Z
+ 2025-09-26T13:58:55.571Z
https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html
- 2025-09-26T09:30:49.766Z
+ 2025-09-26T13:58:56.045Z
https://docs.axolotl.ai/docs/api/convert.html
- 2025-09-26T09:30:48.675Z
+ 2025-09-26T13:58:54.946Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html
- 2025-09-26T09:30:49.288Z
+ 2025-09-26T13:58:55.563Z
https://docs.axolotl.ai/docs/api/utils.schemas.config.html
- 2025-09-26T09:30:49.705Z
+ 2025-09-26T13:58:55.984Z
https://docs.axolotl.ai/docs/api/utils.schemas.enums.html
- 2025-09-26T09:30:49.775Z
+ 2025-09-26T13:58:56.054Z
https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html
- 2025-09-26T09:30:49.498Z
+ 2025-09-26T13:58:55.775Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html
- 2025-09-26T09:30:49.263Z
+ 2025-09-26T13:58:55.538Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html
- 2025-09-26T09:30:49.054Z
+ 2025-09-26T13:58:55.327Z
https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html
- 2025-09-26T09:30:49.936Z
+ 2025-09-26T13:58:56.216Z
https://docs.axolotl.ai/docs/api/utils.collators.core.html
- 2025-09-26T09:30:49.960Z
+ 2025-09-26T13:58:56.240Z
https://docs.axolotl.ai/docs/api/core.chat.format.shared.html
- 2025-09-26T09:30:48.781Z
+ 2025-09-26T13:58:55.053Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html
- 2025-09-26T09:30:49.326Z
+ 2025-09-26T13:58:55.601Z
https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html
- 2025-09-26T09:30:50.028Z
+ 2025-09-26T13:58:56.309Z
https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html
- 2025-09-26T09:30:50.053Z
+ 2025-09-26T13:58:56.334Z
https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html
- 2025-09-26T09:30:49.176Z
+ 2025-09-26T13:58:55.451Z
https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html
- 2025-09-26T09:30:49.754Z
+ 2025-09-26T13:58:56.033Z
https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html
- 2025-09-26T09:30:50.046Z
+ 2025-09-26T13:58:56.327Z
https://docs.axolotl.ai/docs/api/prompt_strategies.base.html
- 2025-09-26T09:30:49.144Z
+ 2025-09-26T13:58:55.418Z
https://docs.axolotl.ai/docs/api/kernels.utils.html
- 2025-09-26T09:30:49.445Z
+ 2025-09-26T13:58:55.722Z
https://docs.axolotl.ai/docs/api/cli.merge_lora.html
- 2025-09-26T09:30:48.919Z
+ 2025-09-26T13:58:55.191Z
https://docs.axolotl.ai/docs/api/cli.utils.html
- 2025-09-26T09:30:48.961Z
+ 2025-09-26T13:58:55.234Z
https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html
- 2025-09-26T09:30:49.142Z
+ 2025-09-26T13:58:55.416Z
https://docs.axolotl.ai/docs/api/index.html
- 2025-09-26T09:30:48.587Z
+ 2025-09-26T13:58:54.857Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html
- 2025-09-26T09:30:49.273Z
+ 2025-09-26T13:58:55.548Z
https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html
- 2025-09-26T09:30:49.527Z
+ 2025-09-26T13:58:55.804Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html
- 2025-09-26T09:30:49.251Z
+ 2025-09-26T13:58:55.526Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html
- 2025-09-26T09:30:49.066Z
+ 2025-09-26T13:58:55.339Z
https://docs.axolotl.ai/docs/api/utils.lora.html
- 2025-09-26T09:30:49.569Z
+ 2025-09-26T13:58:55.847Z
https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html
- 2025-09-26T09:30:49.109Z
+ 2025-09-26T13:58:55.382Z
https://docs.axolotl.ai/docs/api/cli.config.html
- 2025-09-26T09:30:48.892Z
+ 2025-09-26T13:58:55.163Z
https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html
- 2025-09-26T09:30:49.455Z
+ 2025-09-26T13:58:55.732Z
https://docs.axolotl.ai/docs/api/utils.collators.batching.html
- 2025-09-26T09:30:49.979Z
+ 2025-09-26T13:58:56.260Z
https://docs.axolotl.ai/docs/api/utils.quantization.html
- 2025-09-26T09:30:49.691Z
+ 2025-09-26T13:58:55.969Z
https://docs.axolotl.ai/docs/api/utils.dict.html
- 2025-09-26T09:30:49.656Z
+ 2025-09-26T13:58:55.934Z
https://docs.axolotl.ai/docs/api/kernels.quantize.html
- 2025-09-26T09:30:49.444Z
+ 2025-09-26T13:58:55.720Z
https://docs.axolotl.ai/docs/api/utils.schemas.training.html
- 2025-09-26T09:30:49.719Z
+ 2025-09-26T13:58:55.998Z
https://docs.axolotl.ai/docs/api/train.html
- 2025-09-26T09:30:48.645Z
+ 2025-09-26T13:58:54.915Z
https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html
- 2025-09-26T09:30:48.794Z
+ 2025-09-26T13:58:55.066Z
https://docs.axolotl.ai/docs/inference.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/FAQS.html
- 2025-09-26T09:24:08.878Z
+ 2025-09-26T13:55:24.775Z
https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html
- 2025-09-26T09:24:08.888Z
+ 2025-09-26T13:55:24.785Z
https://docs.axolotl.ai/index.html
- 2025-09-26T09:24:08.900Z
+ 2025-09-26T13:55:24.797Z
https://docs.axolotl.ai/docs/custom_integrations.html
- 2025-09-26T09:24:08.879Z
+ 2025-09-26T13:55:24.776Z
https://docs.axolotl.ai/docs/api/utils.schemas.utils.html
- 2025-09-26T09:30:49.781Z
+ 2025-09-26T13:58:56.060Z
https://docs.axolotl.ai/docs/api/kernels.geglu.html
- 2025-09-26T09:30:49.426Z
+ 2025-09-26T13:58:55.703Z
https://docs.axolotl.ai/docs/api/core.builders.causal.html
- 2025-09-26T09:30:48.737Z
+ 2025-09-26T13:58:55.008Z
https://docs.axolotl.ai/docs/api/core.trainers.mamba.html
- 2025-09-26T09:30:49.036Z
+ 2025-09-26T13:58:55.309Z
https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html
- 2025-09-26T09:30:49.329Z
+ 2025-09-26T13:58:55.605Z
https://docs.axolotl.ai/docs/api/core.datasets.chat.html
- 2025-09-26T09:30:48.786Z
+ 2025-09-26T13:58:55.058Z
https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html
- 2025-09-26T09:30:49.987Z
+ 2025-09-26T13:58:56.268Z
https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html
- 2025-09-26T09:30:49.224Z
+ 2025-09-26T13:58:55.499Z
https://docs.axolotl.ai/docs/api/common.const.html
- 2025-09-26T09:30:49.942Z
+ 2025-09-26T13:58:56.223Z
https://docs.axolotl.ai/docs/api/cli.quantize.html
- 2025-09-26T09:30:48.944Z
+ 2025-09-26T13:58:55.216Z
https://docs.axolotl.ai/docs/api/utils.trainer.html
- 2025-09-26T09:30:49.603Z
+ 2025-09-26T13:58:55.881Z
https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html
- 2025-09-26T09:30:48.896Z
+ 2025-09-26T13:58:55.168Z
https://docs.axolotl.ai/docs/api/evaluate.html
- 2025-09-26T09:30:48.655Z
+ 2025-09-26T13:58:54.926Z
https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html
- 2025-09-26T09:30:49.454Z
+ 2025-09-26T13:58:55.730Z
https://docs.axolotl.ai/docs/api/loaders.model.html
- 2025-09-26T09:30:49.077Z
+ 2025-09-26T13:58:55.350Z
https://docs.axolotl.ai/docs/api/utils.distributed.html
- 2025-09-26T09:30:49.650Z
+ 2025-09-26T13:58:55.929Z
https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html
- 2025-09-26T09:30:49.575Z
+ 2025-09-26T13:58:55.853Z
https://docs.axolotl.ai/docs/api/kernels.lora.html
- 2025-09-26T09:30:49.416Z
+ 2025-09-26T13:58:55.692Z
https://docs.axolotl.ai/docs/api/cli.main.html
- 2025-09-26T09:30:48.828Z
+ 2025-09-26T13:58:55.099Z
https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html
- 2025-09-26T09:30:49.939Z
+ 2025-09-26T13:58:56.220Z
https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html
- 2025-09-26T09:30:49.664Z
+ 2025-09-26T13:58:55.942Z
https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html
- 2025-09-26T09:30:48.960Z
+ 2025-09-26T13:58:55.232Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html
- 2025-09-26T09:30:49.451Z
+ 2025-09-26T13:58:55.727Z
https://docs.axolotl.ai/docs/api/core.builders.base.html
- 2025-09-26T09:30:48.732Z
+ 2025-09-26T13:58:55.003Z
https://docs.axolotl.ai/docs/api/utils.schemas.trl.html
- 2025-09-26T09:30:49.749Z
+ 2025-09-26T13:58:56.028Z
https://docs.axolotl.ai/docs/api/cli.utils.args.html
- 2025-09-26T09:30:48.973Z
+ 2025-09-26T13:58:55.245Z
https://docs.axolotl.ai/docs/api/core.trainers.base.html
- 2025-09-26T09:30:49.015Z
+ 2025-09-26T13:58:55.288Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html
- 2025-09-26T09:30:49.500Z
+ 2025-09-26T13:58:55.776Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html
- 2025-09-26T09:30:49.452Z
+ 2025-09-26T13:58:55.729Z
https://docs.axolotl.ai/docs/api/utils.schemas.model.html
- 2025-09-26T09:30:49.712Z
+ 2025-09-26T13:58:55.991Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html
- 2025-09-26T09:30:49.304Z
+ 2025-09-26T13:58:55.579Z
https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html
- 2025-09-26T09:30:50.043Z
+ 2025-09-26T13:58:56.324Z
https://docs.axolotl.ai/docs/api/common.datasets.html
- 2025-09-26T09:30:49.958Z
+ 2025-09-26T13:58:56.238Z
https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html
- 2025-09-26T09:30:49.737Z
+ 2025-09-26T13:58:56.016Z
https://docs.axolotl.ai/docs/api/cli.utils.fetch.html
- 2025-09-26T09:30:48.978Z
+ 2025-09-26T13:58:55.251Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html
- 2025-09-26T09:30:49.283Z
+ 2025-09-26T13:58:55.559Z
https://docs.axolotl.ai/docs/api/monkeypatch.relora.html
- 2025-09-26T09:30:49.459Z
+ 2025-09-26T13:58:55.735Z
https://docs.axolotl.ai/docs/api/cli.evaluate.html
- 2025-09-26T09:30:48.845Z
+ 2025-09-26T13:58:55.116Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html
- 2025-09-26T09:30:49.285Z
+ 2025-09-26T13:58:55.560Z
https://docs.axolotl.ai/docs/api/core.trainers.utils.html
- 2025-09-26T09:30:49.067Z
+ 2025-09-26T13:58:55.340Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html
- 2025-09-26T09:30:49.203Z
+ 2025-09-26T13:58:55.478Z
https://docs.axolotl.ai/docs/api/utils.chat_templates.html
- 2025-09-26T09:30:49.564Z
+ 2025-09-26T13:58:55.842Z
https://docs.axolotl.ai/docs/api/utils.data.streaming.html
- 2025-09-26T09:30:49.665Z
+ 2025-09-26T13:58:55.943Z
https://docs.axolotl.ai/docs/api/utils.bench.html
- 2025-09-26T09:30:49.578Z
+ 2025-09-26T13:58:55.856Z
https://docs.axolotl.ai/docs/api/common.architectures.html
- 2025-09-26T09:30:49.941Z
+ 2025-09-26T13:58:56.221Z
https://docs.axolotl.ai/docs/api/cli.checks.html
- 2025-09-26T09:30:48.874Z
+ 2025-09-26T13:58:55.146Z
https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html
- 2025-09-26T09:30:49.043Z
+ 2025-09-26T13:58:55.316Z
https://docs.axolotl.ai/docs/api/integrations.base.html
- 2025-09-26T09:30:49.917Z
+ 2025-09-26T13:58:56.198Z
https://docs.axolotl.ai/docs/api/cli.utils.train.html
- 2025-09-26T09:30:49.001Z
+ 2025-09-26T13:58:55.274Z
https://docs.axolotl.ai/docs/api/utils.collators.mamba.html
- 2025-09-26T09:30:49.983Z
+ 2025-09-26T13:58:56.263Z
https://docs.axolotl.ai/docs/api/cli.art.html
- 2025-09-26T09:30:48.868Z
+ 2025-09-26T13:58:55.139Z
https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html
- 2025-09-26T09:30:49.509Z
+ 2025-09-26T13:58:55.785Z
https://docs.axolotl.ai/docs/api/logging_config.html
- 2025-09-26T09:30:48.726Z
+ 2025-09-26T13:58:54.997Z
https://docs.axolotl.ai/docs/api/utils.freeze.html
- 2025-09-26T09:30:49.586Z
+ 2025-09-26T13:58:55.864Z
https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html
- 2025-09-26T09:30:49.247Z
+ 2025-09-26T13:58:55.522Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html
- 2025-09-26T09:30:49.190Z
+ 2025-09-26T13:58:55.464Z
https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html
- 2025-09-26T09:30:49.505Z
+ 2025-09-26T13:58:55.782Z
https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html
- 2025-09-26T09:30:49.959Z
+ 2025-09-26T13:58:56.239Z
https://docs.axolotl.ai/docs/api/core.trainers.trl.html
- 2025-09-26T09:30:49.031Z
+ 2025-09-26T13:58:55.303Z
https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html
- 2025-09-26T09:30:49.236Z
+ 2025-09-26T13:58:55.511Z
https://docs.axolotl.ai/docs/api/loaders.constants.html
- 2025-09-26T09:30:49.103Z
+ 2025-09-26T13:58:55.377Z
https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html
- 2025-09-26T09:30:49.526Z
+ 2025-09-26T13:58:55.802Z
https://docs.axolotl.ai/docs/api/cli.vllm_serve.html
- 2025-09-26T09:30:48.950Z
+ 2025-09-26T13:58:55.223Z
https://docs.axolotl.ai/docs/api/prompt_tokenizers.html
- 2025-09-26T09:30:48.716Z
+ 2025-09-26T13:58:54.987Z
https://docs.axolotl.ai/docs/api/cli.args.html
- 2025-09-26T09:30:48.864Z
+ 2025-09-26T13:58:55.136Z
https://docs.axolotl.ai/docs/api/cli.inference.html
- 2025-09-26T09:30:48.910Z
+ 2025-09-26T13:58:55.182Z
https://docs.axolotl.ai/docs/api/cli.utils.load.html
- 2025-09-26T09:30:48.984Z
+ 2025-09-26T13:58:55.256Z
https://docs.axolotl.ai/docs/api/cli.preprocess.html
- 2025-09-26T09:30:48.939Z
+ 2025-09-26T13:58:55.211Z
https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html
- 2025-09-26T09:30:50.038Z
+ 2025-09-26T13:58:56.319Z
https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html
- 2025-09-26T09:30:50.034Z
+ 2025-09-26T13:58:56.315Z
https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html
- 2025-09-26T09:30:48.778Z
+ 2025-09-26T13:58:55.050Z
https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html
- 2025-09-26T09:30:49.922Z
+ 2025-09-26T13:58:56.202Z
https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html
- 2025-09-26T09:30:49.929Z
+ 2025-09-26T13:58:56.210Z
https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html
- 2025-09-26T09:30:49.517Z
+ 2025-09-26T13:58:55.793Z
https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html
- 2025-09-26T09:30:48.780Z
+ 2025-09-26T13:58:55.051Z
https://docs.axolotl.ai/docs/reward_modelling.html
- 2025-09-26T09:24:08.884Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/quantize.html
- 2025-09-26T09:24:08.884Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/fsdp_qlora.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/nd_parallelism.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/batch_vs_grad.html
- 2025-09-26T09:24:08.879Z
+ 2025-09-26T13:55:24.776Z
https://docs.axolotl.ai/docs/multi-node.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/rlhf.html
- 2025-09-26T09:24:08.884Z
+ 2025-09-26T13:55:24.781Z
https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/dataset-formats/pretraining.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/dataset-formats/tokenized.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/dataset-formats/template_free.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/multi-gpu.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/input_output.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/docker.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/gradient_checkpointing.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/optimizations.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/sequence_parallelism.html
- 2025-09-26T09:24:08.884Z
+ 2025-09-26T13:55:24.781Z
https://docs.axolotl.ai/docs/dataset_loading.html
- 2025-09-26T09:24:08.880Z
+ 2025-09-26T13:55:24.777Z
https://docs.axolotl.ai/docs/installation.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/mixed_precision.html
- 2025-09-26T09:24:08.883Z
+ 2025-09-26T13:55:24.780Z
https://docs.axolotl.ai/docs/unsloth.html
- 2025-09-26T09:24:08.884Z
+ 2025-09-26T13:55:24.781Z
https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html
- 2025-09-26T09:24:08.905Z
+ 2025-09-26T13:55:24.802Z