diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 4f772381f..580c4047c 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -180,6 +180,7 @@ jobs: if: ${{ ! contains(github.event.commits[0].message, '[skip docker]') && github.repository_owner == 'axolotl-ai-cloud' }} # this job needs to be run on self-hosted GPU runners... strategy: + fail-fast: false matrix: include: - cuda: 128 @@ -199,12 +200,6 @@ jobs: python_version: "3.11" pytorch: 2.9.1 axolotl_extras: - platforms: "linux/amd64,linux/arm64" - - cuda: 128 - cuda_version: 12.8.1 - python_version: "3.12" - pytorch: 2.9.1 - axolotl_extras: is_latest: true platforms: "linux/amd64,linux/arm64" - cuda: 128 @@ -271,6 +266,7 @@ jobs: if: ${{ ! contains(github.event.commits[0].message, '[skip docker]') && github.repository_owner == 'axolotl-ai-cloud' }} # this job needs to be run on self-hosted GPU runners... strategy: + fail-fast: false matrix: include: - cuda: 128 @@ -278,6 +274,12 @@ jobs: python_version: "3.11" pytorch: 2.9.1 axolotl_extras: + platforms: "linux/amd64,linux/arm64" + - cuda: 128 + cuda_version: 12.8.1 + python_version: "3.12" + pytorch: 2.9.1 + axolotl_extras: is_latest: true platforms: "linux/amd64,linux/arm64" - cuda: 128 @@ -338,6 +340,7 @@ jobs: if: ${{ ! contains(github.event.commits[0].message, '[skip docker]') && github.repository_owner == 'axolotl-ai-cloud' }} # this job needs to be run on self-hosted GPU runners... strategy: + fail-fast: false matrix: include: - cuda: 128 diff --git a/.nojekyll b/.nojekyll index 72acdf8d5..1d23a15d7 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -61d9674d \ No newline at end of file +0cf5395e \ No newline at end of file diff --git a/sitemap.xml b/sitemap.xml index e19848064..94572bd49 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -2,950 +2,950 @@ https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html - 2026-03-12T00:09:52.487Z + 2026-03-12T01:46:10.591Z https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html - 2026-03-12T00:09:52.509Z + 2026-03-12T01:46:10.620Z https://docs.axolotl.ai/docs/inference.html - 2026-03-12T00:09:52.481Z + 2026-03-12T01:46:10.583Z https://docs.axolotl.ai/docs/expert_quantization.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/installation.html - 2026-03-12T00:09:52.481Z + 2026-03-12T01:46:10.583Z https://docs.axolotl.ai/docs/models/ministral3/think.html - 2026-03-12T00:13:55.121Z + 2026-03-12T01:50:20.041Z https://docs.axolotl.ai/docs/models/granite4.html - 2026-03-12T00:13:55.127Z + 2026-03-12T01:50:20.051Z https://docs.axolotl.ai/docs/models/seed-oss.html - 2026-03-12T00:13:55.127Z + 2026-03-12T01:50:20.050Z https://docs.axolotl.ai/docs/models/orpheus.html - 2026-03-12T00:13:55.129Z + 2026-03-12T01:50:20.053Z https://docs.axolotl.ai/docs/models/internvl3_5.html - 2026-03-12T00:13:55.119Z + 2026-03-12T01:50:20.039Z https://docs.axolotl.ai/docs/models/magistral/vision.html - 2026-03-12T00:13:55.122Z + 2026-03-12T01:50:20.045Z https://docs.axolotl.ai/docs/models/mimo.html - 2026-03-12T00:13:55.118Z + 2026-03-12T01:50:19.999Z https://docs.axolotl.ai/docs/models/gpt-oss.html - 2026-03-12T00:13:55.126Z + 2026-03-12T01:50:20.050Z https://docs.axolotl.ai/docs/models/qwen3-next.html - 2026-03-12T00:13:55.125Z + 2026-03-12T01:50:20.048Z https://docs.axolotl.ai/docs/models/llama-2.html - 2026-03-12T00:13:55.125Z + 2026-03-12T01:50:20.047Z https://docs.axolotl.ai/docs/models/kimi-linear.html - 2026-03-12T00:13:55.117Z + 2026-03-12T01:50:19.999Z https://docs.axolotl.ai/docs/models/smolvlm2.html - 2026-03-12T00:13:55.127Z + 2026-03-12T01:50:20.051Z https://docs.axolotl.ai/docs/models/olmo3.html - 2026-03-12T00:13:55.119Z + 2026-03-12T01:50:20.040Z https://docs.axolotl.ai/docs/models/jamba.html - 2026-03-12T00:13:55.128Z + 2026-03-12T01:50:20.052Z https://docs.axolotl.ai/docs/models/mistral-small.html - 2026-03-12T00:13:55.123Z + 2026-03-12T01:50:20.046Z https://docs.axolotl.ai/docs/models/devstral.html - 2026-03-12T00:13:55.124Z + 2026-03-12T01:50:20.046Z https://docs.axolotl.ai/docs/models/index.html - 2026-03-12T00:13:55.129Z + 2026-03-12T01:50:20.053Z https://docs.axolotl.ai/docs/lora_optims.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/cli.html - 2026-03-12T00:09:52.478Z + 2026-03-12T01:46:10.579Z https://docs.axolotl.ai/docs/gradient_checkpointing.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/dataset_preprocessing.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/docker.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/attention.html - 2026-03-12T00:09:52.478Z + 2026-03-12T01:46:10.579Z https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html - 2026-03-12T00:13:32.687Z + 2026-03-12T01:49:58.875Z https://docs.axolotl.ai/docs/api/loaders.adapter.html - 2026-03-12T00:13:32.496Z + 2026-03-12T01:49:58.676Z https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html - 2026-03-12T00:13:33.020Z + 2026-03-12T01:49:59.214Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html - 2026-03-12T00:13:33.022Z + 2026-03-12T01:49:59.216Z https://docs.axolotl.ai/docs/api/core.trainers.utils.html - 2026-03-12T00:13:32.464Z + 2026-03-12T01:49:58.644Z https://docs.axolotl.ai/docs/api/utils.data.sft.html - 2026-03-12T00:13:33.237Z + 2026-03-12T01:49:59.434Z https://docs.axolotl.ai/docs/api/utils.schemas.peft.html - 2026-03-12T00:13:33.329Z + 2026-03-12T01:49:59.526Z https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html - 2026-03-12T00:13:33.008Z + 2026-03-12T01:49:59.202Z https://docs.axolotl.ai/docs/api/utils.collators.mamba.html - 2026-03-12T00:13:33.629Z + 2026-03-12T01:49:59.829Z https://docs.axolotl.ai/docs/api/prompt_strategies.base.html - 2026-03-12T00:13:32.570Z + 2026-03-12T01:49:58.757Z https://docs.axolotl.ai/docs/api/loaders.processor.html - 2026-03-12T00:13:32.489Z + 2026-03-12T01:49:58.669Z https://docs.axolotl.ai/docs/api/core.training_args.html - 2026-03-12T00:13:32.074Z + 2026-03-12T01:49:58.251Z https://docs.axolotl.ai/docs/api/loaders.tokenizer.html - 2026-03-12T00:13:32.487Z + 2026-03-12T01:49:58.668Z https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html - 2026-03-12T00:13:32.679Z + 2026-03-12T01:49:58.867Z https://docs.axolotl.ai/docs/api/loaders.constants.html - 2026-03-12T00:13:32.519Z + 2026-03-12T01:49:58.702Z https://docs.axolotl.ai/docs/api/cli.utils.train.html - 2026-03-12T00:13:32.382Z + 2026-03-12T01:49:58.562Z https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html - 2026-03-12T00:13:33.029Z + 2026-03-12T01:49:59.223Z https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html - 2026-03-12T00:13:33.318Z + 2026-03-12T01:49:59.515Z https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html - 2026-03-12T00:13:32.672Z + 2026-03-12T01:49:58.860Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html - 2026-03-12T00:13:32.963Z + 2026-03-12T01:49:59.156Z https://docs.axolotl.ai/docs/api/common.datasets.html - 2026-03-12T00:13:33.599Z + 2026-03-12T01:49:59.799Z https://docs.axolotl.ai/docs/api/logging_config.html - 2026-03-12T00:13:32.039Z + 2026-03-12T01:49:58.215Z https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html - 2026-03-12T00:13:33.043Z + 2026-03-12T01:49:59.237Z https://docs.axolotl.ai/docs/api/integrations.liger.args.html - 2026-03-12T00:13:33.568Z + 2026-03-12T01:49:59.767Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html - 2026-03-12T00:13:32.740Z + 2026-03-12T01:49:58.929Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html - 2026-03-12T00:13:32.462Z + 2026-03-12T01:49:58.643Z https://docs.axolotl.ai/docs/api/core.chat.messages.html - 2026-03-12T00:13:32.103Z + 2026-03-12T01:49:58.280Z https://docs.axolotl.ai/docs/api/integrations.base.html - 2026-03-12T00:13:33.549Z + 2026-03-12T01:49:59.748Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html - 2026-03-12T00:13:32.727Z + 2026-03-12T01:49:58.916Z https://docs.axolotl.ai/docs/api/train.html - 2026-03-12T00:13:31.936Z + 2026-03-12T01:49:58.110Z https://docs.axolotl.ai/docs/api/utils.distributed.html - 2026-03-12T00:13:33.211Z + 2026-03-12T01:49:59.407Z https://docs.axolotl.ai/docs/api/core.builders.causal.html - 2026-03-12T00:13:32.052Z + 2026-03-12T01:49:58.228Z https://docs.axolotl.ai/docs/api/core.builders.rl.html - 2026-03-12T00:13:32.058Z + 2026-03-12T01:49:58.234Z https://docs.axolotl.ai/docs/api/utils.collators.core.html - 2026-03-12T00:13:33.602Z + 2026-03-12T01:49:59.802Z https://docs.axolotl.ai/docs/api/utils.schemas.model.html - 2026-03-12T00:13:33.287Z + 2026-03-12T01:49:59.484Z https://docs.axolotl.ai/docs/api/kernels.quantize.html - 2026-03-12T00:13:32.952Z + 2026-03-12T01:49:59.145Z https://docs.axolotl.ai/docs/api/utils.schemas.enums.html - 2026-03-12T00:13:33.371Z + 2026-03-12T01:49:59.569Z https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html - 2026-03-12T00:13:32.701Z + 2026-03-12T01:49:58.889Z https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html - 2026-03-12T00:13:33.700Z + 2026-03-12T01:49:59.900Z https://docs.axolotl.ai/docs/api/cli.preprocess.html - 2026-03-12T00:13:32.303Z + 2026-03-12T01:49:58.482Z https://docs.axolotl.ai/docs/api/loaders.model.html - 2026-03-12T00:13:32.476Z + 2026-03-12T01:49:58.656Z https://docs.axolotl.ai/docs/api/cli.merge_lora.html - 2026-03-12T00:13:32.279Z + 2026-03-12T01:49:58.458Z https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html - 2026-03-12T00:13:32.367Z + 2026-03-12T01:49:58.547Z https://docs.axolotl.ai/docs/api/utils.bench.html - 2026-03-12T00:13:33.121Z + 2026-03-12T01:49:59.316Z https://docs.axolotl.ai/docs/api/core.trainers.mamba.html - 2026-03-12T00:13:32.425Z + 2026-03-12T01:49:58.605Z https://docs.axolotl.ai/docs/api/cli.vllm_serve.html - 2026-03-12T00:13:32.318Z + 2026-03-12T01:49:58.497Z https://docs.axolotl.ai/docs/api/kernels.utils.html - 2026-03-12T00:13:32.954Z + 2026-03-12T01:49:59.147Z https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html - 2026-03-12T00:13:32.612Z + 2026-03-12T01:49:58.800Z https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html - 2026-03-12T00:13:33.693Z + 2026-03-12T01:49:59.894Z https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html - 2026-03-12T00:13:33.635Z + 2026-03-12T01:49:59.835Z https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html - 2026-03-12T00:13:33.360Z + 2026-03-12T01:49:59.558Z https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html - 2026-03-12T00:13:32.807Z + 2026-03-12T01:49:58.997Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html - 2026-03-12T00:13:32.646Z + 2026-03-12T01:49:58.834Z https://docs.axolotl.ai/docs/api/cli.evaluate.html - 2026-03-12T00:13:32.187Z + 2026-03-12T01:49:58.364Z https://docs.axolotl.ai/docs/api/core.datasets.chat.html - 2026-03-12T00:13:32.115Z + 2026-03-12T01:49:58.293Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html - 2026-03-12T00:13:32.629Z + 2026-03-12T01:49:58.817Z https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html - 2026-03-12T00:13:32.706Z + 2026-03-12T01:49:58.894Z https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html - 2026-03-12T00:13:33.041Z + 2026-03-12T01:49:59.235Z https://docs.axolotl.ai/docs/api/kernels.lora.html - 2026-03-12T00:13:32.918Z + 2026-03-12T01:49:59.110Z https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html - 2026-03-12T00:13:33.698Z + 2026-03-12T01:49:59.899Z https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html - 2026-03-12T00:13:33.704Z + 2026-03-12T01:49:59.905Z https://docs.axolotl.ai/docs/api/utils.freeze.html - 2026-03-12T00:13:33.131Z + 2026-03-12T01:49:59.326Z https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html - 2026-03-12T00:13:33.564Z + 2026-03-12T01:49:59.763Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html - 2026-03-12T00:13:33.093Z + 2026-03-12T01:49:59.288Z https://docs.axolotl.ai/docs/api/utils.data.streaming.html - 2026-03-12T00:13:33.230Z + 2026-03-12T01:49:59.426Z https://docs.axolotl.ai/docs/api/prompt_tokenizers.html - 2026-03-12T00:13:32.027Z + 2026-03-12T01:49:58.202Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html - 2026-03-12T00:13:32.531Z + 2026-03-12T01:49:58.714Z https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html - 2026-03-12T00:13:32.330Z + 2026-03-12T01:49:58.509Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html - 2026-03-12T00:13:32.539Z + 2026-03-12T01:49:58.723Z https://docs.axolotl.ai/docs/api/convert.html - 2026-03-12T00:13:31.975Z + 2026-03-12T01:49:58.149Z https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html - 2026-03-12T00:13:33.600Z + 2026-03-12T01:49:59.800Z https://docs.axolotl.ai/docs/api/cli.args.html - 2026-03-12T00:13:32.212Z + 2026-03-12T01:49:58.389Z https://docs.axolotl.ai/docs/api/core.chat.format.shared.html - 2026-03-12T00:13:32.109Z + 2026-03-12T01:49:58.286Z https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html - 2026-03-12T00:13:32.812Z + 2026-03-12T01:49:59.002Z https://docs.axolotl.ai/docs/api/index.html - 2026-03-12T00:13:31.860Z + 2026-03-12T01:49:58.033Z https://docs.axolotl.ai/docs/fsdp_qlora.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/dataset-formats/template_free.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/dataset-formats/index.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/telemetry.html - 2026-03-12T00:09:52.483Z + 2026-03-12T01:46:10.586Z https://docs.axolotl.ai/docs/config-reference.html - 2026-03-12T00:13:54.269Z + 2026-03-12T01:50:19.090Z https://docs.axolotl.ai/docs/ray-integration.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/streaming.html - 2026-03-12T00:09:52.483Z + 2026-03-12T01:46:10.586Z https://docs.axolotl.ai/docs/sequence_parallelism.html - 2026-03-12T00:09:52.483Z + 2026-03-12T01:46:10.586Z https://docs.axolotl.ai/docs/unsloth.html - 2026-03-12T00:09:52.483Z + 2026-03-12T01:46:10.586Z https://docs.axolotl.ai/docs/mixed_precision.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/amd_hpc.html - 2026-03-12T00:09:52.478Z + 2026-03-12T01:46:10.579Z https://docs.axolotl.ai/docs/lr_groups.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/optimizations.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/mac.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/index.html - 2026-03-12T00:09:52.503Z + 2026-03-12T01:46:10.613Z https://docs.axolotl.ai/docs/optimizers.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/getting-started.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/multi-node.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/input_output.html - 2026-03-12T00:09:52.481Z + 2026-03-12T01:46:10.583Z https://docs.axolotl.ai/docs/nd_parallelism.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/dataset_loading.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/quantize.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/rlhf.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.585Z https://docs.axolotl.ai/docs/custom_integrations.html - 2026-03-12T00:09:52.478Z + 2026-03-12T01:46:10.579Z https://docs.axolotl.ai/docs/qat.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/checkpoint_saving.html - 2026-03-12T00:09:52.478Z + 2026-03-12T01:46:10.579Z https://docs.axolotl.ai/docs/dataset-formats/conversation.html - 2026-03-12T00:09:52.478Z + 2026-03-12T01:46:10.579Z https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/dataset-formats/tokenized.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/dataset-formats/pretraining.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/api/cli.main.html - 2026-03-12T00:13:32.166Z + 2026-03-12T01:49:58.344Z https://docs.axolotl.ai/docs/api/utils.schemas.trl.html - 2026-03-12T00:13:33.333Z + 2026-03-12T01:49:59.531Z https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html - 2026-03-12T00:13:32.125Z + 2026-03-12T01:49:58.302Z https://docs.axolotl.ai/docs/api/common.const.html - 2026-03-12T00:13:33.580Z + 2026-03-12T01:49:59.780Z https://docs.axolotl.ai/docs/api/cli.utils.load.html - 2026-03-12T00:13:32.360Z + 2026-03-12T01:49:58.539Z https://docs.axolotl.ai/docs/api/loaders.patch_manager.html - 2026-03-12T00:13:32.517Z + 2026-03-12T01:49:58.700Z https://docs.axolotl.ai/docs/api/utils.quantization.html - 2026-03-12T00:13:33.262Z + 2026-03-12T01:49:59.458Z https://docs.axolotl.ai/docs/api/monkeypatch.utils.html - 2026-03-12T00:13:33.018Z + 2026-03-12T01:49:59.212Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html - 2026-03-12T00:13:32.757Z + 2026-03-12T01:49:58.946Z https://docs.axolotl.ai/docs/api/cli.quantize.html - 2026-03-12T00:13:32.309Z + 2026-03-12T01:49:58.488Z https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html - 2026-03-12T00:13:32.656Z + 2026-03-12T01:49:58.844Z https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html - 2026-03-12T00:13:33.572Z + 2026-03-12T01:49:59.772Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html - 2026-03-12T00:13:33.061Z + 2026-03-12T01:49:59.255Z https://docs.axolotl.ai/docs/api/utils.schedulers.html - 2026-03-12T00:13:33.186Z + 2026-03-12T01:49:59.382Z https://docs.axolotl.ai/docs/api/kernels.geglu.html - 2026-03-12T00:13:32.931Z + 2026-03-12T01:49:59.123Z https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html - 2026-03-12T00:13:33.034Z + 2026-03-12T01:49:59.227Z https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html - 2026-03-12T00:13:32.714Z + 2026-03-12T01:49:58.902Z https://docs.axolotl.ai/docs/api/common.architectures.html - 2026-03-12T00:13:33.578Z + 2026-03-12T01:49:59.778Z https://docs.axolotl.ai/docs/api/cli.utils.html - 2026-03-12T00:13:32.332Z + 2026-03-12T01:49:58.511Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html - 2026-03-12T00:13:32.973Z + 2026-03-12T01:49:59.166Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html - 2026-03-12T00:13:32.961Z + 2026-03-12T01:49:59.154Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html - 2026-03-12T00:13:32.781Z + 2026-03-12T01:49:58.971Z https://docs.axolotl.ai/docs/api/cli.checks.html - 2026-03-12T00:13:32.224Z + 2026-03-12T01:49:58.402Z https://docs.axolotl.ai/docs/api/core.trainers.trl.html - 2026-03-12T00:13:32.418Z + 2026-03-12T01:49:58.599Z https://docs.axolotl.ai/docs/api/utils.tokenization.html - 2026-03-12T00:13:33.102Z + 2026-03-12T01:49:59.297Z https://docs.axolotl.ai/docs/api/cli.utils.fetch.html - 2026-03-12T00:13:32.353Z + 2026-03-12T01:49:58.533Z https://docs.axolotl.ai/docs/api/core.builders.base.html - 2026-03-12T00:13:32.047Z + 2026-03-12T01:49:58.223Z https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html - 2026-03-12T00:13:32.965Z + 2026-03-12T01:49:59.158Z https://docs.axolotl.ai/docs/api/utils.trainer.html - 2026-03-12T00:13:33.153Z + 2026-03-12T01:49:59.348Z https://docs.axolotl.ai/docs/api/cli.train.html - 2026-03-12T00:13:32.177Z + 2026-03-12T01:49:58.354Z https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html - 2026-03-12T00:13:32.107Z + 2026-03-12T01:49:58.284Z https://docs.axolotl.ai/docs/api/utils.lora.html - 2026-03-12T00:13:33.110Z + 2026-03-12T01:49:59.305Z https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html - 2026-03-12T00:13:33.340Z + 2026-03-12T01:49:59.538Z https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html - 2026-03-12T00:13:33.056Z + 2026-03-12T01:49:59.251Z https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html - 2026-03-12T00:13:32.433Z + 2026-03-12T01:49:58.614Z https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html - 2026-03-12T00:13:33.685Z + 2026-03-12T01:49:59.886Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html - 2026-03-12T00:13:32.447Z + 2026-03-12T01:49:58.627Z https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html - 2026-03-12T00:13:32.568Z + 2026-03-12T01:49:58.755Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html - 2026-03-12T00:13:32.780Z + 2026-03-12T01:49:58.969Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html - 2026-03-12T00:13:32.769Z + 2026-03-12T01:49:58.959Z https://docs.axolotl.ai/docs/api/datasets.html - 2026-03-12T00:13:31.958Z + 2026-03-12T01:49:58.132Z https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html - 2026-03-12T00:13:33.555Z + 2026-03-12T01:49:59.754Z https://docs.axolotl.ai/docs/api/cli.art.html - 2026-03-12T00:13:32.216Z + 2026-03-12T01:49:58.393Z https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html - 2026-03-12T00:13:33.717Z + 2026-03-12T01:49:59.918Z https://docs.axolotl.ai/docs/api/monkeypatch.relora.html - 2026-03-12T00:13:32.971Z + 2026-03-12T01:49:59.164Z https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html - 2026-03-12T00:13:32.719Z + 2026-03-12T01:49:58.908Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html - 2026-03-12T00:13:32.759Z + 2026-03-12T01:49:58.948Z https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html - 2026-03-12T00:13:32.105Z + 2026-03-12T01:49:58.282Z https://docs.axolotl.ai/docs/api/cli.utils.args.html - 2026-03-12T00:13:32.346Z + 2026-03-12T01:49:58.526Z https://docs.axolotl.ai/docs/api/core.trainers.base.html - 2026-03-12T00:13:32.400Z + 2026-03-12T01:49:58.580Z https://docs.axolotl.ai/docs/api/utils.schemas.training.html - 2026-03-12T00:13:33.296Z + 2026-03-12T01:49:59.492Z https://docs.axolotl.ai/docs/api/evaluate.html - 2026-03-12T00:13:31.950Z + 2026-03-12T01:49:58.124Z https://docs.axolotl.ai/docs/api/cli.config.html - 2026-03-12T00:13:32.245Z + 2026-03-12T01:49:58.423Z https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html - 2026-03-12T00:13:33.577Z + 2026-03-12T01:49:59.776Z https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html - 2026-03-12T00:13:32.692Z + 2026-03-12T01:49:58.880Z https://docs.axolotl.ai/docs/api/utils.collators.batching.html - 2026-03-12T00:13:33.625Z + 2026-03-12T01:49:59.825Z https://docs.axolotl.ai/docs/api/cli.cloud.base.html - 2026-03-12T00:13:32.322Z + 2026-03-12T01:49:58.501Z https://docs.axolotl.ai/docs/api/utils.schemas.config.html - 2026-03-12T00:13:33.278Z + 2026-03-12T01:49:59.475Z https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html - 2026-03-12T00:13:32.967Z + 2026-03-12T01:49:59.160Z https://docs.axolotl.ai/docs/api/utils.dict.html - 2026-03-12T00:13:33.218Z + 2026-03-12T01:49:59.414Z https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html - 2026-03-12T00:13:33.553Z + 2026-03-12T01:49:59.753Z https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html - 2026-03-12T00:13:32.251Z + 2026-03-12T01:49:58.430Z https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html - 2026-03-12T00:13:32.293Z + 2026-03-12T01:49:58.472Z https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html - 2026-03-12T00:13:33.117Z + 2026-03-12T01:49:59.312Z https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html - 2026-03-12T00:13:33.055Z + 2026-03-12T01:49:59.249Z https://docs.axolotl.ai/docs/api/utils.schemas.utils.html - 2026-03-12T00:13:33.378Z + 2026-03-12T01:49:59.576Z https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html - 2026-03-12T00:13:33.709Z + 2026-03-12T01:49:59.910Z https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html - 2026-03-12T00:13:33.228Z + 2026-03-12T01:49:59.424Z https://docs.axolotl.ai/docs/api/kernels.swiglu.html - 2026-03-12T00:13:32.943Z + 2026-03-12T01:49:59.136Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html - 2026-03-12T00:13:32.526Z + 2026-03-12T01:49:58.709Z https://docs.axolotl.ai/docs/api/cli.inference.html - 2026-03-12T00:13:32.269Z + 2026-03-12T01:49:58.447Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html - 2026-03-12T00:13:32.753Z + 2026-03-12T01:49:58.943Z https://docs.axolotl.ai/docs/api/utils.chat_templates.html - 2026-03-12T00:13:33.104Z + 2026-03-12T01:49:59.299Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html - 2026-03-12T00:13:32.631Z + 2026-03-12T01:49:58.819Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html - 2026-03-12T00:13:32.755Z + 2026-03-12T01:49:58.944Z https://docs.axolotl.ai/docs/multipack.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/torchao.html - 2026-03-12T00:09:52.483Z + 2026-03-12T01:46:10.586Z https://docs.axolotl.ai/docs/reward_modelling.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.585Z https://docs.axolotl.ai/docs/nccl.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/multi-gpu.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/batch_vs_grad.html - 2026-03-12T00:09:52.478Z + 2026-03-12T01:46:10.579Z https://docs.axolotl.ai/docs/multimodal.html - 2026-03-12T00:09:52.482Z + 2026-03-12T01:46:10.584Z https://docs.axolotl.ai/docs/models/LiquidAI.html - 2026-03-12T00:13:55.128Z + 2026-03-12T01:50:20.052Z https://docs.axolotl.ai/docs/models/mistral.html - 2026-03-12T00:13:55.124Z + 2026-03-12T01:50:20.047Z https://docs.axolotl.ai/docs/models/trinity.html - 2026-03-12T00:13:55.119Z + 2026-03-12T01:50:20.040Z https://docs.axolotl.ai/docs/models/hunyuan.html - 2026-03-12T00:13:55.128Z + 2026-03-12T01:50:20.052Z https://docs.axolotl.ai/docs/models/phi.html - 2026-03-12T00:13:55.127Z + 2026-03-12T01:50:20.051Z https://docs.axolotl.ai/docs/models/apertus.html - 2026-03-12T00:13:55.126Z + 2026-03-12T01:50:20.049Z https://docs.axolotl.ai/docs/models/plano.html - 2026-03-12T00:13:55.118Z + 2026-03-12T01:50:19.999Z https://docs.axolotl.ai/docs/models/gemma3n.html - 2026-03-12T00:13:55.126Z + 2026-03-12T01:50:20.049Z https://docs.axolotl.ai/docs/models/arcee.html - 2026-03-12T00:13:55.120Z + 2026-03-12T01:50:20.040Z https://docs.axolotl.ai/docs/models/ministral3.html - 2026-03-12T00:13:55.120Z + 2026-03-12T01:50:20.041Z https://docs.axolotl.ai/docs/models/magistral/think.html - 2026-03-12T00:13:55.122Z + 2026-03-12T01:50:20.044Z https://docs.axolotl.ai/docs/models/llama-4.html - 2026-03-12T00:13:55.124Z + 2026-03-12T01:50:20.047Z https://docs.axolotl.ai/docs/models/voxtral.html - 2026-03-12T00:13:55.123Z + 2026-03-12T01:50:20.046Z https://docs.axolotl.ai/docs/models/magistral.html - 2026-03-12T00:13:55.122Z + 2026-03-12T01:50:20.044Z https://docs.axolotl.ai/docs/models/qwen3.html - 2026-03-12T00:13:55.125Z + 2026-03-12T01:50:20.048Z https://docs.axolotl.ai/docs/models/ministral.html - 2026-03-12T00:13:55.123Z + 2026-03-12T01:50:20.045Z https://docs.axolotl.ai/docs/models/ministral3/vision.html - 2026-03-12T00:13:55.121Z + 2026-03-12T01:50:20.043Z https://docs.axolotl.ai/docs/debugging.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/docs/faq.html - 2026-03-12T00:09:52.479Z + 2026-03-12T01:46:10.580Z https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html - 2026-03-12T00:09:52.508Z + 2026-03-12T01:46:10.619Z https://docs.axolotl.ai/FAQS.html - 2026-03-12T00:09:52.477Z + 2026-03-12T01:46:10.577Z