diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 052f9aa72..19cef5de4 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -61,6 +61,7 @@ jobs: uses: docker/build-push-action@v5 with: context: . + platforms: linux/amd64,linux/arm64 build-args: | BASE_TAG=${{ github.ref_type == 'tag' && 'main' || github.ref_name }}-base-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }} CUDA=${{ matrix.cuda }} @@ -127,6 +128,7 @@ jobs: uses: docker/build-push-action@v5 with: context: . + platforms: linux/amd64,linux/arm64 build-args: | BASE_TAG=${{ github.ref_type == 'tag' && 'main' || github.ref_name }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }} CUDA=${{ matrix.cuda }} @@ -180,6 +182,7 @@ jobs: uses: docker/build-push-action@v5 with: context: . + platforms: linux/amd64,linux/arm64 build-args: | BASE_TAG=${{ github.ref_type == 'tag' && 'main' || github.ref_name }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }} CUDA=${{ matrix.cuda }} diff --git a/.nojekyll b/.nojekyll index 348a2e63a..f8b6058d6 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -9745622d \ No newline at end of file +67a6041d \ No newline at end of file diff --git a/sitemap.xml b/sitemap.xml index 03ab37ee7..408faf243 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -2,942 +2,942 @@ https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html - 2026-01-12T14:43:41.839Z + 2026-01-12T17:00:36.431Z https://docs.axolotl.ai/docs/mac.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.412Z https://docs.axolotl.ai/docs/cli.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/mixed_precision.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.412Z https://docs.axolotl.ai/docs/installation.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.412Z https://docs.axolotl.ai/docs/dataset_loading.html - 2026-01-12T14:43:41.811Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/sequence_parallelism.html - 2026-01-12T14:43:41.815Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/optimizations.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/gradient_checkpointing.html - 2026-01-12T14:43:41.811Z + 2026-01-12T17:00:36.410Z https://docs.axolotl.ai/docs/streaming.html - 2026-01-12T14:43:41.815Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/lora_optims.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.412Z https://docs.axolotl.ai/docs/amd_hpc.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/debugging.html - 2026-01-12T14:43:41.811Z + 2026-01-12T17:00:36.410Z https://docs.axolotl.ai/docs/dataset-formats/conversation.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/dataset-formats/index.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/config-reference.html - 2026-01-12T14:47:43.002Z + 2026-01-12T17:04:33.456Z https://docs.axolotl.ai/docs/multimodal.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/ray-integration.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/faq.html - 2026-01-12T14:43:41.811Z + 2026-01-12T17:00:36.410Z https://docs.axolotl.ai/docs/dataset_preprocessing.html - 2026-01-12T14:43:41.811Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/torchao.html - 2026-01-12T14:43:41.815Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/optimizers.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/models/apertus.html - 2026-01-12T14:47:43.652Z + 2026-01-12T17:04:34.189Z https://docs.axolotl.ai/docs/models/ministral3/think.html - 2026-01-12T14:47:43.646Z + 2026-01-12T17:04:34.185Z https://docs.axolotl.ai/docs/models/gpt-oss.html - 2026-01-12T14:47:43.652Z + 2026-01-12T17:04:34.190Z https://docs.axolotl.ai/docs/models/phi.html - 2026-01-12T14:47:43.653Z + 2026-01-12T17:04:34.190Z https://docs.axolotl.ai/docs/models/olmo3.html - 2026-01-12T14:47:43.644Z + 2026-01-12T17:04:34.184Z https://docs.axolotl.ai/docs/models/granite4.html - 2026-01-12T14:47:43.655Z + 2026-01-12T17:04:34.191Z https://docs.axolotl.ai/docs/models/seed-oss.html - 2026-01-12T14:47:43.652Z + 2026-01-12T17:04:34.190Z https://docs.axolotl.ai/docs/models/qwen3.html - 2026-01-12T14:47:43.651Z + 2026-01-12T17:04:34.189Z https://docs.axolotl.ai/docs/models/orpheus.html - 2026-01-12T14:47:43.656Z + 2026-01-12T17:04:34.192Z https://docs.axolotl.ai/docs/models/hunyuan.html - 2026-01-12T14:47:43.656Z + 2026-01-12T17:04:34.191Z https://docs.axolotl.ai/docs/models/mistral.html - 2026-01-12T14:47:43.650Z + 2026-01-12T17:04:34.188Z https://docs.axolotl.ai/docs/models/mistral-small.html - 2026-01-12T14:47:43.649Z + 2026-01-12T17:04:34.187Z https://docs.axolotl.ai/docs/models/smolvlm2.html - 2026-01-12T14:47:43.653Z + 2026-01-12T17:04:34.190Z https://docs.axolotl.ai/docs/models/llama-2.html - 2026-01-12T14:47:43.650Z + 2026-01-12T17:04:34.188Z https://docs.axolotl.ai/docs/models/magistral/vision.html - 2026-01-12T14:47:43.648Z + 2026-01-12T17:04:34.186Z https://docs.axolotl.ai/docs/models/jamba.html - 2026-01-12T14:47:43.656Z + 2026-01-12T17:04:34.191Z https://docs.axolotl.ai/docs/models/mimo.html - 2026-01-12T14:47:43.644Z + 2026-01-12T17:04:34.183Z https://docs.axolotl.ai/docs/api/utils.schedulers.html - 2026-01-12T14:47:24.720Z + 2026-01-12T17:04:17.913Z https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html - 2026-01-12T14:47:23.871Z + 2026-01-12T17:04:17.179Z https://docs.axolotl.ai/docs/api/datasets.html - 2026-01-12T14:47:23.449Z + 2026-01-12T17:04:16.810Z https://docs.axolotl.ai/docs/api/utils.tokenization.html - 2026-01-12T14:47:24.632Z + 2026-01-12T17:04:17.836Z https://docs.axolotl.ai/docs/api/loaders.tokenizer.html - 2026-01-12T14:47:23.993Z + 2026-01-12T17:04:17.287Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html - 2026-01-12T14:47:24.494Z + 2026-01-12T17:04:17.720Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html - 2026-01-12T14:47:24.587Z + 2026-01-12T17:04:17.799Z https://docs.axolotl.ai/docs/api/utils.data.sft.html - 2026-01-12T14:47:24.773Z + 2026-01-12T17:04:17.959Z https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html - 2026-01-12T14:47:24.566Z + 2026-01-12T17:04:17.782Z https://docs.axolotl.ai/docs/api/loaders.patch_manager.html - 2026-01-12T14:47:24.022Z + 2026-01-12T17:04:17.312Z https://docs.axolotl.ai/docs/api/integrations.liger.args.html - 2026-01-12T14:47:25.113Z + 2026-01-12T17:04:18.257Z https://docs.axolotl.ai/docs/api/utils.schemas.peft.html - 2026-01-12T14:47:24.868Z + 2026-01-12T17:04:18.043Z https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html - 2026-01-12T14:47:24.226Z + 2026-01-12T17:04:17.487Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html - 2026-01-12T14:47:24.138Z + 2026-01-12T17:04:17.413Z https://docs.axolotl.ai/docs/api/cli.cloud.base.html - 2026-01-12T14:47:23.824Z + 2026-01-12T17:04:17.138Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html - 2026-01-12T14:47:24.623Z + 2026-01-12T17:04:17.828Z https://docs.axolotl.ai/docs/api/kernels.swiglu.html - 2026-01-12T14:47:24.463Z + 2026-01-12T17:04:17.693Z https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html - 2026-01-12T14:47:25.098Z + 2026-01-12T17:04:18.244Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html - 2026-01-12T14:47:24.296Z + 2026-01-12T17:04:17.548Z https://docs.axolotl.ai/docs/api/monkeypatch.utils.html - 2026-01-12T14:47:24.540Z + 2026-01-12T17:04:17.761Z https://docs.axolotl.ai/docs/api/core.builders.rl.html - 2026-01-12T14:47:23.551Z + 2026-01-12T17:04:16.900Z https://docs.axolotl.ai/docs/api/loaders.processor.html - 2026-01-12T14:47:23.995Z + 2026-01-12T17:04:17.288Z https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html - 2026-01-12T14:47:25.251Z + 2026-01-12T17:04:18.377Z https://docs.axolotl.ai/docs/api/core.training_args.html - 2026-01-12T14:47:23.567Z + 2026-01-12T17:04:16.914Z https://docs.axolotl.ai/docs/api/loaders.adapter.html - 2026-01-12T14:47:24.002Z + 2026-01-12T17:04:17.295Z https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html - 2026-01-12T14:47:23.793Z + 2026-01-12T17:04:17.112Z https://docs.axolotl.ai/docs/api/cli.train.html - 2026-01-12T14:47:23.672Z + 2026-01-12T17:04:17.006Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html - 2026-01-12T14:47:24.035Z + 2026-01-12T17:04:17.323Z https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html - 2026-01-12T14:47:24.190Z + 2026-01-12T17:04:17.456Z https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html - 2026-01-12T14:47:24.204Z + 2026-01-12T17:04:17.468Z https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html - 2026-01-12T14:47:24.530Z + 2026-01-12T17:04:17.752Z https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html - 2026-01-12T14:47:24.231Z + 2026-01-12T17:04:17.492Z https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html - 2026-01-12T14:47:24.163Z + 2026-01-12T17:04:17.435Z https://docs.axolotl.ai/docs/api/core.chat.messages.html - 2026-01-12T14:47:23.596Z + 2026-01-12T17:04:16.940Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html - 2026-01-12T14:47:24.044Z + 2026-01-12T17:04:17.331Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html - 2026-01-12T14:47:24.271Z + 2026-01-12T17:04:17.526Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html - 2026-01-12T14:47:24.283Z + 2026-01-12T17:04:17.537Z https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html - 2026-01-12T14:47:24.900Z + 2026-01-12T17:04:18.071Z https://docs.axolotl.ai/docs/api/convert.html - 2026-01-12T14:47:23.466Z + 2026-01-12T17:04:16.825Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html - 2026-01-12T14:47:24.273Z + 2026-01-12T17:04:17.528Z https://docs.axolotl.ai/docs/api/utils.schemas.config.html - 2026-01-12T14:47:24.816Z + 2026-01-12T17:04:17.997Z https://docs.axolotl.ai/docs/api/utils.schemas.enums.html - 2026-01-12T14:47:24.911Z + 2026-01-12T17:04:18.081Z https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html - 2026-01-12T14:47:24.542Z + 2026-01-12T17:04:17.763Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html - 2026-01-12T14:47:24.240Z + 2026-01-12T17:04:17.500Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html - 2026-01-12T14:47:23.953Z + 2026-01-12T17:04:17.251Z https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html - 2026-01-12T14:47:25.118Z + 2026-01-12T17:04:18.261Z https://docs.axolotl.ai/docs/api/utils.collators.core.html - 2026-01-12T14:47:25.149Z + 2026-01-12T17:04:18.288Z https://docs.axolotl.ai/docs/api/core.chat.format.shared.html - 2026-01-12T14:47:23.602Z + 2026-01-12T17:04:16.945Z https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html - 2026-01-12T14:47:24.322Z + 2026-01-12T17:04:17.571Z https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html - 2026-01-12T14:47:25.236Z + 2026-01-12T17:04:18.364Z https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html - 2026-01-12T14:47:25.269Z + 2026-01-12T17:04:18.392Z https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html - 2026-01-12T14:47:24.118Z + 2026-01-12T17:04:17.396Z https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html - 2026-01-12T14:47:24.880Z + 2026-01-12T17:04:18.053Z https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html - 2026-01-12T14:47:25.260Z + 2026-01-12T17:04:18.385Z https://docs.axolotl.ai/docs/api/prompt_strategies.base.html - 2026-01-12T14:47:24.076Z + 2026-01-12T17:04:17.359Z https://docs.axolotl.ai/docs/api/kernels.utils.html - 2026-01-12T14:47:24.474Z + 2026-01-12T17:04:17.703Z https://docs.axolotl.ai/docs/api/cli.merge_lora.html - 2026-01-12T14:47:23.778Z + 2026-01-12T17:04:17.099Z https://docs.axolotl.ai/docs/api/cli.utils.html - 2026-01-12T14:47:23.834Z + 2026-01-12T17:04:17.147Z https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html - 2026-01-12T14:47:24.074Z + 2026-01-12T17:04:17.357Z https://docs.axolotl.ai/docs/api/index.html - 2026-01-12T14:47:23.346Z + 2026-01-12T17:04:16.721Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html - 2026-01-12T14:47:24.253Z + 2026-01-12T17:04:17.511Z https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html - 2026-01-12T14:47:24.583Z + 2026-01-12T17:04:17.795Z https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html - 2026-01-12T14:47:24.217Z + 2026-01-12T17:04:17.480Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html - 2026-01-12T14:47:23.968Z + 2026-01-12T17:04:17.265Z https://docs.axolotl.ai/docs/api/utils.lora.html - 2026-01-12T14:47:24.641Z + 2026-01-12T17:04:17.843Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html - 2026-01-12T14:47:24.031Z + 2026-01-12T17:04:17.320Z https://docs.axolotl.ai/docs/api/cli.config.html - 2026-01-12T14:47:23.743Z + 2026-01-12T17:04:17.068Z https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html - 2026-01-12T14:47:24.487Z + 2026-01-12T17:04:17.714Z https://docs.axolotl.ai/docs/api/utils.collators.batching.html - 2026-01-12T14:47:25.174Z + 2026-01-12T17:04:18.309Z https://docs.axolotl.ai/docs/api/utils.quantization.html - 2026-01-12T14:47:24.798Z + 2026-01-12T17:04:17.980Z https://docs.axolotl.ai/docs/api/utils.dict.html - 2026-01-12T14:47:24.753Z + 2026-01-12T17:04:17.941Z https://docs.axolotl.ai/docs/api/kernels.quantize.html - 2026-01-12T14:47:24.472Z + 2026-01-12T17:04:17.702Z https://docs.axolotl.ai/docs/api/utils.schemas.training.html - 2026-01-12T14:47:24.834Z + 2026-01-12T17:04:18.013Z https://docs.axolotl.ai/docs/api/train.html - 2026-01-12T14:47:23.427Z + 2026-01-12T17:04:16.791Z https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html - 2026-01-12T14:47:23.618Z + 2026-01-12T17:04:16.959Z https://docs.axolotl.ai/docs/inference.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.412Z https://docs.axolotl.ai/FAQS.html - 2026-01-12T14:43:41.808Z + 2026-01-12T17:00:36.408Z https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html - 2026-01-12T14:43:41.819Z + 2026-01-12T17:00:36.416Z https://docs.axolotl.ai/index.html - 2026-01-12T14:43:41.834Z + 2026-01-12T17:00:36.427Z https://docs.axolotl.ai/docs/custom_integrations.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/api/utils.schemas.utils.html - 2026-01-12T14:47:24.918Z + 2026-01-12T17:04:18.087Z https://docs.axolotl.ai/docs/api/kernels.geglu.html - 2026-01-12T14:47:24.450Z + 2026-01-12T17:04:17.682Z https://docs.axolotl.ai/docs/api/core.builders.causal.html - 2026-01-12T14:47:23.545Z + 2026-01-12T17:04:16.895Z https://docs.axolotl.ai/docs/api/core.trainers.mamba.html - 2026-01-12T14:47:23.930Z + 2026-01-12T17:04:17.231Z https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html - 2026-01-12T14:47:24.327Z + 2026-01-12T17:04:17.575Z https://docs.axolotl.ai/docs/api/core.datasets.chat.html - 2026-01-12T14:47:23.608Z + 2026-01-12T17:04:16.951Z https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html - 2026-01-12T14:47:25.184Z + 2026-01-12T17:04:18.318Z https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html - 2026-01-12T14:47:24.180Z + 2026-01-12T17:04:17.450Z https://docs.axolotl.ai/docs/api/common.const.html - 2026-01-12T14:47:25.126Z + 2026-01-12T17:04:18.268Z https://docs.axolotl.ai/docs/api/cli.quantize.html - 2026-01-12T14:47:23.810Z + 2026-01-12T17:04:17.127Z https://docs.axolotl.ai/docs/api/utils.trainer.html - 2026-01-12T14:47:24.685Z + 2026-01-12T17:04:17.882Z https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html - 2026-01-12T14:47:23.749Z + 2026-01-12T17:04:17.073Z https://docs.axolotl.ai/docs/api/evaluate.html - 2026-01-12T14:47:23.441Z + 2026-01-12T17:04:16.803Z https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html - 2026-01-12T14:47:24.485Z + 2026-01-12T17:04:17.713Z https://docs.axolotl.ai/docs/api/loaders.model.html - 2026-01-12T14:47:23.982Z + 2026-01-12T17:04:17.278Z https://docs.axolotl.ai/docs/api/utils.distributed.html - 2026-01-12T14:47:24.746Z + 2026-01-12T17:04:17.935Z https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html - 2026-01-12T14:47:24.648Z + 2026-01-12T17:04:17.850Z https://docs.axolotl.ai/docs/api/kernels.lora.html - 2026-01-12T14:47:24.436Z + 2026-01-12T17:04:17.670Z https://docs.axolotl.ai/docs/api/cli.main.html - 2026-01-12T14:47:23.661Z + 2026-01-12T17:04:16.996Z https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html - 2026-01-12T14:47:25.122Z + 2026-01-12T17:04:18.265Z https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html - 2026-01-12T14:47:24.763Z + 2026-01-12T17:04:17.950Z https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html - 2026-01-12T14:47:23.832Z + 2026-01-12T17:04:17.145Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html - 2026-01-12T14:47:24.482Z + 2026-01-12T17:04:17.710Z https://docs.axolotl.ai/docs/api/core.builders.base.html - 2026-01-12T14:47:23.539Z + 2026-01-12T17:04:16.889Z https://docs.axolotl.ai/docs/api/utils.schemas.trl.html - 2026-01-12T14:47:24.873Z + 2026-01-12T17:04:18.047Z https://docs.axolotl.ai/docs/api/cli.utils.args.html - 2026-01-12T14:47:23.849Z + 2026-01-12T17:04:17.160Z https://docs.axolotl.ai/docs/api/core.trainers.base.html - 2026-01-12T14:47:23.904Z + 2026-01-12T17:04:17.208Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html - 2026-01-12T14:47:24.544Z + 2026-01-12T17:04:17.764Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html - 2026-01-12T14:47:24.483Z + 2026-01-12T17:04:17.711Z https://docs.axolotl.ai/docs/api/utils.schemas.model.html - 2026-01-12T14:47:24.825Z + 2026-01-12T17:04:18.005Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html - 2026-01-12T14:47:24.294Z + 2026-01-12T17:04:17.546Z https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html - 2026-01-12T14:47:25.255Z + 2026-01-12T17:04:18.381Z https://docs.axolotl.ai/docs/api/common.datasets.html - 2026-01-12T14:47:25.145Z + 2026-01-12T17:04:18.285Z https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html - 2026-01-12T14:47:24.857Z + 2026-01-12T17:04:18.033Z https://docs.axolotl.ai/docs/api/cli.utils.fetch.html - 2026-01-12T14:47:23.856Z + 2026-01-12T17:04:17.166Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html - 2026-01-12T14:47:24.267Z + 2026-01-12T17:04:17.523Z https://docs.axolotl.ai/docs/api/monkeypatch.relora.html - 2026-01-12T14:47:24.492Z + 2026-01-12T17:04:17.718Z https://docs.axolotl.ai/docs/api/cli.evaluate.html - 2026-01-12T14:47:23.682Z + 2026-01-12T17:04:17.015Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html - 2026-01-12T14:47:24.269Z + 2026-01-12T17:04:17.525Z https://docs.axolotl.ai/docs/api/core.trainers.utils.html - 2026-01-12T14:47:23.970Z + 2026-01-12T17:04:17.267Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html - 2026-01-12T14:47:24.153Z + 2026-01-12T17:04:17.426Z https://docs.axolotl.ai/docs/api/utils.chat_templates.html - 2026-01-12T14:47:24.635Z + 2026-01-12T17:04:17.838Z https://docs.axolotl.ai/docs/api/utils.data.streaming.html - 2026-01-12T14:47:24.765Z + 2026-01-12T17:04:17.952Z https://docs.axolotl.ai/docs/api/utils.bench.html - 2026-01-12T14:47:24.653Z + 2026-01-12T17:04:17.854Z https://docs.axolotl.ai/docs/api/common.architectures.html - 2026-01-12T14:47:25.124Z + 2026-01-12T17:04:18.266Z https://docs.axolotl.ai/docs/api/cli.checks.html - 2026-01-12T14:47:23.720Z + 2026-01-12T17:04:17.048Z https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html - 2026-01-12T14:47:23.939Z + 2026-01-12T17:04:17.238Z https://docs.axolotl.ai/docs/api/integrations.base.html - 2026-01-12T14:47:25.093Z + 2026-01-12T17:04:18.240Z https://docs.axolotl.ai/docs/api/cli.utils.train.html - 2026-01-12T14:47:23.886Z + 2026-01-12T17:04:17.192Z https://docs.axolotl.ai/docs/api/utils.collators.mamba.html - 2026-01-12T14:47:25.178Z + 2026-01-12T17:04:18.313Z https://docs.axolotl.ai/docs/api/cli.art.html - 2026-01-12T14:47:23.712Z + 2026-01-12T17:04:17.041Z https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html - 2026-01-12T14:47:24.557Z + 2026-01-12T17:04:17.774Z https://docs.axolotl.ai/docs/api/logging_config.html - 2026-01-12T14:47:23.531Z + 2026-01-12T17:04:16.882Z https://docs.axolotl.ai/docs/api/utils.freeze.html - 2026-01-12T14:47:24.663Z + 2026-01-12T17:04:17.862Z https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html - 2026-01-12T14:47:24.212Z + 2026-01-12T17:04:17.476Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html - 2026-01-12T14:47:24.136Z + 2026-01-12T17:04:17.411Z https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html - 2026-01-12T14:47:24.552Z + 2026-01-12T17:04:17.771Z https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html - 2026-01-12T14:47:25.147Z + 2026-01-12T17:04:18.286Z https://docs.axolotl.ai/docs/api/core.trainers.trl.html - 2026-01-12T14:47:23.923Z + 2026-01-12T17:04:17.225Z https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html - 2026-01-12T14:47:24.198Z + 2026-01-12T17:04:17.463Z https://docs.axolotl.ai/docs/api/loaders.constants.html - 2026-01-12T14:47:24.024Z + 2026-01-12T17:04:17.313Z https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html - 2026-01-12T14:47:24.581Z + 2026-01-12T17:04:17.793Z https://docs.axolotl.ai/docs/api/cli.vllm_serve.html - 2026-01-12T14:47:23.819Z + 2026-01-12T17:04:17.135Z https://docs.axolotl.ai/docs/api/prompt_tokenizers.html - 2026-01-12T14:47:23.519Z + 2026-01-12T17:04:16.871Z https://docs.axolotl.ai/docs/api/cli.args.html - 2026-01-12T14:47:23.707Z + 2026-01-12T17:04:17.037Z https://docs.axolotl.ai/docs/api/cli.inference.html - 2026-01-12T14:47:23.767Z + 2026-01-12T17:04:17.089Z https://docs.axolotl.ai/docs/api/cli.utils.load.html - 2026-01-12T14:47:23.863Z + 2026-01-12T17:04:17.172Z https://docs.axolotl.ai/docs/api/cli.preprocess.html - 2026-01-12T14:47:23.804Z + 2026-01-12T17:04:17.121Z https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html - 2026-01-12T14:47:25.249Z + 2026-01-12T17:04:18.375Z https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html - 2026-01-12T14:47:25.244Z + 2026-01-12T17:04:18.371Z https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html - 2026-01-12T14:47:23.598Z + 2026-01-12T17:04:16.942Z https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html - 2026-01-12T14:47:25.099Z + 2026-01-12T17:04:18.245Z https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html - 2026-01-12T14:47:25.109Z + 2026-01-12T17:04:18.253Z https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html - 2026-01-12T14:47:24.568Z + 2026-01-12T17:04:17.783Z https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html - 2026-01-12T14:47:23.600Z + 2026-01-12T17:04:16.943Z https://docs.axolotl.ai/docs/models/gemma3n.html - 2026-01-12T14:47:43.651Z + 2026-01-12T17:04:34.189Z https://docs.axolotl.ai/docs/models/qwen3-next.html - 2026-01-12T14:47:43.651Z + 2026-01-12T17:04:34.189Z https://docs.axolotl.ai/docs/models/index.html - 2026-01-12T14:47:43.656Z + 2026-01-12T17:04:34.192Z https://docs.axolotl.ai/docs/models/magistral/think.html - 2026-01-12T14:47:43.648Z + 2026-01-12T17:04:34.186Z https://docs.axolotl.ai/docs/models/kimi-linear.html - 2026-01-12T14:47:43.643Z + 2026-01-12T17:04:34.183Z https://docs.axolotl.ai/docs/models/internvl3_5.html - 2026-01-12T14:47:43.644Z + 2026-01-12T17:04:34.184Z https://docs.axolotl.ai/docs/models/arcee.html - 2026-01-12T14:47:43.645Z + 2026-01-12T17:04:34.184Z https://docs.axolotl.ai/docs/models/LiquidAI.html - 2026-01-12T14:47:43.655Z + 2026-01-12T17:04:34.191Z https://docs.axolotl.ai/docs/models/magistral.html - 2026-01-12T14:47:43.647Z + 2026-01-12T17:04:34.186Z https://docs.axolotl.ai/docs/models/voxtral.html - 2026-01-12T14:47:43.649Z + 2026-01-12T17:04:34.187Z https://docs.axolotl.ai/docs/models/trinity.html - 2026-01-12T14:47:43.645Z + 2026-01-12T17:04:34.184Z https://docs.axolotl.ai/docs/models/ministral.html - 2026-01-12T14:47:43.648Z + 2026-01-12T17:04:34.187Z https://docs.axolotl.ai/docs/models/llama-4.html - 2026-01-12T14:47:43.650Z + 2026-01-12T17:04:34.188Z https://docs.axolotl.ai/docs/models/devstral.html - 2026-01-12T14:47:43.649Z + 2026-01-12T17:04:34.188Z https://docs.axolotl.ai/docs/models/ministral3.html - 2026-01-12T14:47:43.646Z + 2026-01-12T17:04:34.185Z https://docs.axolotl.ai/docs/models/ministral3/vision.html - 2026-01-12T14:47:43.647Z + 2026-01-12T17:04:34.185Z https://docs.axolotl.ai/docs/models/plano.html - 2026-01-12T14:47:43.643Z + 2026-01-12T17:04:34.183Z https://docs.axolotl.ai/docs/reward_modelling.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/quantize.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/fsdp_qlora.html - 2026-01-12T14:43:41.811Z + 2026-01-12T17:00:36.410Z https://docs.axolotl.ai/docs/nd_parallelism.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/batch_vs_grad.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/multi-node.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/rlhf.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/dataset-formats/pretraining.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/dataset-formats/tokenized.html - 2026-01-12T14:43:41.811Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/dataset-formats/template_free.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/multi-gpu.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.412Z https://docs.axolotl.ai/docs/input_output.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.412Z https://docs.axolotl.ai/docs/docker.html - 2026-01-12T14:43:41.811Z + 2026-01-12T17:00:36.410Z https://docs.axolotl.ai/docs/checkpoint_saving.html - 2026-01-12T14:43:41.810Z + 2026-01-12T17:00:36.409Z https://docs.axolotl.ai/docs/multipack.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/qat.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/lr_groups.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.412Z https://docs.axolotl.ai/docs/getting-started.html - 2026-01-12T14:43:41.811Z + 2026-01-12T17:00:36.410Z https://docs.axolotl.ai/docs/nccl.html - 2026-01-12T14:43:41.814Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/telemetry.html - 2026-01-12T14:43:41.815Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/docs/unsloth.html - 2026-01-12T14:43:41.815Z + 2026-01-12T17:00:36.413Z https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html - 2026-01-12T14:43:41.838Z + 2026-01-12T17:00:36.431Z