From f9e101605fe51aa6230c6c5a942a6022d77a041d Mon Sep 17 00:00:00 2001 From: Quarto GHA Workflow Runner Date: Mon, 10 Nov 2025 14:43:48 +0000 Subject: [PATCH] Built site for gh-pages --- .nojekyll | 2 +- docs/custom_integrations.html | 4 +- search.json | 2 +- sitemap.xml | 398 +++++++++++++++++----------------- 4 files changed, 204 insertions(+), 202 deletions(-) diff --git a/.nojekyll b/.nojekyll index 9369fc83b..22f7b7aed 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -e3c99217 \ No newline at end of file +7964ed8f \ No newline at end of file diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html index d4c8ec3e6..5c7c6224d 100644 --- a/docs/custom_integrations.html +++ b/docs/custom_integrations.html @@ -1022,7 +1022,9 @@ sparse model before inference for even greater performance benefits.:

liger_rms_norm: true liger_glu_activation: true liger_layer_norm: true -liger_fused_linear_cross_entropy: true +liger_fused_linear_cross_entropy: true + +liger_use_token_scaling: true

Supported Models

diff --git a/search.json b/search.json index 50fda5f5f..93f35ae93 100644 --- a/search.json +++ b/search.json @@ -2367,7 +2367,7 @@ "href": "docs/custom_integrations.html#liger-kernels", "title": "Custom Integrations", "section": "Liger Kernels", - "text": "Liger Kernels\nLiger Kernel provides efficient Triton kernels for LLM training, offering:\n\n20% increase in multi-GPU training throughput\n60% reduction in memory usage\nCompatibility with both FSDP and DeepSpeed\n\nSee https://github.com/linkedin/Liger-Kernel\n\nUsage\nplugins:\n - axolotl.integrations.liger.LigerPlugin\nliger_rope: true\nliger_rms_norm: true\nliger_glu_activation: true\nliger_layer_norm: true\nliger_fused_linear_cross_entropy: true\n\n\nSupported Models\n\ndeepseek_v2\ngemma\ngemma2\ngemma3\ngranite\njamba\nllama\nmistral\nmixtral\nmllama\nmllama_text_model\nolmo2\npaligemma\nphi3\nqwen2\nqwen2_5_vl\nqwen2_vl\n\n\n\nCitation\n@article{hsu2024ligerkernelefficienttriton,\n title={Liger Kernel: Efficient Triton Kernels for LLM Training},\n author={Pin-Lun Hsu and Yun Dai and Vignesh Kothapalli and Qingquan Song and Shao Tang and Siyu Zhu and Steven Shimizu and Shivam Sahni and Haowen Ning and Yanning Chen},\n year={2024},\n eprint={2410.10989},\n archivePrefix={arXiv},\n primaryClass={cs.LG},\n url={https://arxiv.org/abs/2410.10989},\n journal={arXiv preprint arXiv:2410.10989},\n}\nPlease see reference here", + "text": "Liger Kernels\nLiger Kernel provides efficient Triton kernels for LLM training, offering:\n\n20% increase in multi-GPU training throughput\n60% reduction in memory usage\nCompatibility with both FSDP and DeepSpeed\n\nSee https://github.com/linkedin/Liger-Kernel\n\nUsage\nplugins:\n - axolotl.integrations.liger.LigerPlugin\nliger_rope: true\nliger_rms_norm: true\nliger_glu_activation: true\nliger_layer_norm: true\nliger_fused_linear_cross_entropy: true\n\nliger_use_token_scaling: true\n\n\nSupported Models\n\ndeepseek_v2\ngemma\ngemma2\ngemma3\ngranite\njamba\nllama\nmistral\nmixtral\nmllama\nmllama_text_model\nolmo2\npaligemma\nphi3\nqwen2\nqwen2_5_vl\nqwen2_vl\n\n\n\nCitation\n@article{hsu2024ligerkernelefficienttriton,\n title={Liger Kernel: Efficient Triton Kernels for LLM Training},\n author={Pin-Lun Hsu and Yun Dai and Vignesh Kothapalli and Qingquan Song and Shao Tang and Siyu Zhu and Steven Shimizu and Shivam Sahni and Haowen Ning and Yanning Chen},\n year={2024},\n eprint={2410.10989},\n archivePrefix={arXiv},\n primaryClass={cs.LG},\n url={https://arxiv.org/abs/2410.10989},\n journal={arXiv preprint arXiv:2410.10989},\n}\nPlease see reference here", "crumbs": [ "Advanced Features", "Custom Integrations" diff --git a/sitemap.xml b/sitemap.xml index 3f652e50c..d073ca984 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -2,798 +2,798 @@ https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html - 2025-11-07T21:04:09.847Z + 2025-11-10T14:37:58.867Z https://docs.axolotl.ai/docs/mac.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/cli.html - 2025-11-07T21:04:09.820Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/nccl.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/getting-started.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.842Z https://docs.axolotl.ai/docs/lr_groups.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/qat.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/multipack.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/streaming.html - 2025-11-07T21:04:09.825Z + 2025-11-10T14:37:58.846Z https://docs.axolotl.ai/docs/lora_optims.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.844Z https://docs.axolotl.ai/docs/amd_hpc.html - 2025-11-07T21:04:09.820Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/debugging.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.842Z https://docs.axolotl.ai/docs/dataset-formats/conversation.html - 2025-11-07T21:04:09.820Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/dataset-formats/index.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/config-reference.html - 2025-11-07T21:09:23.654Z + 2025-11-10T14:41:46.431Z https://docs.axolotl.ai/docs/multimodal.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/ray-integration.html - 2025-11-07T21:04:09.825Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/faq.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.842Z https://docs.axolotl.ai/docs/dataset_preprocessing.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/torchao.html - 2025-11-07T21:04:09.825Z + 2025-11-10T14:37:58.846Z https://docs.axolotl.ai/docs/optimizers.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/api/utils.schedulers.html - 2025-11-07T21:09:08.707Z + 2025-11-10T14:41:31.364Z https://docs.axolotl.ai/docs/api/cli.utils.sweeps.html - 2025-11-07T21:09:07.915Z + 2025-11-10T14:41:30.584Z https://docs.axolotl.ai/docs/api/datasets.html - 2025-11-07T21:09:07.514Z + 2025-11-10T14:41:30.185Z https://docs.axolotl.ai/docs/api/utils.tokenization.html - 2025-11-07T21:09:08.625Z + 2025-11-10T14:41:31.283Z https://docs.axolotl.ai/docs/api/loaders.tokenizer.html - 2025-11-07T21:09:08.033Z + 2025-11-10T14:41:30.699Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html - 2025-11-07T21:09:08.499Z + 2025-11-10T14:41:31.159Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html - 2025-11-07T21:09:08.584Z + 2025-11-10T14:41:31.243Z https://docs.axolotl.ai/docs/api/utils.data.sft.html - 2025-11-07T21:09:08.756Z + 2025-11-10T14:41:31.413Z https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html - 2025-11-07T21:09:08.566Z + 2025-11-10T14:41:31.225Z https://docs.axolotl.ai/docs/api/loaders.patch_manager.html - 2025-11-07T21:09:08.054Z + 2025-11-10T14:41:30.719Z https://docs.axolotl.ai/docs/api/integrations.liger.args.html - 2025-11-07T21:09:09.076Z + 2025-11-10T14:41:31.729Z https://docs.axolotl.ai/docs/api/utils.schemas.peft.html - 2025-11-07T21:09:08.845Z + 2025-11-10T14:41:31.501Z https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html - 2025-11-07T21:09:08.244Z + 2025-11-10T14:41:30.908Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html - 2025-11-07T21:09:08.163Z + 2025-11-10T14:41:30.828Z https://docs.axolotl.ai/docs/api/cli.cloud.base.html - 2025-11-07T21:09:07.871Z + 2025-11-10T14:41:30.540Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html - 2025-11-07T21:09:08.616Z + 2025-11-10T14:41:31.275Z https://docs.axolotl.ai/docs/api/kernels.swiglu.html - 2025-11-07T21:09:08.470Z + 2025-11-10T14:41:31.131Z https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html - 2025-11-07T21:09:09.061Z + 2025-11-10T14:41:31.714Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html - 2025-11-07T21:09:08.310Z + 2025-11-10T14:41:30.973Z https://docs.axolotl.ai/docs/api/monkeypatch.utils.html - 2025-11-07T21:09:08.543Z + 2025-11-10T14:41:31.203Z https://docs.axolotl.ai/docs/api/core.builders.rl.html - 2025-11-07T21:09:07.613Z + 2025-11-10T14:41:30.282Z https://docs.axolotl.ai/docs/api/loaders.processor.html - 2025-11-07T21:09:08.035Z + 2025-11-10T14:41:30.701Z https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html - 2025-11-07T21:09:09.206Z + 2025-11-10T14:41:31.857Z https://docs.axolotl.ai/docs/api/core.training_args.html - 2025-11-07T21:09:07.629Z + 2025-11-10T14:41:30.298Z https://docs.axolotl.ai/docs/api/loaders.adapter.html - 2025-11-07T21:09:08.042Z + 2025-11-10T14:41:30.707Z https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html - 2025-11-07T21:09:07.843Z + 2025-11-10T14:41:30.512Z https://docs.axolotl.ai/docs/api/cli.train.html - 2025-11-07T21:09:07.728Z + 2025-11-10T14:41:30.398Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html - 2025-11-07T21:09:08.066Z + 2025-11-10T14:41:30.732Z https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html - 2025-11-07T21:09:08.211Z + 2025-11-10T14:41:30.875Z https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html - 2025-11-07T21:09:08.224Z + 2025-11-10T14:41:30.888Z https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html - 2025-11-07T21:09:08.533Z + 2025-11-10T14:41:31.193Z https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html - 2025-11-07T21:09:08.250Z + 2025-11-10T14:41:30.913Z https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html - 2025-11-07T21:09:08.188Z + 2025-11-10T14:41:30.852Z https://docs.axolotl.ai/docs/api/core.chat.messages.html - 2025-11-07T21:09:07.657Z + 2025-11-10T14:41:30.327Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html - 2025-11-07T21:09:08.075Z + 2025-11-10T14:41:30.740Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html - 2025-11-07T21:09:08.286Z + 2025-11-10T14:41:30.950Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html - 2025-11-07T21:09:08.298Z + 2025-11-10T14:41:30.962Z https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html - 2025-11-07T21:09:08.873Z + 2025-11-10T14:41:31.528Z https://docs.axolotl.ai/docs/api/convert.html - 2025-11-07T21:09:07.530Z + 2025-11-10T14:41:30.201Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html - 2025-11-07T21:09:08.288Z + 2025-11-10T14:41:30.952Z https://docs.axolotl.ai/docs/api/utils.schemas.config.html - 2025-11-07T21:09:08.796Z + 2025-11-10T14:41:31.452Z https://docs.axolotl.ai/docs/api/utils.schemas.enums.html - 2025-11-07T21:09:08.884Z + 2025-11-10T14:41:31.539Z https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html - 2025-11-07T21:09:08.545Z + 2025-11-10T14:41:31.205Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html - 2025-11-07T21:09:08.258Z + 2025-11-10T14:41:30.921Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html - 2025-11-07T21:09:07.993Z + 2025-11-10T14:41:30.661Z https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html - 2025-11-07T21:09:09.080Z + 2025-11-10T14:41:31.733Z https://docs.axolotl.ai/docs/api/utils.collators.core.html - 2025-11-07T21:09:09.109Z + 2025-11-10T14:41:31.762Z https://docs.axolotl.ai/docs/api/core.chat.format.shared.html - 2025-11-07T21:09:07.662Z + 2025-11-10T14:41:30.332Z https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html - 2025-11-07T21:09:08.335Z + 2025-11-10T14:41:30.998Z https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html - 2025-11-07T21:09:09.191Z + 2025-11-10T14:41:31.843Z https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html - 2025-11-07T21:09:09.223Z + 2025-11-10T14:41:31.874Z https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html - 2025-11-07T21:09:08.145Z + 2025-11-10T14:41:30.810Z https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html - 2025-11-07T21:09:08.856Z + 2025-11-10T14:41:31.511Z https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html - 2025-11-07T21:09:09.214Z + 2025-11-10T14:41:31.866Z https://docs.axolotl.ai/docs/api/prompt_strategies.base.html - 2025-11-07T21:09:08.105Z + 2025-11-10T14:41:30.770Z https://docs.axolotl.ai/docs/api/kernels.utils.html - 2025-11-07T21:09:08.481Z + 2025-11-10T14:41:31.141Z https://docs.axolotl.ai/docs/api/cli.merge_lora.html - 2025-11-07T21:09:07.829Z + 2025-11-10T14:41:30.498Z https://docs.axolotl.ai/docs/api/cli.utils.html - 2025-11-07T21:09:07.881Z + 2025-11-10T14:41:30.550Z https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html - 2025-11-07T21:09:08.103Z + 2025-11-10T14:41:30.768Z https://docs.axolotl.ai/docs/api/index.html - 2025-11-07T21:09:07.416Z + 2025-11-10T14:41:30.087Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html - 2025-11-07T21:09:08.270Z + 2025-11-10T14:41:30.934Z https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html - 2025-11-07T21:09:08.580Z + 2025-11-10T14:41:31.239Z https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html - 2025-11-07T21:09:08.236Z + 2025-11-10T14:41:30.900Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html - 2025-11-07T21:09:08.008Z + 2025-11-10T14:41:30.675Z https://docs.axolotl.ai/docs/api/utils.lora.html - 2025-11-07T21:09:08.632Z + 2025-11-10T14:41:31.291Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html - 2025-11-07T21:09:08.062Z + 2025-11-10T14:41:30.728Z https://docs.axolotl.ai/docs/api/cli.config.html - 2025-11-07T21:09:07.795Z + 2025-11-10T14:41:30.465Z https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html - 2025-11-07T21:09:08.493Z + 2025-11-10T14:41:31.153Z https://docs.axolotl.ai/docs/api/utils.collators.batching.html - 2025-11-07T21:09:09.132Z + 2025-11-10T14:41:31.784Z https://docs.axolotl.ai/docs/api/utils.quantization.html - 2025-11-07T21:09:08.780Z + 2025-11-10T14:41:31.437Z https://docs.axolotl.ai/docs/api/utils.dict.html - 2025-11-07T21:09:08.738Z + 2025-11-10T14:41:31.395Z https://docs.axolotl.ai/docs/api/kernels.quantize.html - 2025-11-07T21:09:08.479Z + 2025-11-10T14:41:31.139Z https://docs.axolotl.ai/docs/api/utils.schemas.training.html - 2025-11-07T21:09:08.813Z + 2025-11-10T14:41:31.469Z https://docs.axolotl.ai/docs/api/train.html - 2025-11-07T21:09:07.494Z + 2025-11-10T14:41:30.165Z https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html - 2025-11-07T21:09:07.678Z + 2025-11-10T14:41:30.348Z https://docs.axolotl.ai/docs/inference.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.844Z https://docs.axolotl.ai/FAQS.html - 2025-11-07T21:04:09.819Z + 2025-11-10T14:37:58.839Z https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html - 2025-11-07T21:04:09.829Z + 2025-11-10T14:37:58.850Z https://docs.axolotl.ai/index.html - 2025-11-07T21:04:09.842Z + 2025-11-10T14:37:58.862Z https://docs.axolotl.ai/docs/custom_integrations.html - 2025-11-07T21:04:09.820Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/api/utils.schemas.utils.html - 2025-11-07T21:09:08.890Z + 2025-11-10T14:41:31.545Z https://docs.axolotl.ai/docs/api/kernels.geglu.html - 2025-11-07T21:09:08.458Z + 2025-11-10T14:41:31.119Z https://docs.axolotl.ai/docs/api/core.builders.causal.html - 2025-11-07T21:09:07.608Z + 2025-11-10T14:41:30.277Z https://docs.axolotl.ai/docs/api/core.trainers.mamba.html - 2025-11-07T21:09:07.972Z + 2025-11-10T14:41:30.640Z https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html - 2025-11-07T21:09:08.339Z + 2025-11-10T14:41:31.002Z https://docs.axolotl.ai/docs/api/core.datasets.chat.html - 2025-11-07T21:09:07.668Z + 2025-11-10T14:41:30.338Z https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html - 2025-11-07T21:09:09.142Z + 2025-11-10T14:41:31.794Z https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html - 2025-11-07T21:09:08.203Z + 2025-11-10T14:41:30.868Z https://docs.axolotl.ai/docs/api/common.const.html - 2025-11-07T21:09:09.088Z + 2025-11-10T14:41:31.741Z https://docs.axolotl.ai/docs/api/cli.quantize.html - 2025-11-07T21:09:07.859Z + 2025-11-10T14:41:30.528Z https://docs.axolotl.ai/docs/api/utils.trainer.html - 2025-11-07T21:09:08.674Z + 2025-11-10T14:41:31.332Z https://docs.axolotl.ai/docs/api/cli.delinearize_llama4.html - 2025-11-07T21:09:07.801Z + 2025-11-10T14:41:30.471Z https://docs.axolotl.ai/docs/api/evaluate.html - 2025-11-07T21:09:07.506Z + 2025-11-10T14:41:30.177Z https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html - 2025-11-07T21:09:08.491Z + 2025-11-10T14:41:31.151Z https://docs.axolotl.ai/docs/api/loaders.model.html - 2025-11-07T21:09:08.023Z + 2025-11-10T14:41:30.689Z https://docs.axolotl.ai/docs/api/utils.distributed.html - 2025-11-07T21:09:08.731Z + 2025-11-10T14:41:31.389Z https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html - 2025-11-07T21:09:08.639Z + 2025-11-10T14:41:31.298Z https://docs.axolotl.ai/docs/api/kernels.lora.html - 2025-11-07T21:09:08.445Z + 2025-11-10T14:41:31.106Z https://docs.axolotl.ai/docs/api/cli.main.html - 2025-11-07T21:09:07.718Z + 2025-11-10T14:41:30.388Z https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html - 2025-11-07T21:09:09.084Z + 2025-11-10T14:41:31.737Z https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html - 2025-11-07T21:09:08.747Z + 2025-11-10T14:41:31.404Z https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html - 2025-11-07T21:09:07.879Z + 2025-11-10T14:41:30.548Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html - 2025-11-07T21:09:08.488Z + 2025-11-10T14:41:31.148Z https://docs.axolotl.ai/docs/api/core.builders.base.html - 2025-11-07T21:09:07.602Z + 2025-11-10T14:41:30.271Z https://docs.axolotl.ai/docs/api/utils.schemas.trl.html - 2025-11-07T21:09:08.849Z + 2025-11-10T14:41:31.505Z https://docs.axolotl.ai/docs/api/cli.utils.args.html - 2025-11-07T21:09:07.895Z + 2025-11-10T14:41:30.564Z https://docs.axolotl.ai/docs/api/core.trainers.base.html - 2025-11-07T21:09:07.947Z + 2025-11-10T14:41:30.615Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html - 2025-11-07T21:09:08.547Z + 2025-11-10T14:41:31.206Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html - 2025-11-07T21:09:08.489Z + 2025-11-10T14:41:31.150Z https://docs.axolotl.ai/docs/api/utils.schemas.model.html - 2025-11-07T21:09:08.804Z + 2025-11-10T14:41:31.460Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html - 2025-11-07T21:09:08.308Z + 2025-11-10T14:41:30.971Z https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html - 2025-11-07T21:09:09.210Z + 2025-11-10T14:41:31.862Z https://docs.axolotl.ai/docs/api/common.datasets.html - 2025-11-07T21:09:09.106Z + 2025-11-10T14:41:31.759Z https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html - 2025-11-07T21:09:08.835Z + 2025-11-10T14:41:31.490Z https://docs.axolotl.ai/docs/api/cli.utils.fetch.html - 2025-11-07T21:09:07.902Z + 2025-11-10T14:41:30.570Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html - 2025-11-07T21:09:08.283Z + 2025-11-10T14:41:30.946Z https://docs.axolotl.ai/docs/api/monkeypatch.relora.html - 2025-11-07T21:09:08.497Z + 2025-11-10T14:41:31.158Z https://docs.axolotl.ai/docs/api/cli.evaluate.html - 2025-11-07T21:09:07.738Z + 2025-11-10T14:41:30.408Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html - 2025-11-07T21:09:08.285Z + 2025-11-10T14:41:30.948Z https://docs.axolotl.ai/docs/api/core.trainers.utils.html - 2025-11-07T21:09:08.010Z + 2025-11-10T14:41:30.677Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html - 2025-11-07T21:09:08.178Z + 2025-11-10T14:41:30.842Z https://docs.axolotl.ai/docs/api/utils.chat_templates.html - 2025-11-07T21:09:08.626Z + 2025-11-10T14:41:31.285Z https://docs.axolotl.ai/docs/api/utils.data.streaming.html - 2025-11-07T21:09:08.749Z + 2025-11-10T14:41:31.406Z https://docs.axolotl.ai/docs/api/utils.bench.html - 2025-11-07T21:09:08.643Z + 2025-11-10T14:41:31.302Z https://docs.axolotl.ai/docs/api/common.architectures.html - 2025-11-07T21:09:09.086Z + 2025-11-10T14:41:31.739Z https://docs.axolotl.ai/docs/api/cli.checks.html - 2025-11-07T21:09:07.774Z + 2025-11-10T14:41:30.444Z https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html - 2025-11-07T21:09:07.980Z + 2025-11-10T14:41:30.648Z https://docs.axolotl.ai/docs/api/integrations.base.html - 2025-11-07T21:09:09.057Z + 2025-11-10T14:41:31.710Z https://docs.axolotl.ai/docs/api/cli.utils.train.html - 2025-11-07T21:09:07.930Z + 2025-11-10T14:41:30.598Z https://docs.axolotl.ai/docs/api/utils.collators.mamba.html - 2025-11-07T21:09:09.136Z + 2025-11-10T14:41:31.789Z https://docs.axolotl.ai/docs/api/cli.art.html - 2025-11-07T21:09:07.766Z + 2025-11-10T14:41:30.436Z https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html - 2025-11-07T21:09:08.558Z + 2025-11-10T14:41:31.217Z https://docs.axolotl.ai/docs/api/logging_config.html - 2025-11-07T21:09:07.594Z + 2025-11-10T14:41:30.263Z https://docs.axolotl.ai/docs/api/utils.freeze.html - 2025-11-07T21:09:08.653Z + 2025-11-10T14:41:31.311Z https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html - 2025-11-07T21:09:08.232Z + 2025-11-10T14:41:30.896Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html - 2025-11-07T21:09:08.162Z + 2025-11-10T14:41:30.826Z https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html - 2025-11-07T21:09:08.554Z + 2025-11-10T14:41:31.213Z https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html - 2025-11-07T21:09:09.107Z + 2025-11-10T14:41:31.760Z https://docs.axolotl.ai/docs/api/core.trainers.trl.html - 2025-11-07T21:09:07.965Z + 2025-11-10T14:41:30.633Z https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html - 2025-11-07T21:09:08.218Z + 2025-11-10T14:41:30.882Z https://docs.axolotl.ai/docs/api/loaders.constants.html - 2025-11-07T21:09:08.056Z + 2025-11-10T14:41:30.721Z https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html - 2025-11-07T21:09:08.579Z + 2025-11-10T14:41:31.238Z https://docs.axolotl.ai/docs/api/cli.vllm_serve.html - 2025-11-07T21:09:07.867Z + 2025-11-10T14:41:30.536Z https://docs.axolotl.ai/docs/api/prompt_tokenizers.html - 2025-11-07T21:09:07.583Z + 2025-11-10T14:41:30.251Z https://docs.axolotl.ai/docs/api/cli.args.html - 2025-11-07T21:09:07.762Z + 2025-11-10T14:41:30.432Z https://docs.axolotl.ai/docs/api/cli.inference.html - 2025-11-07T21:09:07.819Z + 2025-11-10T14:41:30.488Z https://docs.axolotl.ai/docs/api/cli.utils.load.html - 2025-11-07T21:09:07.908Z + 2025-11-10T14:41:30.577Z https://docs.axolotl.ai/docs/api/cli.preprocess.html - 2025-11-07T21:09:07.853Z + 2025-11-10T14:41:30.522Z https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html - 2025-11-07T21:09:09.204Z + 2025-11-10T14:41:31.855Z https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html - 2025-11-07T21:09:09.199Z + 2025-11-10T14:41:31.851Z https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html - 2025-11-07T21:09:07.659Z + 2025-11-10T14:41:30.328Z https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html - 2025-11-07T21:09:09.063Z + 2025-11-10T14:41:31.715Z https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html - 2025-11-07T21:09:09.072Z + 2025-11-10T14:41:31.725Z https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html - 2025-11-07T21:09:08.568Z + 2025-11-10T14:41:31.227Z https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html - 2025-11-07T21:09:07.661Z + 2025-11-10T14:41:30.330Z https://docs.axolotl.ai/docs/reward_modelling.html - 2025-11-07T21:04:09.825Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/quantize.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/fsdp_qlora.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.842Z https://docs.axolotl.ai/docs/nd_parallelism.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/batch_vs_grad.html - 2025-11-07T21:04:09.820Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/multi-node.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/rlhf.html - 2025-11-07T21:04:09.825Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/dataset-formats/pretraining.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/dataset-formats/tokenized.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/dataset-formats/template_free.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/multi-gpu.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/input_output.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.844Z https://docs.axolotl.ai/docs/docker.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.842Z https://docs.axolotl.ai/docs/gradient_checkpointing.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.842Z https://docs.axolotl.ai/docs/optimizations.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/sequence_parallelism.html - 2025-11-07T21:04:09.825Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/dataset_loading.html - 2025-11-07T21:04:09.821Z + 2025-11-10T14:37:58.841Z https://docs.axolotl.ai/docs/installation.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.844Z https://docs.axolotl.ai/docs/mixed_precision.html - 2025-11-07T21:04:09.824Z + 2025-11-10T14:37:58.845Z https://docs.axolotl.ai/docs/unsloth.html - 2025-11-07T21:04:09.825Z + 2025-11-10T14:37:58.846Z https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html - 2025-11-07T21:04:09.847Z + 2025-11-10T14:37:58.867Z