From 9fc08a1f2d67381354d07e816e1fd9d1cfcca704 Mon Sep 17 00:00:00 2001 From: Quarto GHA Workflow Runner Date: Tue, 3 Jun 2025 19:33:03 +0000 Subject: [PATCH] Built site for gh-pages --- .nojekyll | 2 +- docs/rlhf.html | 1 + search.json | 4 +- sitemap.xml | 380 ++++++++++++++++++++++++------------------------- 4 files changed, 194 insertions(+), 193 deletions(-) diff --git a/.nojekyll b/.nojekyll index b9a1fddc1..8a4672223 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -8a186fbf \ No newline at end of file +4ea7ed03 \ No newline at end of file diff --git a/docs/rlhf.html b/docs/rlhf.html index f82c78e54..f0f0c8360 100644 --- a/docs/rlhf.html +++ b/docs/rlhf.html @@ -556,6 +556,7 @@ feedback. Various methods include, but not limited to:

  • Identity Preference Optimization (IPO)
  • Kahneman-Tversky Optimization (KTO)
  • Odds Ratio Preference Optimization (ORPO)
  • +
  • Group Relative Policy Optimization (GRPO)
  • Proximal Policy Optimization (PPO) (not yet supported in axolotl, if you’re interested in contributing, please reach out!)
  • diff --git a/search.json b/search.json index 97ad2a8b8..e301e7fcd 100644 --- a/search.json +++ b/search.json @@ -155,7 +155,7 @@ "href": "docs/rlhf.html", "title": "RLHF (Beta)", "section": "", - "text": "Reinforcement Learning from Human Feedback is a method whereby a language model is optimized from data using human\nfeedback. Various methods include, but not limited to:\n\nDirect Preference Optimization (DPO)\nIdentity Preference Optimization (IPO)\nKahneman-Tversky Optimization (KTO)\nOdds Ratio Preference Optimization (ORPO)\nProximal Policy Optimization (PPO) (not yet supported in axolotl, if you’re interested in contributing, please reach out!)", + "text": "Reinforcement Learning from Human Feedback is a method whereby a language model is optimized from data using human\nfeedback. Various methods include, but not limited to:\n\nDirect Preference Optimization (DPO)\nIdentity Preference Optimization (IPO)\nKahneman-Tversky Optimization (KTO)\nOdds Ratio Preference Optimization (ORPO)\nGroup Relative Policy Optimization (GRPO)\nProximal Policy Optimization (PPO) (not yet supported in axolotl, if you’re interested in contributing, please reach out!)", "crumbs": [ "How To Guides", "RLHF (Beta)" @@ -166,7 +166,7 @@ "href": "docs/rlhf.html#overview", "title": "RLHF (Beta)", "section": "", - "text": "Reinforcement Learning from Human Feedback is a method whereby a language model is optimized from data using human\nfeedback. Various methods include, but not limited to:\n\nDirect Preference Optimization (DPO)\nIdentity Preference Optimization (IPO)\nKahneman-Tversky Optimization (KTO)\nOdds Ratio Preference Optimization (ORPO)\nProximal Policy Optimization (PPO) (not yet supported in axolotl, if you’re interested in contributing, please reach out!)", + "text": "Reinforcement Learning from Human Feedback is a method whereby a language model is optimized from data using human\nfeedback. Various methods include, but not limited to:\n\nDirect Preference Optimization (DPO)\nIdentity Preference Optimization (IPO)\nKahneman-Tversky Optimization (KTO)\nOdds Ratio Preference Optimization (ORPO)\nGroup Relative Policy Optimization (GRPO)\nProximal Policy Optimization (PPO) (not yet supported in axolotl, if you’re interested in contributing, please reach out!)", "crumbs": [ "How To Guides", "RLHF (Beta)" diff --git a/sitemap.xml b/sitemap.xml index e0f66241c..10c86af9e 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -2,762 +2,762 @@ https://docs.axolotl.ai/FAQS.html - 2025-06-02T22:54:37.550Z + 2025-06-03T19:30:48.979Z https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html - 2025-06-02T22:54:37.572Z + 2025-06-03T19:30:49.002Z https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html - 2025-06-02T22:54:37.557Z + 2025-06-03T19:30:48.986Z https://docs.axolotl.ai/docs/lr_groups.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/lora_optims.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/rlhf.html - 2025-06-02T22:54:37.556Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/qat.html - 2025-06-02T22:54:37.556Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/fsdp_qlora.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.982Z https://docs.axolotl.ai/docs/custom_integrations.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/dataset-formats/pretraining.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/dataset-formats/template_free.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/dataset-formats/conversation.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/dataset-formats/tokenized.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/multipack.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/mac.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/input_output.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.984Z https://docs.axolotl.ai/docs/quantize.html - 2025-06-02T22:54:37.556Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/cli.html - 2025-06-02T22:54:37.551Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/multi-node.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/nccl.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/api/utils.data.sft.html - 2025-06-02T22:55:12.740Z + 2025-06-03T19:31:21.155Z https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html - 2025-06-02T22:55:11.853Z + 2025-06-03T19:31:20.272Z https://docs.axolotl.ai/docs/api/evaluate.html - 2025-06-02T22:55:11.632Z + 2025-06-03T19:31:20.053Z https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html - 2025-06-02T22:55:12.596Z + 2025-06-03T19:31:21.013Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html - 2025-06-02T22:55:12.238Z + 2025-06-03T19:31:20.657Z https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html - 2025-06-02T22:55:12.991Z + 2025-06-03T19:31:21.405Z https://docs.axolotl.ai/docs/api/core.builders.rl.html - 2025-06-02T22:55:11.723Z + 2025-06-03T19:31:20.143Z https://docs.axolotl.ai/docs/api/common.const.html - 2025-06-02T22:55:12.994Z + 2025-06-03T19:31:21.408Z https://docs.axolotl.ai/docs/api/kernels.geglu.html - 2025-06-02T22:55:12.461Z + 2025-06-03T19:31:20.879Z https://docs.axolotl.ai/docs/api/index.html - 2025-06-02T22:55:11.560Z + 2025-06-03T19:31:19.981Z https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html - 2025-06-02T22:55:12.972Z + 2025-06-03T19:31:21.386Z https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html - 2025-06-02T22:55:12.246Z + 2025-06-03T19:31:20.665Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html - 2025-06-02T22:55:12.168Z + 2025-06-03T19:31:20.587Z https://docs.axolotl.ai/docs/api/core.datasets.chat.html - 2025-06-02T22:55:11.845Z + 2025-06-03T19:31:20.264Z https://docs.axolotl.ai/docs/api/train.html - 2025-06-02T22:55:11.622Z + 2025-06-03T19:31:20.042Z https://docs.axolotl.ai/docs/api/cli.preprocess.html - 2025-06-02T22:55:11.989Z + 2025-06-03T19:31:20.408Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html - 2025-06-02T22:55:12.321Z + 2025-06-03T19:31:20.740Z https://docs.axolotl.ai/docs/api/core.training_args.html - 2025-06-02T22:55:11.812Z + 2025-06-03T19:31:20.231Z https://docs.axolotl.ai/docs/api/datasets.html - 2025-06-02T22:55:11.639Z + 2025-06-03T19:31:20.060Z https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html - 2025-06-02T22:55:13.012Z + 2025-06-03T19:31:21.426Z https://docs.axolotl.ai/docs/api/kernels.utils.html - 2025-06-02T22:55:12.480Z + 2025-06-03T19:31:20.899Z https://docs.axolotl.ai/docs/api/loaders.adapter.html - 2025-06-02T22:55:12.143Z + 2025-06-03T19:31:20.562Z https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html - 2025-06-02T22:55:11.837Z + 2025-06-03T19:31:20.256Z https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html - 2025-06-02T22:55:12.094Z + 2025-06-03T19:31:20.512Z https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html - 2025-06-02T22:55:12.042Z + 2025-06-03T19:31:20.460Z https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html - 2025-06-02T22:55:12.276Z + 2025-06-03T19:31:20.695Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html - 2025-06-02T22:55:12.324Z + 2025-06-03T19:31:20.743Z https://docs.axolotl.ai/docs/api/monkeypatch.relora.html - 2025-06-02T22:55:12.531Z + 2025-06-03T19:31:20.949Z https://docs.axolotl.ai/docs/api/kernels.swiglu.html - 2025-06-02T22:55:12.471Z + 2025-06-03T19:31:20.890Z https://docs.axolotl.ai/docs/api/cli.cloud.base.html - 2025-06-02T22:55:12.035Z + 2025-06-03T19:31:20.454Z https://docs.axolotl.ai/docs/api/common.datasets.html - 2025-06-02T22:55:13.011Z + 2025-06-03T19:31:21.425Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html - 2025-06-02T22:55:12.117Z + 2025-06-03T19:31:20.535Z https://docs.axolotl.ai/docs/api/cli.merge_lora.html - 2025-06-02T22:55:11.969Z + 2025-06-03T19:31:20.388Z https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html - 2025-06-02T22:55:12.653Z + 2025-06-03T19:31:21.069Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html - 2025-06-02T22:55:12.309Z + 2025-06-03T19:31:20.728Z https://docs.axolotl.ai/docs/api/integrations.liger.args.html - 2025-06-02T22:55:12.984Z + 2025-06-03T19:31:21.398Z https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html - 2025-06-02T22:55:13.091Z + 2025-06-03T19:31:21.508Z https://docs.axolotl.ai/docs/api/utils.chat_templates.html - 2025-06-02T22:55:12.642Z + 2025-06-03T19:31:21.059Z https://docs.axolotl.ai/docs/api/core.builders.base.html - 2025-06-02T22:55:11.711Z + 2025-06-03T19:31:20.131Z https://docs.axolotl.ai/docs/api/core.trainers.mamba.html - 2025-06-02T22:55:12.083Z + 2025-06-03T19:31:20.501Z https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html - 2025-06-02T22:55:12.363Z + 2025-06-03T19:31:20.781Z https://docs.axolotl.ai/docs/api/utils.data.pretraining.html - 2025-06-02T22:55:12.738Z + 2025-06-03T19:31:21.154Z https://docs.axolotl.ai/docs/api/utils.schemas.peft.html - 2025-06-02T22:55:12.811Z + 2025-06-03T19:31:21.226Z https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html - 2025-06-02T22:55:12.578Z + 2025-06-03T19:31:20.996Z https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html - 2025-06-02T22:55:12.211Z + 2025-06-03T19:31:20.630Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html - 2025-06-02T22:55:12.341Z + 2025-06-03T19:31:20.759Z https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html - 2025-06-02T22:55:12.568Z + 2025-06-03T19:31:20.985Z https://docs.axolotl.ai/docs/api/core.chat.format.shared.html - 2025-06-02T22:55:11.840Z + 2025-06-03T19:31:20.259Z https://docs.axolotl.ai/docs/api/logging_config.html - 2025-06-02T22:55:11.704Z + 2025-06-03T19:31:20.124Z https://docs.axolotl.ai/docs/api/cli.sweeps.html - 2025-06-02T22:55:11.995Z + 2025-06-03T19:31:20.414Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html - 2025-06-02T22:55:12.299Z + 2025-06-03T19:31:20.718Z https://docs.axolotl.ai/docs/api/prompt_tokenizers.html - 2025-06-02T22:55:11.695Z + 2025-06-03T19:31:20.115Z https://docs.axolotl.ai/docs/api/kernels.quantize.html - 2025-06-02T22:55:12.479Z + 2025-06-03T19:31:20.897Z https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html - 2025-06-02T22:55:13.096Z + 2025-06-03T19:31:21.513Z https://docs.axolotl.ai/docs/api/utils.schemas.trl.html - 2025-06-02T22:55:12.814Z + 2025-06-03T19:31:21.229Z https://docs.axolotl.ai/docs/api/utils.schemas.config.html - 2025-06-02T22:55:12.772Z + 2025-06-03T19:31:21.187Z https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html - 2025-06-02T22:55:12.586Z + 2025-06-03T19:31:21.004Z https://docs.axolotl.ai/docs/api/cli.checks.html - 2025-06-02T22:55:11.928Z + 2025-06-03T19:31:20.347Z https://docs.axolotl.ai/docs/api/core.chat.messages.html - 2025-06-02T22:55:11.835Z + 2025-06-03T19:31:20.255Z https://docs.axolotl.ai/docs/api/loaders.patch_manager.html - 2025-06-02T22:55:12.151Z + 2025-06-03T19:31:20.570Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html - 2025-06-02T22:55:12.532Z + 2025-06-03T19:31:20.950Z https://docs.axolotl.ai/docs/api/utils.schemas.utils.html - 2025-06-02T22:55:12.848Z + 2025-06-03T19:31:21.263Z https://docs.axolotl.ai/docs/api/integrations.base.html - 2025-06-02T22:55:12.968Z + 2025-06-03T19:31:21.382Z https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html - 2025-06-02T22:55:13.081Z + 2025-06-03T19:31:21.498Z https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html - 2025-06-02T22:55:12.265Z + 2025-06-03T19:31:20.684Z https://docs.axolotl.ai/docs/api/utils.collators.mamba.html - 2025-06-02T22:55:13.036Z + 2025-06-03T19:31:21.452Z https://docs.axolotl.ai/docs/api/utils.schemas.model.html - 2025-06-02T22:55:12.779Z + 2025-06-03T19:31:21.194Z https://docs.axolotl.ai/docs/api/utils.schemas.training.html - 2025-06-02T22:55:12.784Z + 2025-06-03T19:31:21.199Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html - 2025-06-02T22:55:12.332Z + 2025-06-03T19:31:20.751Z https://docs.axolotl.ai/docs/api/core.trainers.utils.html - 2025-06-02T22:55:12.118Z + 2025-06-03T19:31:20.537Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html - 2025-06-02T22:55:12.158Z + 2025-06-03T19:31:20.577Z https://docs.axolotl.ai/docs/api/utils.freeze.html - 2025-06-02T22:55:12.664Z + 2025-06-03T19:31:21.080Z https://docs.axolotl.ai/docs/api/cli.utils.html - 2025-06-02T22:55:12.027Z + 2025-06-03T19:31:20.446Z https://docs.axolotl.ai/docs/multi-gpu.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/debugging.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.982Z https://docs.axolotl.ai/TODO.html - 2025-06-02T22:54:37.550Z + 2025-06-03T19:30:48.980Z https://docs.axolotl.ai/docs/amd_hpc.html - 2025-06-02T22:54:37.551Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/dataset_loading.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html - 2025-06-02T22:55:11.981Z + 2025-06-03T19:31:20.400Z https://docs.axolotl.ai/docs/api/monkeypatch.attention.mllama.html - 2025-06-02T22:55:12.593Z + 2025-06-03T19:31:21.010Z https://docs.axolotl.ai/docs/api/common.architectures.html - 2025-06-02T22:55:12.992Z + 2025-06-03T19:31:21.406Z https://docs.axolotl.ai/docs/api/utils.schedulers.html - 2025-06-02T22:55:12.706Z + 2025-06-03T19:31:21.122Z https://docs.axolotl.ai/docs/api/utils.collators.core.html - 2025-06-02T22:55:13.013Z + 2025-06-03T19:31:21.428Z https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html - 2025-06-02T22:55:12.819Z + 2025-06-03T19:31:21.234Z https://docs.axolotl.ai/docs/api/utils.distributed.html - 2025-06-02T22:55:12.726Z + 2025-06-03T19:31:21.141Z https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html - 2025-06-02T22:55:12.802Z + 2025-06-03T19:31:21.217Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html - 2025-06-02T22:55:12.342Z + 2025-06-03T19:31:20.761Z https://docs.axolotl.ai/docs/api/monkeypatch.utils.html - 2025-06-02T22:55:12.566Z + 2025-06-03T19:31:20.984Z https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html - 2025-06-02T22:55:12.832Z + 2025-06-03T19:31:21.246Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html - 2025-06-02T22:55:12.162Z + 2025-06-03T19:31:20.580Z https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html - 2025-06-02T22:55:12.987Z + 2025-06-03T19:31:21.401Z https://docs.axolotl.ai/docs/api/loaders.processor.html - 2025-06-02T22:55:12.138Z + 2025-06-03T19:31:20.556Z https://docs.axolotl.ai/docs/api/core.trainers.trl.html - 2025-06-02T22:55:12.078Z + 2025-06-03T19:31:20.496Z https://docs.axolotl.ai/docs/api/loaders.constants.html - 2025-06-02T22:55:12.153Z + 2025-06-03T19:31:20.571Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html - 2025-06-02T22:55:12.506Z + 2025-06-03T19:31:20.925Z https://docs.axolotl.ai/docs/api/cli.args.html - 2025-06-02T22:55:11.921Z + 2025-06-03T19:31:20.340Z https://docs.axolotl.ai/docs/api/core.builders.causal.html - 2025-06-02T22:55:11.715Z + 2025-06-03T19:31:20.135Z https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html - 2025-06-02T22:55:12.271Z + 2025-06-03T19:31:20.690Z https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html - 2025-06-02T22:55:11.838Z + 2025-06-03T19:31:20.258Z https://docs.axolotl.ai/docs/api/cli.train.html - 2025-06-02T22:55:11.893Z + 2025-06-03T19:31:20.312Z https://docs.axolotl.ai/docs/api/convert.html - 2025-06-02T22:55:11.653Z + 2025-06-03T19:31:20.073Z https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html - 2025-06-02T22:55:12.737Z + 2025-06-03T19:31:21.152Z https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html - 2025-06-02T22:55:12.293Z + 2025-06-03T19:31:20.712Z https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html - 2025-06-02T22:55:12.981Z + 2025-06-03T19:31:21.395Z https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html - 2025-06-02T22:55:13.106Z + 2025-06-03T19:31:21.524Z https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html - 2025-06-02T22:55:13.092Z + 2025-06-03T19:31:21.509Z https://docs.axolotl.ai/docs/api/loaders.tokenizer.html - 2025-06-02T22:55:12.136Z + 2025-06-03T19:31:20.555Z https://docs.axolotl.ai/docs/api/cli.main.html - 2025-06-02T22:55:11.885Z + 2025-06-03T19:31:20.304Z https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html - 2025-06-02T22:55:12.594Z + 2025-06-03T19:31:21.011Z https://docs.axolotl.ai/docs/api/cli.evaluate.html - 2025-06-02T22:55:11.902Z + 2025-06-03T19:31:20.320Z https://docs.axolotl.ai/docs/api/utils.bench.html - 2025-06-02T22:55:12.656Z + 2025-06-03T19:31:21.073Z https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html - 2025-06-02T22:55:12.585Z + 2025-06-03T19:31:21.002Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html - 2025-06-02T22:55:12.569Z + 2025-06-03T19:31:20.987Z https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html - 2025-06-02T22:55:12.523Z + 2025-06-03T19:31:20.941Z https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html - 2025-06-02T22:55:12.192Z + 2025-06-03T19:31:20.610Z https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html - 2025-06-02T22:55:12.973Z + 2025-06-03T19:31:21.387Z https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html - 2025-06-02T22:55:13.100Z + 2025-06-03T19:31:21.517Z https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html - 2025-06-02T22:55:12.524Z + 2025-06-03T19:31:20.942Z https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html - 2025-06-02T22:55:13.040Z + 2025-06-03T19:31:21.457Z https://docs.axolotl.ai/docs/api/utils.tokenization.html - 2025-06-02T22:55:12.632Z + 2025-06-03T19:31:21.049Z https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html - 2025-06-02T22:55:12.282Z + 2025-06-03T19:31:20.701Z https://docs.axolotl.ai/docs/api/utils.collators.batching.html - 2025-06-02T22:55:13.032Z + 2025-06-03T19:31:21.449Z https://docs.axolotl.ai/docs/api/core.trainers.base.html - 2025-06-02T22:55:12.061Z + 2025-06-03T19:31:20.479Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html - 2025-06-02T22:55:12.105Z + 2025-06-03T19:31:20.523Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html - 2025-06-02T22:55:12.320Z + 2025-06-03T19:31:20.738Z https://docs.axolotl.ai/docs/api/utils.quantization.html - 2025-06-02T22:55:12.761Z + 2025-06-03T19:31:21.176Z https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html - 2025-06-02T22:55:12.259Z + 2025-06-03T19:31:20.678Z https://docs.axolotl.ai/docs/api/cli.quantize.html - 2025-06-02T22:55:12.047Z + 2025-06-03T19:31:20.465Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html - 2025-06-02T22:55:12.226Z + 2025-06-03T19:31:20.646Z https://docs.axolotl.ai/docs/api/cli.vllm_serve.html - 2025-06-02T22:55:12.032Z + 2025-06-03T19:31:20.451Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html - 2025-06-02T22:55:12.225Z + 2025-06-03T19:31:20.644Z https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html - 2025-06-02T22:55:12.367Z + 2025-06-03T19:31:20.785Z https://docs.axolotl.ai/docs/api/utils.dict.html - 2025-06-02T22:55:12.729Z + 2025-06-03T19:31:21.145Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html - 2025-06-02T22:55:12.323Z + 2025-06-03T19:31:20.741Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html - 2025-06-02T22:55:12.508Z + 2025-06-03T19:31:20.926Z https://docs.axolotl.ai/docs/api/utils.lora.html - 2025-06-02T22:55:12.647Z + 2025-06-03T19:31:21.064Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html - 2025-06-02T22:55:12.599Z + 2025-06-03T19:31:21.016Z https://docs.axolotl.ai/docs/api/utils.trainer.html - 2025-06-02T22:55:12.682Z + 2025-06-03T19:31:21.097Z https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html - 2025-06-02T22:55:12.286Z + 2025-06-03T19:31:20.705Z https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html - 2025-06-02T22:55:12.297Z + 2025-06-03T19:31:20.716Z https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html - 2025-06-02T22:55:12.558Z + 2025-06-03T19:31:20.975Z https://docs.axolotl.ai/docs/api/utils.schemas.enums.html - 2025-06-02T22:55:12.842Z + 2025-06-03T19:31:21.257Z https://docs.axolotl.ai/docs/api/cli.config.html - 2025-06-02T22:55:11.946Z + 2025-06-03T19:31:20.365Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html - 2025-06-02T22:55:12.625Z + 2025-06-03T19:31:21.042Z https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html - 2025-06-02T22:55:12.575Z + 2025-06-03T19:31:20.992Z https://docs.axolotl.ai/docs/api/kernels.lora.html - 2025-06-02T22:55:12.450Z + 2025-06-03T19:31:20.868Z https://docs.axolotl.ai/docs/api/prompt_strategies.base.html - 2025-06-02T22:55:12.193Z + 2025-06-03T19:31:20.612Z https://docs.axolotl.ai/docs/api/core.trainers.relora.html - 2025-06-02T22:55:12.087Z + 2025-06-03T19:31:20.505Z https://docs.axolotl.ai/docs/api/loaders.model.html - 2025-06-02T22:55:12.128Z + 2025-06-03T19:31:20.546Z https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html - 2025-06-02T22:55:13.087Z + 2025-06-03T19:31:21.504Z https://docs.axolotl.ai/docs/api/cli.inference.html - 2025-06-02T22:55:11.960Z + 2025-06-03T19:31:20.380Z https://docs.axolotl.ai/docs/batch_vs_grad.html - 2025-06-02T22:54:37.551Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/sequence_parallelism.html - 2025-06-02T22:54:37.556Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/getting-started.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.982Z https://docs.axolotl.ai/docs/torchao.html - 2025-06-02T22:54:37.556Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/dataset_preprocessing.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.982Z https://docs.axolotl.ai/docs/docker.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.982Z https://docs.axolotl.ai/docs/ray-integration.html - 2025-06-02T22:54:37.556Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/dataset-formats/index.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/multimodal.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/reward_modelling.html - 2025-06-02T22:54:37.556Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/faq.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.982Z https://docs.axolotl.ai/docs/installation.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.984Z https://docs.axolotl.ai/docs/unsloth.html - 2025-06-02T22:54:37.556Z + 2025-06-03T19:30:48.985Z https://docs.axolotl.ai/docs/config.html - 2025-06-02T22:54:37.552Z + 2025-06-03T19:30:48.981Z https://docs.axolotl.ai/docs/inference.html - 2025-06-02T22:54:37.555Z + 2025-06-03T19:30:48.984Z https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html - 2025-06-02T22:54:37.572Z + 2025-06-03T19:30:49.002Z https://docs.axolotl.ai/index.html - 2025-06-02T22:54:37.568Z + 2025-06-03T19:30:48.998Z