From 04e0259d9df5a90914948a6f6cdeb642d7f4619e Mon Sep 17 00:00:00 2001 From: Quarto GHA Workflow Runner Date: Wed, 16 Apr 2025 22:05:16 +0000 Subject: [PATCH] Built site for gh-pages --- .nojekyll | 2 +- docs/custom_integrations.html | 201 ++++++++++---------- index.html | 1 + search.json | 2 +- sitemap.xml | 340 +++++++++++++++++----------------- 5 files changed, 276 insertions(+), 270 deletions(-) diff --git a/.nojekyll b/.nojekyll index 31b524309..ad6e5fc7e 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -6f1a4ebe \ No newline at end of file +5e50c0b5 \ No newline at end of file diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html index 1a1951e98..f67c90d90 100644 --- a/docs/custom_integrations.html +++ b/docs/custom_integrations.html @@ -519,16 +519,21 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin

Installation

Run the following command to install cut_cross_entropy[transformers] if you don’t have it already.

-
python scripts/cutcrossentropy_install.py | sh
-
-pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/apple/ml-cross-entropy.git@bad6f7b49c75fdec69471abb71b4cddd0f0c6438"
+ +
python scripts/cutcrossentropy_install.py | sh
+ +
pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/apple/ml-cross-entropy.git@bad6f7b49c75fdec69471abb71b4cddd0f0c6438"

Usage

-
plugins:
-  - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin
-
-cut_cross_entropy: true
+
plugins:
+  - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin
+
+cut_cross_entropy: true

Supported Models

@@ -551,17 +556,17 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin

Citation

-
@article{wijmans2024cut,
-  author       = {Erik Wijmans and
-                  Brody Huval and
-                  Alexander Hertzberg and
-                  Vladlen Koltun and
-                  Philipp Kr\"ahenb\"uhl},
-  title        = {Cut Your Losses in Large-Vocabulary Language Models},
-  journal      = {arXiv},
-  year         = {2024},
-  url          = {https://arxiv.org/abs/2411.09009},
-}
+
@article{wijmans2024cut,
+  author       = {Erik Wijmans and
+                  Brody Huval and
+                  Alexander Hertzberg and
+                  Vladlen Koltun and
+                  Philipp Kr\"ahenb\"uhl},
+  title        = {Cut Your Losses in Large-Vocabulary Language Models},
+  journal      = {arXiv},
+  year         = {2024},
+  url          = {https://arxiv.org/abs/2411.09009},
+}

Please see reference here

@@ -570,20 +575,20 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin

See https://github.com/ironjr/grokfast

Usage

-
plugins:
-  - axolotl.integrations.grokfast.GrokfastPlugin
-
-grokfast_alpha: 2.0
-grokfast_lamb: 0.98
+
plugins:
+  - axolotl.integrations.grokfast.GrokfastPlugin
+
+grokfast_alpha: 2.0
+grokfast_lamb: 0.98

Citation

-
@article{lee2024grokfast,
-    title={{Grokfast}: Accelerated Grokking by Amplifying Slow Gradients},
-    author={Lee, Jaerin and Kang, Bong Gyun and Kim, Kihoon and Lee, Kyoung Mu},
-    journal={arXiv preprint arXiv:2405.20233},
-    year={2024}
-}
+
@article{lee2024grokfast,
+    title={{Grokfast}: Accelerated Grokking by Amplifying Slow Gradients},
+    author={Lee, Jaerin and Kang, Bong Gyun and Kim, Kihoon and Lee, Kyoung Mu},
+    journal={arXiv preprint arXiv:2405.20233},
+    year={2024}
+}

Please see reference here

@@ -591,21 +596,21 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin

Knowledge Distillation (KD)

Usage

-
plugins:
-  - "axolotl.integrations.kd.KDPlugin"
-
-kd_trainer: True
-kd_ce_alpha: 0.1
-kd_alpha: 0.9
-kd_temperature: 1.0
-
-torch_compile: True  # torch>=2.5.1, recommended to reduce vram
-
-datasets:
-  - path: ...
-    type: "axolotl.integrations.kd.chat_template"
-    field_messages: "messages_combined"
-    logprobs_field: "llm_text_generation_vllm_logprobs"  # for kd only, field of logprobs
+
plugins:
+  - "axolotl.integrations.kd.KDPlugin"
+
+kd_trainer: True
+kd_ce_alpha: 0.1
+kd_alpha: 0.9
+kd_temperature: 1.0
+
+torch_compile: True  # torch>=2.5.1, recommended to reduce vram
+
+datasets:
+  - path: ...
+    type: "axolotl.integrations.kd.chat_template"
+    field_messages: "messages_combined"
+    logprobs_field: "llm_text_generation_vllm_logprobs"  # for kd only, field of logprobs

An example dataset can be found at axolotl-ai-co/evolkit-logprobs-pipeline-75k-v2-sample

Please see reference here

@@ -621,13 +626,13 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin

See https://github.com/linkedin/Liger-Kernel

Usage

-
plugins:
-  - axolotl.integrations.liger.LigerPlugin
-liger_rope: true
-liger_rms_norm: true
-liger_glu_activation: true
-liger_layer_norm: true
-liger_fused_linear_cross_entropy: true
+
plugins:
+  - axolotl.integrations.liger.LigerPlugin
+liger_rope: true
+liger_rms_norm: true
+liger_glu_activation: true
+liger_layer_norm: true
+liger_fused_linear_cross_entropy: true

Supported Models

@@ -653,16 +658,16 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin

Citation

-
@article{hsu2024ligerkernelefficienttriton,
-      title={Liger Kernel: Efficient Triton Kernels for LLM Training},
-      author={Pin-Lun Hsu and Yun Dai and Vignesh Kothapalli and Qingquan Song and Shao Tang and Siyu Zhu and Steven Shimizu and Shivam Sahni and Haowen Ning and Yanning Chen},
-      year={2024},
-      eprint={2410.10989},
-      archivePrefix={arXiv},
-      primaryClass={cs.LG},
-      url={https://arxiv.org/abs/2410.10989},
-      journal={arXiv preprint arXiv:2410.10989},
-}
+
@article{hsu2024ligerkernelefficienttriton,
+      title={Liger Kernel: Efficient Triton Kernels for LLM Training},
+      author={Pin-Lun Hsu and Yun Dai and Vignesh Kothapalli and Qingquan Song and Shao Tang and Siyu Zhu and Steven Shimizu and Shivam Sahni and Haowen Ning and Yanning Chen},
+      year={2024},
+      eprint={2410.10989},
+      archivePrefix={arXiv},
+      primaryClass={cs.LG},
+      url={https://arxiv.org/abs/2410.10989},
+      journal={arXiv preprint arXiv:2410.10989},
+}

Please see reference here

@@ -672,29 +677,29 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin

See https://github.com/EleutherAI/lm-evaluation-harness

Usage

-
plugins:
-  - axolotl.integrations.lm_eval.LMEvalPlugin
-
-lm_eval_tasks:
-  - gsm8k
-  - hellaswag
-  - arc_easy
-
-lm_eval_batch_size: # Batch size for evaluation
-output_dir: # Directory to save evaluation results
+
plugins:
+  - axolotl.integrations.lm_eval.LMEvalPlugin
+
+lm_eval_tasks:
+  - gsm8k
+  - hellaswag
+  - arc_easy
+
+lm_eval_batch_size: # Batch size for evaluation
+output_dir: # Directory to save evaluation results

Citation

-
@misc{eval-harness,
-  author       = {Gao, Leo and Tow, Jonathan and Abbasi, Baber and Biderman, Stella and Black, Sid and DiPofi, Anthony and Foster, Charles and Golding, Laurence and Hsu, Jeffrey and Le Noac'h, Alain and Li, Haonan and McDonell, Kyle and Muennighoff, Niklas and Ociepa, Chris and Phang, Jason and Reynolds, Laria and Schoelkopf, Hailey and Skowron, Aviya and Sutawika, Lintang and Tang, Eric and Thite, Anish and Wang, Ben and Wang, Kevin and Zou, Andy},
-  title        = {A framework for few-shot language model evaluation},
-  month        = 07,
-  year         = 2024,
-  publisher    = {Zenodo},
-  version      = {v0.4.3},
-  doi          = {10.5281/zenodo.12608602},
-  url          = {https://zenodo.org/records/12608602}
-}
+
@misc{eval-harness,
+  author       = {Gao, Leo and Tow, Jonathan and Abbasi, Baber and Biderman, Stella and Black, Sid and DiPofi, Anthony and Foster, Charles and Golding, Laurence and Hsu, Jeffrey and Le Noac'h, Alain and Li, Haonan and McDonell, Kyle and Muennighoff, Niklas and Ociepa, Chris and Phang, Jason and Reynolds, Laria and Schoelkopf, Hailey and Skowron, Aviya and Sutawika, Lintang and Tang, Eric and Thite, Anish and Wang, Ben and Wang, Kevin and Zou, Andy},
+  title        = {A framework for few-shot language model evaluation},
+  month        = 07,
+  year         = 2024,
+  publisher    = {Zenodo},
+  version      = {v0.4.3},
+  doi          = {10.5281/zenodo.12608602},
+  url          = {https://zenodo.org/records/12608602}
+}

Please see reference here

@@ -710,23 +715,23 @@ By identifying the top n% of layers with the highest SNR, you can optimize train

Usage

-
plugins:
-  - axolotl.integrations.spectrum.SpectrumPlugin
-
-spectrum_top_fraction: 0.5
-spectrum_model_name: meta-llama/Meta-Llama-3.1-8B
+
plugins:
+  - axolotl.integrations.spectrum.SpectrumPlugin
+
+spectrum_top_fraction: 0.5
+spectrum_model_name: meta-llama/Meta-Llama-3.1-8B

Citation

-
@misc{hartford2024spectrumtargetedtrainingsignal,
-      title={Spectrum: Targeted Training on Signal to Noise Ratio},
-      author={Eric Hartford and Lucas Atkins and Fernando Fernandes Neto and David Golchinfar},
-      year={2024},
-      eprint={2406.06623},
-      archivePrefix={arXiv},
-      primaryClass={cs.LG},
-      url={https://arxiv.org/abs/2406.06623},
-}
+
@misc{hartford2024spectrumtargetedtrainingsignal,
+      title={Spectrum: Targeted Training on Signal to Noise Ratio},
+      author={Eric Hartford and Lucas Atkins and Fernando Fernandes Neto and David Golchinfar},
+      year={2024},
+      eprint={2406.06623},
+      archivePrefix={arXiv},
+      primaryClass={cs.LG},
+      url={https://arxiv.org/abs/2406.06623},
+}

Please see reference here

@@ -770,10 +775,10 @@ Warning

If you could not load your integration, please ensure you are pip installing in editable mode.

-
pip install -e .
+
pip install -e .

and correctly spelled the integration name in the config file.

-
plugins:
-  - axolotl.integrations.your_integration_name.YourIntegrationPlugin
+
plugins:
+  - axolotl.integrations.your_integration_name.YourIntegrationPlugin
diff --git a/index.html b/index.html index 607a54490..0e4eebd82 100644 --- a/index.html +++ b/index.html @@ -475,6 +475,7 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin

GitHub License tests +codecov Releases
contributors diff --git a/search.json b/search.json index 4d96747b5..3621bd8a5 100644 --- a/search.json +++ b/search.json @@ -3033,7 +3033,7 @@ "href": "docs/custom_integrations.html#cut-cross-entropy", "title": "Custom Integrations", "section": "Cut Cross Entropy", - "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\npython scripts/cutcrossentropy_install.py | sh\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/apple/ml-cross-entropy.git@bad6f7b49c75fdec69471abb71b4cddd0f0c6438\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\ncut_cross_entropy: true\n\n\nSupported Models\n\nllama\nllama4_text\nllama4\nmllama\nphi3\ngemma\ngemma2\ngemma3\ngemma3_text\nmistral\nmistral3\nqwen2\ncohere\ncohere2\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here", + "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/apple/ml-cross-entropy.git@bad6f7b49c75fdec69471abb71b4cddd0f0c6438\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\ncut_cross_entropy: true\n\n\nSupported Models\n\nllama\nllama4_text\nllama4\nmllama\nphi3\ngemma\ngemma2\ngemma3\ngemma3_text\nmistral\nmistral3\nqwen2\ncohere\ncohere2\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here", "crumbs": [ "Advanced Features", "Custom Integrations" diff --git a/sitemap.xml b/sitemap.xml index 2da239fd5..ef82a9bf3 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -2,682 +2,682 @@ https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html - 2025-04-16T21:48:50.899Z + 2025-04-16T22:03:03.860Z https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html - 2025-04-16T21:48:50.894Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/dataset-formats/template_free.html - 2025-04-16T21:48:50.895Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/dataset-formats/tokenized.html - 2025-04-16T21:48:50.895Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/nccl.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/amd_hpc.html - 2025-04-16T21:48:50.894Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/config.html - 2025-04-16T21:48:50.894Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/multi-gpu.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/installation.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.858Z https://docs.axolotl.ai/docs/torchao.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/reward_modelling.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/input_output.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.858Z https://docs.axolotl.ai/docs/multimodal.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html - 2025-04-16T21:49:37.177Z + 2025-04-16T22:03:33.307Z https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html - 2025-04-16T21:49:36.732Z + 2025-04-16T22:03:32.889Z https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html - 2025-04-16T21:49:36.753Z + 2025-04-16T22:03:32.906Z https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html - 2025-04-16T21:49:36.399Z + 2025-04-16T22:03:32.588Z https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html - 2025-04-16T21:49:36.672Z + 2025-04-16T22:03:32.834Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html - 2025-04-16T21:49:36.451Z + 2025-04-16T22:03:32.634Z https://docs.axolotl.ai/docs/api/integrations.liger.args.html - 2025-04-16T21:49:37.089Z + 2025-04-16T22:03:33.221Z https://docs.axolotl.ai/docs/api/utils.schemas.training.html - 2025-04-16T21:49:36.942Z + 2025-04-16T22:03:33.081Z https://docs.axolotl.ai/docs/api/datasets.html - 2025-04-16T21:49:35.848Z + 2025-04-16T22:03:32.076Z https://docs.axolotl.ai/docs/api/kernels.geglu.html - 2025-04-16T21:49:36.605Z + 2025-04-16T22:03:32.773Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html - 2025-04-16T21:49:36.654Z + 2025-04-16T22:03:32.818Z https://docs.axolotl.ai/docs/api/cli.sweeps.html - 2025-04-16T21:49:36.214Z + 2025-04-16T22:03:32.419Z https://docs.axolotl.ai/docs/api/utils.freeze.html - 2025-04-16T21:49:36.832Z + 2025-04-16T22:03:32.980Z https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html - 2025-04-16T21:49:36.673Z + 2025-04-16T22:03:32.835Z https://docs.axolotl.ai/docs/api/cli.main.html - 2025-04-16T21:49:36.101Z + 2025-04-16T22:03:32.312Z https://docs.axolotl.ai/docs/api/core.trainers.trl.html - 2025-04-16T21:49:36.299Z + 2025-04-16T22:03:32.497Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html - 2025-04-16T21:49:36.453Z + 2025-04-16T22:03:32.636Z https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html - 2025-04-16T21:49:36.052Z + 2025-04-16T22:03:32.267Z https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html - 2025-04-16T21:49:36.068Z + 2025-04-16T22:03:32.281Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html - 2025-04-16T21:49:36.472Z + 2025-04-16T22:03:32.653Z https://docs.axolotl.ai/docs/api/utils.collators.mamba.html - 2025-04-16T21:49:37.148Z + 2025-04-16T22:03:33.278Z https://docs.axolotl.ai/docs/api/integrations.base.html - 2025-04-16T21:49:37.073Z + 2025-04-16T22:03:33.206Z https://docs.axolotl.ai/docs/api/utils.bench.html - 2025-04-16T21:49:36.824Z + 2025-04-16T22:03:32.972Z https://docs.axolotl.ai/docs/api/kernels.swiglu.html - 2025-04-16T21:49:36.616Z + 2025-04-16T22:03:32.783Z https://docs.axolotl.ai/docs/api/core.chat.format.shared.html - 2025-04-16T21:49:36.054Z + 2025-04-16T22:03:32.268Z https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html - 2025-04-16T21:49:37.077Z + 2025-04-16T22:03:33.209Z https://docs.axolotl.ai/docs/api/core.datasets.chat.html - 2025-04-16T21:49:36.059Z + 2025-04-16T22:03:32.273Z https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html - 2025-04-16T21:49:37.174Z + 2025-04-16T22:03:33.303Z https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html - 2025-04-16T21:49:37.078Z + 2025-04-16T22:03:33.210Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html - 2025-04-16T21:49:36.343Z + 2025-04-16T22:03:32.537Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html - 2025-04-16T21:49:36.345Z + 2025-04-16T22:03:32.539Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html - 2025-04-16T21:49:36.471Z + 2025-04-16T22:03:32.652Z https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html - 2025-04-16T21:49:36.992Z + 2025-04-16T22:03:33.129Z https://docs.axolotl.ai/docs/api/utils.schemas.trl.html - 2025-04-16T21:49:36.973Z + 2025-04-16T22:03:33.111Z https://docs.axolotl.ai/docs/api/prompt_tokenizers.html - 2025-04-16T21:49:35.908Z + 2025-04-16T22:03:32.132Z https://docs.axolotl.ai/docs/api/utils.data.sft.html - 2025-04-16T21:49:36.916Z + 2025-04-16T22:03:33.057Z https://docs.axolotl.ai/docs/api/utils.schedulers.html - 2025-04-16T21:49:36.878Z + 2025-04-16T22:03:33.022Z https://docs.axolotl.ai/docs/api/utils.chat_templates.html - 2025-04-16T21:49:36.805Z + 2025-04-16T22:03:32.954Z https://docs.axolotl.ai/docs/api/utils.models.html - 2025-04-16T21:49:36.786Z + 2025-04-16T22:03:32.937Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html - 2025-04-16T21:49:36.448Z + 2025-04-16T22:03:32.631Z https://docs.axolotl.ai/docs/api/utils.distributed.html - 2025-04-16T21:49:36.900Z + 2025-04-16T22:03:33.043Z https://docs.axolotl.ai/docs/api/monkeypatch.utils.html - 2025-04-16T21:49:36.719Z + 2025-04-16T22:03:32.877Z https://docs.axolotl.ai/docs/api/utils.schemas.utils.html - 2025-04-16T21:49:37.006Z + 2025-04-16T22:03:33.142Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html - 2025-04-16T21:49:36.683Z + 2025-04-16T22:03:32.844Z https://docs.axolotl.ai/docs/api/common.datasets.html - 2025-04-16T21:49:37.116Z + 2025-04-16T22:03:33.247Z https://docs.axolotl.ai/docs/api/logging_config.html - 2025-04-16T21:49:35.914Z + 2025-04-16T22:03:32.137Z https://docs.axolotl.ai/docs/api/kernels.quantize.html - 2025-04-16T21:49:36.624Z + 2025-04-16T22:03:32.790Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html - 2025-04-16T21:49:36.722Z + 2025-04-16T22:03:32.880Z https://docs.axolotl.ai/docs/api/utils.schemas.model.html - 2025-04-16T21:49:36.936Z + 2025-04-16T22:03:33.075Z https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html - 2025-04-16T21:49:36.728Z + 2025-04-16T22:03:32.886Z https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html - 2025-04-16T21:49:36.754Z + 2025-04-16T22:03:32.907Z https://docs.axolotl.ai/docs/api/utils.tokenization.html - 2025-04-16T21:49:36.794Z + 2025-04-16T22:03:32.944Z https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html - 2025-04-16T21:49:37.086Z + 2025-04-16T22:03:33.218Z https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html - 2025-04-16T21:49:36.961Z + 2025-04-16T22:03:33.099Z https://docs.axolotl.ai/docs/api/utils.collators.core.html - 2025-04-16T21:49:37.119Z + 2025-04-16T22:03:33.250Z https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html - 2025-04-16T21:49:36.721Z + 2025-04-16T22:03:32.879Z https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html - 2025-04-16T21:49:36.912Z + 2025-04-16T22:03:33.054Z https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html - 2025-04-16T21:49:36.394Z + 2025-04-16T22:03:32.583Z https://docs.axolotl.ai/docs/api/index.html - 2025-04-16T21:49:35.760Z + 2025-04-16T22:03:31.998Z https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html - 2025-04-16T21:49:36.265Z + 2025-04-16T22:03:32.466Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html - 2025-04-16T21:49:36.437Z + 2025-04-16T22:03:32.621Z https://docs.axolotl.ai/docs/api/cli.train.html - 2025-04-16T21:49:36.110Z + 2025-04-16T22:03:32.321Z https://docs.axolotl.ai/docs/api/core.trainer_builder.html - 2025-04-16T21:49:35.930Z + 2025-04-16T22:03:32.153Z https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html - 2025-04-16T21:49:37.168Z + 2025-04-16T22:03:33.298Z https://docs.axolotl.ai/docs/getting-started.html - 2025-04-16T21:48:50.895Z + 2025-04-16T22:03:03.856Z https://docs.axolotl.ai/docs/dataset_loading.html - 2025-04-16T21:48:50.895Z + 2025-04-16T22:03:03.856Z https://docs.axolotl.ai/docs/batch_vs_grad.html - 2025-04-16T21:48:50.894Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/faq.html - 2025-04-16T21:48:50.895Z + 2025-04-16T22:03:03.856Z https://docs.axolotl.ai/docs/debugging.html - 2025-04-16T21:48:50.895Z + 2025-04-16T22:03:03.856Z https://docs.axolotl.ai/docs/lr_groups.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/TODO.html - 2025-04-16T21:48:50.893Z + 2025-04-16T22:03:03.854Z https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html - 2025-04-16T21:48:50.916Z + 2025-04-16T22:03:03.875Z https://docs.axolotl.ai/index.html - 2025-04-16T21:48:50.912Z + 2025-04-16T22:03:03.871Z https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html - 2025-04-16T21:48:50.916Z + 2025-04-16T22:03:03.875Z https://docs.axolotl.ai/FAQS.html - 2025-04-16T21:48:50.892Z + 2025-04-16T22:03:03.854Z https://docs.axolotl.ai/docs/multi-node.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/sequence_parallelism.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/multipack.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/inference.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.858Z https://docs.axolotl.ai/docs/lora_optims.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/api/utils.lora_embeddings.html - 2025-04-16T21:49:36.814Z + 2025-04-16T22:03:32.963Z https://docs.axolotl.ai/docs/api/kernels.utils.html - 2025-04-16T21:49:36.626Z + 2025-04-16T22:03:32.792Z https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html - 2025-04-16T21:49:36.328Z + 2025-04-16T22:03:32.523Z https://docs.axolotl.ai/docs/api/convert.html - 2025-04-16T21:49:35.862Z + 2025-04-16T22:03:32.090Z https://docs.axolotl.ai/docs/api/common.const.html - 2025-04-16T21:49:37.099Z + 2025-04-16T22:03:33.230Z https://docs.axolotl.ai/docs/api/cli.cloud.base.html - 2025-04-16T21:49:36.258Z + 2025-04-16T22:03:32.459Z https://docs.axolotl.ai/docs/api/monkeypatch.relora.html - 2025-04-16T21:49:36.681Z + 2025-04-16T22:03:32.842Z https://docs.axolotl.ai/docs/api/utils.lora.html - 2025-04-16T21:49:36.810Z + 2025-04-16T22:03:32.960Z https://docs.axolotl.ai/docs/api/cli.merge_lora.html - 2025-04-16T21:49:36.187Z + 2025-04-16T22:03:32.393Z https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html - 2025-04-16T21:49:36.499Z + 2025-04-16T22:03:32.678Z https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html - 2025-04-16T21:49:36.199Z + 2025-04-16T22:03:32.405Z https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html - 2025-04-16T21:49:37.096Z + 2025-04-16T22:03:33.227Z https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html - 2025-04-16T21:49:37.117Z + 2025-04-16T22:03:33.248Z https://docs.axolotl.ai/docs/api/common.architectures.html - 2025-04-16T21:49:37.097Z + 2025-04-16T22:03:33.229Z https://docs.axolotl.ai/docs/api/utils.trainer.html - 2025-04-16T21:49:36.850Z + 2025-04-16T22:03:32.997Z https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html - 2025-04-16T21:49:37.181Z + 2025-04-16T22:03:33.311Z https://docs.axolotl.ai/docs/api/cli.vllm_serve.html - 2025-04-16T21:49:36.254Z + 2025-04-16T22:03:32.456Z https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html - 2025-04-16T21:49:36.979Z + 2025-04-16T22:03:33.117Z https://docs.axolotl.ai/docs/api/utils.gradient_checkpointing.unsloth.html - 2025-04-16T21:49:36.919Z + 2025-04-16T22:03:33.060Z https://docs.axolotl.ai/docs/api/core.trainers.base.html - 2025-04-16T21:49:36.280Z + 2025-04-16T22:03:32.480Z https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html - 2025-04-16T21:49:36.741Z + 2025-04-16T22:03:32.898Z https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html - 2025-04-16T21:49:37.162Z + 2025-04-16T22:03:33.292Z https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html - 2025-04-16T21:49:37.172Z + 2025-04-16T22:03:33.302Z https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html - 2025-04-16T21:49:37.093Z + 2025-04-16T22:03:33.224Z https://docs.axolotl.ai/docs/api/utils.data.pretraining.html - 2025-04-16T21:49:36.914Z + 2025-04-16T22:03:33.055Z https://docs.axolotl.ai/docs/api/evaluate.html - 2025-04-16T21:49:35.839Z + 2025-04-16T22:03:32.069Z https://docs.axolotl.ai/docs/api/utils.dict.html - 2025-04-16T21:49:36.904Z + 2025-04-16T22:03:33.046Z https://docs.axolotl.ai/docs/api/cli.utils.html - 2025-04-16T21:49:36.249Z + 2025-04-16T22:03:32.451Z https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html - 2025-04-16T21:49:36.419Z + 2025-04-16T22:03:32.605Z https://docs.axolotl.ai/docs/api/core.training_args.html - 2025-04-16T21:49:36.025Z + 2025-04-16T22:03:32.241Z https://docs.axolotl.ai/docs/api/cli.inference.html - 2025-04-16T21:49:36.178Z + 2025-04-16T22:03:32.384Z https://docs.axolotl.ai/docs/api/kernels.lora.html - 2025-04-16T21:49:36.593Z + 2025-04-16T22:03:32.762Z https://docs.axolotl.ai/docs/api/cli.evaluate.html - 2025-04-16T21:49:36.119Z + 2025-04-16T22:03:32.329Z https://docs.axolotl.ai/docs/api/utils.collators.batching.html - 2025-04-16T21:49:37.144Z + 2025-04-16T22:03:33.274Z https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html - 2025-04-16T21:49:36.388Z + 2025-04-16T22:03:32.577Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html - 2025-04-16T21:49:36.449Z + 2025-04-16T22:03:32.633Z https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html - 2025-04-16T21:49:36.407Z + 2025-04-16T22:03:32.594Z https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html - 2025-04-16T21:49:36.495Z + 2025-04-16T22:03:32.674Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html - 2025-04-16T21:49:36.358Z + 2025-04-16T22:03:32.550Z https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html - 2025-04-16T21:49:36.820Z + 2025-04-16T22:03:32.969Z https://docs.axolotl.ai/docs/api/cli.config.html - 2025-04-16T21:49:36.163Z + 2025-04-16T22:03:32.370Z https://docs.axolotl.ai/docs/api/utils.schemas.enums.html - 2025-04-16T21:49:36.999Z + 2025-04-16T22:03:33.136Z https://docs.axolotl.ai/docs/api/cli.preprocess.html - 2025-04-16T21:49:36.208Z + 2025-04-16T22:03:32.413Z https://docs.axolotl.ai/docs/api/core.chat.messages.html - 2025-04-16T21:49:36.049Z + 2025-04-16T22:03:32.264Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html - 2025-04-16T21:49:36.426Z + 2025-04-16T22:03:32.611Z https://docs.axolotl.ai/docs/api/utils.schemas.peft.html - 2025-04-16T21:49:36.970Z + 2025-04-16T22:03:33.107Z https://docs.axolotl.ai/docs/api/train.html - 2025-04-16T21:49:35.828Z + 2025-04-16T22:03:32.059Z https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html - 2025-04-16T21:49:36.424Z + 2025-04-16T22:03:32.609Z https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html - 2025-04-16T21:49:36.412Z + 2025-04-16T22:03:32.598Z https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html - 2025-04-16T21:49:37.153Z + 2025-04-16T22:03:33.283Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html - 2025-04-16T21:49:36.462Z + 2025-04-16T22:03:32.644Z https://docs.axolotl.ai/docs/api/monkeypatch.attention.mllama.html - 2025-04-16T21:49:36.751Z + 2025-04-16T22:03:32.904Z https://docs.axolotl.ai/docs/api/cli.checks.html - 2025-04-16T21:49:36.144Z + 2025-04-16T22:03:32.352Z https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html - 2025-04-16T21:49:36.739Z + 2025-04-16T22:03:32.896Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html - 2025-04-16T21:49:36.656Z + 2025-04-16T22:03:32.819Z https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html - 2025-04-16T21:49:36.306Z + 2025-04-16T22:03:32.504Z https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html - 2025-04-16T21:49:36.367Z + 2025-04-16T22:03:32.558Z https://docs.axolotl.ai/docs/api/cli.args.html - 2025-04-16T21:49:36.137Z + 2025-04-16T22:03:32.346Z https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html - 2025-04-16T21:49:36.381Z + 2025-04-16T22:03:32.571Z https://docs.axolotl.ai/docs/api/utils.schemas.config.html - 2025-04-16T21:49:36.928Z + 2025-04-16T22:03:33.068Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html - 2025-04-16T21:49:36.310Z + 2025-04-16T22:03:32.507Z https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html - 2025-04-16T21:49:36.050Z + 2025-04-16T22:03:32.265Z https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html - 2025-04-16T21:49:36.711Z + 2025-04-16T22:03:32.869Z https://docs.axolotl.ai/docs/api/prompt_strategies.base.html - 2025-04-16T21:49:36.312Z + 2025-04-16T22:03:32.509Z https://docs.axolotl.ai/docs/rlhf.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/cli.html - 2025-04-16T21:48:50.894Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/unsloth.html - 2025-04-16T21:48:50.899Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/fsdp_qlora.html - 2025-04-16T21:48:50.895Z + 2025-04-16T22:03:03.856Z https://docs.axolotl.ai/docs/dataset_preprocessing.html - 2025-04-16T21:48:50.895Z + 2025-04-16T22:03:03.856Z https://docs.axolotl.ai/docs/custom_integrations.html - 2025-04-16T21:48:50.894Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/mac.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/docker.html - 2025-04-16T21:48:50.895Z + 2025-04-16T22:03:03.856Z https://docs.axolotl.ai/docs/ray-integration.html - 2025-04-16T21:48:50.898Z + 2025-04-16T22:03:03.859Z https://docs.axolotl.ai/docs/dataset-formats/index.html - 2025-04-16T21:48:50.894Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/dataset-formats/conversation.html - 2025-04-16T21:48:50.894Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/dataset-formats/pretraining.html - 2025-04-16T21:48:50.894Z + 2025-04-16T22:03:03.855Z https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html - 2025-04-16T21:48:50.894Z + 2025-04-16T22:03:03.855Z