diff --git a/.nojekyll b/.nojekyll
index 31b524309..ad6e5fc7e 100644
--- a/.nojekyll
+++ b/.nojekyll
@@ -1 +1 @@
-6f1a4ebe
\ No newline at end of file
+5e50c0b5
\ No newline at end of file
diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html
index 1a1951e98..f67c90d90 100644
--- a/docs/custom_integrations.html
+++ b/docs/custom_integrations.html
@@ -519,16 +519,21 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin
Installation
Run the following command to install cut_cross_entropy[transformers] if you don’t have it already.
-python scripts/cutcrossentropy_install.py | sh
-
-pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/apple/ml-cross-entropy.git@bad6f7b49c75fdec69471abb71b4cddd0f0c6438"
+
+If you are in dev environment
+
+python scripts/cutcrossentropy_install.py | sh
+
+If you are installing from pip
+
+pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/apple/ml-cross-entropy.git@bad6f7b49c75fdec69471abb71b4cddd0f0c6438"
Usage
-plugins :
- - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin
-
-cut_cross_entropy : true
+plugins :
+ - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin
+
+cut_cross_entropy : true
Supported Models
@@ -551,17 +556,17 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin
Citation
-@article {wijmans2024cut ,
- author = {Erik Wijmans and
- Brody Huval and
- Alexander Hertzberg and
- Vladlen Koltun and
- Philipp Kr\" ahenb\" uhl},
- title = {Cut Your Losses in Large-Vocabulary Language Models},
- journal = {arXiv},
- year = {2024},
- url = {https://arxiv.org/abs/2411.09009},
- }
+@article {wijmans2024cut ,
+ author = {Erik Wijmans and
+ Brody Huval and
+ Alexander Hertzberg and
+ Vladlen Koltun and
+ Philipp Kr\" ahenb\" uhl},
+ title = {Cut Your Losses in Large-Vocabulary Language Models},
+ journal = {arXiv},
+ year = {2024},
+ url = {https://arxiv.org/abs/2411.09009},
+ }
Please see reference here
@@ -570,20 +575,20 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin
See https://github.com/ironjr/grokfast
Usage
-plugins :
- - axolotl.integrations.grokfast.GrokfastPlugin
-
-grokfast_alpha : 2.0
-grokfast_lamb : 0.98
+plugins :
+ - axolotl.integrations.grokfast.GrokfastPlugin
+
+grokfast_alpha : 2.0
+grokfast_lamb : 0.98
Citation
-@article {lee2024grokfast ,
- title ={{Grokfast}: Accelerated Grokking by Amplifying Slow Gradients},
- author ={Lee, Jaerin and Kang, Bong Gyun and Kim, Kihoon and Lee, Kyoung Mu},
- journal ={arXiv preprint arXiv:2405.20233},
- year ={2024}
- }
+@article {lee2024grokfast ,
+ title ={{Grokfast}: Accelerated Grokking by Amplifying Slow Gradients},
+ author ={Lee, Jaerin and Kang, Bong Gyun and Kim, Kihoon and Lee, Kyoung Mu},
+ journal ={arXiv preprint arXiv:2405.20233},
+ year ={2024}
+ }
Please see reference here
@@ -591,21 +596,21 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin
Knowledge Distillation (KD)
Usage
-plugins :
- - "axolotl.integrations.kd.KDPlugin"
-
-kd_trainer : True
-kd_ce_alpha : 0.1
-kd_alpha : 0.9
-kd_temperature : 1.0
-
-torch_compile : True # torch>=2.5.1, recommended to reduce vram
-
-datasets :
- - path : ...
- type : "axolotl.integrations.kd.chat_template"
- field_messages : "messages_combined"
- logprobs_field : "llm_text_generation_vllm_logprobs" # for kd only, field of logprobs
+plugins :
+ - "axolotl.integrations.kd.KDPlugin"
+
+kd_trainer : True
+kd_ce_alpha : 0.1
+kd_alpha : 0.9
+kd_temperature : 1.0
+
+torch_compile : True # torch>=2.5.1, recommended to reduce vram
+
+datasets :
+ - path : ...
+ type : "axolotl.integrations.kd.chat_template"
+ field_messages : "messages_combined"
+ logprobs_field : "llm_text_generation_vllm_logprobs" # for kd only, field of logprobs
An example dataset can be found at axolotl-ai-co/evolkit-logprobs-pipeline-75k-v2-sample
Please see reference here
@@ -621,13 +626,13 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin
See https://github.com/linkedin/Liger-Kernel
Usage
-plugins :
- - axolotl.integrations.liger.LigerPlugin
-liger_rope : true
-liger_rms_norm : true
-liger_glu_activation : true
-liger_layer_norm : true
-liger_fused_linear_cross_entropy : true
+plugins :
+ - axolotl.integrations.liger.LigerPlugin
+liger_rope : true
+liger_rms_norm : true
+liger_glu_activation : true
+liger_layer_norm : true
+liger_fused_linear_cross_entropy : true
Supported Models
@@ -653,16 +658,16 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin
Citation
-@article {hsu2024ligerkernelefficienttriton ,
- title ={Liger Kernel: Efficient Triton Kernels for LLM Training},
- author ={Pin-Lun Hsu and Yun Dai and Vignesh Kothapalli and Qingquan Song and Shao Tang and Siyu Zhu and Steven Shimizu and Shivam Sahni and Haowen Ning and Yanning Chen},
- year ={2024},
- eprint ={2410.10989},
- archivePrefix ={arXiv},
- primaryClass ={cs.LG},
- url ={https://arxiv.org/abs/2410.10989},
- journal ={arXiv preprint arXiv:2410.10989},
- }
+@article {hsu2024ligerkernelefficienttriton ,
+ title ={Liger Kernel: Efficient Triton Kernels for LLM Training},
+ author ={Pin-Lun Hsu and Yun Dai and Vignesh Kothapalli and Qingquan Song and Shao Tang and Siyu Zhu and Steven Shimizu and Shivam Sahni and Haowen Ning and Yanning Chen},
+ year ={2024},
+ eprint ={2410.10989},
+ archivePrefix ={arXiv},
+ primaryClass ={cs.LG},
+ url ={https://arxiv.org/abs/2410.10989},
+ journal ={arXiv preprint arXiv:2410.10989},
+ }
Please see reference here
@@ -672,29 +677,29 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin
See https://github.com/EleutherAI/lm-evaluation-harness
Usage
-plugins :
- - axolotl.integrations.lm_eval.LMEvalPlugin
-
-lm_eval_tasks :
- - gsm8k
- - hellaswag
- - arc_easy
-
-lm_eval_batch_size : # Batch size for evaluation
-output_dir : # Directory to save evaluation results
+plugins :
+ - axolotl.integrations.lm_eval.LMEvalPlugin
+
+lm_eval_tasks :
+ - gsm8k
+ - hellaswag
+ - arc_easy
+
+lm_eval_batch_size : # Batch size for evaluation
+output_dir : # Directory to save evaluation results
Citation
-@misc {eval -harness ,
- author = {Gao, Leo and Tow, Jonathan and Abbasi, Baber and Biderman, Stella and Black, Sid and DiPofi, Anthony and Foster, Charles and Golding, Laurence and Hsu, Jeffrey and Le Noac'h, Alain and Li, Haonan and McDonell, Kyle and Muennighoff, Niklas and Ociepa, Chris and Phang, Jason and Reynolds, Laria and Schoelkopf, Hailey and Skowron, Aviya and Sutawika, Lintang and Tang, Eric and Thite, Anish and Wang, Ben and Wang, Kevin and Zou, Andy},
- title = {A framework for few-shot language model evaluation},
- month = 07,
- year = 2024,
- publisher = {Zenodo},
- version = {v0.4.3},
- doi = {10.5281/zenodo.12608602},
- url = {https://zenodo.org/records/12608602}
- }
+@misc {eval -harness ,
+ author = {Gao, Leo and Tow, Jonathan and Abbasi, Baber and Biderman, Stella and Black, Sid and DiPofi, Anthony and Foster, Charles and Golding, Laurence and Hsu, Jeffrey and Le Noac'h, Alain and Li, Haonan and McDonell, Kyle and Muennighoff, Niklas and Ociepa, Chris and Phang, Jason and Reynolds, Laria and Schoelkopf, Hailey and Skowron, Aviya and Sutawika, Lintang and Tang, Eric and Thite, Anish and Wang, Ben and Wang, Kevin and Zou, Andy},
+ title = {A framework for few-shot language model evaluation},
+ month = 07,
+ year = 2024,
+ publisher = {Zenodo},
+ version = {v0.4.3},
+ doi = {10.5281/zenodo.12608602},
+ url = {https://zenodo.org/records/12608602}
+ }
Please see reference here
@@ -710,23 +715,23 @@ By identifying the top n% of layers with the highest SNR, you can optimize train
Usage
-plugins :
- - axolotl.integrations.spectrum.SpectrumPlugin
-
-spectrum_top_fraction : 0.5
-spectrum_model_name : meta-llama/Meta-Llama-3.1-8B
+plugins :
+ - axolotl.integrations.spectrum.SpectrumPlugin
+
+spectrum_top_fraction : 0.5
+spectrum_model_name : meta-llama/Meta-Llama-3.1-8B
Citation
-@misc {hartford2024spectrumtargetedtrainingsignal ,
- title ={Spectrum: Targeted Training on Signal to Noise Ratio},
- author ={Eric Hartford and Lucas Atkins and Fernando Fernandes Neto and David Golchinfar},
- year ={2024},
- eprint ={2406.06623},
- archivePrefix ={arXiv},
- primaryClass ={cs.LG},
- url ={https://arxiv.org/abs/2406.06623},
- }
+@misc {hartford2024spectrumtargetedtrainingsignal ,
+ title ={Spectrum: Targeted Training on Signal to Noise Ratio},
+ author ={Eric Hartford and Lucas Atkins and Fernando Fernandes Neto and David Golchinfar},
+ year ={2024},
+ eprint ={2406.06623},
+ archivePrefix ={arXiv},
+ primaryClass ={cs.LG},
+ url ={https://arxiv.org/abs/2406.06623},
+ }
Please see reference here
@@ -770,10 +775,10 @@ Warning
If you could not load your integration, please ensure you are pip installing in editable mode.
-
+
and correctly spelled the integration name in the config file.
-
plugins :
- - axolotl.integrations.your_integration_name.YourIntegrationPlugin
+
plugins :
+ - axolotl.integrations.your_integration_name.YourIntegrationPlugin
diff --git a/index.html b/index.html
index 607a54490..0e4eebd82 100644
--- a/index.html
+++ b/index.html
@@ -475,6 +475,7 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin
+
diff --git a/search.json b/search.json
index 4d96747b5..3621bd8a5 100644
--- a/search.json
+++ b/search.json
@@ -3033,7 +3033,7 @@
"href": "docs/custom_integrations.html#cut-cross-entropy",
"title": "Custom Integrations",
"section": "Cut Cross Entropy",
- "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\npython scripts/cutcrossentropy_install.py | sh\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/apple/ml-cross-entropy.git@bad6f7b49c75fdec69471abb71b4cddd0f0c6438\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\ncut_cross_entropy: true\n\n\nSupported Models\n\nllama\nllama4_text\nllama4\nmllama\nphi3\ngemma\ngemma2\ngemma3\ngemma3_text\nmistral\nmistral3\nqwen2\ncohere\ncohere2\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
+ "text": "Cut Cross Entropy\nCut Cross Entropy (CCE) reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\n\nIf you are in dev environment\n\npython scripts/cutcrossentropy_install.py | sh\n\nIf you are installing from pip\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/apple/ml-cross-entropy.git@bad6f7b49c75fdec69471abb71b4cddd0f0c6438\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\ncut_cross_entropy: true\n\n\nSupported Models\n\nllama\nllama4_text\nllama4\nmllama\nphi3\ngemma\ngemma2\ngemma3\ngemma3_text\nmistral\nmistral3\nqwen2\ncohere\ncohere2\n\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
"crumbs": [
"Advanced Features",
"Custom Integrations"
diff --git a/sitemap.xml b/sitemap.xml
index 2da239fd5..ef82a9bf3 100644
--- a/sitemap.xml
+++ b/sitemap.xml
@@ -2,682 +2,682 @@
https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html
- 2025-04-16T21:48:50.899Z
+ 2025-04-16T22:03:03.860Z
https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html
- 2025-04-16T21:48:50.894Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/dataset-formats/template_free.html
- 2025-04-16T21:48:50.895Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/dataset-formats/tokenized.html
- 2025-04-16T21:48:50.895Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/nccl.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/amd_hpc.html
- 2025-04-16T21:48:50.894Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/config.html
- 2025-04-16T21:48:50.894Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/multi-gpu.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/installation.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.858Z
https://docs.axolotl.ai/docs/torchao.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/reward_modelling.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/input_output.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.858Z
https://docs.axolotl.ai/docs/multimodal.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html
- 2025-04-16T21:49:37.177Z
+ 2025-04-16T22:03:33.307Z
https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html
- 2025-04-16T21:49:36.732Z
+ 2025-04-16T22:03:32.889Z
https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html
- 2025-04-16T21:49:36.753Z
+ 2025-04-16T22:03:32.906Z
https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html
- 2025-04-16T21:49:36.399Z
+ 2025-04-16T22:03:32.588Z
https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html
- 2025-04-16T21:49:36.672Z
+ 2025-04-16T22:03:32.834Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html
- 2025-04-16T21:49:36.451Z
+ 2025-04-16T22:03:32.634Z
https://docs.axolotl.ai/docs/api/integrations.liger.args.html
- 2025-04-16T21:49:37.089Z
+ 2025-04-16T22:03:33.221Z
https://docs.axolotl.ai/docs/api/utils.schemas.training.html
- 2025-04-16T21:49:36.942Z
+ 2025-04-16T22:03:33.081Z
https://docs.axolotl.ai/docs/api/datasets.html
- 2025-04-16T21:49:35.848Z
+ 2025-04-16T22:03:32.076Z
https://docs.axolotl.ai/docs/api/kernels.geglu.html
- 2025-04-16T21:49:36.605Z
+ 2025-04-16T22:03:32.773Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html
- 2025-04-16T21:49:36.654Z
+ 2025-04-16T22:03:32.818Z
https://docs.axolotl.ai/docs/api/cli.sweeps.html
- 2025-04-16T21:49:36.214Z
+ 2025-04-16T22:03:32.419Z
https://docs.axolotl.ai/docs/api/utils.freeze.html
- 2025-04-16T21:49:36.832Z
+ 2025-04-16T22:03:32.980Z
https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html
- 2025-04-16T21:49:36.673Z
+ 2025-04-16T22:03:32.835Z
https://docs.axolotl.ai/docs/api/cli.main.html
- 2025-04-16T21:49:36.101Z
+ 2025-04-16T22:03:32.312Z
https://docs.axolotl.ai/docs/api/core.trainers.trl.html
- 2025-04-16T21:49:36.299Z
+ 2025-04-16T22:03:32.497Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html
- 2025-04-16T21:49:36.453Z
+ 2025-04-16T22:03:32.636Z
https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html
- 2025-04-16T21:49:36.052Z
+ 2025-04-16T22:03:32.267Z
https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html
- 2025-04-16T21:49:36.068Z
+ 2025-04-16T22:03:32.281Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html
- 2025-04-16T21:49:36.472Z
+ 2025-04-16T22:03:32.653Z
https://docs.axolotl.ai/docs/api/utils.collators.mamba.html
- 2025-04-16T21:49:37.148Z
+ 2025-04-16T22:03:33.278Z
https://docs.axolotl.ai/docs/api/integrations.base.html
- 2025-04-16T21:49:37.073Z
+ 2025-04-16T22:03:33.206Z
https://docs.axolotl.ai/docs/api/utils.bench.html
- 2025-04-16T21:49:36.824Z
+ 2025-04-16T22:03:32.972Z
https://docs.axolotl.ai/docs/api/kernels.swiglu.html
- 2025-04-16T21:49:36.616Z
+ 2025-04-16T22:03:32.783Z
https://docs.axolotl.ai/docs/api/core.chat.format.shared.html
- 2025-04-16T21:49:36.054Z
+ 2025-04-16T22:03:32.268Z
https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html
- 2025-04-16T21:49:37.077Z
+ 2025-04-16T22:03:33.209Z
https://docs.axolotl.ai/docs/api/core.datasets.chat.html
- 2025-04-16T21:49:36.059Z
+ 2025-04-16T22:03:32.273Z
https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html
- 2025-04-16T21:49:37.174Z
+ 2025-04-16T22:03:33.303Z
https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html
- 2025-04-16T21:49:37.078Z
+ 2025-04-16T22:03:33.210Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html
- 2025-04-16T21:49:36.343Z
+ 2025-04-16T22:03:32.537Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html
- 2025-04-16T21:49:36.345Z
+ 2025-04-16T22:03:32.539Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html
- 2025-04-16T21:49:36.471Z
+ 2025-04-16T22:03:32.652Z
https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html
- 2025-04-16T21:49:36.992Z
+ 2025-04-16T22:03:33.129Z
https://docs.axolotl.ai/docs/api/utils.schemas.trl.html
- 2025-04-16T21:49:36.973Z
+ 2025-04-16T22:03:33.111Z
https://docs.axolotl.ai/docs/api/prompt_tokenizers.html
- 2025-04-16T21:49:35.908Z
+ 2025-04-16T22:03:32.132Z
https://docs.axolotl.ai/docs/api/utils.data.sft.html
- 2025-04-16T21:49:36.916Z
+ 2025-04-16T22:03:33.057Z
https://docs.axolotl.ai/docs/api/utils.schedulers.html
- 2025-04-16T21:49:36.878Z
+ 2025-04-16T22:03:33.022Z
https://docs.axolotl.ai/docs/api/utils.chat_templates.html
- 2025-04-16T21:49:36.805Z
+ 2025-04-16T22:03:32.954Z
https://docs.axolotl.ai/docs/api/utils.models.html
- 2025-04-16T21:49:36.786Z
+ 2025-04-16T22:03:32.937Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html
- 2025-04-16T21:49:36.448Z
+ 2025-04-16T22:03:32.631Z
https://docs.axolotl.ai/docs/api/utils.distributed.html
- 2025-04-16T21:49:36.900Z
+ 2025-04-16T22:03:33.043Z
https://docs.axolotl.ai/docs/api/monkeypatch.utils.html
- 2025-04-16T21:49:36.719Z
+ 2025-04-16T22:03:32.877Z
https://docs.axolotl.ai/docs/api/utils.schemas.utils.html
- 2025-04-16T21:49:37.006Z
+ 2025-04-16T22:03:33.142Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html
- 2025-04-16T21:49:36.683Z
+ 2025-04-16T22:03:32.844Z
https://docs.axolotl.ai/docs/api/common.datasets.html
- 2025-04-16T21:49:37.116Z
+ 2025-04-16T22:03:33.247Z
https://docs.axolotl.ai/docs/api/logging_config.html
- 2025-04-16T21:49:35.914Z
+ 2025-04-16T22:03:32.137Z
https://docs.axolotl.ai/docs/api/kernels.quantize.html
- 2025-04-16T21:49:36.624Z
+ 2025-04-16T22:03:32.790Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html
- 2025-04-16T21:49:36.722Z
+ 2025-04-16T22:03:32.880Z
https://docs.axolotl.ai/docs/api/utils.schemas.model.html
- 2025-04-16T21:49:36.936Z
+ 2025-04-16T22:03:33.075Z
https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html
- 2025-04-16T21:49:36.728Z
+ 2025-04-16T22:03:32.886Z
https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html
- 2025-04-16T21:49:36.754Z
+ 2025-04-16T22:03:32.907Z
https://docs.axolotl.ai/docs/api/utils.tokenization.html
- 2025-04-16T21:49:36.794Z
+ 2025-04-16T22:03:32.944Z
https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html
- 2025-04-16T21:49:37.086Z
+ 2025-04-16T22:03:33.218Z
https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html
- 2025-04-16T21:49:36.961Z
+ 2025-04-16T22:03:33.099Z
https://docs.axolotl.ai/docs/api/utils.collators.core.html
- 2025-04-16T21:49:37.119Z
+ 2025-04-16T22:03:33.250Z
https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html
- 2025-04-16T21:49:36.721Z
+ 2025-04-16T22:03:32.879Z
https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html
- 2025-04-16T21:49:36.912Z
+ 2025-04-16T22:03:33.054Z
https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html
- 2025-04-16T21:49:36.394Z
+ 2025-04-16T22:03:32.583Z
https://docs.axolotl.ai/docs/api/index.html
- 2025-04-16T21:49:35.760Z
+ 2025-04-16T22:03:31.998Z
https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html
- 2025-04-16T21:49:36.265Z
+ 2025-04-16T22:03:32.466Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html
- 2025-04-16T21:49:36.437Z
+ 2025-04-16T22:03:32.621Z
https://docs.axolotl.ai/docs/api/cli.train.html
- 2025-04-16T21:49:36.110Z
+ 2025-04-16T22:03:32.321Z
https://docs.axolotl.ai/docs/api/core.trainer_builder.html
- 2025-04-16T21:49:35.930Z
+ 2025-04-16T22:03:32.153Z
https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html
- 2025-04-16T21:49:37.168Z
+ 2025-04-16T22:03:33.298Z
https://docs.axolotl.ai/docs/getting-started.html
- 2025-04-16T21:48:50.895Z
+ 2025-04-16T22:03:03.856Z
https://docs.axolotl.ai/docs/dataset_loading.html
- 2025-04-16T21:48:50.895Z
+ 2025-04-16T22:03:03.856Z
https://docs.axolotl.ai/docs/batch_vs_grad.html
- 2025-04-16T21:48:50.894Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/faq.html
- 2025-04-16T21:48:50.895Z
+ 2025-04-16T22:03:03.856Z
https://docs.axolotl.ai/docs/debugging.html
- 2025-04-16T21:48:50.895Z
+ 2025-04-16T22:03:03.856Z
https://docs.axolotl.ai/docs/lr_groups.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/TODO.html
- 2025-04-16T21:48:50.893Z
+ 2025-04-16T22:03:03.854Z
https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html
- 2025-04-16T21:48:50.916Z
+ 2025-04-16T22:03:03.875Z
https://docs.axolotl.ai/index.html
- 2025-04-16T21:48:50.912Z
+ 2025-04-16T22:03:03.871Z
https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html
- 2025-04-16T21:48:50.916Z
+ 2025-04-16T22:03:03.875Z
https://docs.axolotl.ai/FAQS.html
- 2025-04-16T21:48:50.892Z
+ 2025-04-16T22:03:03.854Z
https://docs.axolotl.ai/docs/multi-node.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/sequence_parallelism.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/multipack.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/inference.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.858Z
https://docs.axolotl.ai/docs/lora_optims.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/api/utils.lora_embeddings.html
- 2025-04-16T21:49:36.814Z
+ 2025-04-16T22:03:32.963Z
https://docs.axolotl.ai/docs/api/kernels.utils.html
- 2025-04-16T21:49:36.626Z
+ 2025-04-16T22:03:32.792Z
https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html
- 2025-04-16T21:49:36.328Z
+ 2025-04-16T22:03:32.523Z
https://docs.axolotl.ai/docs/api/convert.html
- 2025-04-16T21:49:35.862Z
+ 2025-04-16T22:03:32.090Z
https://docs.axolotl.ai/docs/api/common.const.html
- 2025-04-16T21:49:37.099Z
+ 2025-04-16T22:03:33.230Z
https://docs.axolotl.ai/docs/api/cli.cloud.base.html
- 2025-04-16T21:49:36.258Z
+ 2025-04-16T22:03:32.459Z
https://docs.axolotl.ai/docs/api/monkeypatch.relora.html
- 2025-04-16T21:49:36.681Z
+ 2025-04-16T22:03:32.842Z
https://docs.axolotl.ai/docs/api/utils.lora.html
- 2025-04-16T21:49:36.810Z
+ 2025-04-16T22:03:32.960Z
https://docs.axolotl.ai/docs/api/cli.merge_lora.html
- 2025-04-16T21:49:36.187Z
+ 2025-04-16T22:03:32.393Z
https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html
- 2025-04-16T21:49:36.499Z
+ 2025-04-16T22:03:32.678Z
https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html
- 2025-04-16T21:49:36.199Z
+ 2025-04-16T22:03:32.405Z
https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html
- 2025-04-16T21:49:37.096Z
+ 2025-04-16T22:03:33.227Z
https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html
- 2025-04-16T21:49:37.117Z
+ 2025-04-16T22:03:33.248Z
https://docs.axolotl.ai/docs/api/common.architectures.html
- 2025-04-16T21:49:37.097Z
+ 2025-04-16T22:03:33.229Z
https://docs.axolotl.ai/docs/api/utils.trainer.html
- 2025-04-16T21:49:36.850Z
+ 2025-04-16T22:03:32.997Z
https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html
- 2025-04-16T21:49:37.181Z
+ 2025-04-16T22:03:33.311Z
https://docs.axolotl.ai/docs/api/cli.vllm_serve.html
- 2025-04-16T21:49:36.254Z
+ 2025-04-16T22:03:32.456Z
https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html
- 2025-04-16T21:49:36.979Z
+ 2025-04-16T22:03:33.117Z
https://docs.axolotl.ai/docs/api/utils.gradient_checkpointing.unsloth.html
- 2025-04-16T21:49:36.919Z
+ 2025-04-16T22:03:33.060Z
https://docs.axolotl.ai/docs/api/core.trainers.base.html
- 2025-04-16T21:49:36.280Z
+ 2025-04-16T22:03:32.480Z
https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html
- 2025-04-16T21:49:36.741Z
+ 2025-04-16T22:03:32.898Z
https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html
- 2025-04-16T21:49:37.162Z
+ 2025-04-16T22:03:33.292Z
https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html
- 2025-04-16T21:49:37.172Z
+ 2025-04-16T22:03:33.302Z
https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html
- 2025-04-16T21:49:37.093Z
+ 2025-04-16T22:03:33.224Z
https://docs.axolotl.ai/docs/api/utils.data.pretraining.html
- 2025-04-16T21:49:36.914Z
+ 2025-04-16T22:03:33.055Z
https://docs.axolotl.ai/docs/api/evaluate.html
- 2025-04-16T21:49:35.839Z
+ 2025-04-16T22:03:32.069Z
https://docs.axolotl.ai/docs/api/utils.dict.html
- 2025-04-16T21:49:36.904Z
+ 2025-04-16T22:03:33.046Z
https://docs.axolotl.ai/docs/api/cli.utils.html
- 2025-04-16T21:49:36.249Z
+ 2025-04-16T22:03:32.451Z
https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html
- 2025-04-16T21:49:36.419Z
+ 2025-04-16T22:03:32.605Z
https://docs.axolotl.ai/docs/api/core.training_args.html
- 2025-04-16T21:49:36.025Z
+ 2025-04-16T22:03:32.241Z
https://docs.axolotl.ai/docs/api/cli.inference.html
- 2025-04-16T21:49:36.178Z
+ 2025-04-16T22:03:32.384Z
https://docs.axolotl.ai/docs/api/kernels.lora.html
- 2025-04-16T21:49:36.593Z
+ 2025-04-16T22:03:32.762Z
https://docs.axolotl.ai/docs/api/cli.evaluate.html
- 2025-04-16T21:49:36.119Z
+ 2025-04-16T22:03:32.329Z
https://docs.axolotl.ai/docs/api/utils.collators.batching.html
- 2025-04-16T21:49:37.144Z
+ 2025-04-16T22:03:33.274Z
https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html
- 2025-04-16T21:49:36.388Z
+ 2025-04-16T22:03:32.577Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html
- 2025-04-16T21:49:36.449Z
+ 2025-04-16T22:03:32.633Z
https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html
- 2025-04-16T21:49:36.407Z
+ 2025-04-16T22:03:32.594Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html
- 2025-04-16T21:49:36.495Z
+ 2025-04-16T22:03:32.674Z
https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html
- 2025-04-16T21:49:36.358Z
+ 2025-04-16T22:03:32.550Z
https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html
- 2025-04-16T21:49:36.820Z
+ 2025-04-16T22:03:32.969Z
https://docs.axolotl.ai/docs/api/cli.config.html
- 2025-04-16T21:49:36.163Z
+ 2025-04-16T22:03:32.370Z
https://docs.axolotl.ai/docs/api/utils.schemas.enums.html
- 2025-04-16T21:49:36.999Z
+ 2025-04-16T22:03:33.136Z
https://docs.axolotl.ai/docs/api/cli.preprocess.html
- 2025-04-16T21:49:36.208Z
+ 2025-04-16T22:03:32.413Z
https://docs.axolotl.ai/docs/api/core.chat.messages.html
- 2025-04-16T21:49:36.049Z
+ 2025-04-16T22:03:32.264Z
https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html
- 2025-04-16T21:49:36.426Z
+ 2025-04-16T22:03:32.611Z
https://docs.axolotl.ai/docs/api/utils.schemas.peft.html
- 2025-04-16T21:49:36.970Z
+ 2025-04-16T22:03:33.107Z
https://docs.axolotl.ai/docs/api/train.html
- 2025-04-16T21:49:35.828Z
+ 2025-04-16T22:03:32.059Z
https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html
- 2025-04-16T21:49:36.424Z
+ 2025-04-16T22:03:32.609Z
https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html
- 2025-04-16T21:49:36.412Z
+ 2025-04-16T22:03:32.598Z
https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html
- 2025-04-16T21:49:37.153Z
+ 2025-04-16T22:03:33.283Z
https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html
- 2025-04-16T21:49:36.462Z
+ 2025-04-16T22:03:32.644Z
https://docs.axolotl.ai/docs/api/monkeypatch.attention.mllama.html
- 2025-04-16T21:49:36.751Z
+ 2025-04-16T22:03:32.904Z
https://docs.axolotl.ai/docs/api/cli.checks.html
- 2025-04-16T21:49:36.144Z
+ 2025-04-16T22:03:32.352Z
https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html
- 2025-04-16T21:49:36.739Z
+ 2025-04-16T22:03:32.896Z
https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html
- 2025-04-16T21:49:36.656Z
+ 2025-04-16T22:03:32.819Z
https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html
- 2025-04-16T21:49:36.306Z
+ 2025-04-16T22:03:32.504Z
https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html
- 2025-04-16T21:49:36.367Z
+ 2025-04-16T22:03:32.558Z
https://docs.axolotl.ai/docs/api/cli.args.html
- 2025-04-16T21:49:36.137Z
+ 2025-04-16T22:03:32.346Z
https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html
- 2025-04-16T21:49:36.381Z
+ 2025-04-16T22:03:32.571Z
https://docs.axolotl.ai/docs/api/utils.schemas.config.html
- 2025-04-16T21:49:36.928Z
+ 2025-04-16T22:03:33.068Z
https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html
- 2025-04-16T21:49:36.310Z
+ 2025-04-16T22:03:32.507Z
https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html
- 2025-04-16T21:49:36.050Z
+ 2025-04-16T22:03:32.265Z
https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html
- 2025-04-16T21:49:36.711Z
+ 2025-04-16T22:03:32.869Z
https://docs.axolotl.ai/docs/api/prompt_strategies.base.html
- 2025-04-16T21:49:36.312Z
+ 2025-04-16T22:03:32.509Z
https://docs.axolotl.ai/docs/rlhf.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/cli.html
- 2025-04-16T21:48:50.894Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/unsloth.html
- 2025-04-16T21:48:50.899Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/fsdp_qlora.html
- 2025-04-16T21:48:50.895Z
+ 2025-04-16T22:03:03.856Z
https://docs.axolotl.ai/docs/dataset_preprocessing.html
- 2025-04-16T21:48:50.895Z
+ 2025-04-16T22:03:03.856Z
https://docs.axolotl.ai/docs/custom_integrations.html
- 2025-04-16T21:48:50.894Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/mac.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/docker.html
- 2025-04-16T21:48:50.895Z
+ 2025-04-16T22:03:03.856Z
https://docs.axolotl.ai/docs/ray-integration.html
- 2025-04-16T21:48:50.898Z
+ 2025-04-16T22:03:03.859Z
https://docs.axolotl.ai/docs/dataset-formats/index.html
- 2025-04-16T21:48:50.894Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/dataset-formats/conversation.html
- 2025-04-16T21:48:50.894Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/dataset-formats/pretraining.html
- 2025-04-16T21:48:50.894Z
+ 2025-04-16T22:03:03.855Z
https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html
- 2025-04-16T21:48:50.894Z
+ 2025-04-16T22:03:03.855Z