diff --git a/.nojekyll b/.nojekyll
index a14f9e4e3..7a84e3030 100644
--- a/.nojekyll
+++ b/.nojekyll
@@ -1 +1 @@
-5da99456
\ No newline at end of file
+470da143
\ No newline at end of file
diff --git a/docs/custom_integrations.html b/docs/custom_integrations.html
index f5579bd25..6000487be 100644
--- a/docs/custom_integrations.html
+++ b/docs/custom_integrations.html
@@ -511,7 +511,7 @@ pre > code.sourceCode > span > a:first-child::before { text-decoration: underlin
Run the following command to install cut_cross_entropy[transformers] if you don’t have it already.
python scripts/cutcrossentropy_install.py | sh
-pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy @ git+https://github.com/apple/ml-cross-entropy.git@9c297c905f55b73594b5d650722d1e78183b77bd"'
+pip3 uninstall -y cut-cross-entropy && pip3 install "cut-cross-entropy[transformers] @ git+https://github.com/apple/ml-cross-entropy.git@24fbe4b5dab9a6c250a014573613c1890190536c"
Usage
diff --git a/search.json b/search.json
index 217e8a473..57c5ef57a 100644
--- a/search.json
+++ b/search.json
@@ -1054,7 +1054,7 @@
"href": "docs/custom_integrations.html#cut-cross-entropy",
"title": "Custom Integrations",
"section": "Cut Cross Entropy",
- "text": "Cut Cross Entropy\nCut Cross Entropy reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\npython scripts/cutcrossentropy_install.py | sh\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy @ git+https://github.com/apple/ml-cross-entropy.git@9c297c905f55b73594b5d650722d1e78183b77bd\"'\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\ncut_cross_entropy: true\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
+ "text": "Cut Cross Entropy\nCut Cross Entropy reduces VRAM usage through optimization on the cross-entropy operation during loss calculation.\nSee https://github.com/apple/ml-cross-entropy\n\nRequirements\n\nPyTorch 2.4.0 or higher\n\n\n\nInstallation\nRun the following command to install cut_cross_entropy[transformers] if you don’t have it already.\npython scripts/cutcrossentropy_install.py | sh\n\npip3 uninstall -y cut-cross-entropy && pip3 install \"cut-cross-entropy[transformers] @ git+https://github.com/apple/ml-cross-entropy.git@24fbe4b5dab9a6c250a014573613c1890190536c\"\n\n\nUsage\nplugins:\n - axolotl.integrations.cut_cross_entropy.CutCrossEntropyPlugin\n\ncut_cross_entropy: true\n\n\nCitation\n@article{wijmans2024cut,\n author = {Erik Wijmans and\n Brody Huval and\n Alexander Hertzberg and\n Vladlen Koltun and\n Philipp Kr\\\"ahenb\\\"uhl},\n title = {Cut Your Losses in Large-Vocabulary Language Models},\n journal = {arXiv},\n year = {2024},\n url = {https://arxiv.org/abs/2411.09009},\n}\nPlease see reference here",
"crumbs": [
"Advanced Features",
"Custom Integrations"
diff --git a/sitemap.xml b/sitemap.xml
index 9f170d926..efc7d5212 100644
--- a/sitemap.xml
+++ b/sitemap.xml
@@ -2,162 +2,162 @@
https://axolotl-ai-cloud.github.io/axolotl/examples/colab-notebooks/colab-axolotl-example.html
- 2025-03-10T09:26:02.164Z
+ 2025-03-10T09:26:53.684Z
https://axolotl-ai-cloud.github.io/axolotl/docs/dataset-formats/stepwise_supervised.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/dataset-formats/template_free.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/dataset-formats/tokenized.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/nccl.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/amd_hpc.html
- 2025-03-10T09:26:02.159Z
+ 2025-03-10T09:26:53.679Z
https://axolotl-ai-cloud.github.io/axolotl/docs/config.html
- 2025-03-10T09:26:02.159Z
+ 2025-03-10T09:26:53.679Z
https://axolotl-ai-cloud.github.io/axolotl/docs/multi-gpu.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/installation.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/torchao.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/reward_modelling.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/input_output.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/multimodal.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/getting-started.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/inference.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/multipack.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/debugging.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/lr_groups.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/TODO.html
- 2025-03-10T09:26:02.158Z
+ 2025-03-10T09:26:53.678Z
https://axolotl-ai-cloud.github.io/axolotl/src/axolotl/integrations/LICENSE.html
- 2025-03-10T09:26:02.178Z
+ 2025-03-10T09:26:53.698Z
https://axolotl-ai-cloud.github.io/axolotl/index.html
- 2025-03-10T09:26:02.175Z
+ 2025-03-10T09:26:53.695Z
https://axolotl-ai-cloud.github.io/axolotl/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html
- 2025-03-10T09:26:02.178Z
+ 2025-03-10T09:26:53.698Z
https://axolotl-ai-cloud.github.io/axolotl/FAQS.html
- 2025-03-10T09:26:02.158Z
+ 2025-03-10T09:26:53.678Z
https://axolotl-ai-cloud.github.io/axolotl/docs/multi-node.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/faq.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/batch_vs_grad.html
- 2025-03-10T09:26:02.159Z
+ 2025-03-10T09:26:53.679Z
https://axolotl-ai-cloud.github.io/axolotl/docs/lora_optims.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/rlhf.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/cli.html
- 2025-03-10T09:26:02.159Z
+ 2025-03-10T09:26:53.679Z
https://axolotl-ai-cloud.github.io/axolotl/docs/unsloth.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/fsdp_qlora.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/dataset_preprocessing.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/custom_integrations.html
- 2025-03-10T09:26:02.159Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/mac.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/docker.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/ray-integration.html
- 2025-03-10T09:26:02.163Z
+ 2025-03-10T09:26:53.683Z
https://axolotl-ai-cloud.github.io/axolotl/docs/dataset-formats/index.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/dataset-formats/conversation.html
- 2025-03-10T09:26:02.159Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/dataset-formats/pretraining.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z
https://axolotl-ai-cloud.github.io/axolotl/docs/dataset-formats/inst_tune.html
- 2025-03-10T09:26:02.160Z
+ 2025-03-10T09:26:53.680Z