diff --git a/.nojekyll b/.nojekyll index c0a39ee8d..3e9310b5e 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -923bd3c2 \ No newline at end of file +19010a02 \ No newline at end of file diff --git a/docs/multi-gpu.html b/docs/multi-gpu.html index 32635dfaf..9bb7626b9 100644 --- a/docs/multi-gpu.html +++ b/docs/multi-gpu.html @@ -658,7 +658,8 @@ also follow the config field mapping below to update field names.

-

For example, if you were using the following FSDP1 config:

+

For more details, please see the migration guide in the torchtitan repo. In Axolotl, +if you were using the following FSDP1 config:

fsdp_version: 1
 fsdp_config:
   fsdp_offload_params: false
@@ -1308,8 +1309,8 @@ single sequence causes OOM errors during model training.

fsdp_state_dict_type | state_dict_type fsdp_use_orig_params | **REMOVED** - -For example, if you were using the following FSDP1 config: +For more details, please see the migration guide in the [torchtitan repo](https://github.com/pytorch/torchtitan/blob/main/docs/fsdp.md). In Axolotl, +if you were using the following FSDP1 config: ```{.yaml} fsdp_version: 1 diff --git a/search.json b/search.json index 80575aebf..40f3d865d 100644 --- a/search.json +++ b/search.json @@ -1479,7 +1479,7 @@ "href": "docs/multi-gpu.html#sec-fsdp", "title": "Multi-GPU", "section": "3 Fully Sharded Data Parallel (FSDP)", - "text": "3 Fully Sharded Data Parallel (FSDP)\n\n\n\n\n\n\nNote\n\n\n\nFSDP2 is recommended for new users. FSDP1 is deprecated and will be removed in an upcoming release of Axolotl.\n\n\n\n3.1 Migrating from FSDP1 to FSDP2\nTo migrate your config from FSDP1 to FSDP2, you must use the fsdp_version top-level config field to specify the FSDP version, and\nalso follow the config field mapping below to update field names.\n\n3.1.1 Config mapping\n\n\n\nFSDP1\nFSDP2\n\n\n\n\nfsdp_sharding_strategy\nreshard_after_forward\n\n\nfsdp_backward_prefetch_policy\nREMOVED\n\n\nfsdp_backward_prefetch\nREMOVED\n\n\nfsdp_forward_prefetch\nREMOVED\n\n\nfsdp_sync_module_states\nREMOVED\n\n\nfsdp_cpu_ram_efficient_loading\ncpu_ram_efficient_loading\n\n\nfsdp_state_dict_type\nstate_dict_type\n\n\nfsdp_use_orig_params\nREMOVED\n\n\n\nFor example, if you were using the following FSDP1 config:\nfsdp_version: 1\nfsdp_config:\n fsdp_offload_params: false\n fsdp_cpu_ram_efficient_loading: true\n fsdp_auto_wrap_policy: TRANSFORMER_BASED_WRAP\n fsdp_transformer_layer_cls_to_wrap: Qwen3DecoderLayer\n fsdp_state_dict_type: FULL_STATE_DICT\n fsdp_sharding_strategy: FULL_SHARD\nYou can migrate to the following FSDP2 config:\nfsdp_version: 2\nfsdp_config:\n offload_params: false\n cpu_ram_efficient_loading: true\n auto_wrap_policy: TRANSFORMER_BASED_WRAP\n transformer_layer_cls_to_wrap: Qwen3DecoderLayer\n state_dict_type: FULL_STATE_DICT\n reshard_after_forward: true\n\n\n\n3.2 FSDP1 (deprecated)\n\n\n\n\n\n\nNote\n\n\n\nUsing fsdp to configure FSDP is deprecated and will be removed in an upcoming release of Axolotl. Please use fsdp_config as above instead.\n\n\nfsdp:\n - full_shard\n - auto_wrap\nfsdp_config:\n fsdp_offload_params: true\n fsdp_state_dict_type: FULL_STATE_DICT\n fsdp_transformer_layer_cls_to_wrap: LlamaDecoderLayer", + "text": "3 Fully Sharded Data Parallel (FSDP)\n\n\n\n\n\n\nNote\n\n\n\nFSDP2 is recommended for new users. FSDP1 is deprecated and will be removed in an upcoming release of Axolotl.\n\n\n\n3.1 Migrating from FSDP1 to FSDP2\nTo migrate your config from FSDP1 to FSDP2, you must use the fsdp_version top-level config field to specify the FSDP version, and\nalso follow the config field mapping below to update field names.\n\n3.1.1 Config mapping\n\n\n\nFSDP1\nFSDP2\n\n\n\n\nfsdp_sharding_strategy\nreshard_after_forward\n\n\nfsdp_backward_prefetch_policy\nREMOVED\n\n\nfsdp_backward_prefetch\nREMOVED\n\n\nfsdp_forward_prefetch\nREMOVED\n\n\nfsdp_sync_module_states\nREMOVED\n\n\nfsdp_cpu_ram_efficient_loading\ncpu_ram_efficient_loading\n\n\nfsdp_state_dict_type\nstate_dict_type\n\n\nfsdp_use_orig_params\nREMOVED\n\n\n\nFor more details, please see the migration guide in the torchtitan repo. In Axolotl,\nif you were using the following FSDP1 config:\nfsdp_version: 1\nfsdp_config:\n fsdp_offload_params: false\n fsdp_cpu_ram_efficient_loading: true\n fsdp_auto_wrap_policy: TRANSFORMER_BASED_WRAP\n fsdp_transformer_layer_cls_to_wrap: Qwen3DecoderLayer\n fsdp_state_dict_type: FULL_STATE_DICT\n fsdp_sharding_strategy: FULL_SHARD\nYou can migrate to the following FSDP2 config:\nfsdp_version: 2\nfsdp_config:\n offload_params: false\n cpu_ram_efficient_loading: true\n auto_wrap_policy: TRANSFORMER_BASED_WRAP\n transformer_layer_cls_to_wrap: Qwen3DecoderLayer\n state_dict_type: FULL_STATE_DICT\n reshard_after_forward: true\n\n\n\n3.2 FSDP1 (deprecated)\n\n\n\n\n\n\nNote\n\n\n\nUsing fsdp to configure FSDP is deprecated and will be removed in an upcoming release of Axolotl. Please use fsdp_config as above instead.\n\n\nfsdp:\n - full_shard\n - auto_wrap\nfsdp_config:\n fsdp_offload_params: true\n fsdp_state_dict_type: FULL_STATE_DICT\n fsdp_transformer_layer_cls_to_wrap: LlamaDecoderLayer", "crumbs": [ "Deployments", "Multi-GPU" diff --git a/sitemap.xml b/sitemap.xml index 4a32c3775..406dbe29e 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -2,762 +2,762 @@ https://docs.axolotl.ai/TODO.html - 2025-07-17T19:33:02.921Z + 2025-07-19T17:54:53.843Z https://docs.axolotl.ai/index.html - 2025-07-17T19:33:02.942Z + 2025-07-19T17:54:53.864Z https://docs.axolotl.ai/docs/debugging.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/amd_hpc.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.844Z https://docs.axolotl.ai/docs/api/utils.callbacks.mlflow_.html - 2025-07-17T19:36:15.935Z + 2025-07-19T17:58:01.053Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_expand_mask.html - 2025-07-17T19:36:15.367Z + 2025-07-19T17:58:00.483Z https://docs.axolotl.ai/docs/api/loaders.patch_manager.html - 2025-07-17T19:36:14.977Z + 2025-07-19T17:58:00.090Z https://docs.axolotl.ai/docs/api/core.chat.format.llama3x.html - 2025-07-17T19:36:14.670Z + 2025-07-19T17:57:59.784Z https://docs.axolotl.ai/docs/api/cli.train.html - 2025-07-17T19:36:14.724Z + 2025-07-19T17:57:59.838Z https://docs.axolotl.ai/docs/api/utils.callbacks.perplexity.html - 2025-07-17T19:36:15.926Z + 2025-07-19T17:58:01.044Z https://docs.axolotl.ai/docs/api/core.chat.messages.html - 2025-07-17T19:36:14.667Z + 2025-07-19T17:57:59.781Z https://docs.axolotl.ai/docs/api/utils.callbacks.lisa.html - 2025-07-17T19:36:15.931Z + 2025-07-19T17:58:01.050Z https://docs.axolotl.ai/docs/api/cli.merge_sharded_fsdp_weights.html - 2025-07-17T19:36:14.811Z + 2025-07-19T17:57:59.924Z https://docs.axolotl.ai/docs/api/cli.sweeps.html - 2025-07-17T19:36:14.825Z + 2025-07-19T17:57:59.938Z https://docs.axolotl.ai/docs/api/utils.chat_templates.html - 2025-07-17T19:36:15.463Z + 2025-07-19T17:58:00.580Z https://docs.axolotl.ai/docs/api/core.chat.format.shared.html - 2025-07-17T19:36:14.672Z + 2025-07-19T17:57:59.785Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.optimizer.html - 2025-07-17T19:36:14.984Z + 2025-07-19T17:58:00.097Z https://docs.axolotl.ai/docs/api/utils.collators.mamba.html - 2025-07-17T19:36:15.874Z + 2025-07-19T17:58:00.992Z https://docs.axolotl.ai/docs/api/logging_config.html - 2025-07-17T19:36:14.617Z + 2025-07-19T17:57:59.730Z https://docs.axolotl.ai/docs/api/utils.collators.mm_chat.html - 2025-07-17T19:36:15.879Z + 2025-07-19T17:58:00.997Z https://docs.axolotl.ai/docs/api/prompt_strategies.completion.html - 2025-07-17T19:36:15.104Z + 2025-07-19T17:58:00.218Z https://docs.axolotl.ai/docs/api/kernels.utils.html - 2025-07-17T19:36:15.316Z + 2025-07-19T17:58:00.432Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chat_template.html - 2025-07-17T19:36:15.137Z + 2025-07-19T17:58:00.251Z https://docs.axolotl.ai/docs/api/kernels.swiglu.html - 2025-07-17T19:36:15.307Z + 2025-07-19T17:58:00.423Z https://docs.axolotl.ai/docs/api/common.const.html - 2025-07-17T19:36:15.834Z + 2025-07-19T17:58:00.952Z https://docs.axolotl.ai/docs/api/cli.cloud.base.html - 2025-07-17T19:36:14.867Z + 2025-07-19T17:57:59.980Z https://docs.axolotl.ai/docs/api/utils.callbacks.comet_.html - 2025-07-17T19:36:15.938Z + 2025-07-19T17:58:01.057Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_cpu.html - 2025-07-17T19:36:15.429Z + 2025-07-19T17:58:00.546Z https://docs.axolotl.ai/docs/api/common.architectures.html - 2025-07-17T19:36:15.833Z + 2025-07-19T17:58:00.950Z https://docs.axolotl.ai/docs/api/prompt_strategies.pygmalion.html - 2025-07-17T19:36:15.132Z + 2025-07-19T17:58:00.246Z https://docs.axolotl.ai/docs/api/utils.schemas.peft.html - 2025-07-17T19:36:15.639Z + 2025-07-19T17:58:00.755Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.user_defined.html - 2025-07-17T19:36:15.161Z + 2025-07-19T17:58:00.275Z https://docs.axolotl.ai/docs/api/utils.schemas.datasets.html - 2025-07-17T19:36:15.630Z + 2025-07-19T17:58:00.747Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_w_system.html - 2025-07-17T19:36:15.077Z + 2025-07-19T17:58:00.191Z https://docs.axolotl.ai/docs/api/prompt_strategies.base.html - 2025-07-17T19:36:15.019Z + 2025-07-19T17:58:00.132Z https://docs.axolotl.ai/docs/api/utils.lora.html - 2025-07-17T19:36:15.468Z + 2025-07-19T17:58:00.585Z https://docs.axolotl.ai/docs/api/prompt_strategies.input_output.html - 2025-07-17T19:36:15.110Z + 2025-07-19T17:58:00.224Z https://docs.axolotl.ai/docs/api/utils.schemas.trl.html - 2025-07-17T19:36:15.642Z + 2025-07-19T17:58:00.759Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.zephyr.html - 2025-07-17T19:36:15.159Z + 2025-07-19T17:58:00.273Z https://docs.axolotl.ai/docs/api/integrations.kd.trainer.html - 2025-07-17T19:36:15.821Z + 2025-07-19T17:58:00.939Z https://docs.axolotl.ai/docs/api/monkeypatch.gradient_checkpointing.offload_disk.html - 2025-07-17T19:36:15.455Z + 2025-07-19T17:58:00.572Z https://docs.axolotl.ai/docs/api/utils.optimizers.adopt.html - 2025-07-17T19:36:15.558Z + 2025-07-19T17:58:00.675Z https://docs.axolotl.ai/docs/api/monkeypatch.data.batch_dataset_fetcher.html - 2025-07-17T19:36:15.424Z + 2025-07-19T17:58:00.541Z https://docs.axolotl.ai/docs/api/cli.cloud.modal_.html - 2025-07-17T19:36:14.873Z + 2025-07-19T17:57:59.987Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_chat.html - 2025-07-17T19:36:15.064Z + 2025-07-19T17:58:00.178Z https://docs.axolotl.ai/docs/api/utils.freeze.html - 2025-07-17T19:36:15.485Z + 2025-07-19T17:58:00.602Z https://docs.axolotl.ai/docs/api/prompt_strategies.bradley_terry.llama3.html - 2025-07-17T19:36:15.204Z + 2025-07-19T17:58:00.319Z https://docs.axolotl.ai/docs/api/integrations.base.html - 2025-07-17T19:36:15.810Z + 2025-07-19T17:58:00.927Z https://docs.axolotl.ai/docs/api/monkeypatch.unsloth_.html - 2025-07-17T19:36:15.423Z + 2025-07-19T17:58:00.540Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.chatml.html - 2025-07-17T19:36:15.178Z + 2025-07-19T17:58:00.293Z https://docs.axolotl.ai/docs/api/cli.main.html - 2025-07-17T19:36:14.716Z + 2025-07-19T17:57:59.830Z https://docs.axolotl.ai/docs/api/common.datasets.html - 2025-07-17T19:36:15.849Z + 2025-07-19T17:58:00.967Z https://docs.axolotl.ai/docs/api/train.html - 2025-07-17T19:36:14.531Z + 2025-07-19T17:57:59.644Z https://docs.axolotl.ai/docs/api/core.trainers.base.html - 2025-07-17T19:36:14.888Z + 2025-07-19T17:58:00.002Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.scheduler.html - 2025-07-17T19:36:14.994Z + 2025-07-19T17:58:00.107Z https://docs.axolotl.ai/docs/api/utils.ctx_managers.sequence_parallel.html - 2025-07-17T19:36:15.017Z + 2025-07-19T17:58:00.131Z https://docs.axolotl.ai/docs/api/utils.schemas.config.html - 2025-07-17T19:36:15.601Z + 2025-07-19T17:58:00.717Z https://docs.axolotl.ai/docs/api/loaders.tokenizer.html - 2025-07-17T19:36:14.962Z + 2025-07-19T17:58:00.075Z https://docs.axolotl.ai/docs/api/integrations.liger.args.html - 2025-07-17T19:36:15.825Z + 2025-07-19T17:58:00.942Z https://docs.axolotl.ai/docs/api/cli.config.html - 2025-07-17T19:36:14.776Z + 2025-07-19T17:57:59.890Z https://docs.axolotl.ai/docs/api/loaders.processor.html - 2025-07-17T19:36:14.963Z + 2025-07-19T17:58:00.077Z https://docs.axolotl.ai/docs/api/monkeypatch.utils.html - 2025-07-17T19:36:15.403Z + 2025-07-19T17:58:00.520Z https://docs.axolotl.ai/docs/api/integrations.cut_cross_entropy.args.html - 2025-07-17T19:36:15.813Z + 2025-07-19T17:58:00.930Z https://docs.axolotl.ai/docs/api/core.trainers.dpo.trainer.html - 2025-07-17T19:36:14.919Z + 2025-07-19T17:58:00.033Z https://docs.axolotl.ai/docs/api/loaders.adapter.html - 2025-07-17T19:36:14.969Z + 2025-07-19T17:58:00.082Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.llama3.html - 2025-07-17T19:36:15.148Z + 2025-07-19T17:58:00.262Z https://docs.axolotl.ai/docs/api/core.datasets.transforms.chat_builder.html - 2025-07-17T19:36:14.685Z + 2025-07-19T17:57:59.798Z https://docs.axolotl.ai/docs/api/monkeypatch.transformers_fa_utils.html - 2025-07-17T19:36:15.421Z + 2025-07-19T17:58:00.538Z https://docs.axolotl.ai/docs/api/datasets.html - 2025-07-17T19:36:14.552Z + 2025-07-19T17:57:59.666Z https://docs.axolotl.ai/docs/api/monkeypatch.btlm_attn_hijack_flash.html - 2025-07-17T19:36:15.405Z + 2025-07-19T17:58:00.521Z https://docs.axolotl.ai/docs/api/cli.inference.html - 2025-07-17T19:36:14.790Z + 2025-07-19T17:57:59.904Z https://docs.axolotl.ai/docs/api/cli.utils.html - 2025-07-17T19:36:14.856Z + 2025-07-19T17:57:59.970Z https://docs.axolotl.ai/docs/api/cli.preprocess.html - 2025-07-17T19:36:14.819Z + 2025-07-19T17:57:59.933Z https://docs.axolotl.ai/docs/api/loaders.model.html - 2025-07-17T19:36:14.953Z + 2025-07-19T17:58:00.067Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.sampler.html - 2025-07-17T19:36:14.942Z + 2025-07-19T17:58:00.056Z https://docs.axolotl.ai/docs/api/core.trainers.grpo.trainer.html - 2025-07-17T19:36:14.930Z + 2025-07-19T17:58:00.043Z https://docs.axolotl.ai/docs/batch_vs_grad.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.844Z https://docs.axolotl.ai/docs/custom_integrations.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/quantize.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.849Z https://docs.axolotl.ai/docs/unsloth.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.849Z https://docs.axolotl.ai/docs/ray-integration.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.849Z https://docs.axolotl.ai/docs/dataset-formats/stepwise_supervised.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/dataset-formats/template_free.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/dataset-formats/index.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/dataset-formats/pretraining.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/multi-gpu.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/docs/torchao.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.849Z https://docs.axolotl.ai/docs/cli.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/nccl.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/docs/dataset_preprocessing.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/faq.html - 2025-07-17T19:33:02.924Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/qat.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/docs/gradient_checkpointing.html - 2025-07-17T19:33:02.924Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/input_output.html - 2025-07-17T19:33:02.926Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/src/axolotl/integrations/LICENSE.html - 2025-07-17T19:33:02.946Z + 2025-07-19T17:54:53.868Z https://docs.axolotl.ai/src/axolotl/integrations/cut_cross_entropy/ACKNOWLEDGEMENTS.html - 2025-07-17T19:33:02.946Z + 2025-07-19T17:54:53.868Z https://docs.axolotl.ai/docs/mac.html - 2025-07-17T19:33:02.926Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/docs/lr_groups.html - 2025-07-17T19:33:02.926Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/docs/dataset_loading.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/getting-started.html - 2025-07-17T19:33:02.924Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/lora_optims.html - 2025-07-17T19:33:02.926Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/docs/multi-node.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/docs/fsdp_qlora.html - 2025-07-17T19:33:02.924Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/inference.html - 2025-07-17T19:33:02.926Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/docs/sequence_parallelism.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.849Z https://docs.axolotl.ai/docs/rlhf.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.849Z https://docs.axolotl.ai/docs/dataset-formats/tokenized.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/dataset-formats/conversation.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/dataset-formats/inst_tune.html - 2025-07-17T19:33:02.923Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/reward_modelling.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.849Z https://docs.axolotl.ai/docs/docker.html - 2025-07-17T19:33:02.924Z + 2025-07-19T17:54:53.845Z https://docs.axolotl.ai/docs/installation.html - 2025-07-17T19:33:02.926Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/docs/multimodal.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/docs/config-reference.html - 2025-07-17T19:36:28.059Z + 2025-07-19T17:58:14.550Z https://docs.axolotl.ai/docs/api/prompt_tokenizers.html - 2025-07-17T19:36:14.607Z + 2025-07-19T17:57:59.720Z https://docs.axolotl.ai/docs/api/utils.schedulers.html - 2025-07-17T19:36:15.527Z + 2025-07-19T17:58:00.644Z https://docs.axolotl.ai/docs/api/utils.samplers.multipack.html - 2025-07-17T19:36:15.920Z + 2025-07-19T17:58:01.038Z https://docs.axolotl.ai/docs/api/prompt_strategies.orcamini.html - 2025-07-17T19:36:15.125Z + 2025-07-19T17:58:00.239Z https://docs.axolotl.ai/docs/api/core.trainers.trl.html - 2025-07-17T19:36:14.903Z + 2025-07-19T17:58:00.016Z https://docs.axolotl.ai/docs/api/prompt_strategies.metharme.html - 2025-07-17T19:36:15.121Z + 2025-07-19T17:58:00.235Z https://docs.axolotl.ai/docs/api/utils.callbacks.profiler.html - 2025-07-17T19:36:15.930Z + 2025-07-19T17:58:01.048Z https://docs.axolotl.ai/docs/api/utils.schemas.enums.html - 2025-07-17T19:36:15.670Z + 2025-07-19T17:58:00.786Z https://docs.axolotl.ai/docs/api/core.trainers.mamba.html - 2025-07-17T19:36:14.908Z + 2025-07-19T17:58:00.022Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_flash.html - 2025-07-17T19:36:15.341Z + 2025-07-19T17:58:00.457Z https://docs.axolotl.ai/docs/api/monkeypatch.relora.html - 2025-07-17T19:36:15.365Z + 2025-07-19T17:58:00.482Z https://docs.axolotl.ai/docs/api/monkeypatch.stablelm_attn_hijack_flash.html - 2025-07-17T19:36:15.412Z + 2025-07-19T17:58:00.529Z https://docs.axolotl.ai/docs/api/loaders.constants.html - 2025-07-17T19:36:14.978Z + 2025-07-19T17:58:00.092Z https://docs.axolotl.ai/docs/api/utils.callbacks.qat.html - 2025-07-17T19:36:15.945Z + 2025-07-19T17:58:01.064Z https://docs.axolotl.ai/docs/api/utils.schemas.model.html - 2025-07-17T19:36:15.607Z + 2025-07-19T17:58:00.724Z https://docs.axolotl.ai/docs/api/prompt_strategies.stepwise_supervised.html - 2025-07-17T19:36:15.114Z + 2025-07-19T17:58:00.228Z https://docs.axolotl.ai/docs/api/integrations.grokfast.optimizer.html - 2025-07-17T19:36:15.814Z + 2025-07-19T17:58:00.931Z https://docs.axolotl.ai/docs/api/convert.html - 2025-07-17T19:36:14.566Z + 2025-07-19T17:57:59.679Z https://docs.axolotl.ai/docs/api/kernels.quantize.html - 2025-07-17T19:36:15.314Z + 2025-07-19T17:58:00.430Z https://docs.axolotl.ai/docs/api/core.training_args.html - 2025-07-17T19:36:14.645Z + 2025-07-19T17:57:59.758Z https://docs.axolotl.ai/docs/api/prompt_strategies.chat_template.html - 2025-07-17T19:36:15.051Z + 2025-07-19T17:58:00.164Z https://docs.axolotl.ai/docs/api/index.html - 2025-07-17T19:36:14.469Z + 2025-07-19T17:57:59.583Z https://docs.axolotl.ai/docs/api/prompt_strategies.llama2_chat.html - 2025-07-17T19:36:15.098Z + 2025-07-19T17:58:00.212Z https://docs.axolotl.ai/docs/api/utils.trainer.html - 2025-07-17T19:36:15.503Z + 2025-07-19T17:58:00.619Z https://docs.axolotl.ai/docs/api/prompt_strategies.messages.chat.html - 2025-07-17T19:36:15.136Z + 2025-07-19T17:58:00.250Z https://docs.axolotl.ai/docs/api/monkeypatch.lora_kernels.html - 2025-07-17T19:36:15.395Z + 2025-07-19T17:58:00.512Z https://docs.axolotl.ai/docs/api/kernels.lora.html - 2025-07-17T19:36:15.286Z + 2025-07-19T17:58:00.402Z https://docs.axolotl.ai/docs/api/cli.vllm_serve.html - 2025-07-17T19:36:14.863Z + 2025-07-19T17:57:59.977Z https://docs.axolotl.ai/docs/api/utils.schemas.multimodal.html - 2025-07-17T19:36:15.647Z + 2025-07-19T17:58:00.764Z https://docs.axolotl.ai/docs/api/utils.schemas.utils.html - 2025-07-17T19:36:15.675Z + 2025-07-19T17:58:00.792Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_attn_hijack_xformers.html - 2025-07-17T19:36:15.343Z + 2025-07-19T17:58:00.459Z https://docs.axolotl.ai/docs/api/integrations.lm_eval.args.html - 2025-07-17T19:36:15.828Z + 2025-07-19T17:58:00.946Z https://docs.axolotl.ai/docs/api/monkeypatch.mistral_attn_hijack_flash.html - 2025-07-17T19:36:15.357Z + 2025-07-19T17:58:00.474Z https://docs.axolotl.ai/docs/api/utils.collators.core.html - 2025-07-17T19:36:15.852Z + 2025-07-19T17:58:00.969Z https://docs.axolotl.ai/docs/api/core.chat.format.chatml.html - 2025-07-17T19:36:14.669Z + 2025-07-19T17:57:59.782Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.passthrough.html - 2025-07-17T19:36:15.162Z + 2025-07-19T17:58:00.276Z https://docs.axolotl.ai/docs/api/core.datasets.chat.html - 2025-07-17T19:36:14.677Z + 2025-07-19T17:57:59.790Z https://docs.axolotl.ai/docs/api/utils.bench.html - 2025-07-17T19:36:15.477Z + 2025-07-19T17:58:00.594Z https://docs.axolotl.ai/docs/api/utils.schemas.training.html - 2025-07-17T19:36:15.612Z + 2025-07-19T17:58:00.729Z https://docs.axolotl.ai/docs/api/utils.collators.batching.html - 2025-07-17T19:36:15.870Z + 2025-07-19T17:58:00.988Z https://docs.axolotl.ai/docs/api/monkeypatch.llama_patch_multipack.html - 2025-07-17T19:36:15.406Z + 2025-07-19T17:58:00.523Z https://docs.axolotl.ai/docs/api/monkeypatch.multipack.html - 2025-07-17T19:36:15.359Z + 2025-07-19T17:58:00.475Z https://docs.axolotl.ai/docs/api/core.builders.causal.html - 2025-07-17T19:36:14.627Z + 2025-07-19T17:57:59.741Z https://docs.axolotl.ai/docs/api/cli.evaluate.html - 2025-07-17T19:36:14.732Z + 2025-07-19T17:57:59.846Z https://docs.axolotl.ai/docs/api/monkeypatch.trainer_fsdp_optim.html - 2025-07-17T19:36:15.415Z + 2025-07-19T17:58:00.532Z https://docs.axolotl.ai/docs/api/core.trainers.utils.html - 2025-07-17T19:36:14.944Z + 2025-07-19T17:58:00.057Z https://docs.axolotl.ai/docs/api/utils.schemas.integrations.html - 2025-07-17T19:36:15.659Z + 2025-07-19T17:58:00.776Z https://docs.axolotl.ai/docs/api/utils.dict.html - 2025-07-17T19:36:15.551Z + 2025-07-19T17:58:00.667Z https://docs.axolotl.ai/docs/api/core.builders.rl.html - 2025-07-17T19:36:14.632Z + 2025-07-19T17:57:59.745Z https://docs.axolotl.ai/docs/api/prompt_strategies.orpo.chat_template.html - 2025-07-17T19:36:15.200Z + 2025-07-19T17:58:00.315Z https://docs.axolotl.ai/docs/api/core.trainers.relora.html - 2025-07-17T19:36:14.913Z + 2025-07-19T17:58:00.026Z https://docs.axolotl.ai/docs/api/integrations.spectrum.args.html - 2025-07-17T19:36:15.831Z + 2025-07-19T17:58:00.949Z https://docs.axolotl.ai/docs/api/cli.quantize.html - 2025-07-17T19:36:14.878Z + 2025-07-19T17:57:59.991Z https://docs.axolotl.ai/docs/api/cli.checks.html - 2025-07-17T19:36:14.758Z + 2025-07-19T17:57:59.872Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.llama3.html - 2025-07-17T19:36:15.170Z + 2025-07-19T17:58:00.285Z https://docs.axolotl.ai/docs/api/utils.model_shard_quant.html - 2025-07-17T19:36:15.474Z + 2025-07-19T17:58:00.591Z https://docs.axolotl.ai/docs/api/utils.quantization.html - 2025-07-17T19:36:15.587Z + 2025-07-19T17:58:00.703Z https://docs.axolotl.ai/docs/api/core.trainers.mixins.rng_state_loader.html - 2025-07-17T19:36:14.987Z + 2025-07-19T17:58:00.100Z https://docs.axolotl.ai/docs/api/kernels.geglu.html - 2025-07-17T19:36:15.297Z + 2025-07-19T17:58:00.413Z https://docs.axolotl.ai/docs/api/utils.data.pretraining.html - 2025-07-17T19:36:15.560Z + 2025-07-19T17:58:00.676Z https://docs.axolotl.ai/docs/api/prompt_strategies.kto.user_defined.html - 2025-07-17T19:36:15.180Z + 2025-07-19T17:58:00.294Z https://docs.axolotl.ai/docs/api/core.builders.base.html - 2025-07-17T19:36:14.623Z + 2025-07-19T17:57:59.736Z https://docs.axolotl.ai/docs/api/cli.merge_lora.html - 2025-07-17T19:36:14.798Z + 2025-07-19T17:57:59.912Z https://docs.axolotl.ai/docs/api/monkeypatch.mixtral.html - 2025-07-17T19:36:15.426Z + 2025-07-19T17:58:00.543Z https://docs.axolotl.ai/docs/api/utils.data.sft.html - 2025-07-17T19:36:15.566Z + 2025-07-19T17:58:00.683Z https://docs.axolotl.ai/docs/api/prompt_strategies.user_defined.html - 2025-07-17T19:36:15.086Z + 2025-07-19T17:58:00.199Z https://docs.axolotl.ai/docs/api/utils.tokenization.html - 2025-07-17T19:36:15.462Z + 2025-07-19T17:58:00.579Z https://docs.axolotl.ai/docs/api/prompt_strategies.dpo.chatml.html - 2025-07-17T19:36:15.158Z + 2025-07-19T17:58:00.272Z https://docs.axolotl.ai/docs/api/models.mamba.modeling_mamba.html - 2025-07-17T19:36:15.850Z + 2025-07-19T17:58:00.968Z https://docs.axolotl.ai/docs/api/cli.args.html - 2025-07-17T19:36:14.752Z + 2025-07-19T17:57:59.866Z https://docs.axolotl.ai/docs/api/evaluate.html - 2025-07-17T19:36:14.542Z + 2025-07-19T17:57:59.655Z https://docs.axolotl.ai/docs/api/prompt_strategies.alpaca_instruct.html - 2025-07-17T19:36:15.066Z + 2025-07-19T17:58:00.179Z https://docs.axolotl.ai/docs/api/utils.distributed.html - 2025-07-17T19:36:15.547Z + 2025-07-19T17:58:00.664Z https://docs.axolotl.ai/docs/multipack.html - 2025-07-17T19:33:02.927Z + 2025-07-19T17:54:53.848Z https://docs.axolotl.ai/examples/colab-notebooks/colab-axolotl-example.html - 2025-07-17T19:33:02.931Z + 2025-07-19T17:54:53.852Z https://docs.axolotl.ai/FAQS.html - 2025-07-17T19:33:02.921Z + 2025-07-19T17:54:53.843Z