diff --git a/.nojekyll b/.nojekyll index 9dcb21eaf..05b0dc2f0 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -aeeb58bf \ No newline at end of file +4e4c1269 \ No newline at end of file diff --git a/docs/dataset-formats/index.html b/docs/dataset-formats/index.html index 9c1a1fbbd..5081bfca0 100644 --- a/docs/dataset-formats/index.html +++ b/docs/dataset-formats/index.html @@ -351,7 +351,7 @@ Description - + Pre-training @@ -359,7 +359,7 @@ Description Data format for a pre-training completion task. - + Instruction Tuning @@ -367,7 +367,7 @@ Description Instruction tuning formats for supervised fine-tuning. - + Conversation @@ -375,7 +375,7 @@ Description Conversation format for supervised fine-tuning. - + Template-Free @@ -383,7 +383,7 @@ Description Construct prompts without a template. - + Custom Pre-Tokenized Dataset diff --git a/examples/llama-2/qlora-fsdp.yml b/examples/llama-2/qlora-fsdp.yml index 30916ed45..93b3b2a60 100644 --- a/examples/llama-2/qlora-fsdp.yml +++ b/examples/llama-2/qlora-fsdp.yml @@ -65,12 +65,14 @@ deepspeed: weight_decay: 0.0 fsdp: - full_shard + - auto_wrap fsdp_config: fsdp_limit_all_gathers: true fsdp_sync_module_states: true fsdp_offload_params: true fsdp_use_orig_params: false fsdp_cpu_ram_efficient_loading: true + fsdp_auto_wrap_policy: TRANSFORMER_BASED_WRAP fsdp_transformer_layer_cls_to_wrap: LlamaDecoderLayer - fsdp_state_dict_type: SHARDED_STATE_DICT + fsdp_state_dict_type: FULL_STATE_DICT special_tokens: diff --git a/sitemap.xml b/sitemap.xml index b29d882a4..a7ad1a5c7 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -2,86 +2,86 @@ https://OpenAccess-AI-Collective.github.io/axolotl/TODO.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/debugging.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/fsdp_qlora.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/faq.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/rlhf.html - 2024-04-09T22:58:50.099Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/nccl.html - 2024-04-09T22:58:50.099Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/dataset-formats/inst_tune.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/dataset-formats/tokenized.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/dataset-formats/pretraining.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/FAQS.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/examples/colab-notebooks/colab-axolotl-example.html - 2024-04-09T22:58:50.099Z + 2024-04-12T13:02:53.470Z https://OpenAccess-AI-Collective.github.io/axolotl/index.html - 2024-04-09T22:58:50.107Z + 2024-04-12T13:02:53.478Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/dataset-formats/conversation.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/dataset-formats/index.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/dataset-formats/template_free.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/multipack.html - 2024-04-09T22:58:50.099Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/multi-node.html - 2024-04-09T22:58:50.099Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/mac.html - 2024-04-09T22:58:50.099Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/input_output.html - 2024-04-09T22:58:50.099Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/config.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z https://OpenAccess-AI-Collective.github.io/axolotl/docs/batch_vs_grad.html - 2024-04-09T22:58:50.095Z + 2024-04-12T13:02:53.466Z