From 60e32ff4576d5b0e0dc650d922b8882077b85526 Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Fri, 26 May 2023 11:09:28 +0900 Subject: [PATCH 1/4] Fix shard config --- README.md | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/README.md b/README.md index f79a49a1f..346ee6904 100644 --- a/README.md +++ b/README.md @@ -199,8 +199,7 @@ datasets: # The type of prompt to use for training. [alpaca, sharegpt, gpteacher, oasst, reflection] type: alpaca # format OR format:prompt_style (chat/instruct) data_files: # path to source data files - shards: # true if use subset data. make sure to set `shards` param also -shards: # number of shards to split dataset into + shards: # number of shards to split data into # axolotl attempts to save the dataset as an arrow after packing the data together so # subsequent training attempts load faster, relative path From d7d8bc739e00747d75ea83f48fedd8a29e270e7a Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Fri, 26 May 2023 11:10:59 +0900 Subject: [PATCH 2/4] Add strict yml --- README.md | 3 +++ 1 file changed, 3 insertions(+) diff --git a/README.md b/README.md index 346ee6904..0a593a30d 100644 --- a/README.md +++ b/README.md @@ -325,6 +325,9 @@ debug: # Seed seed: + +# Allow overwrite yml config using from cli +strict: ``` From e689069afdaf83045cad721e2b8e0d20dd536296 Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Fri, 26 May 2023 11:12:03 +0900 Subject: [PATCH 3/4] Add xformers error --- README.md | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/README.md b/README.md index 0a593a30d..7acdd2fb1 100644 --- a/README.md +++ b/README.md @@ -384,6 +384,10 @@ Please reduce any below Try set `fp16: true` +> NotImplementedError: No operator found for `memory_efficient_attention_forward` ... + +Try to turn off xformers. + ## Need help? 🙋‍♂️ Join our [Discord server](https://discord.gg/HhrNrHJPRb) where we can help you From 85326bfbf35339c7a84a9cb576e299b04e5d7ccb Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Fri, 26 May 2023 11:15:57 +0900 Subject: [PATCH 4/4] Update quickstart config --- README.md | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/README.md b/README.md index 7acdd2fb1..a0e036566 100644 --- a/README.md +++ b/README.md @@ -33,12 +33,12 @@ pip3 install -e .[int4] accelerate config -# finetune -accelerate launch scripts/finetune.py examples/4bit-lora-7b/config.yml +# finetune lora +accelerate launch scripts/finetune.py examples/lora-openllama-3b/config.yml # inference -accelerate launch scripts/finetune.py examples/4bit-lora-7b/config.yml \ - --inference --lora_model_dir="./llama-7b-lora-int4" +accelerate launch scripts/finetune.py examples/lora-openllama-3b/config.yml \ + --inference --lora_model_dir="./lora-out" ``` ## Installation