add llama 7b config and fiz lora_fan_in_fan_out for llama (copy pasta bug)

2023-04-15 14:26:52 -04:00
parent d33a975747
commit d060c803ce
2 changed files with 42 additions and 1 deletions
--- a/configs/llama_65B_alpaca.yml
+++ b/configs/llama_65B_alpaca.yml
@@ -22,7 +22,7 @@ lora_dropout: 0.05
 lora_target_modules:
  - q_proj
  - w_proj
-lora_fan_in_fan_out: true  # pythia/GPTNeoX lora specific
+lora_fan_in_fan_out: false
 wandb_project: llama-65b-lora
 wandb_watch:
 wandb_run_id:
--- a/configs/llama_7B_alpaca.yml
+++ b/configs/llama_7B_alpaca.yml
@@ -0,0 +1,41 @@
+base_model: huggyllama/llama-7b
+model_type: LlamaForCausalLM
+tokenizer_type: LlamaTokenizer
+load_in_8bit: true
+datasets:
+  - path: data/alpaca_data_gpt4.jsonl
+    type: alpaca
+  - path: data/vicuna_cleaned.jsonl
+    type: sharegpt
+  - path: data/gpt4-instruct-similarity-0.6-dataset.jsonl
+    type: gpteacher
+  - path: data/roleplay-similarity_0.6-instruct-dataset.jsonl
+    type: gpteacher
+dataset_prepared_path: data/last_run
+val_set_size: 0.04
+adapter: lora
+lora_model_dir:
+sequence_len: 2048
+lora_r: 8
+lora_alpha: 16
+lora_dropout: 0.05
+lora_target_modules:
+  - q_proj
+  - w_proj
+lora_fan_in_fan_out: false
+wandb_project: llama-7b-lora
+wandb_watch:
+wandb_run_id:
+wandb_log_model: checkpoint
+output_dir: ./lora-llama-alpaca
+batch_size: 128
+micro_batch_size: 16
+num_epochs: 5
+learning_rate: 0.00003
+train_on_inputs: false
+group_by_length: false
+bf16: true
+tf32: true
+resume_from_checkpoint:
+local_rank:
+deepspeed: