diff --git a/examples/llama-3/fft-8b.yaml b/examples/llama-3/fft-8b.yaml index a36fd740e..908ef6e03 100644 --- a/examples/llama-3/fft-8b.yaml +++ b/examples/llama-3/fft-8b.yaml @@ -1,4 +1,4 @@ -base_model: meta-llama/Meta-Llama-3-8B +base_model: NousResearch/Meta-Llama-3-8B model_type: LlamaForCausalLM tokenizer_type: AutoTokenizer diff --git a/examples/llama-3/lora-8b.yml b/examples/llama-3/lora-8b.yml index 76418ca3b..a20a529f5 100644 --- a/examples/llama-3/lora-8b.yml +++ b/examples/llama-3/lora-8b.yml @@ -1,4 +1,4 @@ -base_model: meta-llama/Meta-Llama-3-8B +base_model: NousResearch/Meta-Llama-3-8B model_type: LlamaForCausalLM tokenizer_type: AutoTokenizer diff --git a/examples/llama-3/qlora-fsdp-70b.yaml b/examples/llama-3/qlora-fsdp-70b.yaml index 9b74f6b4d..7c9480ba0 100644 --- a/examples/llama-3/qlora-fsdp-70b.yaml +++ b/examples/llama-3/qlora-fsdp-70b.yaml @@ -1,4 +1,4 @@ -base_model: casperhansen/llama-3-70b-fp16 +base_model: NousResearch/Meta-Llama-3-70B model_type: LlamaForCausalLM tokenizer_type: AutoTokenizer # PreTrainedTokenizerFast diff --git a/examples/llama-3/qlora.yml b/examples/llama-3/qlora.yml index 44120d938..858a2fcfe 100644 --- a/examples/llama-3/qlora.yml +++ b/examples/llama-3/qlora.yml @@ -1,4 +1,4 @@ -base_model: meta-llama/Meta-Llama-3-8B +base_model: NousResearch/Meta-Llama-3-8B model_type: AutoModelForCausalLM tokenizer_type: AutoTokenizer @@ -7,7 +7,7 @@ load_in_4bit: true strict: false datasets: - - path: aaditya/alpaca_subset_1 + - path: tatsu-lab/alpaca type: alpaca dataset_prepared_path: val_set_size: 0