diff --git a/examples/llama-3/fft-1b-fsdp.yml b/examples/llama-3/fft-8b-fsdp.yml similarity index 90% rename from examples/llama-3/fft-1b-fsdp.yml rename to examples/llama-3/fft-8b-fsdp.yml index 84b4db48f..8efe1eb3d 100644 --- a/examples/llama-3/fft-1b-fsdp.yml +++ b/examples/llama-3/fft-8b-fsdp.yml @@ -1,4 +1,4 @@ -base_model: meta-llama/Llama-3.2-1B +base_model: meta-llama/Llama-3.1-8B-Instruct save_safetensors: true @@ -9,7 +9,7 @@ datasets: dataset_prepared_path: ./last_run_prepared output_dir: ./outputs/fft-out -sequence_len: 2048 +sequence_len: 8192 gradient_accumulation_steps: 1 micro_batch_size: 1