fix(example): align example to correct adapter (#2478)

* fix(example): align example to correct adapter

* fix: add missing load in 4 bit
This commit is contained in:
NanoCode012
2025-04-03 19:48:14 +07:00
committed by GitHub
parent 5249e98058
commit 64d8035f50
2 changed files with 5 additions and 1 deletions

View File

@@ -1,6 +1,8 @@
base_model: google/gemma-3-4b-it
strict: false
load_in_4bit: true
# gemma3 doesn't seem to play nice with ddp
ddp_find_unused_parameters: true
@@ -17,7 +19,7 @@ dataset_prepared_path: last_run_prepared
val_set_size: 0.01
output_dir: ./outputs/out
adapter: lora
adapter: qlora
lora_model_dir:
sequence_len: 2048

View File

@@ -2,6 +2,8 @@ base_model: google/gemma-3-4b-it
processor_type: AutoProcessor
strict: false
load_in_4bit: true
# these 3 lines are needed for now to handle vision chat templates w images
skip_prepare_dataset: true
remove_unused_columns: false