fix(example): align example to correct adapter (#2478)
* fix(example): align example to correct adapter * fix: add missing load in 4 bit
This commit is contained in:
@@ -1,6 +1,8 @@
|
|||||||
base_model: google/gemma-3-4b-it
|
base_model: google/gemma-3-4b-it
|
||||||
strict: false
|
strict: false
|
||||||
|
|
||||||
|
load_in_4bit: true
|
||||||
|
|
||||||
# gemma3 doesn't seem to play nice with ddp
|
# gemma3 doesn't seem to play nice with ddp
|
||||||
ddp_find_unused_parameters: true
|
ddp_find_unused_parameters: true
|
||||||
|
|
||||||
@@ -17,7 +19,7 @@ dataset_prepared_path: last_run_prepared
|
|||||||
val_set_size: 0.01
|
val_set_size: 0.01
|
||||||
output_dir: ./outputs/out
|
output_dir: ./outputs/out
|
||||||
|
|
||||||
adapter: lora
|
adapter: qlora
|
||||||
lora_model_dir:
|
lora_model_dir:
|
||||||
|
|
||||||
sequence_len: 2048
|
sequence_len: 2048
|
||||||
|
|||||||
@@ -2,6 +2,8 @@ base_model: google/gemma-3-4b-it
|
|||||||
processor_type: AutoProcessor
|
processor_type: AutoProcessor
|
||||||
strict: false
|
strict: false
|
||||||
|
|
||||||
|
load_in_4bit: true
|
||||||
|
|
||||||
# these 3 lines are needed for now to handle vision chat templates w images
|
# these 3 lines are needed for now to handle vision chat templates w images
|
||||||
skip_prepare_dataset: true
|
skip_prepare_dataset: true
|
||||||
remove_unused_columns: false
|
remove_unused_columns: false
|
||||||
|
|||||||
Reference in New Issue
Block a user