consolidate as peft_model_dir

This commit is contained in:
Wing Lian
2023-09-19 19:02:14 -04:00
parent ba85308720
commit 203369411e
33 changed files with 50 additions and 49 deletions

View File

@@ -18,7 +18,7 @@ dataset_prepared_path: last_prepared_run
val_set_size: 0.01
adapter:
lora_model_dir:
peft_model_dir:
sequence_len: 2048
max_packed_sequence_len:
sample_packing: false

View File

@@ -10,7 +10,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.01
adapter: qlora
lora_model_dir:
peft_model_dir:
sequence_len: 2048
max_packed_sequence_len: 2048
lora_r: 16

View File

@@ -20,7 +20,7 @@ sample_packing: true
pad_to_sequence_len: true
adapter: lora
lora_model_dir:
peft_model_dir:
lora_r: 32
lora_alpha: 16
lora_dropout: 0.05

View File

@@ -16,7 +16,7 @@ val_set_size: 0.01
output_dir: ./qlora-out
adapter: qlora
lora_model_dir:
peft_model_dir:
sequence_len: 4096
sample_packing: true

View File

@@ -20,7 +20,7 @@ sample_packing: true
pad_to_sequence_len: true
adapter: lora
lora_model_dir:
peft_model_dir:
lora_r: 32
lora_alpha: 16
lora_dropout: 0.05

View File

@@ -16,7 +16,7 @@ val_set_size: 0.01
output_dir: ./qlora-out
adapter: qlora
lora_model_dir:
peft_model_dir:
sequence_len: 4096
sample_packing: true

View File

@@ -20,7 +20,7 @@ sample_packing: true
pad_to_sequence_len: true
adapter: lora
lora_model_dir:
peft_model_dir:
lora_r: 32
lora_alpha: 16
lora_dropout: 0.05

View File

@@ -16,7 +16,7 @@ val_set_size: 0.01
output_dir: ./qlora-out
adapter: qlora
lora_model_dir:
peft_model_dir:
sequence_len: 4096
sample_packing: true

View File

@@ -15,7 +15,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.01
adapter: lora
lora_model_dir:
peft_model_dir:
sequence_len: 2048
max_packed_sequence_len:
lora_r: 16

View File

@@ -22,7 +22,7 @@ dataset_prepared_path:
val_set_size: 0.01
# enable QLoRA
adapter: qlora
lora_model_dir:
peft_model_dir:
sequence_len: 2048
max_packed_sequence_len:

View File

@@ -15,7 +15,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.01
adapter:
lora_model_dir:
peft_model_dir:
sequence_len: 2048
max_packed_sequence_len:
lora_r: 64

View File

@@ -10,7 +10,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.01
adapter: qlora
lora_model_dir:
peft_model_dir:
sequence_len: 2048
max_packed_sequence_len:
lora_r: 8

View File

@@ -9,7 +9,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.02
adapter:
lora_model_dir:
peft_model_dir:
sequence_len: 512
max_packed_sequence_len:
lora_r:

View File

@@ -18,7 +18,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.01
adapter: lora
lora_model_dir:
peft_model_dir:
sequence_len: 4096
sample_packing:
lora_r: 8

View File

@@ -20,7 +20,7 @@ sample_packing: true
pad_to_sequence_len: true
adapter: ia3
ia3_model_dir:
peft_model_dir:
ia3_target_modules:
- k_proj
- v_proj

View File

@@ -20,7 +20,7 @@ sample_packing: true
pad_to_sequence_len: true
adapter: lora
lora_model_dir:
peft_model_dir:
lora_r: 32
lora_alpha: 16
lora_dropout: 0.05

View File

@@ -16,7 +16,7 @@ val_set_size: 0.01
output_dir: ./qlora-out
adapter: qlora
lora_model_dir:
peft_model_dir:
sequence_len: 4096
sample_packing: true

View File

@@ -16,7 +16,7 @@ val_set_size: 0.01
output_dir: ./relora-out
adapter: qlora
lora_model_dir:
peft_model_dir:
sequence_len: 4096
sample_packing: true

View File

@@ -20,7 +20,7 @@ sequence_len: 4096
sample_packing: true
adapter: lora
lora_model_dir:
peft_model_dir:
lora_r: 32
lora_alpha: 16
lora_dropout: 0.05

View File

@@ -9,7 +9,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.02
adapter:
lora_model_dir:
peft_model_dir:
sequence_len: 2048
max_packed_sequence_len:
lora_r: 8

View File

@@ -12,7 +12,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.02
adapter:
lora_model_dir:
peft_model_dir:
sequence_len: 1024
sample_packing: true
lora_r:

View File

@@ -12,7 +12,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.02
adapter: lora
lora_model_dir:
peft_model_dir:
sequence_len: 1024
sample_packing: true
lora_r: 8

View File

@@ -12,7 +12,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.01
adapter: qlora
lora_model_dir:
peft_model_dir:
sequence_len: 1024
sample_packing: true
lora_r: 8

View File

@@ -22,7 +22,7 @@ sample_packing: true
pad_to_sequence_len:
adapter:
lora_model_dir:
peft_model_dir:
lora_r:
lora_alpha:
lora_dropout:

View File

@@ -22,7 +22,7 @@ sample_packing: false # not CURRENTLY compatible with LoRAs
pad_to_sequence_len:
adapter: qlora
lora_model_dir:
peft_model_dir:
lora_r: 64
lora_alpha: 32
lora_dropout: 0.05

View File

@@ -13,7 +13,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.05
adapter:
lora_model_dir:
peft_model_dir:
sequence_len: 2048
max_packed_sequence_len: 2048
lora_r: 64

View File

@@ -7,7 +7,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.05
adapter: lora
lora_model_dir:
peft_model_dir:
sequence_len: 512
lora_r: 16
lora_alpha: 32

View File

@@ -10,7 +10,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.02
adapter:
lora_model_dir:
peft_model_dir:
sequence_len: 2048
max_packed_sequence_len:
lora_r: 8

View File

@@ -8,7 +8,7 @@ datasets:
dataset_prepared_path:
val_set_size: 0.05
adapter: lora
lora_model_dir:
peft_model_dir:
sequence_len: 2048
max_packed_sequence_len:
lora_r: 8

View File

@@ -20,7 +20,7 @@ dataset_prepared_path:
val_set_size: 0.01
# enable QLoRA
adapter: qlora
lora_model_dir:
peft_model_dir:
sequence_len: 8192
max_packed_sequence_len: