address PR feedback

This commit is contained in:
Wing Lian
2023-06-10 14:21:43 -04:00
parent eea2731a5e
commit 0c6f928601
5 changed files with 9 additions and 8 deletions

View File

@@ -1,4 +1,4 @@
# Python 12B
# Pythia 12B
- Single-GPU A100 only (?)

View File

@@ -22,7 +22,7 @@ lora_dropout: 0.0
lora_target_modules:
lora_target_linear: true
lora_fan_in_fan_out: true # pythia/GPTNeoX lora specific
wandb_project: pythia-12b
wandb_project:
wandb_watch:
wandb_run_id:
wandb_log_model:
@@ -45,5 +45,5 @@ resume_from_checkpoint:
local_rank:
gradient_checkpointing: true
fsdp:
fsdp_transformer_layer_cls_to_wrap:
fsdp_config:
collator_pad_to_longest: true