set env var for FSDP layer to wrap (#453)
This commit is contained in:
@@ -377,6 +377,10 @@ def setup_fsdp_envs(cfg):
|
|||||||
os.environ["FSDP_SYNC_MODULE_STATES"] = "true"
|
os.environ["FSDP_SYNC_MODULE_STATES"] = "true"
|
||||||
if cfg.fsdp_config.fsdp_state_dict_type:
|
if cfg.fsdp_config.fsdp_state_dict_type:
|
||||||
os.environ["FSDP_STATE_DICT_TYPE"] = cfg.fsdp_config.fsdp_state_dict_type
|
os.environ["FSDP_STATE_DICT_TYPE"] = cfg.fsdp_config.fsdp_state_dict_type
|
||||||
|
if cfg.fsdp_config.fsdp_transformer_layer_cls_to_wrap:
|
||||||
|
os.environ[
|
||||||
|
"FSDP_TRANSFORMER_CLS_TO_WRAP"
|
||||||
|
] = cfg.fsdp_config.fsdp_transformer_layer_cls_to_wrap
|
||||||
|
|
||||||
|
|
||||||
def setup_trainer(cfg, train_dataset, eval_dataset, model, tokenizer, total_num_steps):
|
def setup_trainer(cfg, train_dataset, eval_dataset, model, tokenizer, total_num_steps):
|
||||||
|
|||||||
Reference in New Issue
Block a user