diff --git a/deepspeed_configs/zero3.json b/deepspeed_configs/zero3.json index a648cbe81..f8c9cdfe0 100644 --- a/deepspeed_configs/zero3.json +++ b/deepspeed_configs/zero3.json @@ -5,8 +5,8 @@ "contiguous_gradients": true, "sub_group_size": 0, "reduce_bucket_size": "auto", - "prefetch_bucket_size": "auto", - "param_persistence_threshold": "auto", + "stage3_prefetch_bucket_size": "auto", + "stage3_param_persistence_threshold": "auto", "max_live_parameters": 0, "max_reuse_distance": 0, "gather_16bit_weights_on_model_save": true diff --git a/deepspeed_configs/zero3_bf16.json b/deepspeed_configs/zero3_bf16.json index 4d31a1531..a69e13cf7 100644 --- a/deepspeed_configs/zero3_bf16.json +++ b/deepspeed_configs/zero3_bf16.json @@ -5,8 +5,8 @@ "contiguous_gradients": true, "sub_group_size": 0, "reduce_bucket_size": "auto", - "prefetch_bucket_size": "auto", - "param_persistence_threshold": "auto", + "stage3_prefetch_bucket_size": "auto", + "stage3_param_persistence_threshold": "auto", "max_live_parameters": 0, "max_reuse_distance": 0, "gather_16bit_weights_on_model_save": true diff --git a/deepspeed_configs/zero3_bf16_cpuoffload_all.json b/deepspeed_configs/zero3_bf16_cpuoffload_all.json index 52fe9cdd4..5112c570b 100644 --- a/deepspeed_configs/zero3_bf16_cpuoffload_all.json +++ b/deepspeed_configs/zero3_bf16_cpuoffload_all.json @@ -15,8 +15,8 @@ "contiguous_gradients": true, "sub_group_size": 0, "reduce_bucket_size": "auto", - "prefetch_bucket_size": "auto", - "param_persistence_threshold": "auto", + "stage3_prefetch_bucket_size": "auto", + "stage3_param_persistence_threshold": "auto", "max_live_parameters": 0, "max_reuse_distance": 0, "gather_16bit_weights_on_model_save": true diff --git a/deepspeed_configs/zero3_bf16_cpuoffload_params.json b/deepspeed_configs/zero3_bf16_cpuoffload_params.json index 81ac1d1d8..a2ac82341 100644 --- a/deepspeed_configs/zero3_bf16_cpuoffload_params.json +++ b/deepspeed_configs/zero3_bf16_cpuoffload_params.json @@ -11,8 +11,8 @@ "contiguous_gradients": true, "sub_group_size": 0, "reduce_bucket_size": "auto", - "prefetch_bucket_size": "auto", - "param_persistence_threshold": "auto", + "stage3_prefetch_bucket_size": "auto", + "stage3_param_persistence_threshold": "auto", "max_live_parameters": 0, "max_reuse_distance": 0, "gather_16bit_weights_on_model_save": true