From 631268a0caa18250a30a1c837c4d7f4d9505adc0 Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Tue, 22 Jul 2025 20:59:47 +0700 Subject: [PATCH] revert renaming of deepspeed stage3 args that use auto (#2964) [skip ci] MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * Revert "fix deprecate deepspeed stage3_gather_16bit_weights_on_model_save arg…" This reverts commit e207762928fe066df2c9d2149e9f897fe2f8025f. * don't revert the values that don't use 'auto' --------- Co-authored-by: Wing Lian --- deepspeed_configs/zero3.json | 4 ++-- deepspeed_configs/zero3_bf16.json | 4 ++-- deepspeed_configs/zero3_bf16_cpuoffload_all.json | 4 ++-- deepspeed_configs/zero3_bf16_cpuoffload_params.json | 4 ++-- 4 files changed, 8 insertions(+), 8 deletions(-) diff --git a/deepspeed_configs/zero3.json b/deepspeed_configs/zero3.json index a648cbe81..f8c9cdfe0 100644 --- a/deepspeed_configs/zero3.json +++ b/deepspeed_configs/zero3.json @@ -5,8 +5,8 @@ "contiguous_gradients": true, "sub_group_size": 0, "reduce_bucket_size": "auto", - "prefetch_bucket_size": "auto", - "param_persistence_threshold": "auto", + "stage3_prefetch_bucket_size": "auto", + "stage3_param_persistence_threshold": "auto", "max_live_parameters": 0, "max_reuse_distance": 0, "gather_16bit_weights_on_model_save": true diff --git a/deepspeed_configs/zero3_bf16.json b/deepspeed_configs/zero3_bf16.json index 4d31a1531..a69e13cf7 100644 --- a/deepspeed_configs/zero3_bf16.json +++ b/deepspeed_configs/zero3_bf16.json @@ -5,8 +5,8 @@ "contiguous_gradients": true, "sub_group_size": 0, "reduce_bucket_size": "auto", - "prefetch_bucket_size": "auto", - "param_persistence_threshold": "auto", + "stage3_prefetch_bucket_size": "auto", + "stage3_param_persistence_threshold": "auto", "max_live_parameters": 0, "max_reuse_distance": 0, "gather_16bit_weights_on_model_save": true diff --git a/deepspeed_configs/zero3_bf16_cpuoffload_all.json b/deepspeed_configs/zero3_bf16_cpuoffload_all.json index 52fe9cdd4..5112c570b 100644 --- a/deepspeed_configs/zero3_bf16_cpuoffload_all.json +++ b/deepspeed_configs/zero3_bf16_cpuoffload_all.json @@ -15,8 +15,8 @@ "contiguous_gradients": true, "sub_group_size": 0, "reduce_bucket_size": "auto", - "prefetch_bucket_size": "auto", - "param_persistence_threshold": "auto", + "stage3_prefetch_bucket_size": "auto", + "stage3_param_persistence_threshold": "auto", "max_live_parameters": 0, "max_reuse_distance": 0, "gather_16bit_weights_on_model_save": true diff --git a/deepspeed_configs/zero3_bf16_cpuoffload_params.json b/deepspeed_configs/zero3_bf16_cpuoffload_params.json index 81ac1d1d8..a2ac82341 100644 --- a/deepspeed_configs/zero3_bf16_cpuoffload_params.json +++ b/deepspeed_configs/zero3_bf16_cpuoffload_params.json @@ -11,8 +11,8 @@ "contiguous_gradients": true, "sub_group_size": 0, "reduce_bucket_size": "auto", - "prefetch_bucket_size": "auto", - "param_persistence_threshold": "auto", + "stage3_prefetch_bucket_size": "auto", + "stage3_param_persistence_threshold": "auto", "max_live_parameters": 0, "max_reuse_distance": 0, "gather_16bit_weights_on_model_save": true