From 476a205cea4fe73d34811bd7d16a6808af4cf6d7 Mon Sep 17 00:00:00 2001 From: Haoxiang Wang Date: Mon, 4 Dec 2023 02:17:38 -0800 Subject: [PATCH] Remove learning rate scheduler in deepspeed config to avoid conflict (#909) --- deepspeed/zero1.json | 10 ---------- deepspeed/zero2.json | 10 ---------- deepspeed/zero3.json | 10 ---------- 3 files changed, 30 deletions(-) diff --git a/deepspeed/zero1.json b/deepspeed/zero1.json index 85bc58609..c76a20637 100644 --- a/deepspeed/zero1.json +++ b/deepspeed/zero1.json @@ -24,16 +24,6 @@ "weight_decay": "auto" } }, - "scheduler": { - "type": "WarmupDecayLR", - "params": { - "warmup_min_lr": "auto", - "warmup_max_lr": "auto", - "warmup_num_steps": "auto", - "warmup_type": "linear", - "total_num_steps": "auto" - } - }, "gradient_accumulation_steps": "auto", "train_batch_size": "auto", "train_micro_batch_size_per_gpu": "auto", diff --git a/deepspeed/zero2.json b/deepspeed/zero2.json index 18ec4bd0e..3f3baa3ec 100644 --- a/deepspeed/zero2.json +++ b/deepspeed/zero2.json @@ -28,16 +28,6 @@ "weight_decay": "auto" } }, - "scheduler": { - "type": "WarmupDecayLR", - "params": { - "warmup_min_lr": "auto", - "warmup_max_lr": "auto", - "warmup_num_steps": "auto", - "warmup_type": "linear", - "total_num_steps": "auto" - } - }, "gradient_accumulation_steps": "auto", "train_batch_size": "auto", "train_micro_batch_size_per_gpu": "auto", diff --git a/deepspeed/zero3.json b/deepspeed/zero3.json index 99ecbd4bf..cf64e83ac 100644 --- a/deepspeed/zero3.json +++ b/deepspeed/zero3.json @@ -32,16 +32,6 @@ "weight_decay": "auto" } }, - "scheduler": { - "type": "WarmupDecayLR", - "params": { - "warmup_min_lr": "auto", - "warmup_max_lr": "auto", - "warmup_num_steps": "auto", - "warmup_type": "linear", - "total_num_steps": "auto" - } - }, "gradient_accumulation_steps": "auto", "train_batch_size": "auto", "train_micro_batch_size_per_gpu": "auto",