From 4dbef0941f27ee5d8f95651daa8de2967c4b3623 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Sun, 30 Apr 2023 04:24:58 -0400 Subject: [PATCH] update ds_config --- ds_config.json | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) diff --git a/ds_config.json b/ds_config.json index ffd6f2075..49de5f874 100644 --- a/ds_config.json +++ b/ds_config.json @@ -10,6 +10,15 @@ "hysteresis": 2, "min_loss_scale": 1 }, + "optimizer": { + "type": "Adam", + "params": { + "lr": "auto", + "betas": "auto", + "eps": "auto", + "weight_decay": "auto" + } + }, "scheduler": { "type": "OneCycle", "params": { @@ -19,12 +28,22 @@ }, "zero_optimization": { "stage": 2, + "offload_optimizer": { + "device": "cpu", + "pin_memory": true + }, + "offload_param": { + "device": "cpu", + "pin_memory": true + }, "overlap_comm": true, "allgather_partitions": true, "allgather_bucket_size": 5e8, "contiguous_gradients": true, "reduce_bucket_size": "auto", "reduce_scatter": true, + "stage3_max_live_parameters": 0, + "stage3_max_reuse_distance": 0, "stage3_gather_16bit_weights_on_model_save": true }, "gradient_accumulation_steps": "auto",