Spaces:

Dovakiins
/

qwerrwe

Build error

Teknium commited on Oct 28, 2023

Commit

d3193be

unverified ·

1 Parent(s): 2e71ff0

Fix Deepspeed Zero3 Config (#791)

* Update zero3.json

Take away CPU Offload by default (Slows things down horribly, better off reducing batchsize), and changes LR Scheduler to a properly decaying one

* Update zero3.json

fix something

Files changed (1) hide show

deepspeed/zero3.json +3 -10

deepspeed/zero3.json CHANGED Viewed

@@ -1,14 +1,6 @@
 {
   "zero_optimization": {
     "stage": 3,
-    "offload_optimizer": {
-      "device": "cpu",
-      "pin_memory": true
-    },
-    "offload_param": {
-      "device": "cpu",
-      "pin_memory": true
-    },
     "overlap_comm": true,
     "contiguous_gradients": true,
     "sub_group_size": 0,
@@ -41,12 +33,13 @@
     }
   },
   "scheduler": {
-    "type": "WarmupLR",
     "params": {
       "warmup_min_lr": "auto",
       "warmup_max_lr": "auto",
       "warmup_num_steps": "auto",
-      "warmup_type": "linear"
     }
   },
   "gradient_accumulation_steps": "auto",

 {
   "zero_optimization": {
     "stage": 3,
     "overlap_comm": true,
     "contiguous_gradients": true,
     "sub_group_size": 0,
     }
   },
   "scheduler": {
+    "type": "WarmupDecayLR",
     "params": {
       "warmup_min_lr": "auto",
       "warmup_max_lr": "auto",
       "warmup_num_steps": "auto",
+      "warmup_type": "linear",
+      "total_num_steps": "auto"
     }
   },
   "gradient_accumulation_steps": "auto",