George-API commited on
Commit
0a1769d
·
verified ·
1 Parent(s): d625213

Upload transformers_config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. transformers_config.json +45 -0
transformers_config.json CHANGED
@@ -70,5 +70,50 @@
70
  "pre_tokenized": true,
71
  "input_ids_field": "input_ids",
72
  "skip_tokenization": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
73
  }
74
  }
 
70
  "pre_tokenized": true,
71
  "input_ids_field": "input_ids",
72
  "skip_tokenization": true
73
+ },
74
+ "deepspeed_config": {
75
+ "zero_optimization": {
76
+ "stage": 2,
77
+ "offload_optimizer": {
78
+ "device": "cpu",
79
+ "pin_memory": true
80
+ },
81
+ "contiguous_gradients": true,
82
+ "overlap_comm": true,
83
+ "reduce_scatter": true,
84
+ "reduce_bucket_size": 5e8,
85
+ "allgather_bucket_size": 5e8
86
+ },
87
+ "gradient_accumulation_steps": 4,
88
+ "gradient_clipping": 0.3,
89
+ "fp16": {
90
+ "enabled": true,
91
+ "loss_scale": 0,
92
+ "loss_scale_window": 1000,
93
+ "initial_scale_power": 16,
94
+ "hysteresis": 2,
95
+ "min_loss_scale": 1
96
+ },
97
+ "optimizer": {
98
+ "type": "AdamW",
99
+ "params": {
100
+ "lr": 2e-5,
101
+ "betas": [0.9, 0.999],
102
+ "eps": 1e-8,
103
+ "weight_decay": 0.01
104
+ }
105
+ },
106
+ "activation_checkpointing": {
107
+ "partition_activations": true,
108
+ "cpu_checkpointing": true,
109
+ "contiguous_memory_optimization": true,
110
+ "number_checkpoints": null,
111
+ "synchronize_checkpoint_boundary": false,
112
+ "profile": false
113
+ },
114
+ "steps_per_print": 10,
115
+ "train_batch_size": "auto",
116
+ "train_micro_batch_size_per_gpu": "auto",
117
+ "wall_clock_breakdown": false
118
  }
119
  }