guyhadad01 commited on
Commit
2a4bb55
·
verified ·
1 Parent(s): 33e79e0

Training in progress, step 52000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1193,6 +1193,10 @@ You can finetune this model on your own dataset.
1193
  | 0.9136 | 51700 | 0.3088 |
1194
  | 0.9145 | 51750 | 0.2287 |
1195
  | 0.9153 | 51800 | 0.2067 |
 
 
 
 
1196
 
1197
 
1198
  ### Framework Versions
 
1193
  | 0.9136 | 51700 | 0.3088 |
1194
  | 0.9145 | 51750 | 0.2287 |
1195
  | 0.9153 | 51800 | 0.2067 |
1196
+ | 0.9162 | 51850 | 0.2735 |
1197
+ | 0.9171 | 51900 | 0.3976 |
1198
+ | 0.9180 | 51950 | 0.2939 |
1199
+ | 0.9189 | 52000 | 0.3193 |
1200
 
1201
 
1202
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8adbf03525b39d3cbba1bbdde2da90cb7be2d698601f862e040d6383edf785e8
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64df739ab78548e5d75f993ab6041c207785adcb30fa9a57cf9234173976387d
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ddba7d83c634a4905db07a12f6761ec90e0847d3c3a75cb805e5a2c45f6f055e
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab3798d7d967dd27d94d9da8c3b443a2ae8d98157d0a447c72ba241256385ef3
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed3acf2d762800b6693f2eadfe02d38f79ee54f3a4fcf7d7f00a5e20954d4a73
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bf77e2ef33f60ef48f8a5fc09cb1943760ae6ba4d88634c23d14cfcf6cad117
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e37c94dad9c27aa070c66f020f85050e7628adbe8df381c470c2f01ed333d243
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12597bbc3e3311f727af17ce6725c67e2c62ce8d20a5da4fcf3ead6fc2b4cd3a
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad4fc38cbd3a40df512cafd836390b147d408874f4ecc602c76931ee4bd316f8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69967b924386ed794e36fcb2fe2f94715b55410c1d3076df0af1214b0c14df7b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9153398950363132,
6
  "eval_steps": 500,
7
- "global_step": 51800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7260,6 +7260,34 @@
7260
  "learning_rate": 4.724038404900748e-06,
7261
  "loss": 0.2067,
7262
  "step": 51800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7263
  }
7264
  ],
7265
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9188740259051793,
6
  "eval_steps": 500,
7
+ "global_step": 52000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7260
  "learning_rate": 4.724038404900748e-06,
7261
  "loss": 0.2067,
7262
  "step": 51800
7263
+ },
7264
+ {
7265
+ "epoch": 0.9162234277535297,
7266
+ "grad_norm": 1.1146478652954102,
7267
+ "learning_rate": 4.674952386562212e-06,
7268
+ "loss": 0.2735,
7269
+ "step": 51850
7270
+ },
7271
+ {
7272
+ "epoch": 0.9171069604707462,
7273
+ "grad_norm": 2.2454397678375244,
7274
+ "learning_rate": 4.625866368223675e-06,
7275
+ "loss": 0.3976,
7276
+ "step": 51900
7277
+ },
7278
+ {
7279
+ "epoch": 0.9179904931879628,
7280
+ "grad_norm": 1.902377724647522,
7281
+ "learning_rate": 4.576780349885139e-06,
7282
+ "loss": 0.2939,
7283
+ "step": 51950
7284
+ },
7285
+ {
7286
+ "epoch": 0.9188740259051793,
7287
+ "grad_norm": 4.320808410644531,
7288
+ "learning_rate": 4.527694331546602e-06,
7289
+ "loss": 0.3193,
7290
+ "step": 52000
7291
  }
7292
  ],
7293
  "logging_steps": 50,