guyhadad01 commited on
Commit
47417d4
·
verified ·
1 Parent(s): 5d26d8d

Training in progress, step 53400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1221,6 +1221,10 @@ You can finetune this model on your own dataset.
1221
  | 0.9383 | 53100 | 0.2066 |
1222
  | 0.9392 | 53150 | 0.2957 |
1223
  | 0.9401 | 53200 | 0.3931 |
 
 
 
 
1224
 
1225
 
1226
  ### Framework Versions
 
1221
  | 0.9383 | 53100 | 0.2066 |
1222
  | 0.9392 | 53150 | 0.2957 |
1223
  | 0.9401 | 53200 | 0.3931 |
1224
+ | 0.9410 | 53250 | 0.3384 |
1225
+ | 0.9418 | 53300 | 0.234 |
1226
+ | 0.9427 | 53350 | 0.2244 |
1227
+ | 0.9436 | 53400 | 0.2736 |
1228
 
1229
 
1230
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2487922e51e359a9f1ecb6a445d3e636440e65c32739f52f813e51dba1e67cff
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39c1a96a93254cf31ffb70f6814ad348fc844266fcb793b7212c9e8b11daf19d
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb6a3019423076f9d2bcde60bdb5789ba741f63b281497780b4c7a5a01452766
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1b5b98b6da8546e8a7a2cc62e31dd4b93cce07de3e6e6f9ce4ce52ad9cdab9b
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:703c575158d027ee9439c8f4b7cba9394179cb8e338f46e41a82b465fd641366
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca41761b8d788c104936e19f7e170bfd0a6d6a882f10f2b6319094786889629a
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d78afd0a4dfa1ad614feedb884bc52a6d0ef53d711277b9eb7759daf275b74c
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afe990ada4836e3b8da06b332bb1effcb8ba00456aa80c3ca264f6cde84a1b18
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c6628a730df5612a115afdb07517d1848beb0c28c4d9cd90e5531c3a4536e32
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b096fb0b9d4b123e0ea98d85fa01bcdb3622620e30def8e03e9a27f4fc9f25b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9400788111183758,
6
  "eval_steps": 500,
7
- "global_step": 53200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7456,6 +7456,34 @@
7456
  "learning_rate": 3.3506116117884983e-06,
7457
  "loss": 0.3931,
7458
  "step": 53200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7459
  }
7460
  ],
7461
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9436129419872418,
6
  "eval_steps": 500,
7
+ "global_step": 53400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7456
  "learning_rate": 3.3506116117884983e-06,
7457
  "loss": 0.3931,
7458
  "step": 53200
7459
+ },
7460
+ {
7461
+ "epoch": 0.9409623438355922,
7462
+ "grad_norm": 1.065996766090393,
7463
+ "learning_rate": 3.3015255934499617e-06,
7464
+ "loss": 0.3384,
7465
+ "step": 53250
7466
+ },
7467
+ {
7468
+ "epoch": 0.9418458765528087,
7469
+ "grad_norm": 1.57516610622406,
7470
+ "learning_rate": 3.252439575111425e-06,
7471
+ "loss": 0.234,
7472
+ "step": 53300
7473
+ },
7474
+ {
7475
+ "epoch": 0.9427294092700252,
7476
+ "grad_norm": 1.2013062238693237,
7477
+ "learning_rate": 3.203353556772889e-06,
7478
+ "loss": 0.2244,
7479
+ "step": 53350
7480
+ },
7481
+ {
7482
+ "epoch": 0.9436129419872418,
7483
+ "grad_norm": 1.448370099067688,
7484
+ "learning_rate": 3.1542675384343524e-06,
7485
+ "loss": 0.2736,
7486
+ "step": 53400
7487
  }
7488
  ],
7489
  "logging_steps": 50,