guyhadad01 commited on
Commit
07ce260
·
verified ·
1 Parent(s): b3b9901

Training in progress, step 53600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1225,6 +1225,10 @@ You can finetune this model on your own dataset.
1225
  | 0.9418 | 53300 | 0.234 |
1226
  | 0.9427 | 53350 | 0.2244 |
1227
  | 0.9436 | 53400 | 0.2736 |
 
 
 
 
1228
 
1229
 
1230
  ### Framework Versions
 
1225
  | 0.9418 | 53300 | 0.234 |
1226
  | 0.9427 | 53350 | 0.2244 |
1227
  | 0.9436 | 53400 | 0.2736 |
1228
+ | 0.9445 | 53450 | 0.3088 |
1229
+ | 0.9454 | 53500 | 0.3135 |
1230
+ | 0.9463 | 53550 | 0.2813 |
1231
+ | 0.9471 | 53600 | 0.2333 |
1232
 
1233
 
1234
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39c1a96a93254cf31ffb70f6814ad348fc844266fcb793b7212c9e8b11daf19d
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46322e2fdae84cb4d149624b40324ba603107423e0ed811b11c103af6014e1e4
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1b5b98b6da8546e8a7a2cc62e31dd4b93cce07de3e6e6f9ce4ce52ad9cdab9b
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:068f22c1d711e17dfced7140337b436095f34a8fa926c1703ed0a4e7970380ec
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca41761b8d788c104936e19f7e170bfd0a6d6a882f10f2b6319094786889629a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:738e43c027de9571a26dc41c2c90188ad15bc024b7fa4548c553209c415b7ff9
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afe990ada4836e3b8da06b332bb1effcb8ba00456aa80c3ca264f6cde84a1b18
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41033b29e66c9e9264898026bd8259ffc51d8197a6199f012e6c4fab4d2b8853
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b096fb0b9d4b123e0ea98d85fa01bcdb3622620e30def8e03e9a27f4fc9f25b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:225f37a4049625453028403228c6e91c80694c7d0b9a5b2f9a1f983bafdfc1df
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9436129419872418,
6
  "eval_steps": 500,
7
- "global_step": 53400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7484,6 +7484,34 @@
7484
  "learning_rate": 3.1542675384343524e-06,
7485
  "loss": 0.2736,
7486
  "step": 53400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7487
  }
7488
  ],
7489
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9471470728561079,
6
  "eval_steps": 500,
7
+ "global_step": 53600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7484
  "learning_rate": 3.1542675384343524e-06,
7485
  "loss": 0.2736,
7486
  "step": 53400
7487
+ },
7488
+ {
7489
+ "epoch": 0.9444964747044583,
7490
+ "grad_norm": 1.7333183288574219,
7491
+ "learning_rate": 3.105181520095816e-06,
7492
+ "loss": 0.3088,
7493
+ "step": 53450
7494
+ },
7495
+ {
7496
+ "epoch": 0.9453800074216748,
7497
+ "grad_norm": 1.5718059539794922,
7498
+ "learning_rate": 3.0560955017572796e-06,
7499
+ "loss": 0.3135,
7500
+ "step": 53500
7501
+ },
7502
+ {
7503
+ "epoch": 0.9462635401388914,
7504
+ "grad_norm": 1.3086848258972168,
7505
+ "learning_rate": 3.007009483418743e-06,
7506
+ "loss": 0.2813,
7507
+ "step": 53550
7508
+ },
7509
+ {
7510
+ "epoch": 0.9471470728561079,
7511
+ "grad_norm": 1.3118650913238525,
7512
+ "learning_rate": 2.9579234650802064e-06,
7513
+ "loss": 0.2333,
7514
+ "step": 53600
7515
  }
7516
  ],
7517
  "logging_steps": 50,