guyhadad01 commited on
Commit
a36bb8e
·
verified ·
1 Parent(s): 5eddccc

Training in progress, step 54200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1237,6 +1237,10 @@ You can finetune this model on your own dataset.
1237
  | 0.9524 | 53900 | 0.2253 |
1238
  | 0.9533 | 53950 | 0.2942 |
1239
  | 0.9542 | 54000 | 0.2997 |
 
 
 
 
1240
 
1241
 
1242
  ### Framework Versions
 
1237
  | 0.9524 | 53900 | 0.2253 |
1238
  | 0.9533 | 53950 | 0.2942 |
1239
  | 0.9542 | 54000 | 0.2997 |
1240
+ | 0.9551 | 54050 | 0.3954 |
1241
+ | 0.9560 | 54100 | 0.3496 |
1242
+ | 0.9569 | 54150 | 0.2609 |
1243
+ | 0.9577 | 54200 | 0.3942 |
1244
 
1245
 
1246
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d367b7e3094b9509638dc3aab8cd20aa7d72d8a2079791ccc62c560157ab98a0
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23c626c07a484cf440299aeab5250215215dc9a9504ba76a2c4d8cbb2ee9f703
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebfbc0071777229c33761182ed33d399969ad60e886668928a56deda972d74c1
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31a1ca22d51c4852d7b597cdc6df536f10b0a83016c09217dd4a746f81603dfe
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b32f599e36a2e355058567f81a1cf5fcee6ab44b38d16fa4944caffd04dfbb3
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f12eb5ebd31ffd5667160725a966706229b611b4915c7e9e0942936f7af1fe3f
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8db4dd2df84f2b4b00fc6674bde1c97fccefdb7d0ae1f644ab8647d522122a7c
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecc3972897ec297e0f8185ac88e544940af5d6dbb43a2cbce3b08ddf982f52c7
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f315466204b131c92fd6cdb19db01462071017aa8244ad37245b5ffab5418efa
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c74d3b4e96c259643bb77262d75e1f23a0f31a3e975d23f8db0d5e5def888ead
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.95421533459384,
6
  "eval_steps": 500,
7
- "global_step": 54000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7568,6 +7568,34 @@
7568
  "learning_rate": 2.5652353183719152e-06,
7569
  "loss": 0.2997,
7570
  "step": 54000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7571
  }
7572
  ],
7573
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9577494654627061,
6
  "eval_steps": 500,
7
+ "global_step": 54200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7568
  "learning_rate": 2.5652353183719152e-06,
7569
  "loss": 0.2997,
7570
  "step": 54000
7571
+ },
7572
+ {
7573
+ "epoch": 0.9550988673110565,
7574
+ "grad_norm": 1.0720359086990356,
7575
+ "learning_rate": 2.5161493000333786e-06,
7576
+ "loss": 0.3954,
7577
+ "step": 54050
7578
+ },
7579
+ {
7580
+ "epoch": 0.9559824000282731,
7581
+ "grad_norm": 1.608279824256897,
7582
+ "learning_rate": 2.467063281694842e-06,
7583
+ "loss": 0.3496,
7584
+ "step": 54100
7585
+ },
7586
+ {
7587
+ "epoch": 0.9568659327454896,
7588
+ "grad_norm": 1.2330106496810913,
7589
+ "learning_rate": 2.4179772633563054e-06,
7590
+ "loss": 0.2609,
7591
+ "step": 54150
7592
+ },
7593
+ {
7594
+ "epoch": 0.9577494654627061,
7595
+ "grad_norm": 1.4279929399490356,
7596
+ "learning_rate": 2.3688912450177693e-06,
7597
+ "loss": 0.3942,
7598
+ "step": 54200
7599
  }
7600
  ],
7601
  "logging_steps": 50,