guyhadad01 commited on
Commit
8e989cb
·
verified ·
1 Parent(s): 624aca9

Training in progress, step 55400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1261,6 +1261,10 @@ You can finetune this model on your own dataset.
1261
  | 0.9737 | 55100 | 0.2965 |
1262
  | 0.9745 | 55150 | 0.2382 |
1263
  | 0.9754 | 55200 | 0.3863 |
 
 
 
 
1264
 
1265
 
1266
  ### Framework Versions
 
1261
  | 0.9737 | 55100 | 0.2965 |
1262
  | 0.9745 | 55150 | 0.2382 |
1263
  | 0.9754 | 55200 | 0.3863 |
1264
+ | 0.9763 | 55250 | 0.2909 |
1265
+ | 0.9772 | 55300 | 0.3787 |
1266
+ | 0.9781 | 55350 | 0.3196 |
1267
+ | 0.9790 | 55400 | 0.3738 |
1268
 
1269
 
1270
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84dfa838d5d08ff2f7ba730d306c0960dd6da737376547d2bfca93e1966bc1dd
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7e0a1455740180aedb80f8bb0aec516cb7153da241701244132cb399617a794
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:014ea2c017260d23539bf2018a3aeecb9f09815bf6c03db5f9a232664f2814fd
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3a83cdaa07d04d231b900b829ca00bf94bbd812391baa3af8be0f339dc5c09a
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74c101267c3a81601197ccbb38d2e72ad72f0ccd27fd0e0454beeffecf5ebfa6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c32e0fe828ffd94931d917ede7d98af8f116069bcef2571793c504c5a05f607
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d0369b7df9f4f6057f54d12203a572c70823bfca8ac268e71fe1a019e47a330
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:380ffdc8abce86595967f2c6febf85c303c1ae3d84e66897af982ed22c990884
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7a98fbd51768bffd64a896f3250670354d9f2cc8cf54c04f0d410e34f028552
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67d3a94240ec5e377beed092b82635ec739c5c48243fbb51753d92a8d8f55ac7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9754201198070365,
6
  "eval_steps": 500,
7
- "global_step": 55200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7736,6 +7736,34 @@
7736
  "learning_rate": 1.388152598613811e-06,
7737
  "loss": 0.3863,
7738
  "step": 55200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7739
  }
7740
  ],
7741
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9789542506759026,
6
  "eval_steps": 500,
7
+ "global_step": 55400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7736
  "learning_rate": 1.388152598613811e-06,
7737
  "loss": 0.3863,
7738
  "step": 55200
7739
+ },
7740
+ {
7741
+ "epoch": 0.976303652524253,
7742
+ "grad_norm": 1.0731230974197388,
7743
+ "learning_rate": 1.3390665802752744e-06,
7744
+ "loss": 0.2909,
7745
+ "step": 55250
7746
+ },
7747
+ {
7748
+ "epoch": 0.9771871852414695,
7749
+ "grad_norm": 1.6253186464309692,
7750
+ "learning_rate": 1.289980561936738e-06,
7751
+ "loss": 0.3787,
7752
+ "step": 55300
7753
+ },
7754
+ {
7755
+ "epoch": 0.978070717958686,
7756
+ "grad_norm": 1.9667285680770874,
7757
+ "learning_rate": 1.2408945435982016e-06,
7758
+ "loss": 0.3196,
7759
+ "step": 55350
7760
+ },
7761
+ {
7762
+ "epoch": 0.9789542506759026,
7763
+ "grad_norm": 1.1798194646835327,
7764
+ "learning_rate": 1.191808525259665e-06,
7765
+ "loss": 0.3738,
7766
+ "step": 55400
7767
  }
7768
  ],
7769
  "logging_steps": 50,