guyhadad01 commited on
Commit
a1cefc8
·
verified ·
1 Parent(s): a3fecd9

Training in progress, step 55000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1253,6 +1253,10 @@ You can finetune this model on your own dataset.
1253
  | 0.9666 | 54700 | 0.2484 |
1254
  | 0.9675 | 54750 | 0.3228 |
1255
  | 0.9684 | 54800 | 0.2935 |
 
 
 
 
1256
 
1257
 
1258
  ### Framework Versions
 
1253
  | 0.9666 | 54700 | 0.2484 |
1254
  | 0.9675 | 54750 | 0.3228 |
1255
  | 0.9684 | 54800 | 0.2935 |
1256
+ | 0.9692 | 54850 | 0.3085 |
1257
+ | 0.9701 | 54900 | 0.3112 |
1258
+ | 0.9710 | 54950 | 0.2889 |
1259
+ | 0.9719 | 55000 | 0.2746 |
1260
 
1261
 
1262
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4660d5cc04b8230e366c2507b6edc6eb9740e5655f078f06d7fa8b708868348d
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7de782f93f57348bf850bc04f35cc7f6059cfdc1487661cd5cf4f11ce0e636f
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7ddc79258480305b86c7de987bf66efad05525fb132f3c4537096562844858a
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dc1a5e4533471281ab4208b72f4dd16330451bdcbc3512cd1466d1a94c0279b
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe80331ddc64a10f3922d2d2aa6e1345a324e582ebfcde4acd33dd3c01a97f23
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:035838ab30ab4d07fb2aaaa81eb5cd5230f5b5f92e211ace87a3143ca1c3c17c
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a394d9ef4969559c2e748a44250c8baede91e41491cb79bd3a87fcd799d229f
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d88e34fed71326e402519391fc702de0ba4ca1011f3b15e76161c4e72df1f1c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:175e278f8a42116e02058ec0c5ec6fdf92f24c652abe7967b071b8b6350190f1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73e5c254a90680845431aa779809105481c9b9fb095d05b8d7eb9127bf1f4c4d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9683518580693043,
6
  "eval_steps": 500,
7
- "global_step": 54800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7680,6 +7680,34 @@
7680
  "learning_rate": 1.779859024955332e-06,
7681
  "loss": 0.2935,
7682
  "step": 54800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7683
  }
7684
  ],
7685
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9718859889381704,
6
  "eval_steps": 500,
7
+ "global_step": 55000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7680
  "learning_rate": 1.779859024955332e-06,
7681
  "loss": 0.2935,
7682
  "step": 54800
7683
+ },
7684
+ {
7685
+ "epoch": 0.9692353907865209,
7686
+ "grad_norm": 1.5993742942810059,
7687
+ "learning_rate": 1.7307730066167953e-06,
7688
+ "loss": 0.3085,
7689
+ "step": 54850
7690
+ },
7691
+ {
7692
+ "epoch": 0.9701189235037373,
7693
+ "grad_norm": 4.223308086395264,
7694
+ "learning_rate": 1.681686988278259e-06,
7695
+ "loss": 0.3112,
7696
+ "step": 54900
7697
+ },
7698
+ {
7699
+ "epoch": 0.9710024562209538,
7700
+ "grad_norm": 1.7939913272857666,
7701
+ "learning_rate": 1.6326009699397223e-06,
7702
+ "loss": 0.2889,
7703
+ "step": 54950
7704
+ },
7705
+ {
7706
+ "epoch": 0.9718859889381704,
7707
+ "grad_norm": 1.1405465602874756,
7708
+ "learning_rate": 1.583514951601186e-06,
7709
+ "loss": 0.2746,
7710
+ "step": 55000
7711
  }
7712
  ],
7713
  "logging_steps": 50,