guyhadad01 commited on
Commit
c827ebe
·
verified ·
1 Parent(s): 8e989cb

Training in progress, step 55600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1265,6 +1265,10 @@ You can finetune this model on your own dataset.
1265
  | 0.9772 | 55300 | 0.3787 |
1266
  | 0.9781 | 55350 | 0.3196 |
1267
  | 0.9790 | 55400 | 0.3738 |
 
 
 
 
1268
 
1269
 
1270
  ### Framework Versions
 
1265
  | 0.9772 | 55300 | 0.3787 |
1266
  | 0.9781 | 55350 | 0.3196 |
1267
  | 0.9790 | 55400 | 0.3738 |
1268
+ | 0.9798 | 55450 | 0.3588 |
1269
+ | 0.9807 | 55500 | 0.3559 |
1270
+ | 0.9816 | 55550 | 0.4382 |
1271
+ | 0.9825 | 55600 | 0.2588 |
1272
 
1273
 
1274
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7e0a1455740180aedb80f8bb0aec516cb7153da241701244132cb399617a794
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4757af97769f9bf496f79482c67b4ad52305ab54793692a8f0992bfb1b3e1d99
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3a83cdaa07d04d231b900b829ca00bf94bbd812391baa3af8be0f339dc5c09a
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc0ad85e5b5865c2909f3ef475b6781df3d6695ce915b04da508edcabe1e676c
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c32e0fe828ffd94931d917ede7d98af8f116069bcef2571793c504c5a05f607
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53cd51ebdd8de8dece2e081300401e55897bd6527506b231b719e81675496d96
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:380ffdc8abce86595967f2c6febf85c303c1ae3d84e66897af982ed22c990884
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cadf5e13e62099775fee57e6f6e29864a5e8da9a1f19033bf424bca204d48d8
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67d3a94240ec5e377beed092b82635ec739c5c48243fbb51753d92a8d8f55ac7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40c3ccdbd565485480694df123a18cb3bc6089aca7ac0b1c3670702db7f9e007
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9789542506759026,
6
  "eval_steps": 500,
7
- "global_step": 55400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7764,6 +7764,34 @@
7764
  "learning_rate": 1.191808525259665e-06,
7765
  "loss": 0.3738,
7766
  "step": 55400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7767
  }
7768
  ],
7769
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9824883815447686,
6
  "eval_steps": 500,
7
+ "global_step": 55600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7764
  "learning_rate": 1.191808525259665e-06,
7765
  "loss": 0.3738,
7766
  "step": 55400
7767
+ },
7768
+ {
7769
+ "epoch": 0.979837783393119,
7770
+ "grad_norm": 1.5018582344055176,
7771
+ "learning_rate": 1.1427225069211286e-06,
7772
+ "loss": 0.3588,
7773
+ "step": 55450
7774
+ },
7775
+ {
7776
+ "epoch": 0.9807213161103355,
7777
+ "grad_norm": 1.1979721784591675,
7778
+ "learning_rate": 1.0936364885825922e-06,
7779
+ "loss": 0.3559,
7780
+ "step": 55500
7781
+ },
7782
+ {
7783
+ "epoch": 0.9816048488275521,
7784
+ "grad_norm": 3.014507532119751,
7785
+ "learning_rate": 1.0445504702440556e-06,
7786
+ "loss": 0.4382,
7787
+ "step": 55550
7788
+ },
7789
+ {
7790
+ "epoch": 0.9824883815447686,
7791
+ "grad_norm": 1.5364562273025513,
7792
+ "learning_rate": 9.954644519055192e-07,
7793
+ "loss": 0.2588,
7794
+ "step": 55600
7795
  }
7796
  ],
7797
  "logging_steps": 50,