guyhadad01 commited on
Commit
2bca8e8
·
verified ·
1 Parent(s): b46def2

Training in progress, step 52600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1205,6 +1205,10 @@ You can finetune this model on your own dataset.
1205
  | 0.9242 | 52300 | 0.3196 |
1206
  | 0.9251 | 52350 | 0.3322 |
1207
  | 0.9259 | 52400 | 0.3258 |
 
 
 
 
1208
 
1209
 
1210
  ### Framework Versions
 
1205
  | 0.9242 | 52300 | 0.3196 |
1206
  | 0.9251 | 52350 | 0.3322 |
1207
  | 0.9259 | 52400 | 0.3258 |
1208
+ | 0.9268 | 52450 | 0.3419 |
1209
+ | 0.9277 | 52500 | 0.2997 |
1210
+ | 0.9286 | 52550 | 0.2425 |
1211
+ | 0.9295 | 52600 | 0.2708 |
1212
 
1213
 
1214
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b6ccee8235180e0fcb744d9c9527b2c600512f7ecc4b3d25488b384822838a3
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d488dc3a5445f93dc6d891e374112fcf40bd92f3df49a02fa164a7b7e3f0939
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:002e9ce3d93da778bb4fe1c95037789e052796647a41c67b89002e6d3a8a69ff
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ade7229380655a5e5d3053eb6b8da0b8461494cbbd9ca16bd058175900faab5
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3763a2915178d87a90c93bc33c9a17dd8d33e1ee286d4f530459bdee03d15b6d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8bc5e9aadcf53514c913a3f624aee68ac8959f84c12938e1ebd53df4add3fd5
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0315f631d073b9e84cefc9abe7ee2e75af036769039c7a2bf20f3d81a5e6f752
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16fabdbfb525bb124af89aae1d7ac043f5eac6bfe2d8462a555cfc01bdf7a82a
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:acf725a620db2293e4b5f5ac9e35cb4f2f88cf44a5a0884c22a06b906efee164
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0c8184ff5d3c53c23e51683855f8ef56aed39b4067ed958d2a6305ca37d4bf3
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9259422876429114,
6
  "eval_steps": 500,
7
- "global_step": 52400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7344,6 +7344,34 @@
7344
  "learning_rate": 4.135006184838311e-06,
7345
  "loss": 0.3258,
7346
  "step": 52400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7347
  }
7348
  ],
7349
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9294764185117775,
6
  "eval_steps": 500,
7
+ "global_step": 52600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7344
  "learning_rate": 4.135006184838311e-06,
7345
  "loss": 0.3258,
7346
  "step": 52400
7347
+ },
7348
+ {
7349
+ "epoch": 0.926825820360128,
7350
+ "grad_norm": 4.394749164581299,
7351
+ "learning_rate": 4.085920166499775e-06,
7352
+ "loss": 0.3419,
7353
+ "step": 52450
7354
+ },
7355
+ {
7356
+ "epoch": 0.9277093530773445,
7357
+ "grad_norm": 0.856221616268158,
7358
+ "learning_rate": 4.036834148161238e-06,
7359
+ "loss": 0.2997,
7360
+ "step": 52500
7361
+ },
7362
+ {
7363
+ "epoch": 0.928592885794561,
7364
+ "grad_norm": 1.1520658731460571,
7365
+ "learning_rate": 3.9877481298227014e-06,
7366
+ "loss": 0.2425,
7367
+ "step": 52550
7368
+ },
7369
+ {
7370
+ "epoch": 0.9294764185117775,
7371
+ "grad_norm": 1.2415558099746704,
7372
+ "learning_rate": 3.938662111484165e-06,
7373
+ "loss": 0.2708,
7374
+ "step": 52600
7375
  }
7376
  ],
7377
  "logging_steps": 50,