guyhadad01 commited on
Commit
1553ca7
·
verified ·
1 Parent(s): ad8d4bb

Training in progress, step 52800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1209,6 +1209,10 @@ You can finetune this model on your own dataset.
1209
  | 0.9277 | 52500 | 0.2997 |
1210
  | 0.9286 | 52550 | 0.2425 |
1211
  | 0.9295 | 52600 | 0.2708 |
 
 
 
 
1212
 
1213
 
1214
  ### Framework Versions
 
1209
  | 0.9277 | 52500 | 0.2997 |
1210
  | 0.9286 | 52550 | 0.2425 |
1211
  | 0.9295 | 52600 | 0.2708 |
1212
+ | 0.9304 | 52650 | 0.2201 |
1213
+ | 0.9312 | 52700 | 0.2958 |
1214
+ | 0.9321 | 52750 | 0.2647 |
1215
+ | 0.9330 | 52800 | 0.2329 |
1216
 
1217
 
1218
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d488dc3a5445f93dc6d891e374112fcf40bd92f3df49a02fa164a7b7e3f0939
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a329281b62dee04f25df2a1445a6d06e38a118403d00dfd2047a9f0451d6a236
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ade7229380655a5e5d3053eb6b8da0b8461494cbbd9ca16bd058175900faab5
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1a7c65d7edd786206cd29e1711b41b5ec57296920cd7f0363e9e1febcd4786d
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8bc5e9aadcf53514c913a3f624aee68ac8959f84c12938e1ebd53df4add3fd5
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a39806bf7f5ccc564dfbcbf96185e5776a4d453cf6ceeebfa61e6b15fd77f05f
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16fabdbfb525bb124af89aae1d7ac043f5eac6bfe2d8462a555cfc01bdf7a82a
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15f8eff2e31e5d461c8d76e9f3c73436b8f99cd51de4fc3b3a328f9ccbf1dbdd
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0c8184ff5d3c53c23e51683855f8ef56aed39b4067ed958d2a6305ca37d4bf3
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d76c0e19f4170b3811b1d648f816f3a3f40e357234c62ca57c1c93ddc1c338c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9294764185117775,
6
  "eval_steps": 500,
7
- "global_step": 52600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7372,6 +7372,34 @@
7372
  "learning_rate": 3.938662111484165e-06,
7373
  "loss": 0.2708,
7374
  "step": 52600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7375
  }
7376
  ],
7377
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9330105493806435,
6
  "eval_steps": 500,
7
+ "global_step": 52800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7372
  "learning_rate": 3.938662111484165e-06,
7373
  "loss": 0.2708,
7374
  "step": 52600
7375
+ },
7376
+ {
7377
+ "epoch": 0.9303599512289941,
7378
+ "grad_norm": 2.747580051422119,
7379
+ "learning_rate": 3.889576093145628e-06,
7380
+ "loss": 0.2201,
7381
+ "step": 52650
7382
+ },
7383
+ {
7384
+ "epoch": 0.9312434839462105,
7385
+ "grad_norm": 2.005228281021118,
7386
+ "learning_rate": 3.840490074807092e-06,
7387
+ "loss": 0.2958,
7388
+ "step": 52700
7389
+ },
7390
+ {
7391
+ "epoch": 0.932127016663427,
7392
+ "grad_norm": 1.6022164821624756,
7393
+ "learning_rate": 3.791404056468556e-06,
7394
+ "loss": 0.2647,
7395
+ "step": 52750
7396
+ },
7397
+ {
7398
+ "epoch": 0.9330105493806435,
7399
+ "grad_norm": 1.7913720607757568,
7400
+ "learning_rate": 3.7423180381300193e-06,
7401
+ "loss": 0.2329,
7402
+ "step": 52800
7403
  }
7404
  ],
7405
  "logging_steps": 50,