guyhadad01 commited on
Commit
946dbc0
·
verified ·
1 Parent(s): a8b0bac

Training in progress, step 5400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.6341, 0.1285],
290
- # [0.6341, 1.0000, 0.1635],
291
- # [0.1285, 0.1635, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1330,6 +1330,10 @@ You can finetune this model on your own dataset.
1330
  | 0.0901 | 5100 | 0.4469 |
1331
  | 0.0910 | 5150 | 0.5283 |
1332
  | 0.0919 | 5200 | 0.4826 |
 
 
 
 
1333
 
1334
  </details>
1335
 
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.6268, 0.1112],
290
+ # [0.6268, 1.0000, 0.1476],
291
+ # [0.1112, 0.1476, 1.0000]])
292
  ```
293
 
294
  <!--
 
1330
  | 0.0901 | 5100 | 0.4469 |
1331
  | 0.0910 | 5150 | 0.5283 |
1332
  | 0.0919 | 5200 | 0.4826 |
1333
+ | 0.0928 | 5250 | 0.3895 |
1334
+ | 0.0937 | 5300 | 0.4873 |
1335
+ | 0.0945 | 5350 | 0.4895 |
1336
+ | 0.0954 | 5400 | 0.4686 |
1337
 
1338
  </details>
1339
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4af90c7f23b49e51d466a6d8a0d86939bf37e4d8ea5c0b655ab35b7c151a05cf
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a7b3038038d614d02d13200e3426ce1cee9998e3dd720f3ef8373fd32bc320c
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:544baf7d60ab6e318f100fc6c2fccfb140e19ae226f8f7d820d236577b1da105
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da23c5a242ed1a18ccfa540abf270f8af47081a60b90b0528855f1e52bf8ac00
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11c0cb9bd2c9c6c5c964ae0bb4e4e4872958c4dc97ac96f40f1c118dec4c9803
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43b1cabcf4d622f4eeb0e2e256d17e427254b320b0d958e0925925fc3965ffc2
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afb655591367e732af512c0b489f6652e710a205ef4e8286da8729a948980ee0
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93d3edcb87fa33fd6a7048f57178907c582fac7657ef4f6ed7cd1a489f3a9b01
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:407fdddb74e20b064ec7452aeeae963d95b777da5e4cde56c489f916bcf701b2
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cde96e015f065de3d9994d1a7735820057fec16cad19c67655b731af60c92ecc
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.09188740259051793,
6
  "eval_steps": 500,
7
- "global_step": 5200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -736,6 +736,34 @@
736
  "learning_rate": 4.5927561837455834e-05,
737
  "loss": 0.4826,
738
  "step": 5200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
739
  }
740
  ],
741
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.095421533459384,
6
  "eval_steps": 500,
7
+ "global_step": 5400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
736
  "learning_rate": 4.5927561837455834e-05,
737
  "loss": 0.4826,
738
  "step": 5200
739
+ },
740
+ {
741
+ "epoch": 0.09277093530773445,
742
+ "grad_norm": 3.52422833442688,
743
+ "learning_rate": 4.636925795053004e-05,
744
+ "loss": 0.3895,
745
+ "step": 5250
746
+ },
747
+ {
748
+ "epoch": 0.09365446802495096,
749
+ "grad_norm": 2.1975631713867188,
750
+ "learning_rate": 4.681095406360424e-05,
751
+ "loss": 0.4873,
752
+ "step": 5300
753
+ },
754
+ {
755
+ "epoch": 0.09453800074216748,
756
+ "grad_norm": 3.4910616874694824,
757
+ "learning_rate": 4.725265017667845e-05,
758
+ "loss": 0.4895,
759
+ "step": 5350
760
+ },
761
+ {
762
+ "epoch": 0.095421533459384,
763
+ "grad_norm": 2.1225690841674805,
764
+ "learning_rate": 4.769434628975265e-05,
765
+ "loss": 0.4686,
766
+ "step": 5400
767
  }
768
  ],
769
  "logging_steps": 50,