Training in progress, step 1280, checkpoint

Browse files

Files changed (12) hide show

last-checkpoint/model.safetensors +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +47 -3

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7a7a5bf2ae53fe913692899a49310566217dbeffbb0199ff9046888fb5aa7575
 size 2433024

 version https://git-lfs.github.com/spec/v1
+oid sha256:76da35fcd2eceb4682b02e4d6f4efd1f654fac0b25429d515156667dd817308a
 size 2433024

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5b51ee5c39f2196a17052a3369869248cbff6bb81824726e673d7bacb4845000
 size 2498406

 version https://git-lfs.github.com/spec/v1
+oid sha256:f660c44323f7dc691c0421faf42c40cc765dca5c21d11bff643a623b003967a0
 size 2498406

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a69f6ea192cfcf54ef28bb2d6bd807102ec49e655245cd88a8999a1025beaa56
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:1b3ba644702b51ab6ceb3cfb78b0712e10c56d7a898133b9cf775673605d71a6
 size 15984

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cd5bf2b6b2f2b239cbf378c9ab279dbd312ccd339731dbb40b178c5d2117f1fa
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:7a575d13944792443c2e0faf6af7562460ac52c5628f17b918747a2fad55be01
 size 15984

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc3d6b5de9f89ae92adeb3ebb45551760dedacf84ef470629b9572c81c7e5e15
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:3378545ae3c0bb849e88bd71db9a81f0556e610f7a1d6ea4af902425e910afa6
 size 15984

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8a659c65d62a0ad4ef2400d4a9efa53bb95f33c9a3510b01c06df806373098fd
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:d3581eff136704b2f763bfac1cfe6d4ca215660e05f32de8938f8c598bdd09e1
 size 15984

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7945d23ad3f18f8d933786bc7ca2663bfc4a07a89b86602528c15c8de525cba4
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:4710f39f928214c6084305a96ed4d69309abcb477c5fe9ea3b79644e92349f58
 size 15984

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e3564e5e1fb5118c052847f294bdd8157abfa1387eac82f725487e3fb9285512
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:17f2040b06510c4ed4dae6986e8f9b63891a60d4b9fa2e8045fc74b430abf05b
 size 15984

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cd61a764da978cdc05855ec977013888fcda81d8e3f693f0b43c1fa27207c8cf
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:3f0418024306b84efbd06ecb22274609094ccd51161118b224af78a4c9aa3c2e
 size 15984

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c21d6eb44e4c3a4a2aa63996253ecd1b46d24a99d863d3828abc8a3058eb6753
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d46bb0bbf258912802dbc17d20db208430fc3ab3a923169293e1cbe07fb7ae7
 size 15984

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cd12f9f53e74c951a51712fa65ed54e535568d6d68567892b5b94a3a28396fca
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:25cf578d94ac1a7be20caf3c6bf3d856ece0554beb81a56caa6f17d994e34988
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.467455621301775,
   "eval_steps": 20,
-  "global_step": 1240,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1379,6 +1379,50 @@
       "eval_samples_per_second": 412.352,
       "eval_steps_per_second": 25.806,
       "step": 1240
     }
   ],
   "logging_steps": 10,
@@ -1398,7 +1442,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 485882265600.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.514792899408284,
   "eval_steps": 20,
+  "global_step": 1280,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 412.352,
       "eval_steps_per_second": 25.806,
       "step": 1240
+    },
+    {
+      "epoch": 1.4792899408284024,
+      "grad_norm": 0.51171875,
+      "learning_rate": 0.00010825793454723325,
+      "loss": 10.4014,
+      "step": 1250
+    },
+    {
+      "epoch": 1.4911242603550297,
+      "grad_norm": 0.453125,
+      "learning_rate": 0.00010693899263660441,
+      "loss": 10.4494,
+      "step": 1260
+    },
+    {
+      "epoch": 1.4911242603550297,
+      "eval_loss": 10.489725112915039,
+      "eval_runtime": 3.7506,
+      "eval_samples_per_second": 400.469,
+      "eval_steps_per_second": 25.063,
+      "step": 1260
+    },
+    {
+      "epoch": 1.502958579881657,
+      "grad_norm": 0.66015625,
+      "learning_rate": 0.00010561883660318455,
+      "loss": 10.4229,
+      "step": 1270
+    },
+    {
+      "epoch": 1.514792899408284,
+      "grad_norm": 0.5,
+      "learning_rate": 0.00010429769743605407,
+      "loss": 10.4095,
+      "step": 1280
+    },
+    {
+      "epoch": 1.514792899408284,
+      "eval_loss": 10.488317489624023,
+      "eval_runtime": 3.5347,
+      "eval_samples_per_second": 424.926,
+      "eval_steps_per_second": 26.593,
+      "step": 1280
     }
   ],
   "logging_steps": 10,
       "attributes": {}
     }
   },
+  "total_flos": 501547991040.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null