Training in progress, epoch 3

Browse files

Files changed (5) hide show

model-00001-of-00004.safetensors +1 -1
model-00002-of-00004.safetensors +1 -1
model-00003-of-00004.safetensors +1 -1
model-00004-of-00004.safetensors +1 -1
trainer_log.jsonl +11 -0

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0b38f25c26533a5ef7afcf9abbbf19f9271a5163b3d4a8aa45588d73fb4d08f9
 size 4877660776

 version https://git-lfs.github.com/spec/v1
+oid sha256:5e3e94e7ab0127c34bc63db5e4fbfbc6f1ccb3a2789727f91f551916b22cc1b0
 size 4877660776

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:66791ba1b919246b48f8dd85a88f6f89c4035d4befb4ce18058844b419bf72ac
 size 4932751008

 version https://git-lfs.github.com/spec/v1
+oid sha256:c6031ce48cdec407a6c353f4d75e68b1b272ba9694d211cb850097ab524df234
 size 4932751008

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f0def7cbde5a449a4c013d07f36dee04a72a12caee77edf2b044ef70734ada2
 size 4330865200

 version https://git-lfs.github.com/spec/v1
+oid sha256:f62b25c79fcb2c8aed1e4d18fe75a29c2645620f5b1944fd5fe1d34ac17f0ecf
 size 4330865200

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9015e9f0ee7984e347c7a5fdcc7dfb395e31979fdcffe080d0d28971c383e0ef
 size 1089994880

 version https://git-lfs.github.com/spec/v1
+oid sha256:8567cf6b6a60df86529506982690524e576db267592e2efd684fd8b942f70901
 size 1089994880

trainer_log.jsonl CHANGED Viewed

@@ -30,3 +30,14 @@
 {"current_steps": 30, "total_steps": 70, "loss": 0.6531, "lr": 1.4112871031306118e-05, "epoch": 2.88, "percentage": 42.86, "elapsed_time": "1:03:40", "remaining_time": "1:24:54"}
 {"current_steps": 31, "total_steps": 70, "loss": 0.6383, "lr": 1.3653410243663953e-05, "epoch": 2.976, "percentage": 44.29, "elapsed_time": "1:05:40", "remaining_time": "1:22:37"}
 {"current_steps": 32, "total_steps": 70, "loss": 0.6244, "lr": 1.3184866502516846e-05, "epoch": 3.072, "percentage": 45.71, "elapsed_time": "1:08:27", "remaining_time": "1:21:17"}

 {"current_steps": 30, "total_steps": 70, "loss": 0.6531, "lr": 1.4112871031306118e-05, "epoch": 2.88, "percentage": 42.86, "elapsed_time": "1:03:40", "remaining_time": "1:24:54"}
 {"current_steps": 31, "total_steps": 70, "loss": 0.6383, "lr": 1.3653410243663953e-05, "epoch": 2.976, "percentage": 44.29, "elapsed_time": "1:05:40", "remaining_time": "1:22:37"}
 {"current_steps": 32, "total_steps": 70, "loss": 0.6244, "lr": 1.3184866502516846e-05, "epoch": 3.072, "percentage": 45.71, "elapsed_time": "1:08:27", "remaining_time": "1:21:17"}
+{"current_steps": 33, "total_steps": 70, "loss": 0.5952, "lr": 1.2708404681430054e-05, "epoch": 3.168, "percentage": 47.14, "elapsed_time": "1:10:31", "remaining_time": "1:19:04"}
+{"current_steps": 34, "total_steps": 70, "loss": 0.5929, "lr": 1.2225209339563144e-05, "epoch": 3.2640000000000002, "percentage": 48.57, "elapsed_time": "1:12:32", "remaining_time": "1:16:48"}
+{"current_steps": 35, "total_steps": 70, "loss": 0.5952, "lr": 1.1736481776669307e-05, "epoch": 3.36, "percentage": 50.0, "elapsed_time": "1:14:50", "remaining_time": "1:14:50"}
+{"current_steps": 36, "total_steps": 70, "loss": 0.5883, "lr": 1.1243437046474854e-05, "epoch": 3.456, "percentage": 51.43, "elapsed_time": "1:16:54", "remaining_time": "1:12:38"}
+{"current_steps": 37, "total_steps": 70, "loss": 0.5908, "lr": 1.0747300935864245e-05, "epoch": 3.552, "percentage": 52.86, "elapsed_time": "1:18:57", "remaining_time": "1:10:25"}
+{"current_steps": 38, "total_steps": 70, "loss": 0.5882, "lr": 1.0249306917380731e-05, "epoch": 3.648, "percentage": 54.29, "elapsed_time": "1:20:58", "remaining_time": "1:08:11"}
+{"current_steps": 39, "total_steps": 70, "loss": 0.6026, "lr": 9.750693082619274e-06, "epoch": 3.7439999999999998, "percentage": 55.71, "elapsed_time": "1:22:49", "remaining_time": "1:05:50"}
+{"current_steps": 40, "total_steps": 70, "loss": 0.5629, "lr": 9.252699064135759e-06, "epoch": 3.84, "percentage": 57.14, "elapsed_time": "1:24:53", "remaining_time": "1:03:40"}
+{"current_steps": 41, "total_steps": 70, "loss": 0.5778, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:26:46", "remaining_time": "1:01:22"}
+{"current_steps": 42, "total_steps": 70, "loss": 0.5831, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:29:35", "remaining_time": "0:59:43"}
+{"current_steps": 43, "total_steps": 70, "loss": 0.562, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:31:35", "remaining_time": "0:57:30"}