SystemAdmin123 commited on
Commit
ae43565
·
verified ·
1 Parent(s): 33e7a44

Training in progress, step 40, checkpoint

Browse files
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49abecc3012aa33040e2fb01e32e561bb0b599ef920d57e5804dbf05cce2f142
3
  size 4943178720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b907ba68261a733495a2decc931e4839e4907e6e52a97528b167a0a5a0ebd392
3
  size 4943178720
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e268892504057e819d6c86952d153640cfeab12dfde0c669137107e7bbaa9a7
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf95b6219ea0c58409934588c2a66dc9c8321e127f35cf06df02c3acd88afc0e
3
  size 4999819336
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba955cd0f1842463cd22c00dad17603532a55cb793303e24c624588deaf5affc
3
  size 4540532728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76053a4a789be6b616ea43ab19cf1a53cfc29041a95eebbb8627e860734e1f52
3
  size 4540532728
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ea56f435222638b51353e98a7a59318640daf28906ee7970d8fea972ee2fd54
3
  size 14710155092
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22617f0b8389a6d4fa5a7e5e259a2a6e9ac793955c55c10b715b8d4f9596c212
3
  size 14710155092
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5829e55a74209d86a905d56c797173146629e2a97eb8f2567e78aab055ee715
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:572996e9dc190ff3f3a6efdf58de929f593fa2dd2f97d74fed7646828651b17f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -11,44 +11,44 @@
11
  {
12
  "epoch": 0.019230769230769232,
13
  "eval_loss": 1.8673125505447388,
14
- "eval_runtime": 15.0658,
15
- "eval_samples_per_second": 99.63,
16
- "eval_steps_per_second": 6.239,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.19230769230769232,
21
- "grad_norm": 346.0,
22
- "learning_rate": 0.00013333333333333334,
23
- "loss": 7.3336,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.38461538461538464,
28
- "grad_norm": 63.75,
29
- "learning_rate": 0.00019984815164333163,
30
- "loss": 10.1286,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.5769230769230769,
35
- "grad_norm": 1776.0,
36
- "learning_rate": 0.00019863613034027224,
37
- "loss": 10.0786,
38
  "step": 30
39
  },
40
  {
41
  "epoch": 0.7692307692307693,
42
- "grad_norm": 45.0,
43
- "learning_rate": 0.00019622680003092503,
44
- "loss": 9.0353,
45
  "step": 40
46
  }
47
  ],
48
  "logging_steps": 10,
49
- "max_steps": 300,
50
  "num_input_tokens_seen": 0,
51
- "num_train_epochs": 6,
52
  "save_steps": 40,
53
  "stateful_callbacks": {
54
  "TrainerControl": {
 
11
  {
12
  "epoch": 0.019230769230769232,
13
  "eval_loss": 1.8673125505447388,
14
+ "eval_runtime": 15.1011,
15
+ "eval_samples_per_second": 99.397,
16
+ "eval_steps_per_second": 6.225,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.19230769230769232,
21
+ "grad_norm": 36.0,
22
+ "learning_rate": 6.666666666666667e-05,
23
+ "loss": 2.4526,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.38461538461538464,
28
+ "grad_norm": 231.0,
29
+ "learning_rate": 0.00013333333333333334,
30
+ "loss": 2.8068,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.5769230769230769,
35
+ "grad_norm": 105.0,
36
+ "learning_rate": 0.0002,
37
+ "loss": 6.5887,
38
  "step": 30
39
  },
40
  {
41
  "epoch": 0.7692307692307693,
42
+ "grad_norm": 67.0,
43
+ "learning_rate": 0.00019984815164333163,
44
+ "loss": 9.409,
45
  "step": 40
46
  }
47
  ],
48
  "logging_steps": 10,
49
+ "max_steps": 600,
50
  "num_input_tokens_seen": 0,
51
+ "num_train_epochs": 12,
52
  "save_steps": 40,
53
  "stateful_callbacks": {
54
  "TrainerControl": {
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa8dcd878159cc59f87447028fd2e09931ebdac776af71b4ee5edce164448ac3
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b41a9fb463c0db3738bb35eb54493dd7cd16792db1e56184a9c9b31d58bd7b14
3
  size 6776