SystemAdmin123 commited on
Commit
936b728
·
verified ·
1 Parent(s): f536751

Training in progress, step 40, checkpoint

Browse files
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b907ba68261a733495a2decc931e4839e4907e6e52a97528b167a0a5a0ebd392
3
  size 4943178720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:681a208ef373053824021017b27708b23a588064e7003361364981ae70fa09cc
3
  size 4943178720
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf95b6219ea0c58409934588c2a66dc9c8321e127f35cf06df02c3acd88afc0e
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3b773cef476437d526f7c17ec504cec44088b25420cde09e2273e473904f2e5
3
  size 4999819336
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76053a4a789be6b616ea43ab19cf1a53cfc29041a95eebbb8627e860734e1f52
3
  size 4540532728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64e632ea54fafa03fa867d58aa1615bc784b20c0be1d236538bd55ebff650daa
3
  size 4540532728
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22617f0b8389a6d4fa5a7e5e259a2a6e9ac793955c55c10b715b8d4f9596c212
3
  size 14710155092
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe9951bfdfc286622c846de580f1aec65c1e44f78aa8094a852f758e9ef7b3ca
3
  size 14710155092
last-checkpoint/trainer_state.json CHANGED
@@ -11,37 +11,37 @@
11
  {
12
  "epoch": 0.019230769230769232,
13
  "eval_loss": 1.8673125505447388,
14
- "eval_runtime": 15.1011,
15
- "eval_samples_per_second": 99.397,
16
- "eval_steps_per_second": 6.225,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.19230769230769232,
21
- "grad_norm": 36.0,
22
  "learning_rate": 6.666666666666667e-05,
23
- "loss": 2.4526,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.38461538461538464,
28
- "grad_norm": 231.0,
29
  "learning_rate": 0.00013333333333333334,
30
- "loss": 2.8068,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.5769230769230769,
35
- "grad_norm": 105.0,
36
  "learning_rate": 0.0002,
37
- "loss": 6.5887,
38
  "step": 30
39
  },
40
  {
41
  "epoch": 0.7692307692307693,
42
- "grad_norm": 67.0,
43
  "learning_rate": 0.00019984815164333163,
44
- "loss": 9.409,
45
  "step": 40
46
  }
47
  ],
 
11
  {
12
  "epoch": 0.019230769230769232,
13
  "eval_loss": 1.8673125505447388,
14
+ "eval_runtime": 14.8131,
15
+ "eval_samples_per_second": 101.329,
16
+ "eval_steps_per_second": 6.346,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.19230769230769232,
21
+ "grad_norm": 29.625,
22
  "learning_rate": 6.666666666666667e-05,
23
+ "loss": 2.4447,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.38461538461538464,
28
+ "grad_norm": 246.0,
29
  "learning_rate": 0.00013333333333333334,
30
+ "loss": 3.8293,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.5769230769230769,
35
+ "grad_norm": 96.5,
36
  "learning_rate": 0.0002,
37
+ "loss": 6.931,
38
  "step": 30
39
  },
40
  {
41
  "epoch": 0.7692307692307693,
42
+ "grad_norm": 804.0,
43
  "learning_rate": 0.00019984815164333163,
44
+ "loss": 11.6713,
45
  "step": 40
46
  }
47
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b41a9fb463c0db3738bb35eb54493dd7cd16792db1e56184a9c9b31d58bd7b14
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0acef938a7d9ffe7b10254d7cbe4256ddc2dc212f47d8b0cfb76c4ad76b57933
3
  size 6776