SystemAdmin123 commited on
Commit
c8cb36c
·
verified ·
1 Parent(s): 0c1e3e3

Training in progress, step 160, checkpoint

Browse files
last-checkpoint/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "peft-internal-testing/tiny-dummy-qwen2",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
 
1
  {
2
+ "_name_or_path": "fxmarty/tiny-dummy-qwen2",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
last-checkpoint/trainer_state.json CHANGED
@@ -11,9 +11,9 @@
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 11.929322242736816,
14
- "eval_runtime": 3.6275,
15
- "eval_samples_per_second": 414.056,
16
- "eval_steps_per_second": 25.913,
17
  "step": 1
18
  },
19
  {
@@ -33,9 +33,9 @@
33
  {
34
  "epoch": 0.023668639053254437,
35
  "eval_loss": 11.92916488647461,
36
- "eval_runtime": 3.5124,
37
- "eval_samples_per_second": 427.632,
38
- "eval_steps_per_second": 26.763,
39
  "step": 20
40
  },
41
  {
@@ -55,9 +55,9 @@
55
  {
56
  "epoch": 0.047337278106508875,
57
  "eval_loss": 11.928914070129395,
58
- "eval_runtime": 3.5866,
59
- "eval_samples_per_second": 418.781,
60
- "eval_steps_per_second": 26.209,
61
  "step": 40
62
  },
63
  {
@@ -77,9 +77,9 @@
77
  {
78
  "epoch": 0.07100591715976332,
79
  "eval_loss": 11.92799186706543,
80
- "eval_runtime": 3.5352,
81
- "eval_samples_per_second": 424.864,
82
- "eval_steps_per_second": 26.589,
83
  "step": 60
84
  },
85
  {
@@ -99,9 +99,9 @@
99
  {
100
  "epoch": 0.09467455621301775,
101
  "eval_loss": 11.925419807434082,
102
- "eval_runtime": 3.5978,
103
- "eval_samples_per_second": 417.483,
104
- "eval_steps_per_second": 26.127,
105
  "step": 80
106
  },
107
  {
@@ -121,9 +121,9 @@
121
  {
122
  "epoch": 0.11834319526627218,
123
  "eval_loss": 11.913871765136719,
124
- "eval_runtime": 3.568,
125
- "eval_samples_per_second": 420.97,
126
- "eval_steps_per_second": 26.346,
127
  "step": 100
128
  },
129
  {
@@ -143,9 +143,9 @@
143
  {
144
  "epoch": 0.14201183431952663,
145
  "eval_loss": 11.85535717010498,
146
- "eval_runtime": 3.581,
147
- "eval_samples_per_second": 419.431,
148
- "eval_steps_per_second": 26.249,
149
  "step": 120
150
  },
151
  {
@@ -165,9 +165,9 @@
165
  {
166
  "epoch": 0.16568047337278108,
167
  "eval_loss": 11.73879337310791,
168
- "eval_runtime": 3.5748,
169
- "eval_samples_per_second": 420.168,
170
- "eval_steps_per_second": 26.295,
171
  "step": 140
172
  },
173
  {
@@ -187,9 +187,9 @@
187
  {
188
  "epoch": 0.1893491124260355,
189
  "eval_loss": 11.629658699035645,
190
- "eval_runtime": 3.5281,
191
- "eval_samples_per_second": 425.721,
192
- "eval_steps_per_second": 26.643,
193
  "step": 160
194
  }
195
  ],
 
11
  {
12
  "epoch": 0.001183431952662722,
13
  "eval_loss": 11.929322242736816,
14
+ "eval_runtime": 3.5424,
15
+ "eval_samples_per_second": 424.005,
16
+ "eval_steps_per_second": 26.536,
17
  "step": 1
18
  },
19
  {
 
33
  {
34
  "epoch": 0.023668639053254437,
35
  "eval_loss": 11.92916488647461,
36
+ "eval_runtime": 3.5376,
37
+ "eval_samples_per_second": 424.587,
38
+ "eval_steps_per_second": 26.572,
39
  "step": 20
40
  },
41
  {
 
55
  {
56
  "epoch": 0.047337278106508875,
57
  "eval_loss": 11.928914070129395,
58
+ "eval_runtime": 3.5225,
59
+ "eval_samples_per_second": 426.404,
60
+ "eval_steps_per_second": 26.686,
61
  "step": 40
62
  },
63
  {
 
77
  {
78
  "epoch": 0.07100591715976332,
79
  "eval_loss": 11.92799186706543,
80
+ "eval_runtime": 3.5615,
81
+ "eval_samples_per_second": 421.727,
82
+ "eval_steps_per_second": 26.393,
83
  "step": 60
84
  },
85
  {
 
99
  {
100
  "epoch": 0.09467455621301775,
101
  "eval_loss": 11.925419807434082,
102
+ "eval_runtime": 3.5961,
103
+ "eval_samples_per_second": 417.672,
104
+ "eval_steps_per_second": 26.139,
105
  "step": 80
106
  },
107
  {
 
121
  {
122
  "epoch": 0.11834319526627218,
123
  "eval_loss": 11.913871765136719,
124
+ "eval_runtime": 3.5719,
125
+ "eval_samples_per_second": 420.504,
126
+ "eval_steps_per_second": 26.316,
127
  "step": 100
128
  },
129
  {
 
143
  {
144
  "epoch": 0.14201183431952663,
145
  "eval_loss": 11.85535717010498,
146
+ "eval_runtime": 3.5396,
147
+ "eval_samples_per_second": 424.345,
148
+ "eval_steps_per_second": 26.557,
149
  "step": 120
150
  },
151
  {
 
165
  {
166
  "epoch": 0.16568047337278108,
167
  "eval_loss": 11.73879337310791,
168
+ "eval_runtime": 3.4959,
169
+ "eval_samples_per_second": 429.652,
170
+ "eval_steps_per_second": 26.889,
171
  "step": 140
172
  },
173
  {
 
187
  {
188
  "epoch": 0.1893491124260355,
189
  "eval_loss": 11.629658699035645,
190
+ "eval_runtime": 3.5771,
191
+ "eval_samples_per_second": 419.895,
192
+ "eval_steps_per_second": 26.278,
193
  "step": 160
194
  }
195
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9932170e7e73ee2b0df54dc82e7d5237bddfcbc5bea68ea5e6421bff5f7c8a3
3
- size 6712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20af897fff432dad9da1232d2f5e6ab4040448b601443dcf983c39a3e47a3b26
3
+ size 6648