Upload model
Browse files- README.md +1 -0
- all_results.json +4 -4
- start_end.json +1 -1
- train_results.json +4 -4
- trainer_log.jsonl +2 -0
- trainer_state.json +4 -4
- training_args.bin +2 -2
README.md
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
---
|
2 |
library_name: transformers
|
3 |
license: other
|
|
|
4 |
tags:
|
5 |
- llama-factory
|
6 |
- full
|
|
|
1 |
---
|
2 |
library_name: transformers
|
3 |
license: other
|
4 |
+
base_model: Qwen/Qwen2.5-7B-Instruct
|
5 |
tags:
|
6 |
- llama-factory
|
7 |
- full
|
all_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
"total_flos": 4.772812472451072e+16,
|
4 |
-
"train_loss": 0.
|
5 |
-
"train_runtime":
|
6 |
-
"train_samples_per_second":
|
7 |
-
"train_steps_per_second":
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
"total_flos": 4.772812472451072e+16,
|
4 |
+
"train_loss": 0.0,
|
5 |
+
"train_runtime": 8.8002,
|
6 |
+
"train_samples_per_second": 165280.93,
|
7 |
+
"train_steps_per_second": 323.289
|
8 |
}
|
start_end.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"start_time": "2025-06-
|
|
|
1 |
+
{"start_time": "2025-06-28 20:43:56", "end_time": "2025-06-28 20:45:49"}
|
train_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
"total_flos": 4.772812472451072e+16,
|
4 |
-
"train_loss": 0.
|
5 |
-
"train_runtime":
|
6 |
-
"train_samples_per_second":
|
7 |
-
"train_steps_per_second":
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
"total_flos": 4.772812472451072e+16,
|
4 |
+
"train_loss": 0.0,
|
5 |
+
"train_runtime": 8.8002,
|
6 |
+
"train_samples_per_second": 165280.93,
|
7 |
+
"train_steps_per_second": 323.289
|
8 |
}
|
trainer_log.jsonl
CHANGED
@@ -2844,3 +2844,5 @@
|
|
2844 |
{"current_steps": 2844, "total_steps": 2845, "loss": 0.4757, "lr": 3.011963855659161e-11, "epoch": 4.998242530755712, "percentage": 99.96, "elapsed_time": "14:28:40", "remaining_time": "0:00:18"}
|
2845 |
{"current_steps": 2845, "total_steps": 2845, "loss": 0.4687, "lr": 0.0, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "14:29:00", "remaining_time": "0:00:00"}
|
2846 |
{"current_steps": 2845, "total_steps": 2845, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "14:30:15", "remaining_time": "0:00:00"}
|
|
|
|
|
|
2844 |
{"current_steps": 2844, "total_steps": 2845, "loss": 0.4757, "lr": 3.011963855659161e-11, "epoch": 4.998242530755712, "percentage": 99.96, "elapsed_time": "14:28:40", "remaining_time": "0:00:18"}
|
2845 |
{"current_steps": 2845, "total_steps": 2845, "loss": 0.4687, "lr": 0.0, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "14:29:00", "remaining_time": "0:00:00"}
|
2846 |
{"current_steps": 2845, "total_steps": 2845, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "14:30:15", "remaining_time": "0:00:00"}
|
2847 |
+
{"current_steps": 2845, "total_steps": 2845, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00"}
|
2848 |
+
{"current_steps": 2845, "total_steps": 2845, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00"}
|
trainer_state.json
CHANGED
@@ -19927,10 +19927,10 @@
|
|
19927 |
"epoch": 5.0,
|
19928 |
"step": 2845,
|
19929 |
"total_flos": 4.772812472451072e+16,
|
19930 |
-
"train_loss": 0.
|
19931 |
-
"train_runtime":
|
19932 |
-
"train_samples_per_second":
|
19933 |
-
"train_steps_per_second":
|
19934 |
}
|
19935 |
],
|
19936 |
"logging_steps": 1,
|
|
|
19927 |
"epoch": 5.0,
|
19928 |
"step": 2845,
|
19929 |
"total_flos": 4.772812472451072e+16,
|
19930 |
+
"train_loss": 0.0,
|
19931 |
+
"train_runtime": 8.8002,
|
19932 |
+
"train_samples_per_second": 165280.93,
|
19933 |
+
"train_steps_per_second": 323.289
|
19934 |
}
|
19935 |
],
|
19936 |
"logging_steps": 1,
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:515f9e72ee63ddb994fed5d03f3c6b90c4e6ce89629a14e0c19db16c1232fe69
|
3 |
+
size 7544
|