EtashGuha commited on
Commit
dba4169
·
verified ·
1 Parent(s): bfe1753

Upload model

Browse files
README.md CHANGED
@@ -1,6 +1,7 @@
1
  ---
2
  library_name: transformers
3
  license: other
 
4
  tags:
5
  - llama-factory
6
  - full
 
1
  ---
2
  library_name: transformers
3
  license: other
4
+ base_model: Qwen/Qwen2.5-7B-Instruct
5
  tags:
6
  - llama-factory
7
  - full
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
  "total_flos": 4.772812472451072e+16,
4
- "train_loss": 0.5341540531345327,
5
- "train_runtime": 52223.946,
6
- "train_samples_per_second": 27.851,
7
- "train_steps_per_second": 0.054
8
  }
 
1
  {
2
  "epoch": 5.0,
3
  "total_flos": 4.772812472451072e+16,
4
+ "train_loss": 0.0,
5
+ "train_runtime": 8.8002,
6
+ "train_samples_per_second": 165280.93,
7
+ "train_steps_per_second": 323.289
8
  }
start_end.json CHANGED
@@ -1 +1 @@
1
- {"start_time": "2025-06-27 04:50:36", "end_time": "2025-06-27 19:22:51"}
 
1
+ {"start_time": "2025-06-28 20:43:56", "end_time": "2025-06-28 20:45:49"}
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
  "total_flos": 4.772812472451072e+16,
4
- "train_loss": 0.5341540531345327,
5
- "train_runtime": 52223.946,
6
- "train_samples_per_second": 27.851,
7
- "train_steps_per_second": 0.054
8
  }
 
1
  {
2
  "epoch": 5.0,
3
  "total_flos": 4.772812472451072e+16,
4
+ "train_loss": 0.0,
5
+ "train_runtime": 8.8002,
6
+ "train_samples_per_second": 165280.93,
7
+ "train_steps_per_second": 323.289
8
  }
trainer_log.jsonl CHANGED
@@ -2844,3 +2844,5 @@
2844
  {"current_steps": 2844, "total_steps": 2845, "loss": 0.4757, "lr": 3.011963855659161e-11, "epoch": 4.998242530755712, "percentage": 99.96, "elapsed_time": "14:28:40", "remaining_time": "0:00:18"}
2845
  {"current_steps": 2845, "total_steps": 2845, "loss": 0.4687, "lr": 0.0, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "14:29:00", "remaining_time": "0:00:00"}
2846
  {"current_steps": 2845, "total_steps": 2845, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "14:30:15", "remaining_time": "0:00:00"}
 
 
 
2844
  {"current_steps": 2844, "total_steps": 2845, "loss": 0.4757, "lr": 3.011963855659161e-11, "epoch": 4.998242530755712, "percentage": 99.96, "elapsed_time": "14:28:40", "remaining_time": "0:00:18"}
2845
  {"current_steps": 2845, "total_steps": 2845, "loss": 0.4687, "lr": 0.0, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "14:29:00", "remaining_time": "0:00:00"}
2846
  {"current_steps": 2845, "total_steps": 2845, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "14:30:15", "remaining_time": "0:00:00"}
2847
+ {"current_steps": 2845, "total_steps": 2845, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00"}
2848
+ {"current_steps": 2845, "total_steps": 2845, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00"}
trainer_state.json CHANGED
@@ -19927,10 +19927,10 @@
19927
  "epoch": 5.0,
19928
  "step": 2845,
19929
  "total_flos": 4.772812472451072e+16,
19930
- "train_loss": 0.5341540531345327,
19931
- "train_runtime": 52223.946,
19932
- "train_samples_per_second": 27.851,
19933
- "train_steps_per_second": 0.054
19934
  }
19935
  ],
19936
  "logging_steps": 1,
 
19927
  "epoch": 5.0,
19928
  "step": 2845,
19929
  "total_flos": 4.772812472451072e+16,
19930
+ "train_loss": 0.0,
19931
+ "train_runtime": 8.8002,
19932
+ "train_samples_per_second": 165280.93,
19933
+ "train_steps_per_second": 323.289
19934
  }
19935
  ],
19936
  "logging_steps": 1,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f9bd04a28c05161cdf4fe4f55751b25e0094c30a2486ae53c8d3d880a6c0175
3
- size 7416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:515f9e72ee63ddb994fed5d03f3c6b90c4e6ce89629a14e0c19db16c1232fe69
3
+ size 7544