aisuko commited on
Commit
4d97fc7
·
verified ·
1 Parent(s): 686c44d
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [microsoft/Phi-3.5-mini-instruct](https://huggingface.co/microsoft/Phi-3.5-mini-instruct) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 0.7631
20
  - Exact Match Ratio: 0.0
21
  - Sequence Accuracy: 0.0
22
 
@@ -49,9 +49,9 @@ The following hyperparameters were used during training:
49
 
50
  | Training Loss | Epoch | Step | Validation Loss | Exact Match Ratio | Sequence Accuracy |
51
  |:-------------:|:-----:|:----:|:---------------:|:-----------------:|:-----------------:|
52
- | 8.1148 | 1.0 | 50 | 1.6942 | 0.0 | 0.0 |
53
- | 1.2769 | 2.0 | 100 | 0.8926 | 0.0 | 0.0 |
54
- | 0.8832 | 3.0 | 150 | 0.7631 | 0.0 | 0.0 |
55
 
56
 
57
  ### Framework versions
 
16
 
17
  This model is a fine-tuned version of [microsoft/Phi-3.5-mini-instruct](https://huggingface.co/microsoft/Phi-3.5-mini-instruct) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 0.7111
20
  - Exact Match Ratio: 0.0
21
  - Sequence Accuracy: 0.0
22
 
 
49
 
50
  | Training Loss | Epoch | Step | Validation Loss | Exact Match Ratio | Sequence Accuracy |
51
  |:-------------:|:-----:|:----:|:---------------:|:-----------------:|:-----------------:|
52
+ | 1.3755 | 1.0 | 500 | 0.7111 | 0.0 | 0.0 |
53
+ | 1.1658 | 2.0 | 1000 | 1.0461 | 0.0 | 0.0 |
54
+ | 1.0217 | 3.0 | 1500 | 0.7995 | 0.0 | 0.0 |
55
 
56
 
57
  ### Framework versions
adapter_config.json CHANGED
@@ -26,10 +26,10 @@
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
29
- "down_proj",
30
  "qkv_proj",
31
- "o_proj",
32
- "gate_up_proj"
 
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
 
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
 
29
  "qkv_proj",
30
+ "down_proj",
31
+ "gate_up_proj",
32
+ "o_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f15bd442fe3e4d1b515b51f3d64667e033497c8f4e4a635f2a227d6d8078cec8
3
  size 888703384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23ff80ac0881d0b146286fe51c47ae8c659ded1fb958af8712edcd2195100df7
3
  size 888703384
runs/Dec06_22-36-31_default/events.out.tfevents.1733524591.default.1440.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94da49524d4103dc2f614ac5215a63a546f7036473b873a5cf9a326a4497825c
3
+ size 10573
runs/Dec06_22-36-31_default/events.out.tfevents.1733526287.default.1440.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:867b30cdd9b00502689ddae1e0c2a603595def98c8b472bb5578b5e41aa76f1f
3
+ size 481
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb9a6430bbb63abb7745d79404d46877785336574cf79a89fd40d253e0990ea9
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12510a0bc410ceb3b1133e6fd17f26c3a9340e3895a0abf3208ec5cf3e778526
3
  size 5304