Add model weights
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +81 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 11008,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-06,
|
11 |
+
"vocab_size": 32256,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 100000,
|
14 |
+
"rope_scaling": null,
|
15 |
+
"context_window_size": 16384,
|
16 |
+
"prefill_chunk_size": 8192,
|
17 |
+
"num_key_value_heads": 32,
|
18 |
+
"head_dim": 128,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"pipeline_parallel_stages": 1,
|
21 |
+
"max_batch_size": 128,
|
22 |
+
"disaggregation": false
|
23 |
+
},
|
24 |
+
"vocab_size": 32256,
|
25 |
+
"context_window_size": 16384,
|
26 |
+
"sliding_window_size": -1,
|
27 |
+
"prefill_chunk_size": 8192,
|
28 |
+
"attention_sink_size": -1,
|
29 |
+
"tensor_parallel_shards": 1,
|
30 |
+
"pipeline_parallel_stages": 1,
|
31 |
+
"temperature": 1.0,
|
32 |
+
"presence_penalty": 0.0,
|
33 |
+
"frequency_penalty": 0.0,
|
34 |
+
"repetition_penalty": 1.0,
|
35 |
+
"top_p": 1.0,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.json",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"tokenizer_info": {
|
41 |
+
"token_postproc_method": "byte_level",
|
42 |
+
"prepend_space_in_encode": false,
|
43 |
+
"strip_space_in_decode": false
|
44 |
+
},
|
45 |
+
"conv_template": {
|
46 |
+
"name": "deepseek",
|
47 |
+
"system_template": "{system_message}",
|
48 |
+
"system_message": "",
|
49 |
+
"system_prefix_token_ids": [
|
50 |
+
100000
|
51 |
+
],
|
52 |
+
"add_role_after_system_message": true,
|
53 |
+
"roles": {
|
54 |
+
"user": "User",
|
55 |
+
"assistant": "Assistant"
|
56 |
+
},
|
57 |
+
"role_templates": {
|
58 |
+
"user": "{user_message}",
|
59 |
+
"assistant": "{assistant_message}",
|
60 |
+
"tool": "{tool_message}"
|
61 |
+
},
|
62 |
+
"messages": [],
|
63 |
+
"seps": [
|
64 |
+
"\n\n",
|
65 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
66 |
+
],
|
67 |
+
"role_content_sep": ": ",
|
68 |
+
"role_empty_sep": ":",
|
69 |
+
"stop_str": [
|
70 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
71 |
+
],
|
72 |
+
"stop_token_ids": [
|
73 |
+
100001
|
74 |
+
],
|
75 |
+
"function_string": "",
|
76 |
+
"use_function_calling": false
|
77 |
+
},
|
78 |
+
"pad_token_id": 0,
|
79 |
+
"bos_token_id": 32013,
|
80 |
+
"eos_token_id": 32021
|
81 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:113958fd244846a2e6e13c320cf9a43cf353fa64a609e22ddc89a540a46fda36
|
3 |
+
size 66060288
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bce1a81e94d0d8ff7b91a2a6d62aec3a62510a50dc3a9408c78d94a754850630
|
3 |
+
size 30810112
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01ccf5a123ea107faf5a26570f22d39ac4191e465a203f8b6a7ca820e96877a9
|
3 |
+
size 25165824
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad2f637652d0e20971efbc890fdf6a060dc69310adf662210ea03675f8c60f32
|
3 |
+
size 22544384
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afff688fc7c83b8538edc03f428f9cc203e4834a2e3d1184dab87fcc01c422a9
|
3 |
+
size 45088768
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9552929bdc3fb84029aa8404818eb14d42627a22148902f3f1641dda0c5d3677
|
3 |
+
size 25165824
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95ee006c0fb4bd23dfacbf802eb886f40cab2cb480f2dd1fc0d465b0e1f78e97
|
3 |
+
size 32661504
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8706a346c201a4a622757313d9c6d0449206df7ce699600009887a222d3ab90
|
3 |
+
size 31989760
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d56bb91f54ac698416150196771bfc41e0f1121451c5371c4aa26deeada6f5f0
|
3 |
+
size 45088768
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c479d370ffc0cf90b57fcd870e5cbdb497f33dc020a1067e33ae44d9a40d4443
|
3 |
+
size 25165824
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f51d88ace9a217309ae40405a612c83417fa318d692c78a54f4d8a55da7ac7e
|
3 |
+
size 22544384
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:870f89dba3db76adebda7b05c868e55a0a3791fda92f22b73cc5ae2761d0de0f
|
3 |
+
size 45088768
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c567a2afe492dc5e835f1d694149a1042bf721bdbf0dbb4c14335efe5ea0d63
|
3 |
+
size 25165824
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c99129a962f42acef05bb70d31b2b6c1dbabaee3d9341d5e8d4027c454aca2f9
|
3 |
+
size 22544384
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e67143a4eecfaa46754db1373468143b1b5f8e4c8d400892a969afc7b4f907ed
|
3 |
+
size 32661504
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:add9b58e37d9a9e7a43e513d87b0b7b761d8a13c93f0b63c3db4e1070b9c3a6e
|
3 |
+
size 31989760
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28ab2be4d1f87d6f29666ad7a0c3c2ebebb7daac81ae8e02626e188f0592844c
|
3 |
+
size 45088768
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40a9140268a3b5ea13b22918c4128b6f555bdeac6e2ea1230624cd258b2ca706
|
3 |
+
size 25165824
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34f092937983aac5edcd11309c497a32caf8c6c3c05de89a8eb31f2c8913ac6e
|
3 |
+
size 21045248
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8c129b94b0c53454dbb77b40a73beb573422b6fb0c89d79829cd82d414978f0
|
3 |
+
size 45088768
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5652c03ede5b4fc81a3bcc71c89522e5d77ad5ce1e17416de9aa9246baca863
|
3 |
+
size 25165824
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75010a067f6257d08a004be043f7aea4288878745bc060f09b4092f46b935bd3
|
3 |
+
size 32661504
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea9d436c35bfa99bf55ebdbfb0aa0e4f5b3dd12b6e97aae7c4f50bec0335a0f3
|
3 |
+
size 31989760
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61760427459ddb894308572f59ddde2fc15051575b0fd91e5f014001a77c226d
|
3 |
+
size 45088768
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a1177a1e54144d47e8ad87ce4412fc5a2b2eb7ea22d9ea47782c19b01ff5694
|
3 |
+
size 25165824
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e1b3af1c5c695643f784b1683c6d1386483da56f13d2373a1bf5cac74d15696
|
3 |
+
size 22544384
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c60f81ba3bb3f99b143da63a2c3eafe8425f8e2ef9ec4a767418f40b23b65834
|
3 |
+
size 45088768
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be299961cba208ba443ed2f7115e993c0dbf3095db4240b0609ea094e60c2b71
|
3 |
+
size 45088768
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf83be195aeda5ba31838c32c859eeb2abba58e680ac8d68e673df4b662217cb
|
3 |
+
size 25165824
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5e717d960c8b5c362e3b83b596909e1921277c908835b56f5d1b190d51220bc
|
3 |
+
size 32661504
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7598f884bb9ca51595c89b322b7a5207e5326b82525342d660414886de34584b
|
3 |
+
size 31989760
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47311236eafb86b11099b63f5caec4fcdcb559f90e634a013254cfc335ee1f5c
|
3 |
+
size 45088768
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:376d5d03ec3a17e4e0057686aaa6451c22178a34dbec90db0580d3907e09fd59
|
3 |
+
size 25165824
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:545ebe12ba509a2a5173e4c3fd7bc90bac5536258b34c76158a175fb7907c3cf
|
3 |
+
size 22544384
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:086c0a3396aa52cf068346e0d7724cb6981b57c68eb17a7c26d5239eed4b9116
|
3 |
+
size 45088768
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:742ec521135eb4e52a5565f8c63f8f1d69620a98736ace85a665ac72eec402f1
|
3 |
+
size 25165824
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:022f570277c5c38691c3aee47733f3164af3ae5a13c964667e9d441e2ab03050
|
3 |
+
size 32661504
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3071953dc57ee9eadf4a21fcf980017c5337df34893e9ffd5f0f5c856b3b84f
|
3 |
+
size 66060288
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0000630e1dde6becf1f595ceeb2e6e6255fa3c7adf0155b6dcbef388fe39a84c
|
3 |
+
size 25165824
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e8b41b93ddfdc0bfb51e634b5675a91bcb7d0324ebc334eae8a29fd0e139add
|
3 |
+
size 22544384
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4946587ab4348355a8030cddf8f004c9e66d2337696dfe51f1195203030fc33c
|
3 |
+
size 45088768
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74a2fb3d206e1ba7ead8a05ec12063231b7a2658d3df56e78ff981284eb92188
|
3 |
+
size 25165824
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05361117c01b30cbe8c725ab490595566b92aecbb329c2b2b3c95c4bad1d686f
|
3 |
+
size 29319168
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:059b0e0dacc79f51abc5d05e1cf76f6bcda70d0f4b7609d3d382e099ad5ecc56
|
3 |
+
size 31989760
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c89b2529678fde2f902475f42ace6624aa45641a51463193273644d632d54ab9
|
3 |
+
size 45088768
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8202ffe9343eff354c4f67d584cd842b7576e3f45f1c7e3aced2ce542be62af7
|
3 |
+
size 25165824
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7b94d4139623c6137a70f0fb2dca05d8fc852022961ea7c8c9f2d1321d74192
|
3 |
+
size 22544384
|