Add weights
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +9 -0
- merges.txt +0 -0
- mlc-chat-config.json +84 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
README.md
CHANGED
@@ -1,3 +1,12 @@
|
|
1 |
---
|
2 |
license: apache-2.0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
---
|
|
|
1 |
---
|
2 |
license: apache-2.0
|
3 |
+
license_link: https://huggingface.co/Qwen/Qwen2.5-7B-Instruct-GPTQ-Int4/blob/main/LICENSE
|
4 |
+
language:
|
5 |
+
- en
|
6 |
+
base_model: Qwen/Qwen2.5-7B-Instruct
|
7 |
+
base_model_relation: quantized
|
8 |
+
library_name: mlc-llm
|
9 |
+
pipeline_tag: text-generation
|
10 |
+
tags:
|
11 |
+
- chat
|
12 |
---
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,84 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen2",
|
4 |
+
"quantization": "GPTQ-Int4",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 3584,
|
8 |
+
"intermediate_size": 18944,
|
9 |
+
"num_attention_heads": 28,
|
10 |
+
"num_hidden_layers": 28,
|
11 |
+
"num_key_value_heads": 4,
|
12 |
+
"rms_norm_eps": 1e-06,
|
13 |
+
"rope_theta": 1000000.0,
|
14 |
+
"vocab_size": 152064,
|
15 |
+
"tie_word_embeddings": false,
|
16 |
+
"context_window_size": 8192,
|
17 |
+
"prefill_chunk_size": 128,
|
18 |
+
"tensor_parallel_shards": 1,
|
19 |
+
"head_dim": 128,
|
20 |
+
"dtype": "float32",
|
21 |
+
"max_batch_size": 128
|
22 |
+
},
|
23 |
+
"vocab_size": 152064,
|
24 |
+
"context_window_size": 8192,
|
25 |
+
"sliding_window_size": -1,
|
26 |
+
"prefill_chunk_size": 128,
|
27 |
+
"attention_sink_size": -1,
|
28 |
+
"tensor_parallel_shards": 1,
|
29 |
+
"pipeline_parallel_stages": 1,
|
30 |
+
"temperature": 0.7,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.05,
|
34 |
+
"top_p": 0.8,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.json",
|
37 |
+
"vocab.json",
|
38 |
+
"merges.txt",
|
39 |
+
"tokenizer_config.json"
|
40 |
+
],
|
41 |
+
"tokenizer_info": {
|
42 |
+
"token_postproc_method": "byte_level",
|
43 |
+
"prepend_space_in_encode": false,
|
44 |
+
"strip_space_in_decode": false
|
45 |
+
},
|
46 |
+
"conv_template": {
|
47 |
+
"name": "qwen2",
|
48 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
49 |
+
"system_message": "You are a helpful assistant.",
|
50 |
+
"system_prefix_token_ids": null,
|
51 |
+
"add_role_after_system_message": true,
|
52 |
+
"roles": {
|
53 |
+
"user": "<|im_start|>user",
|
54 |
+
"assistant": "<|im_start|>assistant"
|
55 |
+
},
|
56 |
+
"role_templates": {
|
57 |
+
"user": "{user_message}",
|
58 |
+
"assistant": "{assistant_message}",
|
59 |
+
"tool": "{tool_message}"
|
60 |
+
},
|
61 |
+
"messages": [],
|
62 |
+
"seps": [
|
63 |
+
"<|im_end|>\n"
|
64 |
+
],
|
65 |
+
"role_content_sep": "\n",
|
66 |
+
"role_empty_sep": "\n",
|
67 |
+
"stop_str": [
|
68 |
+
"<|endoftext|>",
|
69 |
+
"<|im_end|>"
|
70 |
+
],
|
71 |
+
"stop_token_ids": [
|
72 |
+
151643,
|
73 |
+
151645
|
74 |
+
],
|
75 |
+
"function_string": "",
|
76 |
+
"use_function_calling": false
|
77 |
+
},
|
78 |
+
"pad_token_id": 151643,
|
79 |
+
"bos_token_id": 151643,
|
80 |
+
"eos_token_id": [
|
81 |
+
151645,
|
82 |
+
151643
|
83 |
+
]
|
84 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c39365f4790e5fa7cb1a7ac7ceb462b7b1c5a10a9eee3ea31fcc6648439ca66
|
3 |
+
size 272498688
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42cd75b4b6dca34f137469d0355035076a5fe406b9d19170438c05ad8e55e774
|
3 |
+
size 33947648
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52e6a42f3010eac2a27281f5a3d17e5150801563ed616f9af8a4bd440ae586c2
|
3 |
+
size 33490944
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b227fb322752c994fb5268bf4c17d3802b4373a77c56c352ad41dd078ebdc220
|
3 |
+
size 67895296
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fbd151eafa8ba5200e4580753b19c5d95a22a3c05aa27bba3ca0d3c1ab0605e
|
3 |
+
size 33947648
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07e9c703e6190eb517945004ea561887734cf6f31ffe29a56d8cb04457aff31c
|
3 |
+
size 67895296
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a8f22c554c700c2b9795fcdb33232ebfbedc99f745460fc5d9f5c606913464b
|
3 |
+
size 30059520
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a8076edd62294be9893059260db0d3d72e1232e486a978f5f1ad26aded56f57
|
3 |
+
size 272498688
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d903fde7fb6a318fb15aa8f1c05f2d4a8062d320df627a3d61e487fd6cf1ebfe
|
3 |
+
size 33947648
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bdcb062fad2f529134437a25cf9b1c58c1a29f049503b221bf30d5c9d212a87
|
3 |
+
size 67895296
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51f3fd84236fcd3ed2b3176cb63cb881c22b42d8e45d65eca9c5ffdbd27b897e
|
3 |
+
size 33947648
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91d6405c46c2c9d08276691f540ad3f15a9fe70e13e294a9b1b69d71a3d08656
|
3 |
+
size 33498112
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbd31ca8a52674f58cbe698e36dd7feff337a76f36a35582e8e1f7f8b7d6d552
|
3 |
+
size 33947648
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc559510f0afcd766f42bd9e2edcbab71df5b435036aa5d31937e510073f0589
|
3 |
+
size 67895296
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0daeaab6c083d2fa0a2323f3def85b137d1ae62cce585c63caca4ff9a57ce02
|
3 |
+
size 33947648
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ef3583b58b29a449bc0b49659599c013332e49e49e33b791bc0a83540c9106c
|
3 |
+
size 67895296
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b441923c12abe1a71c11ab650daf1a107f326b8c2c65acc41d0981e66cc32240
|
3 |
+
size 30059520
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af31b1e4112976023dd6ce549ea06db220d9ea43000007774a256b27f516ac63
|
3 |
+
size 33947648
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ebaff4e41f93bd0de7683ae5bc910b7d2d99508337d465912353da95b084437
|
3 |
+
size 67895296
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6b89b86bde9af82be9ec930e44c4d5db667fd869849c8655e0c6dace374c20d
|
3 |
+
size 33947648
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28c2f703db5c737c8df5e432e3fd627dd78fb2c290c67685dbb9257c5091d27a
|
3 |
+
size 67895296
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c279c682fabe024c7c136b73c3ae170b1eb116e0a4ded50e602a45066e78a255
|
3 |
+
size 28174336
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca1d7df32ac4a57bb9b507c861a2d2213f9118972aa5f38ec14e15178e449b25
|
3 |
+
size 33947648
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aacbdce1c8765e800fa78ae52f2a4c4cf39f27daafb78bd0b377ad33344f85e0
|
3 |
+
size 67895296
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:738ea0b178203a40f29125da674f28599b475e46ed93ffa001bf9505cf29ecbf
|
3 |
+
size 67895296
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c2fed3412f385650bc942bd2f71af527f88761293ab0958f5f8430d9c5fa6cd
|
3 |
+
size 33507328
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf8623b53fa80ea54eaef1b1f8c1c064b95b03a1f8af7ab37fd97255c8434fe5
|
3 |
+
size 33947648
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98039d027fe1e6132d4c1ddf1e5ddaa3792209ecbb0308db35e65d7de8c3dabe
|
3 |
+
size 67895296
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:971d9768b3e5cb33f2df070caa5c6ffb73108f53409eec7407290959e403ba45
|
3 |
+
size 33947648
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6981e486f9d4014287ca7e90842d6ec2f4786cbeb8fafcd5bf40203ba8c9e95
|
3 |
+
size 33490944
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dee11fade35709888792f1b7f100a5e9294cb3791f78f7cce9c732a8df63edef
|
3 |
+
size 67895296
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:273972d533017082d51f90521ad790e049613b6a7fd3797745fa44fbf5fa6051
|
3 |
+
size 33947648
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52c4d1c54b03595b9dc68841aa163eaa2f72b9c938dbe22d6649d2479c89ac00
|
3 |
+
size 67895296
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd6dff59dc4a65544b29f4f0e982288e162b9b82bc15eeb9e5ffdb61dfd39ef8
|
3 |
+
size 30059520
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0198735f0f0565ea7bfcd57b61fbe9e4b4e51b71bd41065cd0bbc0ba7898f161
|
3 |
+
size 33947648
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf1d00a8bc5cdd50febf34607dceae1ecd550316827b2fd40d1fa59bf7049333
|
3 |
+
size 33947648
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e47f031b4f0883556de4d0bae1f336748103b665756f5efb270a6d5ea794f56
|
3 |
+
size 67895296
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0e54c8f402b544e1d4551e46e281c5cb79e3886a7364128eb361550138ea324
|
3 |
+
size 67895296
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8c6a5f726faeac81d67b17c9c736e099caca48a733eac6a8295d8ead3dfa907
|
3 |
+
size 27113472
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f5557f843b495558b933fdb5c8822853fd3b1c058fcfb06aee0da71cc9afbe9
|
3 |
+
size 33947648
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44396b48da8c8afce5bf5cbf9730b9881fef5a08aa4559d2769e66db46a5cae3
|
3 |
+
size 67895296
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51d48ddf1c417049fd8f0105f46644638792c5a3972fe99eeffa111ee2208eea
|
3 |
+
size 33947648
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:789192ad047d7e68e9d55b82cbeeb9bc69d34ec64a15ac1de0e0525cc51e961e
|
3 |
+
size 67895296
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3810cdee708527c2ea40caf2fa53cac841ed46a443de73c9dce1e8f22b4c1d90
|
3 |
+
size 30043136
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef022f0b7a38ecd6f3c0ea9df49f19ed361b7e23323e1f57b318c5e6c8af8289
|
3 |
+
size 33947648
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:827dacdf095507c29d5f09a42bdc629287472df927a39d0333f4057ba5fb1497
|
3 |
+
size 67895296
|