add model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +73 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
- params_shard_6.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,73 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "llama",
|
3 |
+
"quantization": "q4f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 4096,
|
6 |
+
"intermediate_size": 11008,
|
7 |
+
"num_attention_heads": 32,
|
8 |
+
"num_hidden_layers": 26,
|
9 |
+
"rms_norm_eps": 1e-06,
|
10 |
+
"vocab_size": 32000,
|
11 |
+
"position_embedding_base": 10000.0,
|
12 |
+
"context_window_size": 768,
|
13 |
+
"prefill_chunk_size": 768,
|
14 |
+
"num_key_value_heads": 32,
|
15 |
+
"head_dim": 128,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"max_batch_size": 80
|
18 |
+
},
|
19 |
+
"vocab_size": 32000,
|
20 |
+
"context_window_size": 768,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 768,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": {
|
34 |
+
"name": "llava",
|
35 |
+
"system_template": "{system_message}",
|
36 |
+
"system_message": "\n",
|
37 |
+
"system_prefix_token_ids": [
|
38 |
+
1
|
39 |
+
],
|
40 |
+
"add_role_after_system_message": false,
|
41 |
+
"roles": {
|
42 |
+
"user": "USER",
|
43 |
+
"assistant": "ASSISTANT"
|
44 |
+
},
|
45 |
+
"role_templates": {
|
46 |
+
"user": "{user_message}",
|
47 |
+
"assistant": "{assistant_message}",
|
48 |
+
"tool": "{tool_message}"
|
49 |
+
},
|
50 |
+
"messages": [],
|
51 |
+
"seps": [
|
52 |
+
" "
|
53 |
+
],
|
54 |
+
"role_content_sep": ": ",
|
55 |
+
"role_empty_sep": ":",
|
56 |
+
"stop_str": [
|
57 |
+
"</s>"
|
58 |
+
],
|
59 |
+
"stop_token_ids": [
|
60 |
+
2
|
61 |
+
],
|
62 |
+
"function_string": "",
|
63 |
+
"use_function_calling": false
|
64 |
+
},
|
65 |
+
"pad_token_id": -1,
|
66 |
+
"bos_token_id": 0,
|
67 |
+
"eos_token_id": 1,
|
68 |
+
"tokenizer_files": [
|
69 |
+
"tokenizer.model",
|
70 |
+
"tokenizer_config.json"
|
71 |
+
],
|
72 |
+
"version": "0.1.0"
|
73 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94c758e07af583dcc01863d18547217d4b3d059fd4bed5bc3c6f18e4aa61466a
|
3 |
+
size 65536000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d603f95e51fb25717469170b116224779b22adc0d3834174c58449baa290675
|
3 |
+
size 30744576
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b983bf04a304ac1ef90cd60e6ca3cef1383ad7c8e4abf27828348f52c748a9d6
|
3 |
+
size 45088768
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93b5e684891404e449b6882a01f58fff52563dacdb5acd66fa22d07402cae000
|
3 |
+
size 25165824
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5148d25e0c97157754257b27e6ec78d3ab6323ec43f2c77e772527a12038ec21
|
3 |
+
size 29253632
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4b567da0367f4879411203245be74d6b833a2e891195de507afb4d666f6db52
|
3 |
+
size 31989760
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff04e5bee464c377b99d83775faf380490227197892e55e4b1742e058b2eba2d
|
3 |
+
size 45088768
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81632cd5900922f94bd7878e4d9346bd7720c620f8f14fdeb8ea5ff74cc2a300
|
3 |
+
size 25165824
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdfed809301c15854419fbb101320c8a6c238326f50ca661e5d0cb26b61f5148
|
3 |
+
size 22544384
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:386e83c6b822ec62bcaad461c864cd5b8687a093dea51d8c93b68e48726eeb86
|
3 |
+
size 45088768
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ba3d32d3613be2c2d8d40078234e9f8f13f95955659aae97e8192ef6b6b5921
|
3 |
+
size 25165824
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a0c970fe2a40c2c6a0c2981c0bf124ed48686a87344aa604c3156dbb29def82
|
3 |
+
size 32661504
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46da39690add5d9901005cf08eda566a3753a476254e2a0e8e84995aeca9e2a6
|
3 |
+
size 45088768
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e9931948eb35ca909cac3d5cc2904bc7f32b24492ba733b9531ad2eb6901cda
|
3 |
+
size 31989760
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c239c2b51363ddfbf6911962a66dc80e67242959d8cc4c3a973099a114122b37
|
3 |
+
size 45088768
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b50974dd548767b7e770cef03db8bdecf6d94aa3cf3e73c86e6c5ae8ffed2243
|
3 |
+
size 25165824
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9237242ea688d8c0dc53ca00292c689d8dc5cd4e012f0bec18d3855bdcfba07a
|
3 |
+
size 22544384
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1890029a8a5abf8338f5907383022aae3aac4ba78bcfe9f6099c71d3ea1255d
|
3 |
+
size 45088768
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68291f6252be529ac78623e575f7bd77d7d8d9e1e4ade7e825d0fca1d15217ca
|
3 |
+
size 25165824
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ec0ebaba388e28d9f4cbe813fbd5007e43437379020398911d3830421d463e6
|
3 |
+
size 32661504
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e683532317c485995996f388cfb7dff430321d53bbee6ceef30c57bdf52838db
|
3 |
+
size 31989760
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36c0f03ef97033a6753b3a07cef7a90235fcfe937a72ea6d1d6b63591754658f
|
3 |
+
size 45088768
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c128def5b1dfb9d9d39648345b9e864609d4074a9df19a3d8a5c2fa177ed1c80
|
3 |
+
size 25165824
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:857f352956609916ddfd571f63ef8a5f8561936b189b80b0511bfeb05593173e
|
3 |
+
size 25165824
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:955d43a44891dd23ed7ae9db4af512c05493167b265d0512bf6c1378b36859d2
|
3 |
+
size 22544384
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3193e8470d5d6fa7b3be21e3498e6cfcd84504c1479a14f32524c0fe2563debd
|
3 |
+
size 45088768
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cdd1339a764277b227759516f3c81b45af75e5c8a53d2c22073cfa7f91dc6dd
|
3 |
+
size 25165824
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51e93e75249e38d056725ea660c6a2139d41b2d35e6f909afb3a195dce72867d
|
3 |
+
size 32661504
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ad7990ee36f062326fe0922c1f6b99fcb22c9aa65f6d66343db8c55eeeb32c2
|
3 |
+
size 31989760
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e95761e30e456e7932578b0aa7d5bb7588ff467b51209b8ebced1c84eb47601
|
3 |
+
size 45088768
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25100a211f61d9f7754f99406b7e9f0385499b70c418b0e5b592e2af887423b5
|
3 |
+
size 25165824
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99e81e824da5017d9f2319155cd3e2fd8610e4706d602432748e6b179b2ec65c
|
3 |
+
size 22544384
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88b807fd3054d64d422a0688f333bde43f531208f8afe965770fd258299ee915
|
3 |
+
size 45088768
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e802936a08ada9fbb6a56ec4f64390851a8b89e1c03d5e13a39f4d20dddb4125
|
3 |
+
size 25165824
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfb8d6d6e0762484adaa6f3dcc0953b379f2680020d8e9c54ca3e14353db8bb3
|
3 |
+
size 22544384
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c54c2f4008430e634115b593d0ec8dcb0cee3987b394d0e9cd1415f41206f40d
|
3 |
+
size 32661504
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3dc546ba54d3e65c9164193ad9c9e27fafb98fc3ac9a787df59d63ce233a7b36
|
3 |
+
size 31989760
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c182ebd5ab5c4954ed3102c7ad0cfdd7b340af30ffa56f7b9705d3e3c7ce014
|
3 |
+
size 45088768
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b0ad38b6aee9ba2cb3a0bff8c0f978ea737ad5aec5eef3bf1b2b33b84b9d7d9
|
3 |
+
size 25165824
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5772ed2fc1ae414cd54d54fef6f5760b28975c405dfeb4728c0ca4a7059b5c2d
|
3 |
+
size 22544384
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:875bb6a7a073632ffe7038d967bb22e519049b7939cfabe7333211f9243c5a44
|
3 |
+
size 45088768
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85ff619ab13eacca9fafc7bc9f57f545260dd41f075bcb9fc1d3cd13cf59a161
|
3 |
+
size 25165824
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3188b73f7a06dd74797cf54123e830756da0190c03a7a407ba10eb347fd4a22f
|
3 |
+
size 32661504
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d0b7edede12d165f2a351843fd87468b8f13df1f7ef49c153e17c3933f22f78
|
3 |
+
size 31989760
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:924a6a03d6066fdc9146b3423eec37d709fad40e3832b16486b0e53099e56d5a
|
3 |
+
size 45088768
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0779291b1307d0a4492c5aba5cbbc57717ef93ddfaf910df40bb88b0b647540
|
3 |
+
size 45088768
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b181eb582fe73b90db5480d60005e914acce5b3373a6c663bab79e94484023b4
|
3 |
+
size 25165824
|
params_shard_6.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31a10047f5da60ed808805ae3e3a6a070aa9d357a9a48f8577ed6e5ca1d72db1
|
3 |
+
size 25165824
|