KLMFOREVER commited on
Commit
742258f
1 Parent(s): 26e5956

Upload 2 files

Browse files
Files changed (2) hide show
  1. mlc-chat-config.json +79 -0
  2. ndarray-cache.json +0 -0
mlc-chat-config.json ADDED
@@ -0,0 +1,79 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "mistral",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "hidden_size": 4096,
7
+ "intermediate_size": 14336,
8
+ "num_attention_heads": 32,
9
+ "num_hidden_layers": 32,
10
+ "rms_norm_eps": 1e-05,
11
+ "vocab_size": 32000,
12
+ "position_embedding_base": 10000.0,
13
+ "num_key_value_heads": 8,
14
+ "head_dim": 128,
15
+ "context_window_size": -1,
16
+ "sliding_window_size": 4096,
17
+ "prefill_chunk_size": 2048,
18
+ "attention_sink_size": 4,
19
+ "tensor_parallel_shards": 1,
20
+ "max_batch_size": 80
21
+ },
22
+ "vocab_size": 32000,
23
+ "context_window_size": -1,
24
+ "sliding_window_size": 4096,
25
+ "prefill_chunk_size": 2048,
26
+ "attention_sink_size": 4,
27
+ "tensor_parallel_shards": 1,
28
+ "temperature": 1.0,
29
+ "presence_penalty": 0.0,
30
+ "frequency_penalty": 0.0,
31
+ "repetition_penalty": 1.0,
32
+ "top_p": 1.0,
33
+ "tokenizer_files": [
34
+ "tokenizer.model",
35
+ "tokenizer_config.json",
36
+ "tokenizer.json"
37
+ ],
38
+ "tokenizer_info": {
39
+ "token_postproc_method": "byte_fallback",
40
+ "prepend_space_in_encode": true,
41
+ "strip_space_in_decode": true
42
+ },
43
+ "conv_template": {
44
+ "name": "mistral_default",
45
+ "system_template": "[INST] {system_message}",
46
+ "system_message": "Always assist with care, respect, and truth. Respond with utmost utility yet securely. Avoid harmful, unethical, prejudiced, or negative content. Ensure replies promote fairness and positivity.",
47
+ "system_prefix_token_ids": [
48
+ 1
49
+ ],
50
+ "add_role_after_system_message": false,
51
+ "roles": {
52
+ "user": "[INST]",
53
+ "assistant": "[/INST]",
54
+ "tool": "[INST]"
55
+ },
56
+ "role_templates": {
57
+ "user": "{user_message}",
58
+ "assistant": "{assistant_message}",
59
+ "tool": "{tool_message}"
60
+ },
61
+ "messages": [],
62
+ "seps": [
63
+ " "
64
+ ],
65
+ "role_content_sep": " ",
66
+ "role_empty_sep": "",
67
+ "stop_str": [
68
+ "</s>"
69
+ ],
70
+ "stop_token_ids": [
71
+ 2
72
+ ],
73
+ "function_string": "",
74
+ "use_function_calling": false
75
+ },
76
+ "pad_token_id": 0,
77
+ "bos_token_id": 1,
78
+ "eos_token_id": 2
79
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff