3thn commited on
Commit
3dd8287
1 Parent(s): 4882e4c

Upload folder using huggingface_hub (#1)

Browse files

- 3230888cad9ff1ca0d769ca478ab352482a4ac539a7760cad3f9cc4048eed8e2 (4f3d4ba3aac5135a623c69e2b25e93bdbb7214fb)
- a85c84204410d5047ebe8c079ddd90cba2cf6e0a604a63829549a31fc4233209 (7506ef17bb90c4d04cbdf9dbd81aed2c133ac797)
- 5d1c51e15f5077905d0a1a55cf1904f28fe309037e78007a4e0395c282cc6fcd (3ecec28d3c921118bb39c67ab9dd183d1f00db74)
- 0e36d108ffdc6471d9bd96ef996395064273ef9bdf1a15ac8d8b6936dd0eb8f1 (a2c12e564f758e458736bf7c25653d5c3ea0d1f8)
- b9c65ce7fd43240a9ac55cefae9d3c2d2dd28cfae1941bd5e55851f4125a2566 (60045b6604631c65a8146f8dedefa23c1483f53c)
- d624bc4df1104c7c1df40b83e5aa5c32d3be404358e1742de1685c42a6e40ff5 (4b91dc0baa334c1fd5366ae5b7cc02e5d2254adf)
- 8944a80ca322b046d071649cd4cf2e6c9ed42e7ea173a19f1260764d9b849e36 (4a55df16787180ac69edb6699538645f73234d78)
- 480553f2838ca2f96975f810fb38d241f6db81a3d7c49205902390134f58dfd2 (33ae5c56308dcd46ac0405fd4011db7dff925c1a)
- 02ff3823e4c5de4b768947b0589624fb98e007d9391a026e6d75c576b15b1423 (cf477e728efd643e9d5bab9436a576c8e7e2c955)

README.md ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: other
3
+ tags:
4
+ - generated_from_trainer
5
+ - axolotl
6
+ - mlx
7
+ base_model: Qwen/Qwen2-72B
8
+ datasets:
9
+ - cognitivecomputations/Dolphin-2.9
10
+ - teknium/OpenHermes-2.5
11
+ - m-a-p/CodeFeedback-Filtered-Instruction
12
+ - cognitivecomputations/dolphin-coder
13
+ - cognitivecomputations/samantha-data
14
+ - microsoft/orca-math-word-problems-200k
15
+ - Locutusque/function-calling-chatml
16
+ - internlm/Agent-FLAN
17
+ license_name: tongyi-qianwen
18
+ license_link: https://huggingface.co/Qwen/Qwen1.5-110B/blob/main/LICENSE
19
+ ---
20
+
21
+ # mlx-community/dolphin-2.9.2-qwen2-72b-4bit
22
+ This model was converted to MLX format from [`cognitivecomputations/dolphin-2.9.2-qwen2-72b`]() using mlx-lm version **0.12.1**.
23
+ Refer to the [original model card](https://huggingface.co/cognitivecomputations/dolphin-2.9.2-qwen2-72b) for more details on the model.
24
+ ## Use with mlx
25
+
26
+ ```bash
27
+ pip install mlx-lm
28
+ ```
29
+
30
+ ```python
31
+ from mlx_lm import load, generate
32
+
33
+ model, tokenizer = load("mlx-community/dolphin-2.9.2-qwen2-72b-4bit")
34
+ response = generate(model, tokenizer, prompt="hello", verbose=True)
35
+ ```
added_tokens.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "<|endoftext|>": 151643,
3
+ "<|im_end|>": 151645,
4
+ "<|im_start|>": 151644
5
+ }
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen2ForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "eos_token_id": 151645,
7
+ "hidden_act": "silu",
8
+ "hidden_size": 8192,
9
+ "initializer_range": 0.02,
10
+ "intermediate_size": 29568,
11
+ "max_position_embeddings": 131072,
12
+ "max_window_layers": 28,
13
+ "model_type": "qwen2",
14
+ "num_attention_heads": 64,
15
+ "num_hidden_layers": 80,
16
+ "num_key_value_heads": 8,
17
+ "quantization": {
18
+ "group_size": 64,
19
+ "bits": "4"
20
+ },
21
+ "rms_norm_eps": 1e-05,
22
+ "rope_theta": 1000000.0,
23
+ "sliding_window": 4096,
24
+ "tie_word_embeddings": false,
25
+ "torch_dtype": "bfloat16",
26
+ "transformers_version": "4.40.2",
27
+ "use_cache": false,
28
+ "use_sliding_window": false,
29
+ "vocab_size": 152064
30
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0c94e0e1bbb82619ebfe6cfb86c87b53ae4375f2fea0dc772820c074e4b28af
3
+ size 5365567671
model-00002-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a11bf1358b13490e40c60c50a0c458e07e752b1b55aecfed28e8b61dd6c3a26f
3
+ size 5294878244
model-00003-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b8c855edc3165ba6a1e08302012effc13cfdee4abb9c254108c6eb5d4fc6c52
3
+ size 5346171127
model-00004-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68c8b931377cef73ede7f4ee4e23a1afa2448e2711ade94d72cf16234515b0a8
3
+ size 5294845211
model-00005-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc138df328cbce47b87765b1db5568de1ab9b57223d9a9a014fc13c36ee354ce
3
+ size 5294878277
model-00006-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b3a9f8758c6e763bc9574bc4a11a045995fbdb7eec1e9d3f71c69ef31ccc681
3
+ size 5294878236
model-00007-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93ceed3dabaf5d8302800e3984bbdf080f337921f2e77cf7ec3852034dec312f
3
+ size 5346171153
model-00008-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:993d15d1b45426b016f9cf3b972740aae407c07ea39c3ba4681f650985932fb3
3
+ size 3663161114
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>"
5
+ ],
6
+ "eos_token": {
7
+ "content": "<|im_end|>",
8
+ "lstrip": false,
9
+ "normalized": false,
10
+ "rstrip": false,
11
+ "single_word": false
12
+ },
13
+ "pad_token": {
14
+ "content": "<|endoftext|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false
19
+ }
20
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "151643": {
5
+ "content": "<|endoftext|>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "151644": {
13
+ "content": "<|im_start|>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "151645": {
21
+ "content": "<|im_end|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ }
28
+ },
29
+ "additional_special_tokens": [
30
+ "<|im_start|>",
31
+ "<|im_end|>"
32
+ ],
33
+ "bos_token": null,
34
+ "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
35
+ "clean_up_tokenization_spaces": false,
36
+ "eos_token": "<|im_end|>",
37
+ "errors": "replace",
38
+ "model_max_length": 32768,
39
+ "pad_token": "<|endoftext|>",
40
+ "split_special_tokens": false,
41
+ "tokenizer_class": "Qwen2Tokenizer",
42
+ "unk_token": null
43
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff