KingNish/WizardLM2-2bit

trial

by KingNish - opened Apr 25

base: refs/heads/main

←

from: refs/pr/3

Discussion Files changed

+113

-1858

This PR is in draft mode

Files changed (40) hide show

README.md +11 -4
WizardLM-2-8x22B.IQ4_XS-00003-of-00005.gguf +3 -0
WizardLM-2-8x22B.IQ4_XS-00004-of-00005.gguf +3 -0
tokenizer.model → WizardLM-2-8x22B.IQ4_XS-00005-of-00005.gguf +2 -2
WizardLM-2-8x22B.Q3_K_L-00001-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_L-00002-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_L-00003-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_L-00004-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_L-00005-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_M-00001-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_M-00002-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_M-00003-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_M-00004-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_M-00005-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_S-00001-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_S-00002-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_S-00003-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_S-00004-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q3_K_S-00005-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q4_K_M-00001-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q4_K_M-00002-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q4_K_M-00003-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q4_K_M-00004-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q4_K_M-00005-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q4_K_S-00001-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q4_K_S-00002-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q4_K_S-00003-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q4_K_S-00004-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q4_K_S-00005-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q5_K_M-00001-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q5_K_M-00002-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q5_K_M-00003-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q5_K_M-00004-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q5_K_S-00001-of-00005.gguf +3 -0
WizardLM-2-8x22B.Q5_K_S-00004-of-00005.gguf +3 -0
config.json +0 -31
generation_config.json +0 -6
model.safetensors.index.json +0 -0
special_tokens_map.json +0 -24
tokenizer_config.json +0 -44

README.md CHANGED Viewed

@@ -2,6 +2,11 @@
 tags:
 - quantized
 - 2-bit
 - GGUF
 - transformers
 - safetensors
@@ -17,16 +22,18 @@ tags:
 - region:us
 - text-generation
 model_name: WizardLM-2-8x22B-GGUF
-inference: true
-base_model: mistral-community/Mixtral-8x22B-v0.1
 pipeline_tag: text-generation
 quantized_by: MaziyarPanahi
 ---
 # [MaziyarPanahi/WizardLM-2-8x22B-GGUF](https://huggingface.co/MaziyarPanahi/WizardLM-2-8x22B-GGUF)
-- Base model: [mistral-community/Mixtral-8x22B-v0.1](https://huggingface.co/mistral-community/Mixtral-8x22B-v0.1)
 ## Description
-[MaziyarPanahi/WizardLM-2-8x22B-GGUF](https://huggingface.co/MaziyarPanahi/WizardLM-2-8x22B-GGUF) contains GGUF format model files for [mistral-community/Mixtral-8x22B-v0.1](https://huggingface.co/mistral-community/Mixtral-8x22B-v0.1).
 ## How to download
 You can download only the quants you need instead of cloning the entire repository as follows:

 tags:
 - quantized
 - 2-bit
+- 3-bit
+- 4-bit
+- 5-bit
+- 6-bit
+- 8-bit
 - GGUF
 - transformers
 - safetensors
 - region:us
 - text-generation
 model_name: WizardLM-2-8x22B-GGUF
+base_model: microsoft/WizardLM-2-8x22B
+inference: false
+model_creator: microsoft
 pipeline_tag: text-generation
 quantized_by: MaziyarPanahi
 ---
 # [MaziyarPanahi/WizardLM-2-8x22B-GGUF](https://huggingface.co/MaziyarPanahi/WizardLM-2-8x22B-GGUF)
+- Model creator: [microsoft](https://huggingface.co/microsoft)
+- Original model: [microsoft/WizardLM-2-8x22B](https://huggingface.co/microsoft/WizardLM-2-8x22B)
 ## Description
+[MaziyarPanahi/WizardLM-2-8x22B-GGUF](https://huggingface.co/MaziyarPanahi/WizardLM-2-8x22B-GGUF) contains GGUF format model files for [microsoft/WizardLM-2-8x22B](https://huggingface.co/microsoft/WizardLM-2-8x22B).
 ## How to download
 You can download only the quants you need instead of cloning the entire repository as follows:

WizardLM-2-8x22B.IQ4_XS-00003-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:52ae1b3b1b75dabaf96484ec1e0141f0ce65225f1b98a73d2261a50d6cae3f15
+size 16187875456

WizardLM-2-8x22B.IQ4_XS-00004-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce912e4e6c0948169b3b192268cbdb04af0c1bd8f3790bfcb9cd2fc39d4f0291
+size 17432699040

tokenizer.model → WizardLM-2-8x22B.IQ4_XS-00005-of-00005.gguf RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
-size 493443

 version https://git-lfs.github.com/spec/v1
+oid sha256:762ac686d247b8b7499ea8076c432df8f409807401819c47f7042be617ad8bce
+size 6869523776

WizardLM-2-8x22B.Q3_K_L-00001-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:677254a8764e9cdc736e638e6634c960c3dbb305c99eb15963f5edb28b4f81f2
+size 16530777024

WizardLM-2-8x22B.Q3_K_L-00002-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b3c810fd9c410f7d21effb1d75fb1255a3a06770a696755d8bdadd618f07bf58
+size 17108099264

WizardLM-2-8x22B.Q3_K_L-00003-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5129af244ebaaecbf40f89cb6eede1b2035c4f9a8f1df066ed97413e87fb4eec
+size 15552635008

WizardLM-2-8x22B.Q3_K_L-00004-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ecef6b5d484ae03d0684ec579fb086e3864cf2b50805c85dd3a6dbffb69fd8fe
+size 16775340192

WizardLM-2-8x22B.Q3_K_L-00005-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af2364a5dc9bde78cfccf90063df9b01658410629124ceadb40eef2edb9f628b
+size 6612950336

WizardLM-2-8x22B.Q3_K_M-00001-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b4132b1115f0fa12451c9049c24c0f3d1ab3348f70fa4609a94d193a6d58da1
+size 15650661312

WizardLM-2-8x22B.Q3_K_M-00002-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:001d7eb7125217a694781fecf9ca2cb49c655fb5b0bd124a4025b198dd140bae
+size 15916261568

WizardLM-2-8x22B.Q3_K_M-00003-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:577ea20c1fcc89ee42e5fabdd372dc7974857bf0eaedfab111ca94c6ba0fc607
+size 14480924800

WizardLM-2-8x22B.Q3_K_M-00004-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a96a5ad47fa40eebd46723a2db791e5834430bbb1a25014839028fa64db87bf
+size 15583502496

WizardLM-2-8x22B.Q3_K_M-00005-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f79c807121753e7c4d8312f02330c5315a37e47ac1e1feb6a64f395416fb6af1
+size 6158294336

WizardLM-2-8x22B.Q3_K_S-00001-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:02c67f83658f8039c146642741936c7a1ad18d786af0364e7486f616c45508fc
+size 13958259648

WizardLM-2-8x22B.Q3_K_S-00002-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4578f7ef6150c93b7347bdb77c6f2c3f839bec145ec9022bccea8900d8e3caf2
+size 14525849792

WizardLM-2-8x22B.Q3_K_S-00003-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bbf516d44516ac5f1478f48dfb37c45ebd91940111b32af93edbcf629441e8a5
+size 13197467776

WizardLM-2-8x22B.Q3_K_S-00004-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f4433ced22748b00fabffe18ef41b93aa164214029603286ecc55ad7ef6f8e1
+size 14193090720

WizardLM-2-8x22B.Q3_K_S-00005-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:13b984ca43dcbf4d0a873d7658400060ab00629cc784716142819dbb045da01c
+size 5623520576

WizardLM-2-8x22B.Q4_K_M-00001-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1ff155aaade7d6d9c208e5ad3933cbc02974c30a6742ee3404f7b51e617a4f3e
+size 19982390208

WizardLM-2-8x22B.Q4_K_M-00002-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cda9d26caeeb40eb916e04b4ef5efc0117b90ffe63d5f8fe997262fb04b4b333
+size 19699687616

WizardLM-2-8x22B.Q4_K_M-00003-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2765d9a73e1d558781fcd77b908d3a26ce92772b02a2cf38ac0717f95f1ab58f
+size 17938473088

WizardLM-2-8x22B.Q4_K_M-00004-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee19ae577798150ee11f6cffe220f9257e4658dcfb6eec6b430aaf97aaa42ba6
+size 19675209888

WizardLM-2-8x22B.Q4_K_M-00005-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4bef8ea8f78d69ad3b9b13f59ee6b69234732670e31580b201f56e4091e1419f
+size 8290999616

WizardLM-2-8x22B.Q4_K_S-00001-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:92456ec422ddf695a19c990df3ac4186f0b12cc757504e3970d200d449044e3a
+size 18818470848

WizardLM-2-8x22B.Q4_K_S-00002-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c5c0adcd16f8254086b04498820138236615e71c7a50b01a78523530a2da260
+size 18869215424

WizardLM-2-8x22B.Q4_K_S-00003-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ab35ad5d7f7e4e8cd8cfafb2291b7ff5e8baa595cfcfaca209fa4dfc7c022bc
+size 17108000896

WizardLM-2-8x22B.Q4_K_S-00004-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6e84aa55e44859ffb4da18f320bdef3b705ede320ad5118ed5d3bc3fd8717d39
+size 18429501600

WizardLM-2-8x22B.Q4_K_S-00005-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:966d15e0c80a8305614d44b0337fbad8c4253bd8bf0973161d39ae2695769110
+size 7252909376

WizardLM-2-8x22B.Q5_K_M-00001-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8fa60ba9d5be2dae5875904f22716eb3cf7fdf99a9871304e324e403369cfc58
+size 22987543488

WizardLM-2-8x22B.Q5_K_M-00002-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0acd9445e3681da199b3243ba9467952106a5d599af0226626c63d2431da6129
+size 23384907968

WizardLM-2-8x22B.Q5_K_M-00003-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:29febc013ad3af2c7201bb81433f596e25fa75c060821e20edb65cb1eacb708f
+size 21216321664

WizardLM-2-8x22B.Q5_K_M-00004-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df9a71ae9a4e57454c1812a51171a5729dee28f0ff1f657cf10aaf79ecd094e9
+size 23058440352

WizardLM-2-8x22B.Q5_K_S-00001-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:72fa0b4a2b0b09a62e751473c4fa04f0e60fc71ca7b3dbc127cd7dd658375ec0
+size 22024950720

WizardLM-2-8x22B.Q5_K_S-00004-of-00005.gguf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e1e46cf212b7fdeb2e97dd13d902386b58e47e6041d8136b33b31a67af88fcf
+size 22416711840

config.json DELETED Viewed

@@ -1,31 +0,0 @@
-{
-  "_name_or_path": "",
-  "architectures": [
-    "MixtralForCausalLM"
-  ],
-  "attention_dropout": 0.0,
-  "bos_token_id": 1,
-  "eos_token_id": 2,
-  "hidden_act": "silu",
-  "hidden_size": 6144,
-  "initializer_range": 0.02,
-  "intermediate_size": 16384,
-  "max_position_embeddings": 65536,
-  "model_type": "mixtral",
-  "num_attention_heads": 48,
-  "num_experts_per_tok": 2,
-  "num_hidden_layers": 56,
-  "num_key_value_heads": 8,
-  "num_local_experts": 8,
-  "output_router_logits": false,
-  "rms_norm_eps": 1e-05,
-  "rope_theta": 1000000,
-  "router_aux_loss_coef": 0.001,
-  "router_jitter_noise": 0.0,
-  "sliding_window": null,
-  "tie_word_embeddings": false,
-  "torch_dtype": "bfloat16",
-  "transformers_version": "4.36.2",
-  "use_cache": false,
-  "vocab_size": 32000
-}

generation_config.json DELETED Viewed

@@ -1,6 +0,0 @@
-{
-  "_from_model_config": true,
-  "bos_token_id": 1,
-  "eos_token_id": 2,
-  "transformers_version": "4.36.2"
-}

model.safetensors.index.json DELETED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json DELETED Viewed

@@ -1,24 +0,0 @@
-{
-  "bos_token": {
-    "content": "<s>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "eos_token": {
-    "content": "</s>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "pad_token": "<unk>",
-  "unk_token": {
-    "content": "<unk>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  }
-}

tokenizer_config.json DELETED Viewed

@@ -1,44 +0,0 @@
-{
-  "add_bos_token": true,
-  "add_eos_token": false,
-  "added_tokens_decoder": {
-    "0": {
-      "content": "<unk>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "1": {
-      "content": "<s>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "2": {
-      "content": "</s>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    }
-  },
-  "additional_special_tokens": [],
-  "bos_token": "<s>",
-  "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{{ messages[0]['content'].strip() }}{% else %}{% set loop_messages = messages %}{{ 'A chat between a curious user and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the user\\'s questions.' }}{% endif %}{% for message in loop_messages %}{% if loop.index0 == 0 %}{% if message['role'] == 'system' or message['role'] == 'user' %}{{ ' USER: ' + message['content'].strip() }}{% else %}{{ ' ASSISTANT: ' + message['content'].strip() + eos_token }}{% endif %}{% else %}{% if message['role'] == 'system' or message['role'] == 'user' %}{{ '\nUSER: ' + message['content'].strip() }}{% else %}{{ ' ASSISTANT: ' + message['content'].strip() + eos_token }}{% endif %}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ ' ASSISTANT:' }}{% endif %}",
-  "clean_up_tokenization_spaces": false,
-  "eos_token": "</s>",
-  "legacy": true,
-  "model_max_length": 1000000000000000019884624838656,
-  "pad_token": "<unk>",
-  "padding_side": "right",
-  "sp_model_kwargs": {},
-  "spaces_between_special_tokens": false,
-  "tokenizer_class": "LlamaTokenizer",
-  "unk_token": "<unk>",
-  "use_default_system_prompt": true
-}