Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

README.md +130 -0
config.json +29 -0
generation_config.json +6 -0
model-00058-of-00059.safetensors +3 -0
model-00059-of-00059.safetensors +3 -0
model.safetensors.index.json +0 -0
special_tokens_map.json +7 -0
tokenizer.json +0 -0
tokenizer_config.json +52 -0

README.md ADDED Viewed

	@@ -0,0 +1,130 @@

+---
+license: apache-2.0
+language:
+- en
+- es
+- it
+- de
+- fr
+---
+# Model Card for Mixtral-8x22B-Instruct-v0.1
+The Mixtral-8x22B-Instruct-v0.1 Large Language Model (LLM) is an instruct fine-tuned version of the [Mixtral-8x22B-v0.1](https://huggingface.co/mistralai/Mixtral-8x22B-v0.1).
+## Run the model
+```python
+from transformers import AutoModelForCausalLM
+from mistral_common.protocol.instruct.messages import (
+    AssistantMessage,
+    UserMessage,
+)
+from mistral_common.protocol.instruct.tool_calls import (
+    Tool,
+    Function,
+)
+from mistral_common.tokens.tokenizers.mistral import MistralTokenizer
+from mistral_common.tokens.instruct.normalize import ChatCompletionRequest
+device = "cuda" # the device to load the model onto
+tokenizer_v3 = MistralTokenizer.v3()
+mistral_query = ChatCompletionRequest(
+    tools=[
+        Tool(
+            function=Function(
+                name="get_current_weather",
+                description="Get the current weather",
+                parameters={
+                    "type": "object",
+                    "properties": {
+                        "location": {
+                            "type": "string",
+                            "description": "The city and state, e.g. San Francisco, CA",
+                        },
+                        "format": {
+                            "type": "string",
+                            "enum": ["celsius", "fahrenheit"],
+                            "description": "The temperature unit to use. Infer this from the users location.",
+                        },
+                    },
+                    "required": ["location", "format"],
+                },
+            )
+        )
+    ],
+    messages=[
+        UserMessage(content="What's the weather like today in Paris"),
+    ],
+    model="test",
+)
+encodeds = tokenizer_v3.encode_chat_completion(mistral_query).tokens
+model = AutoModelForCausalLM.from_pretrained("mistralai/Mixtral-8x22B-Instruct-v0.1")
+model_inputs = encodeds.to(device)
+model.to(device)
+generated_ids = model.generate(model_inputs, max_new_tokens=1000, do_sample=True)
+sp_tokenizer = tokenizer_v3.instruct_tokenizer.tokenizer
+decoded = sp_tokenizer.decode(generated_ids[0])
+print(decoded)
+```
+# Instruct tokenizer
+The HuggingFace tokenizer included in this release should match our own. To compare:
+`pip install mistral-common`
+```py
+from mistral_common.protocol.instruct.messages import (
+    AssistantMessage,
+    UserMessage,
+)
+from mistral_common.tokens.tokenizers.mistral import MistralTokenizer
+from mistral_common.tokens.instruct.normalize import ChatCompletionRequest
+from transformers import AutoTokenizer
+tokenizer_v3 = MistralTokenizer.v3()
+mistral_query = ChatCompletionRequest(
+    messages=[
+        UserMessage(content="How many experts ?"),
+        AssistantMessage(content="8"),
+        UserMessage(content="How big ?"),
+        AssistantMessage(content="22B"),
+        UserMessage(content="Noice 🎉 !"),
+    ],
+    model="test",
+)
+hf_messages = mistral_query.model_dump()['messages']
+tokenized_mistral = tokenizer_v3.encode_chat_completion(mistral_query).tokens
+tokenizer_hf = AutoTokenizer.from_pretrained('mistralai/Mixtral-8x22B-Instruct-v0.1')
+tokenized_hf = tokenizer_hf.apply_chat_template(hf_messages, tokenize=True)
+assert tokenized_hf == tokenized_mistral
+```
+# Function calling and special tokens
+This tokenizer includes more special tokens, related to function calling :
+- [TOOL_CALLS]
+- [AVAILABLE_TOOLS]
+- [/AVAILABLE_TOOLS]
+- [TOOL_RESULTS]
+- [/TOOL_RESULTS]
+If you want to use this model with function calling, please be sure to apply it similarly to what is done in our [SentencePieceTokenizerV3](https://github.com/mistralai/mistral-common/blob/main/src/mistral_common/tokens/tokenizers/sentencepiece.py#L299).
+# The Mistral AI Team
+Albert Jiang, Alexandre Sablayrolles, Alexis Tacnet, Antoine Roux,
+Arthur Mensch, Audrey Herblin-Stoop, Baptiste Bout, Baudouin de Monicault,
+Blanche Savary, Bam4d, Caroline Feldman, Devendra Singh Chaplot,
+Diego de las Casas, Eleonore Arcelin, Emma Bou Hanna, Etienne Metzger,
+Gianna Lengyel, Guillaume Bour, Guillaume Lample, Harizo Rajaona,
+Jean-Malo Delignon, Jia Li, Justus Murke, Louis Martin, Louis Ternon,
+Lucile Saulnier, Lélio Renard Lavaud, Margaret Jennings, Marie Pellat,
+Marie Torelli, Marie-Anne Lachaux, Nicolas Schuhl, Patrick von Platen,
+Pierre Stock, Sandeep Subramanian, Sophia Yang, Szymon Antoniak, Teven Le Scao,
+Thibaut Lavril, Timothée Lacroix, Théophile Gervet, Thomas Wang,
+Valera Nemychnikova, William El Sayed, William Marshall

config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "architectures": [
+    "MixtralForCausalLM"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 6144,
+  "initializer_range": 0.02,
+  "intermediate_size": 16384,
+  "max_position_embeddings": 65536,
+  "model_type": "mixtral",
+  "num_attention_heads": 48,
+  "num_experts_per_tok": 2,
+  "num_hidden_layers": 56,
+  "num_key_value_heads": 8,
+  "num_local_experts": 8,
+  "output_router_logits": false,
+  "rms_norm_eps": 1e-05,
+  "rope_theta": 1000000.0,
+  "router_aux_loss_coef": 0.001,
+  "sliding_window": null,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.38.0",
+  "use_cache": true,
+  "vocab_size": 32768
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "transformers_version": "4.34.0.dev0"
+}

model-00058-of-00059.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e2de705aefc7b98a4394b9b691fd733d19633370ec8c3ded13f89fe73e11b5b
+size 4806799144

model-00059-of-00059.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:700482c2a697bd67ae38b25ddbd81babb83c77ebce91b5f61761409eb55e4ae0
+size 1207997392

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "unk_token": "<unk>",
+  "b_inst": "[INST]",
+  "e_inst": "[/INST]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,52 @@

+{
+  "add_bos_token": false,
+  "add_eos_token": false,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [],
+  "bos_token": "<s>",
+  "chat_template": [
+  {
+    "name": "default",
+    "template": "{{bos_token}}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ ' [INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + message['content'] + ' ' + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}"
+  },
+  {
+    "name": "tool_use",
+    "template": "{{bos_token}}{% set user_messages = messages | selectattr('role', 'equalto', 'user') | list %}{% for message in messages %}{% if message['role'] == 'user' %}{% if message == user_messages[-1] %}{{ '[AVAILABLE_TOOLS]'}}{% for tool in tools %}{{ tool }}{% endfor %}{{ '[/AVAILABLE_TOOLS]'}}{{ '[INST]' + message['content'] + '[/INST]' }}{% else %}{{ '[INST]' + message['content'] + '[/INST]' }}{% endif %}{% elif message['role'] == 'assistant' %}{{ ' ' + message['content'] + ' ' + eos_token}}{% elif message['role'] == 'tool_results' %}{{'[TOOL_RESULTS]' + message['content']|string + '[/TOOL_RESULTS]'}}{% elif message['role'] == 'tool_calls' %}{{'[TOOL_CALLS]' + message['content']|string + eos_token}}{% endif %}{% endfor %}"
+  }
+  ],
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": true,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": null,
+  "sp_model_kwargs": {},
+  "spaces_between_special_tokens": false,
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}