TheDrummer
commited on
Commit
•
a118836
1
Parent(s):
3c0ec92
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +33 -0
- config.json +27 -0
- mergekit_config.yml +4 -0
- model-00001-of-00051.safetensors +3 -0
- model-00002-of-00051.safetensors +3 -0
- model-00003-of-00051.safetensors +3 -0
- model-00004-of-00051.safetensors +3 -0
- model-00005-of-00051.safetensors +3 -0
- model-00006-of-00051.safetensors +3 -0
- model-00007-of-00051.safetensors +3 -0
- model-00008-of-00051.safetensors +3 -0
- model-00009-of-00051.safetensors +3 -0
- model-00010-of-00051.safetensors +3 -0
- model-00011-of-00051.safetensors +3 -0
- model-00012-of-00051.safetensors +3 -0
- model-00013-of-00051.safetensors +3 -0
- model-00014-of-00051.safetensors +3 -0
- model-00015-of-00051.safetensors +3 -0
- model-00016-of-00051.safetensors +3 -0
- model-00017-of-00051.safetensors +3 -0
- model-00018-of-00051.safetensors +3 -0
- model-00019-of-00051.safetensors +3 -0
- model-00020-of-00051.safetensors +3 -0
- model-00021-of-00051.safetensors +3 -0
- model-00022-of-00051.safetensors +3 -0
- model-00023-of-00051.safetensors +3 -0
- model-00024-of-00051.safetensors +3 -0
- model-00025-of-00051.safetensors +3 -0
- model-00026-of-00051.safetensors +3 -0
- model-00027-of-00051.safetensors +3 -0
- model-00028-of-00051.safetensors +3 -0
- model-00029-of-00051.safetensors +3 -0
- model-00030-of-00051.safetensors +3 -0
- model-00031-of-00051.safetensors +3 -0
- model-00032-of-00051.safetensors +3 -0
- model-00033-of-00051.safetensors +3 -0
- model-00034-of-00051.safetensors +3 -0
- model-00035-of-00051.safetensors +3 -0
- model-00036-of-00051.safetensors +3 -0
- model-00037-of-00051.safetensors +3 -0
- model-00038-of-00051.safetensors +3 -0
- model-00039-of-00051.safetensors +3 -0
- model-00040-of-00051.safetensors +3 -0
- model-00041-of-00051.safetensors +3 -0
- model-00042-of-00051.safetensors +3 -0
- model-00043-of-00051.safetensors +3 -0
- model-00044-of-00051.safetensors +3 -0
- model-00045-of-00051.safetensors +3 -0
- model-00046-of-00051.safetensors +3 -0
- model-00047-of-00051.safetensors +3 -0
README.md
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
base_model:
|
3 |
+
- mistralai/Mistral-Large-Instruct-2411
|
4 |
+
library_name: transformers
|
5 |
+
tags:
|
6 |
+
- mergekit
|
7 |
+
- merge
|
8 |
+
|
9 |
+
---
|
10 |
+
# merged
|
11 |
+
|
12 |
+
This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
|
13 |
+
|
14 |
+
## Merge Details
|
15 |
+
### Merge Method
|
16 |
+
|
17 |
+
This model was merged using the passthrough merge method.
|
18 |
+
|
19 |
+
### Models Merged
|
20 |
+
|
21 |
+
The following models were included in the merge:
|
22 |
+
* [mistralai/Mistral-Large-Instruct-2411](https://huggingface.co/mistralai/Mistral-Large-Instruct-2411) + ./adapter
|
23 |
+
|
24 |
+
### Configuration
|
25 |
+
|
26 |
+
The following YAML configuration was used to produce this model:
|
27 |
+
|
28 |
+
```yaml
|
29 |
+
models:
|
30 |
+
- model: mistralai/Mistral-Large-Instruct-2411+./adapter
|
31 |
+
merge_method: passthrough
|
32 |
+
dtype: bfloat16
|
33 |
+
```
|
config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "mistralai/Mistral-Large-Instruct-2411",
|
3 |
+
"architectures": [
|
4 |
+
"MistralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 1,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"head_dim": 128,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 12288,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 131072,
|
15 |
+
"model_type": "mistral",
|
16 |
+
"num_attention_heads": 96,
|
17 |
+
"num_hidden_layers": 88,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"rms_norm_eps": 1e-05,
|
20 |
+
"rope_theta": 1000000.0,
|
21 |
+
"sliding_window": null,
|
22 |
+
"tie_word_embeddings": false,
|
23 |
+
"torch_dtype": "bfloat16",
|
24 |
+
"transformers_version": "4.46.3",
|
25 |
+
"use_cache": true,
|
26 |
+
"vocab_size": 32768
|
27 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
models:
|
2 |
+
- model: mistralai/Mistral-Large-Instruct-2411+./adapter
|
3 |
+
merge_method: passthrough
|
4 |
+
dtype: bfloat16
|
model-00001-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e9dd8e22bded91b53e752bebceafee487c6ce1d1596709f071b33dccf792f04
|
3 |
+
size 4378928504
|
model-00002-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79b0a1c68ee379ad49c740be95bdf4c44d34841d00ecb0307f4ef2acc00b294f
|
3 |
+
size 4907411088
|
model-00003-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:893d88c62c082ab1bb453ae3e164c339962967d3a389d5b31b1956a853989639
|
3 |
+
size 4806747904
|
model-00004-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:050147b492637872c86bd4c17f3516e022dda7ad244ea9107e8c4e5917060e2f
|
3 |
+
size 4831938544
|
model-00005-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:958ba05ebea4c2f4d91f4d251ac96336da6b4e779bea5cfec1051c60912f98cf
|
3 |
+
size 4831938552
|
model-00006-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe171ff7591808d8daaf28a1ea98b2f0e313b580e923e058e492d9a7ddf5fb0f
|
3 |
+
size 4907411096
|
model-00007-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:265e0638d782d0eec3978f6a1754e5411a3e2bdc2f69a6f35fd6640f6b750101
|
3 |
+
size 4806747904
|
model-00008-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4e11293bd5241829a571f9c3ec498dfa04c5fe4c50391db1e2272a5cfd97ae4
|
3 |
+
size 4831938536
|
model-00009-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32c76acd32a1876ab1496edd84d37bd8cef979d6f7696b5c446f326212457ad0
|
3 |
+
size 4831938552
|
model-00010-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa3e64d4961a1633582a9af668502e7c71a1a265537b9fe3c6fe735e2f762d6f
|
3 |
+
size 4907411096
|
model-00011-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af62dc84254f23f4e70aff059f98d421be65440775bb03dbe242504860351745
|
3 |
+
size 4806747904
|
model-00012-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:863fe3f5b0bf8d4501632d194ad6af31d000d89ac6e149b5cc5914c7a817b7fb
|
3 |
+
size 4831938544
|
model-00013-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d96431b2f55b071aed9a0fc07493c11ab7b8c5415e0e3a70057635a416ca64b9
|
3 |
+
size 4831938552
|
model-00014-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b5130f370db016d8c2b05fe326299d033e16189a5e92e10d21645b096f4cbf2
|
3 |
+
size 4907411088
|
model-00015-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d6ce6cf9e4ed1f307de4830a4fcc30ebb22d4c5f5724e2e80a4bd33dcd2c99f
|
3 |
+
size 4806747904
|
model-00016-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9a02fabe09d3d9c446e1d8980a95eed03fa12a715e315c0fd803168bf9ca621
|
3 |
+
size 4831938544
|
model-00017-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddc3de7fb14112acfbc5750f383c19bc2072c6049dfb2458b50c2dede842ccf9
|
3 |
+
size 4831938552
|
model-00018-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fde01c9bbbfce74b1c18ef0071717080d12d21ec56060a86a397f28d3eec5a07
|
3 |
+
size 4907411096
|
model-00019-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d75d07d265c076ee36cda1ea7923e1ace571e1c2a443812e0bebb6312af61d1f
|
3 |
+
size 4806747904
|
model-00020-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0008e0edf02680e80ea510d62aefd0d937fee705157984ccfa4687963ab5762d
|
3 |
+
size 4831938544
|
model-00021-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6744ccdb8550a6b5fb6070a27df6263ae29ab000af8fe701cde23dad383460b0
|
3 |
+
size 4831938544
|
model-00022-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1465cc3a877334f2aca2781646c3067812b92c399b74655287521b1eb1612c9
|
3 |
+
size 4907411096
|
model-00023-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43697afd0726c1c513c23343ebae92eef561d6090bb586a1ffd5543ee120a02b
|
3 |
+
size 4806747904
|
model-00024-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83cf65a30e965f1b0ebd4ea3a361be13e0ab4afa6fd375fade8281d8618c8924
|
3 |
+
size 4831938544
|
model-00025-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cf097902e862ba3548e649c53d8bfc4e7b94ff3d2fe87b3788d1a9c1a0313f9
|
3 |
+
size 4831938552
|
model-00026-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:250c4cfde5f358c099396121ae59f8e4effd1d9e2a34835c7c47fa0e589ecdf0
|
3 |
+
size 4907411096
|
model-00027-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72cdccf46edc9c4217c7b5b74d4fb77bf9b94a2f464875d00bf4b4b2415e0484
|
3 |
+
size 4806747896
|
model-00028-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df6f487cb8aadf8ba3caf35cc6f58925fad1df12cbe3c13d81d239ed6def84d2
|
3 |
+
size 4831938544
|
model-00029-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3f90523e9cf74b92c834c852d3dfb704045af167d4bfd3c5c9b533efc1d0f8b
|
3 |
+
size 4831938552
|
model-00030-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a973efe2bcba332a80904d106b9e74df437acd2b9af78f7a836f5744727a9850
|
3 |
+
size 4907411096
|
model-00031-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2498dfa1e7015504e0e18be91deba210bdd83d75d468173186fb0a8b4b292990
|
3 |
+
size 4806747904
|
model-00032-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf876b5bd3c8ea3b35c43563484a200af763e9f39711086571a5e389ca6ca8c8
|
3 |
+
size 4831938544
|
model-00033-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05e73855403d79babb901ffdd5ddc39683976f01a1fc12556c1983e8b9e6fcae
|
3 |
+
size 4831938544
|
model-00034-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac61a66a740d8a7d61bdd560f282731c628f7b764398366d19030c94bc88806b
|
3 |
+
size 4907411096
|
model-00035-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1602293965d283235e91af497ab0ddf15a065c5251b1be60f56004e67decd1ba
|
3 |
+
size 4806747904
|
model-00036-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aefa4749b1ecb23ff9134477a7d371e3b39331e9ee448f5467fcb760af3148ab
|
3 |
+
size 4831938544
|
model-00037-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f978c9f3e94a0021f740475f0d38662c6fc2e1bd7ed86037db05bc938f9f5fb
|
3 |
+
size 4831938552
|
model-00038-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93186609b5a1975519b97e6251b23adc21a5203007c085b82a56a3e3f905fcc6
|
3 |
+
size 4907411096
|
model-00039-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffcf6acb20072fb7f9861fce8b25382407ac3e277d21856268a033441f7ae7d3
|
3 |
+
size 4806747904
|
model-00040-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e69886f4cb71419895fbcb2a0d0fd53384c55f245f21d2470c489c500df0270
|
3 |
+
size 4831938544
|
model-00041-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6391c8d1de0652ba7a3e9f15c42a883e048e20c344b3928405479ef1b646655f
|
3 |
+
size 4831938552
|
model-00042-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:003485f2d7cf48510cd8d50e8834613d72ff3bef0cad0a68b81036cd28ea36c1
|
3 |
+
size 4907411096
|
model-00043-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5abf1526d8c2707e34508643ffc36bfcf0181df223b0a5f86933e05d31646ee
|
3 |
+
size 4806747904
|
model-00044-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1f28e5ddb68fea71248c1e8e05e4f9dcdf4058e8c5e2b3976a56051763a23fb
|
3 |
+
size 4831938544
|
model-00045-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4b0820563305321e259406cdf3e16d5f1c735098bc2b130ba8a9292e69bd9fe
|
3 |
+
size 4831938552
|
model-00046-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14581f0c8a156ba44933d7117f838b553ee095d4a2ba82eb7293a02cf784c4ba
|
3 |
+
size 4907411088
|
model-00047-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3288e48b55bbf81979e4e30b1eedf02b744acd7e0fba2e9ebab66cb9fa8000df
|
3 |
+
size 4806747904
|