Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +30 -0
- generation_config.json +6 -0
- model-00001-of-00059.safetensors +3 -0
- model-00002-of-00059.safetensors +3 -0
- model-00003-of-00059.safetensors +3 -0
- model-00004-of-00059.safetensors +3 -0
- model-00005-of-00059.safetensors +3 -0
- model-00006-of-00059.safetensors +3 -0
- model-00007-of-00059.safetensors +3 -0
- model-00008-of-00059.safetensors +3 -0
- model-00009-of-00059.safetensors +3 -0
- model-00010-of-00059.safetensors +3 -0
- model-00011-of-00059.safetensors +3 -0
- model-00012-of-00059.safetensors +3 -0
- model-00013-of-00059.safetensors +3 -0
- model-00014-of-00059.safetensors +3 -0
- model-00015-of-00059.safetensors +3 -0
- model-00016-of-00059.safetensors +3 -0
- model-00017-of-00059.safetensors +3 -0
- model-00018-of-00059.safetensors +3 -0
- model-00019-of-00059.safetensors +3 -0
- model-00020-of-00059.safetensors +3 -0
- model-00021-of-00059.safetensors +3 -0
- model-00022-of-00059.safetensors +3 -0
- model-00023-of-00059.safetensors +3 -0
- model-00024-of-00059.safetensors +3 -0
- model-00025-of-00059.safetensors +3 -0
- model-00026-of-00059.safetensors +3 -0
- model-00027-of-00059.safetensors +3 -0
- model-00028-of-00059.safetensors +3 -0
- model-00029-of-00059.safetensors +3 -0
- model-00030-of-00059.safetensors +3 -0
- model-00031-of-00059.safetensors +3 -0
- model-00032-of-00059.safetensors +3 -0
- model-00033-of-00059.safetensors +3 -0
- model-00034-of-00059.safetensors +3 -0
- model-00035-of-00059.safetensors +3 -0
- model-00036-of-00059.safetensors +3 -0
- model-00037-of-00059.safetensors +3 -0
- model-00038-of-00059.safetensors +3 -0
- model-00039-of-00059.safetensors +3 -0
- model-00040-of-00059.safetensors +3 -0
- model-00041-of-00059.safetensors +3 -0
- model-00042-of-00059.safetensors +3 -0
- model-00043-of-00059.safetensors +3 -0
- model-00044-of-00059.safetensors +3 -0
- model-00045-of-00059.safetensors +3 -0
- model-00046-of-00059.safetensors +3 -0
- model-00047-of-00059.safetensors +3 -0
- model-00048-of-00059.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"MixtralForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_dropout": 0.0,
|
6 |
+
"bos_token_id": 1,
|
7 |
+
"eos_token_id": 2,
|
8 |
+
"hidden_act": "silu",
|
9 |
+
"hidden_size": 6144,
|
10 |
+
"initializer_range": 0.02,
|
11 |
+
"intermediate_size": 16384,
|
12 |
+
"max_position_embeddings": 65536,
|
13 |
+
"model_type": "mixtral",
|
14 |
+
"num_attention_heads": 48,
|
15 |
+
"num_experts_per_tok": 2,
|
16 |
+
"num_hidden_layers": 56,
|
17 |
+
"num_key_value_heads": 8,
|
18 |
+
"num_local_experts": 8,
|
19 |
+
"output_router_logits": false,
|
20 |
+
"rms_norm_eps": 1e-05,
|
21 |
+
"rope_theta": 1000000,
|
22 |
+
"router_aux_loss_coef": 0.001,
|
23 |
+
"router_jitter_noise": 0.0,
|
24 |
+
"sliding_window": null,
|
25 |
+
"tie_word_embeddings": false,
|
26 |
+
"torch_dtype": "bfloat16",
|
27 |
+
"transformers_version": "4.40.0.dev0",
|
28 |
+
"use_cache": true,
|
29 |
+
"vocab_size": 32000
|
30 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"transformers_version": "4.40.0.dev0"
|
6 |
+
}
|
model-00001-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b039c0a113de62272bace9f5c48c70503ad3290bb0c65abbdb9ace27ca565cfd
|
3 |
+
size 4998663696
|
model-00002-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a83771f7731be5a4e216fbd8efe7c4c4733a556c3c72124cea3f5f7963a95eed
|
3 |
+
size 4806799120
|
model-00003-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7bd17848981fb13c16c1a850a5ae1492af74c79088fe1e60bbd9591aff42354
|
3 |
+
size 4806799120
|
model-00004-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51783101334dfaa9d62e05c47adc95f1695754e1b3cdecc5a324db51f0ac4fd4
|
3 |
+
size 4806799120
|
model-00005-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:884dda6f0757f11ea3366cbc5b1d961cbffa65c826f95295a296b481b2b69e75
|
3 |
+
size 4806799120
|
model-00006-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bc1bd6bfcf7e0c91488f0c07f8a8e50b3596e8cd7ed862ce8d4e6292ed34935
|
3 |
+
size 4806799120
|
model-00007-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e463627c8cfcacb6d6be922384f4484c4085df0fe6e3da8b8bcad631ee6c650
|
3 |
+
size 4806799120
|
model-00008-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1147ec45481fa3ef9a917d08a78865ef42ecb7c4c538a4edc498609ec678b221
|
3 |
+
size 4806799120
|
model-00009-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcf912f23bad0f9692c58c76c93d361876d6a61e6b6372b40eae51422ecb5457
|
3 |
+
size 4806799120
|
model-00010-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b635201338d2a2911a035f05023c94e60c14920e731be6652b9b89c6b05cf938
|
3 |
+
size 4806799120
|
model-00011-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ee35393493b397e5d6c556b938b6c836c945a430ccadd1947c03a0f67921023
|
3 |
+
size 4806799136
|
model-00012-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94f67175581edbcd500caa4cb4edc1f362d020e85fc022c4f0e3e6f9ab69ce2d
|
3 |
+
size 4806799152
|
model-00013-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47ae57ed917b0d0ed903839e9dc22bdb0f0590ebb9e867a98b5b4f9aff1d3515
|
3 |
+
size 4806799152
|
model-00014-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d5d5156330ec725b6c89877fea2eef67038846d0afec96dab2bc2531e604ac4
|
3 |
+
size 4806799152
|
model-00015-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76ac8d1c058daaed35d2add3b9e4b17173b43d2a125a3da5fa45e1658e8878fd
|
3 |
+
size 4806799152
|
model-00016-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7a478c73e34122bf98ca7dcbdc5acd3e7c6f8d8aa60529c272e832875d5216f
|
3 |
+
size 4806799152
|
model-00017-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dca496a9d0cc2a323b9cb8ff5a8ce05aacee3795c0698acaabc13e5ad052a77d
|
3 |
+
size 4806799152
|
model-00018-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b4d36cd8cd6d5004fe197d2971c2d735ae95d0a7fca3d5b9764ba5ff9dc777c
|
3 |
+
size 4806799152
|
model-00019-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f21e8856c1bf685b87bdac2c54d0c4e7247757a98c6d5b43880759a9c14c8b1
|
3 |
+
size 4806799152
|
model-00020-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:933dda96b69cdef0440e7e77b96d0286e8a00a2fc45234e3f5096a7150ef02a9
|
3 |
+
size 4806799152
|
model-00021-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:616211f8ed279b2c133e9863bfb01c6bf061397dc879fa06676ab1c7a1bfeb0a
|
3 |
+
size 4806799152
|
model-00022-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a127eae5266dd1fe645a45b425482d5c8052c5374f6e386e614a6733c6226bb
|
3 |
+
size 4806799152
|
model-00023-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4f29da3532e4937b99d1a5ece5457a97c846276c8ec4ef514281f90f4a9506e
|
3 |
+
size 4806799152
|
model-00024-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:063e0bbb5f2d783f2ce20cfaa014b234c81b370afe49587399386d99b50e3aae
|
3 |
+
size 4932529864
|
model-00025-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:040b7d741425ae5676099d9431dbbb55929159d33a8afd5feaf4b5c50f9d2800
|
3 |
+
size 4995542848
|
model-00026-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06a45ea1f0841e8f214683fdabf89cec183f7e844849bf633b898bab8aa740e6
|
3 |
+
size 4995542848
|
model-00027-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c6f5e468564e403a7cb3a97b84f778451ab92937e684b75122f90950df27849
|
3 |
+
size 4932628288
|
model-00028-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b9a5ce26370f37727dc78305dc8dcfea7f3b102e9a894e2a8a5f3dde2f7ab89
|
3 |
+
size 4806774344
|
model-00029-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0458c20683be80e6c814f17b233f7e3b651f461fa616079fa22542b2abff59f
|
3 |
+
size 4806799144
|
model-00030-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:790b0203791f80500dd1d3d15796ff4c72ab3cf78ea00dd96e51872d1722f585
|
3 |
+
size 4806799144
|
model-00031-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eed11f4e9fe8b3f582ccf57245dba278c0b996042228a4c0ccd080f31bfd334d
|
3 |
+
size 4806799144
|
model-00032-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e70e6bc0591fc8bec66d8756d2ffd04b59b4fd57ae93cdd441a76429884f1c83
|
3 |
+
size 4806799144
|
model-00033-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afc00641c7de6181c059c414230046263b20ffce2807037a79ec467dcca8d201
|
3 |
+
size 4806799152
|
model-00034-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd7fcaa9f411b23bd1f5d0e6d25a7fab18aa420f64a2e4160550cb92c7f8bff6
|
3 |
+
size 4806799152
|
model-00035-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d65513f09da03f27cac48b3d87dbfb1e98929a31630deb9ab954405e735d3775
|
3 |
+
size 4806799152
|
model-00036-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59c7f0a00e9d1d32899c8f9a85c2bab3f03b061a1d3f25466de8cf7cb6ee2dba
|
3 |
+
size 4806799152
|
model-00037-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9414dcc7522d4cc765458ce6697aeb5286aa03de6d1204f42a470ff2f81a59ec
|
3 |
+
size 4806799152
|
model-00038-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f40497204a3f340f8894bda0df9bc65873c97f68cf91e68c9d42370bd4a457d
|
3 |
+
size 4806799152
|
model-00039-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5adf314c52d78bf6ddc2778eb5bafceefcd25069cf6710f75c6770633a438a0c
|
3 |
+
size 4806799152
|
model-00040-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3916f7db00d69d8aecb6d2597ca3b488a2829d3bd4d21fa4ed21dde311f0df8
|
3 |
+
size 4806799152
|
model-00041-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4556f1b7c3599f3a904dfe1e61dd22e655d29ed1eae614118078e216662c8650
|
3 |
+
size 4806799152
|
model-00042-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef1fcc735bbf26a61623185ac500161757d4854a3b8b05c9826bba4a6633859e
|
3 |
+
size 4806799152
|
model-00043-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d51d71c5598283092b9eebd69169d6002d08fabb92eb1de2e11d2f504c83f6d4
|
3 |
+
size 4806799152
|
model-00044-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21d280cf85760838c2108fa750401d271c5a5fa112c3a79dfaef1f61e81bf42e
|
3 |
+
size 4806799152
|
model-00045-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d291e6ad3383c50c6897a67a88050da4aa8fd78eca3fbbe46e65d9ff0e818cce
|
3 |
+
size 4806799152
|
model-00046-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa610e393ffb4182a6e6dda2115d54d297fb7ad721d96920644bc0942b753e8e
|
3 |
+
size 4806799152
|
model-00047-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b0069d8246eb8933fbd678fec8db10485c25ce399dce0bc8931a943657da3d3
|
3 |
+
size 4806799152
|
model-00048-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31204ed829f496213dfe6a02bcfcab65ed9f663f7b4b22e8535c60cfc929924f
|
3 |
+
size 4806799152
|