dataautogpt3 commited on Feb 1

Commit

2251a6a

•

1 Parent(s): c2cd618

Upload 36 files

Browse files

Files changed (36) hide show

README.md +38 -0
config.json +29 -0
mergekit_config.yml +9 -0
model-00001-of-00028.safetensors +3 -0
model-00002-of-00028.safetensors +3 -0
model-00003-of-00028.safetensors +3 -0
model-00004-of-00028.safetensors +3 -0
model-00005-of-00028.safetensors +3 -0
model-00006-of-00028.safetensors +3 -0
model-00007-of-00028.safetensors +3 -0
model-00008-of-00028.safetensors +3 -0
model-00009-of-00028.safetensors +3 -0
model-00010-of-00028.safetensors +3 -0
model-00011-of-00028.safetensors +3 -0
model-00012-of-00028.safetensors +3 -0
model-00013-of-00028.safetensors +3 -0
model-00014-of-00028.safetensors +3 -0
model-00015-of-00028.safetensors +3 -0
model-00016-of-00028.safetensors +3 -0
model-00017-of-00028.safetensors +3 -0
model-00018-of-00028.safetensors +3 -0
model-00019-of-00028.safetensors +3 -0
model-00020-of-00028.safetensors +3 -0
model-00021-of-00028.safetensors +3 -0
model-00022-of-00028.safetensors +3 -0
model-00023-of-00028.safetensors +3 -0
model-00024-of-00028.safetensors +3 -0
model-00025-of-00028.safetensors +3 -0
model-00026-of-00028.safetensors +3 -0
model-00027-of-00028.safetensors +3 -0
model-00028-of-00028.safetensors +3 -0
model.safetensors.index.json +0 -0
special_tokens_map.json +30 -0
tokenizer.json +0 -0
tokenizer.model +3 -0
tokenizer_config.json +41 -0

README.md ADDED Viewed

	@@ -0,0 +1,38 @@

+---
+base_model:
+- 152334H/miqu-1-70b-sf
+tags:
+- mergekit
+- merge
+---
+# miqu-big-fix
+This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
+## Merge Details
+### Merge Method
+This model was merged using the passthrough merge method.
+### Models Merged
+The following models were included in the merge:
+* [152334H/miqu-1-70b-sf](https://huggingface.co/152334H/miqu-1-70b-sf)
+### Configuration
+The following YAML configuration was used to produce this model:
+```yaml
+slices:
+  - sources:
+    - model: 152334H/miqu-1-70b-sf
+      layer_range: [0, 80]
+  - sources:
+    - model: 152334H/miqu-1-70b-sf
+      layer_range: [0, 80]
+merge_method: passthrough
+dtype: float16
+```

config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "_name_or_path": "152334H/miqu-1-70b-sf",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 8192,
+  "initializer_range": 0.02,
+  "intermediate_size": 28672,
+  "max_position_embeddings": 32764,
+  "model_type": "llama",
+  "num_attention_heads": 64,
+  "num_hidden_layers": 160,
+  "num_key_value_heads": 8,
+  "pad_token_id": 0,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 1000000,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float16",
+  "transformers_version": "4.37.2",
+  "use_cache": true,
+  "vocab_size": 32000
+}

mergekit_config.yml ADDED Viewed

	@@ -0,0 +1,9 @@

+slices:
+  - sources:
+    - model: 152334H/miqu-1-70b-sf
+      layer_range: [0, 80]
+  - sources:
+    - model: 152334H/miqu-1-70b-sf
+      layer_range: [0, 80]
+merge_method: passthrough
+dtype: float16

model-00001-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3537c0411f97fc512a65f3229c840c29e83c3195e426952924d5684c7509436d
+size 9986776088

model-00002-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:092b0e7b6d22f1bea454bedbf72870614a41e44e3e1d4b054dbb390ab7e939b8
+size 9663912040

model-00003-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:20c645dd18d2bb1e41083ca91e7021f3b46ecc711883c0286847a2cdca1dbb89
+size 9663878336

model-00004-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d66902945d9f339a7110675640e6324454cc3ccbb8a22f4d34ac560a336503f
+size 9932281024

model-00005-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d727097276e23a9feec14746a5e8664139f0b3da9dd0d98a04c59051e9b2f3be
+size 9932248760

model-00006-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1b983a2a502be54a7d6b6120880654daca454763e986eea044697d0e5a69dc14
+size 9798130624

model-00007-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f3ad8854e6fc125f2785574ae18ddcaae4bdd38ffc7e14502038696201c4e8f7
+size 9999423400

model-00008-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b1b505a334dd7526faa2a1079ad270a5d9a4c4b17234bf9d6252d0b7381236f
+size 9663878376

model-00009-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1fe0f7fe38b7800509c3baa8e28acefebc1581e4d08ced0242651aed1899a071
+size 9932281064

model-00010-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:483d70c64be34b248b6403e22f7a306b7e7a839dce68590131f2d1dcecddbe2e
+size 9932282504

model-00011-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6cbf51160352804c622e219675c7db47a12f53100440b151e70addd536d0b78
+size 9798096936

model-00012-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:52d6a7110bfcb3e5c5866920e8a9287d21bad136a538a2f5913bf11922f35106
+size 9999457104

model-00013-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d1866e4d9f75ec3690cd9f99f41150b9512f0c44e37e9c26146636a30234b7e6
+size 9798129240

model-00014-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f18278fbf5780d437868c9e45f7a6d4e13cba4b99fac3ed604c7f4535fbe4fb0
+size 9932248072

model-00015-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:731e3c8e8cbd0d92b61f8588b0d4f920cf6dda46d64257f271fa1ae423dd64cf
+size 9798030936

model-00016-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b5042626ad2863dad905f0ed36f465aacd579fb0f9e645b910f3aa9360f20a5
+size 9932381488

model-00017-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ae14a1739261f6541faf9569dddd4b239855c8b553015bef0e5740d0b467a965
+size 9999423408

model-00018-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:07ad3450b51dfb64c471fabbc92e4832500eeafa1ba27cdfe1fc191e48e01b0c
+size 9663878384

model-00019-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:56487d4d72cb058c43196c3d916660ba76ff7d125d33d2e7fc291206d0b2ff3a
+size 9932248072

model-00020-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a364fcaacf2b1ac52f9bb04fb03bd97739ea4c3123b68dbe852f38330fc28901
+size 9932315488

model-00021-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9dddb428ed53e9397cccf19f2d1bd64bd87ee98c96e85735e067ee0d6459dcce
+size 9798096936

model-00022-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7cf66be88d0117a50c3a3845c4b1a4b085158231fe7e9c79a5e635adcaeb47f9
+size 9999489400

model-00023-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:86106c0b7e9c00179820bcdf2beecc28e9a8c6940874e6ca3a3ead34b72237f8
+size 9932314072

model-00024-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e008bed8e008d5fd4d38f86d52274ae50fb4b1d6098ef7a5b6278b669ab071d6
+size 9798030936

model-00025-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:280723ca1fac0ec1b0d05ed4ace04706e35c4b0a2d36ea6b48ba557ec53b875e
+size 9798030936

model-00026-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:24653ea6fc75cd137e53154c674b078233f51988c073316f2db24a3734f74fcc
+size 9798162936

model-00027-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ec71790b6f60f64270991b15ebf53231ea9e9bfa1fd9a6086443467310ec7ff
+size 9999423408

model-00028-of-00028.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1fafeca3f066a7632877e7dc5f9cb3d4769e15762cb102b6f6ff02dd5474abef
+size 8443318432

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
+size 499723

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,41 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": false,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<unk>",
+  "sp_model_kwargs": {},
+  "spaces_between_special_tokens": false,
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}