deltanym commited on 4 days ago

Commit

041b299

•

1 Parent(s): 952a501

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +1 -0
README.md +55 -0
config.json +40 -0
mergekit_config.yml +24 -0
model-00001-of-00050.safetensors +3 -0
model-00002-of-00050.safetensors +3 -0
model-00003-of-00050.safetensors +3 -0
model-00004-of-00050.safetensors +3 -0
model-00005-of-00050.safetensors +3 -0
model-00006-of-00050.safetensors +3 -0
model-00007-of-00050.safetensors +3 -0
model-00008-of-00050.safetensors +3 -0
model-00009-of-00050.safetensors +3 -0
model-00010-of-00050.safetensors +3 -0
model-00011-of-00050.safetensors +3 -0
model-00012-of-00050.safetensors +3 -0
model-00013-of-00050.safetensors +3 -0
model-00014-of-00050.safetensors +3 -0
model-00015-of-00050.safetensors +3 -0
model-00016-of-00050.safetensors +3 -0
model-00017-of-00050.safetensors +3 -0
model-00018-of-00050.safetensors +3 -0
model-00019-of-00050.safetensors +3 -0
model-00020-of-00050.safetensors +3 -0
model-00021-of-00050.safetensors +3 -0
model-00022-of-00050.safetensors +3 -0
model-00023-of-00050.safetensors +3 -0
model-00024-of-00050.safetensors +3 -0
model-00025-of-00050.safetensors +3 -0
model-00026-of-00050.safetensors +3 -0
model-00027-of-00050.safetensors +3 -0
model-00028-of-00050.safetensors +3 -0
model-00029-of-00050.safetensors +3 -0
model-00030-of-00050.safetensors +3 -0
model-00031-of-00050.safetensors +3 -0
model-00032-of-00050.safetensors +3 -0
model-00033-of-00050.safetensors +3 -0
model-00034-of-00050.safetensors +3 -0
model-00035-of-00050.safetensors +3 -0
model-00036-of-00050.safetensors +3 -0
model-00037-of-00050.safetensors +3 -0
model-00038-of-00050.safetensors +3 -0
model-00039-of-00050.safetensors +3 -0
model-00040-of-00050.safetensors +3 -0
model-00041-of-00050.safetensors +3 -0
model-00042-of-00050.safetensors +3 -0
model-00043-of-00050.safetensors +3 -0
model-00044-of-00050.safetensors +3 -0
model-00045-of-00050.safetensors +3 -0
model-00046-of-00050.safetensors +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,55 @@

+---
+base_model:
+- meta-llama/Llama-3.1-70B-Instruct
+library_name: transformers
+tags:
+- mergekit
+- merge
+---
+# llama-3.1-120b-instruct
+This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
+It's a recreation of [mlabonne/Meta-Llama-3-120B-Instruct](https://huggingface.co/mlabonne/Meta-Llama-3-120B-Instruct) but using Llama 3.1 70b instead of Llama 3, with the same configuration.
+## Merge Details
+### Merge Method
+This model was merged using the passthrough merge method.
+### Models Merged
+The following models were included in the merge:
+* [meta-llama/Llama-3.1-70B-Instruct](https://huggingface.co/meta-llama/Llama-3.1-70B-Instruct)
+### Configuration
+The following YAML configuration was used to produce this model:
+```yaml
+slices:
+- sources:
+  - layer_range: [0, 20]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [10, 30]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [20, 40]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [30, 50]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [40, 60]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [50, 70]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [60, 80]
+    model: meta-llama/Llama-3.1-70B-Instruct
+merge_method: passthrough
+dtype: float16
+```

config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "_name_or_path": "meta-llama/Llama-3.1-70B-Instruct",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 128000,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "head_dim": 128,
+  "hidden_act": "silu",
+  "hidden_size": 8192,
+  "initializer_range": 0.02,
+  "intermediate_size": 28672,
+  "max_position_embeddings": 131072,
+  "mlp_bias": false,
+  "model_type": "llama",
+  "num_attention_heads": 64,
+  "num_hidden_layers": 140,
+  "num_key_value_heads": 8,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": {
+    "factor": 8.0,
+    "high_freq_factor": 4.0,
+    "low_freq_factor": 1.0,
+    "original_max_position_embeddings": 8192,
+    "rope_type": "llama3"
+  },
+  "rope_theta": 500000.0,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float16",
+  "transformers_version": "4.46.0",
+  "use_cache": true,
+  "vocab_size": 128256
+}

mergekit_config.yml ADDED Viewed

	@@ -0,0 +1,24 @@

+slices:
+- sources:
+  - layer_range: [0, 20]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [10, 30]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [20, 40]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [30, 50]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [40, 60]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [50, 70]
+    model: meta-llama/Llama-3.1-70B-Instruct
+- sources:
+  - layer_range: [60, 80]
+    model: meta-llama/Llama-3.1-70B-Instruct
+merge_method: passthrough
+dtype: float16

model-00001-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2d6b2b03306e00c0e70d58598d4911b587f7f7537c7e33137aed53858092bf8e
+size 4672471496

model-00002-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:daf2022d1fc8804e5fd01c9dcc15a2ba9807c42d06cf5066de5505a6c5c1ca6d
+size 4831922680

model-00003-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bb14258180ae65798f4c1d09f55d793f81d8563e8831a1ea6b8ea4799848208
+size 4966190736

model-00004-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b2264e94f6b4bffb614e6733922771b07b2537bf24f67ed5ff4fe0e7b11b5203
+size 4831906200

model-00005-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:520e6206ce7e53029587bae3f2fd1bb7c6c3471635677750853186493da1f23f
+size 4999711712

model-00006-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2859ef4d85f9704d9cee7d8ff64e994b164cdaa5b56d0e110d12c9ca9522abad
+size 4798385224

model-00007-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:595043aa527c3c44346348e59ecf0aeb83d070ca8fa2be54e6a3551be0d76130
+size 4831906200

model-00008-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a9f3551f16c072dba382dac464a5d906df452b2350e098adbf0f007265448e40
+size 4966190736

model-00009-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4a49fba98efd43aa2b1ad873f12a9d9046e61b8c9606b26e54daacefb596fb0d
+size 4664167384

model-00010-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:34884dbc8c6dcf962212f69c74f872c5797f89833fddb70b120b497ce4c3bcc3
+size 4831906200

model-00011-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35252e9be0ce4f80e3c2d6ff8d2701be1572903d99269d87112f08aa6f3a4ff7
+size 4999711712

model-00012-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d30389aaf95e80ae5b1c93bcf62d499a18ce68da09ccaf1ca0a67582bff7261
+size 4798385224

model-00013-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd2e6aaa1024646476eb7c97ca032bcea82b0559b1ea7683e88b862decaa9fd3
+size 4831906200

model-00014-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2d4e77a1583a7bdfc25680bc08372b58cb87c885f0264036f6c4082b5dd54af2
+size 4966190736

model-00015-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:76416e5634cadbaa71222241610194bc69f38c70334183b0456181421ac1efd9
+size 4831906200

model-00016-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff44e489e7cc25b0f45fc91ec702df1108ed9844bbf1fe8090965b20445ba60a
+size 4966174232

model-00017-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5568d1a7d9287079145ed0878780056904c1ba64c0fa7cd3a5aae6f502272681
+size 4966140544

model-00018-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ebdeccc43575e6a538ddae18085ea6879ff429654d07290e377de5276a7fe471
+size 4999711704

model-00019-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:345b97b98f0fad656d8062288dc1e6db353c60f478114d07ae394908ff84d432
+size 4999711712

model-00020-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a16747f24d34d3e19b263f41a92e94e6bde4f0a7ec778e95dbfc4fa041b6ebae
+size 4798385224

model-00021-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d4fdbdad88200c43381bfe67f589c3c70e0d59c4e0eb2b9c7ede06238f82c363
+size 4831906200

model-00022-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32c8e0dfa125ecfffb762fdcda09a64097125c6987887b79517f7ba806c37a82
+size 4966190736

model-00023-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e4da4c885e4a3b4dcd0c659619be30ae37a65856aa566b6be9117ae66e4fcf32
+size 4831906200

model-00024-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9f1b0dfd73ab6865f400ec295fde62f00ff6c3ef045d922d2c34391fedb5d2b2
+size 4664167376

model-00025-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:57e1c679cd658852974773b35a7f7ae14beda6096528d29e62d8a40b0f9264a1
+size 4999711712

model-00026-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3240e649c292d905f0698ca896f1dfac4844a9e48c0d2474a3dfe9d0d2412bbe
+size 4798385224

model-00027-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff438d7da66ed3049d08ed6c501e011dbfbbf1f57085903f42ed4d875dbbda3e
+size 4831906200

model-00028-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8ac89613cd93016b780dbff0290bbbc614e9f7610e42f238e37420661631bae2
+size 4966190736

model-00029-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0dbd77d2ee348362ac012aba2eef2a0fd54b256ffb40ccf9e6d6d9146cab0d2
+size 4831906200

model-00030-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:715f6e63ffca34def2a8e271c7fa6d30345fd99147c86991f7d9249b95849803
+size 4966190736

model-00031-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:168bab91302186fc04b8e87ae389f5ee6e63cb220cfb273b1b2873c90fcab20b
+size 4982901368

model-00032-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d3db5ed93d9902bef4b3c5014433ff8258f3aa2f5a5619b42dedb8814f4474a8
+size 4982934368

model-00033-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f548efaa6c8fc1ad7e54e010e88d166f2a0555062cfe8bd7ea4d972d277c3301
+size 4999711720

model-00034-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62475c0bac2a8fd6f7ec6bdf8eb9655857c88f06183384beca3297031c5b5366
+size 4798385240

model-00035-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4b73824be4668f7487d5eb249445dd30450e05e083dced0687b8734078bfb91
+size 4831906208

model-00036-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6fef95f1be960bf78af29cf1aeb5dad16fdb62813ebf2b75ced025c0d46ea8f1
+size 4966190744

model-00037-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:72a9a30521d09c8f5e417621b08e89d266075382743c047d418951b9594eeb82
+size 4831906208

model-00038-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:56b3568aafcb4a3d302619ca3f2f8ad6b32dada5c637a666c1aa577b04e58fe1
+size 4966174256

model-00039-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a81a33c36ee2a2553537fea5714b020061a5b1e5f0201a6c4e622adef8d484a8
+size 4966140544

model-00040-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b86c3ebdee6c199c413afed34e453399bec1befde451f9568933e166d56e3a54
+size 4999711728

model-00041-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fe048112581f18ab2b711f986330edcc00f4f90ce5ca870e187aab437b1a689c
+size 4999711744

model-00042-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a907a87e173ab30cb6d7856626e210f23f01eac564bd4696d274abf9dac60f8e
+size 4798385256

model-00043-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4ec7ccb8b8564bab41b16cb34808c73d331c5759a640d0102cd5416fe25d66f8
+size 4831906216

model-00044-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2eadae2b8bf98f2c17505931c54bbaab78530eadf17ffff588ab125992b2b2b3
+size 4966190768

model-00045-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d132c7cb3612a6ade0c2e3406d1bbb18d277df83a00ee4023249899ac86db6c
+size 4831906224

model-00046-of-00050.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:685b0145bd48929b1dacdae3e7c807541ec003e81bd10c55152806939d1b28ea
+size 4966174256