init
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +28 -0
- dpo-adapter/adapter_config.json +37 -0
- generation_config.json +7 -0
- model-00002-of-00291.safetensors +3 -0
- model-00003-of-00291.safetensors +3 -0
- model-00004-of-00291.safetensors +3 -0
- model-00005-of-00291.safetensors +3 -0
- model-00006-of-00291.safetensors +3 -0
- model-00007-of-00291.safetensors +3 -0
- model-00008-of-00291.safetensors +3 -0
- model-00009-of-00291.safetensors +3 -0
- model-00010-of-00291.safetensors +3 -0
- model-00011-of-00291.safetensors +3 -0
- model-00012-of-00291.safetensors +3 -0
- model-00013-of-00291.safetensors +3 -0
- model-00014-of-00291.safetensors +3 -0
- model-00015-of-00291.safetensors +3 -0
- model-00016-of-00291.safetensors +3 -0
- model-00017-of-00291.safetensors +3 -0
- model-00018-of-00291.safetensors +3 -0
- model-00019-of-00291.safetensors +3 -0
- model-00020-of-00291.safetensors +3 -0
- model-00021-of-00291.safetensors +3 -0
- model-00022-of-00291.safetensors +3 -0
- model-00023-of-00291.safetensors +3 -0
- model-00024-of-00291.safetensors +3 -0
- model-00025-of-00291.safetensors +3 -0
- model-00026-of-00291.safetensors +3 -0
- model-00027-of-00291.safetensors +3 -0
- model-00028-of-00291.safetensors +3 -0
- model-00029-of-00291.safetensors +3 -0
- model-00030-of-00291.safetensors +3 -0
- model-00031-of-00291.safetensors +3 -0
- model-00032-of-00291.safetensors +3 -0
- model-00033-of-00291.safetensors +3 -0
- model-00034-of-00291.safetensors +3 -0
- model-00035-of-00291.safetensors +3 -0
- model-00036-of-00291.safetensors +3 -0
- model-00037-of-00291.safetensors +3 -0
- model-00038-of-00291.safetensors +3 -0
- model-00039-of-00291.safetensors +3 -0
- model-00040-of-00291.safetensors +3 -0
- model-00041-of-00291.safetensors +3 -0
- model-00042-of-00291.safetensors +3 -0
- model-00043-of-00291.safetensors +3 -0
- model-00044-of-00291.safetensors +3 -0
- model-00045-of-00291.safetensors +3 -0
- model-00046-of-00291.safetensors +3 -0
- model-00047-of-00291.safetensors +3 -0
- model-00048-of-00291.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "./hermes-2-pro-llama-3-8b-DPO",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": 128003,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 4096,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 14336,
|
14 |
+
"max_position_embeddings": 8192,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 32,
|
17 |
+
"num_hidden_layers": 32,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"pretraining_tp": 1,
|
20 |
+
"rms_norm_eps": 1e-05,
|
21 |
+
"rope_scaling": null,
|
22 |
+
"rope_theta": 500000.0,
|
23 |
+
"tie_word_embeddings": false,
|
24 |
+
"torch_dtype": "float16",
|
25 |
+
"transformers_version": "4.40.1",
|
26 |
+
"use_cache": true,
|
27 |
+
"vocab_size": 128288
|
28 |
+
}
|
dpo-adapter/adapter_config.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"alpha_pattern": {},
|
3 |
+
"auto_mapping": null,
|
4 |
+
"base_model_name_or_path": "/workspace/axolotl/hermes-2-pro-llama-3-8b-dpo-split-2",
|
5 |
+
"bias": "none",
|
6 |
+
"fan_in_fan_out": null,
|
7 |
+
"inference_mode": true,
|
8 |
+
"init_lora_weights": true,
|
9 |
+
"layer_replication": null,
|
10 |
+
"layers_pattern": null,
|
11 |
+
"layers_to_transform": null,
|
12 |
+
"loftq_config": {},
|
13 |
+
"lora_alpha": 16,
|
14 |
+
"lora_dropout": 0.05,
|
15 |
+
"megatron_config": null,
|
16 |
+
"megatron_core": "megatron.core",
|
17 |
+
"modules_to_save": [
|
18 |
+
"embed_tokens",
|
19 |
+
"lm_head"
|
20 |
+
],
|
21 |
+
"peft_type": "LORA",
|
22 |
+
"r": 32,
|
23 |
+
"rank_pattern": {},
|
24 |
+
"revision": null,
|
25 |
+
"target_modules": [
|
26 |
+
"v_proj",
|
27 |
+
"up_proj",
|
28 |
+
"o_proj",
|
29 |
+
"k_proj",
|
30 |
+
"gate_proj",
|
31 |
+
"q_proj",
|
32 |
+
"down_proj"
|
33 |
+
],
|
34 |
+
"task_type": "CAUSAL_LM",
|
35 |
+
"use_dora": false,
|
36 |
+
"use_rslora": false
|
37 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 128000,
|
4 |
+
"do_sample": true,
|
5 |
+
"eos_token_id": 128003,
|
6 |
+
"transformers_version": "4.40.1"
|
7 |
+
}
|
model-00002-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24552d1e6d6052ead2c070190507fb9d48ec508d0dedc3823a4364f7b78bbac0
|
3 |
+
size 1050935440
|
model-00003-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:846ca1ce27d38aff82568ace21f4fe9896b8ce0280ed184f116c4b7fb02615d6
|
3 |
+
size 8328
|
model-00004-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78af5e278ece63631e0fd51e842e873c2e67ecc0760d5f1c29145c17424b0b4f
|
3 |
+
size 117440664
|
model-00005-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:467aad1f458b395e4a80e3906c7ac9f4c92021228210f2e3fd3976c19365b300
|
3 |
+
size 117440664
|
model-00006-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bf7cae68e59b6b4e50a924c0080fb7e9cc64a33274c2aebb9dfe2adc4601ef8
|
3 |
+
size 117440656
|
model-00007-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c962f39377822f59e0dd13e386fe8c1ebf677d0b8c9232ed16345670582a3847
|
3 |
+
size 8344
|
model-00008-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a6d8645191188f21a6ca664d20dac70884642ab5f91ced665d4140a2a01dd73
|
3 |
+
size 8388760
|
model-00009-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20f2d8bfc782b9e171c64d62b464c407b5ec8e195a7298865cc54ee882abc713
|
3 |
+
size 33554584
|
model-00010-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a97689d83877b08f7de787f800779db799377bfd9b4ddf5bc506435c3605879
|
3 |
+
size 33554584
|
model-00011-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07c922a158c2ef774a6be06b38db5282f4400e5865c84451a34b2edb5cbcee93
|
3 |
+
size 8388760
|
model-00012-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8983028bc1ad6c1dab49535d874e24cc320cba2460110e30fb531b09e2fc0f08
|
3 |
+
size 8328
|
model-00013-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04e46088235994852e13caf9158c8517c7c553090c14ed696caffac044dc769b
|
3 |
+
size 117440664
|
model-00014-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa8130ab75fb8a04cc80aaa4c028e516b2be024b5176539b384a4860d13d94ab
|
3 |
+
size 117440664
|
model-00015-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0475145714ae8c747d76ddc349a416811e4ed1f93ecb1152f568e3ecd270c704
|
3 |
+
size 117440656
|
model-00016-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e39832d18c9e16c0ad04798f38100874628d3589c3aadd179ea66240ed3466aa
|
3 |
+
size 8344
|
model-00017-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7fbb0fd3816122198136749aba5b4e133a4549ffe48f836bda11be5096552646
|
3 |
+
size 8388760
|
model-00018-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41061ea464cbe84ecc20effc1ac388cee57888fb4fd4af297f693325bd3e1c37
|
3 |
+
size 33554584
|
model-00019-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ae025687ca74c331cc5c67006c0fcba6ca858f3180cf439422b8c8b74a2e48d
|
3 |
+
size 33554584
|
model-00020-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79753bc658d351b69c11ac657d0feb29edd59b942414a896f4b8befcb3d2ea41
|
3 |
+
size 8388760
|
model-00021-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:145266d5b6af1a5cbb502bfd7ff7c167960a088dcf05787eddfe89af3ca2fd32
|
3 |
+
size 8328
|
model-00022-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79817449923dfede8afef28211abe854f6c5de18a3f7388a82431941b686ee87
|
3 |
+
size 117440664
|
model-00023-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7838fa5112156244eba5f5d44f8bf2c76396857c4f23fc213c31cb31495d5e6
|
3 |
+
size 117440664
|
model-00024-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7a47c30373f159fa6c745f5641a1be5921697b3fb10c4809ddfb99f61b02b35
|
3 |
+
size 117440656
|
model-00025-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b219f83795a10ed825ab18a607ee442b2ffc1b42bbec0def50b1487550ead037
|
3 |
+
size 8344
|
model-00026-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4373ae351de6eb043da589457ca52a0e0facd3d3221d2624bbfe11335d616856
|
3 |
+
size 8388760
|
model-00027-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a65e567f2634ad308e6f6f520e7c7101ad98ed03f095acecba7ac44f10b04c0
|
3 |
+
size 33554584
|
model-00028-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f411737043de5ce3052797e900e86047a13a4f804701abf74e1898b36dac1bdd
|
3 |
+
size 33554584
|
model-00029-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28e5f14788cb93b81a5a01377895f9ff21d10cb9bdb022338643e18d6ec3d3e1
|
3 |
+
size 8388760
|
model-00030-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c59eebe6bbdf99ad5cd1ac7f5a3e7fb50007d81be9d98b691ba9f370705117c7
|
3 |
+
size 8328
|
model-00031-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:778a511c311f11d35c263a0fb20ce8e797a202257290d737b1e92105b483e7df
|
3 |
+
size 117440664
|
model-00032-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b5c14a6ea6d7ca004b0e3ccafb389367869671dce4cde5c431ca899fc6fd32b
|
3 |
+
size 117440664
|
model-00033-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bdfb259143e05797d22e2e2d9639d897b1204661303e93a3657ebbda71b7ab5
|
3 |
+
size 117440656
|
model-00034-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:edf13cd86249045a162ef2159372ec8ac54dca9ca5e3607001781f687d4bd971
|
3 |
+
size 8344
|
model-00035-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8344f93f075e94fdae7d4c0b06333336d0ee940599aae80ac85a67b2e42fa29
|
3 |
+
size 8388760
|
model-00036-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8f6b2911c3c3029ee2403fc7b223fe6bc8cb3d587bdb96f21d08c24c771ea43
|
3 |
+
size 33554584
|
model-00037-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45292fade1cb7acc51ac5feb0271db645104b5dacb6cdd9624c26534974afd79
|
3 |
+
size 33554584
|
model-00038-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9cb0ff7e383d75cd1575131f4712535bdcf4d0e12cb51664db27c2fe1948113
|
3 |
+
size 8388760
|
model-00039-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dda2944f210c72003ffa5eb5e88c5feef641182c94601434d357afbf2a12e5f
|
3 |
+
size 8328
|
model-00040-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3957c5f871f3b3c02e0430bcd4a81a0485fd1120544d61b93223da272d5ace69
|
3 |
+
size 117440664
|
model-00041-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5113b79de71d90e87c4972dee99ea1a556370729673825db0000d2f5b25c187
|
3 |
+
size 117440664
|
model-00042-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:403273c3a08447f55a2e10cc185671c8283906d3f48e2b6c1f3323e7f12cc6cd
|
3 |
+
size 117440656
|
model-00043-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d55d56b67fcda633bfc97a68eb1a0f29b25058c678961354e090a7d255e3615
|
3 |
+
size 8344
|
model-00044-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ba0d6f335d206262c3789ef7aa4bd260d56d0100c39d2fbb57929d51d374b4c
|
3 |
+
size 8388760
|
model-00045-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9ccb4a00554f6870ee20cba233110ee1d2f2fec9a5abc94f8f09db320e9c67d
|
3 |
+
size 33554584
|
model-00046-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eba400eb104aca976807b7743476e0d7e1df7fad024cee6b12043e4cb939901
|
3 |
+
size 33554584
|
model-00047-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1671d3d380b7c0ef3eed36bf565800c3158fda9462df93691cd1eca6f90f2ff7
|
3 |
+
size 8388760
|
model-00048-of-00291.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddbdb3cc7247dc10eb70ab278310e583855aeec5833da0e15a0f741622a3c53f
|
3 |
+
size 8328
|