danielhanchen commited on
Commit
c1b23fe
1 Parent(s): b3c4a0d

Upload LlamaForCausalLM

Browse files
config.json CHANGED
@@ -1,21 +1,17 @@
1
  {
2
- "_name_or_path": "mattshumer/Reflection-70B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
- "eos_token_id": [
10
- 128001,
11
- 128008,
12
- 128009
13
- ],
14
  "hidden_act": "silu",
15
  "hidden_size": 8192,
16
  "initializer_range": 0.02,
17
  "intermediate_size": 28672,
18
- "max_position_embeddings": 131072,
19
  "mlp_bias": false,
20
  "model_type": "llama",
21
  "num_attention_heads": 64,
@@ -23,17 +19,11 @@
23
  "num_key_value_heads": 8,
24
  "pretraining_tp": 1,
25
  "rms_norm_eps": 1e-05,
26
- "rope_scaling": {
27
- "factor": 8.0,
28
- "high_freq_factor": 4.0,
29
- "low_freq_factor": 1.0,
30
- "original_max_position_embeddings": 8192,
31
- "rope_type": "llama3"
32
- },
33
  "rope_theta": 500000.0,
34
  "tie_word_embeddings": false,
35
  "torch_dtype": "bfloat16",
36
  "transformers_version": "4.44.2",
37
  "use_cache": true,
38
- "vocab_size": 128256
39
  }
 
1
  {
2
+ "_name_or_path": "mattshumer/Reflection-Llama-3.1-70B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
+ "eos_token_id": 128009,
 
 
 
 
10
  "hidden_act": "silu",
11
  "hidden_size": 8192,
12
  "initializer_range": 0.02,
13
  "intermediate_size": 28672,
14
+ "max_position_embeddings": 8192,
15
  "mlp_bias": false,
16
  "model_type": "llama",
17
  "num_attention_heads": 64,
 
19
  "num_key_value_heads": 8,
20
  "pretraining_tp": 1,
21
  "rms_norm_eps": 1e-05,
22
+ "rope_scaling": null,
 
 
 
 
 
 
23
  "rope_theta": 500000.0,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
  "transformers_version": "4.44.2",
27
  "use_cache": true,
28
+ "vocab_size": 128262
29
  }
generation_config.json CHANGED
@@ -3,10 +3,10 @@
3
  "do_sample": true,
4
  "eos_token_id": [
5
  128001,
6
- 128008,
7
  128009
8
  ],
9
- "temperature": 0.7,
10
- "top_p": 0.95,
 
11
  "transformers_version": "4.44.2"
12
  }
 
3
  "do_sample": true,
4
  "eos_token_id": [
5
  128001,
 
6
  128009
7
  ],
8
+ "max_length": 4096,
9
+ "temperature": 0.6,
10
+ "top_p": 0.9,
11
  "transformers_version": "4.44.2"
12
  }
model-00001-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3c208883511816be018b3d5c4e90a8c27d9b7d828cbb97d36c05d24d20ada8c
3
- size 4584408808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:644f054373639c20fba9270749c25b9e91ecaf538fd3ddd48268578ea920c4ef
3
+ size 4584507112
model-00002-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4642126f1113a1c3eb42e0b83e965d5b85f12b39931767dba1642cb5630bbce9
3
  size 4664167376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1222b2ef9549c6fd5d104ed973df737c06c17fc9c7592336fdd6e048605ed25
3
  size 4664167376
model-00003-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c06765cd8c5e838d61284885c48d14286d44f5ecc2aa34d08be2c1f1b63b59ba
3
  size 4999711704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86191b3774de93e70b405ab5f485bcd9adbf73d47043e747cc823b27d419db31
3
  size 4999711704
model-00004-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2a985e4dcd7538433b512fa14ff23499856a1f925fd947d5b7101ea1f673380
3
  size 4966157032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6253872ad9d98cbc79110974734a719240e3d4a2c2fc914d1a319d679a377e43
3
  size 4966157032
model-00005-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8051a0d2e07c7e9fa368a582f6d91d228135fa0c11bdc941a8955fec6a8ba4c
3
  size 4664134408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:023d5918deb9095bfb2c4d0bd316f2db0abecd4509ddce643fa9526638ea646d
3
  size 4664134408
model-00006-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:348cd98f65a4b29af25330445841428a9a16e41569c067e63b7f44af9ea19329
3
  size 4664167408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:798b92d3c8b878af625420583f746f7055e444e8daca99496303497ec54ec3da
3
  size 4664167408
model-00007-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2e52303706b73fca20c1f4137dcdd16929487b432b805d32e6a0a4967d518d2
3
  size 4664167408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8293f5521baf1f314d63104bf821e52c9aad1a1d9eb9987e3d8bd39fe6e903f7
3
  size 4664167408
model-00008-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6240b8784a4236a01656e9af27d09b122417ee83eb2d1a35e46f31456230059f
3
  size 4999711728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:454249979a0b1c25a0eb72b5ac5222da0a9b11eab459d207aaa189afaf6e01b3
3
  size 4999711728
model-00009-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78da3c0b496a2bdd3864f463b9fd9fe24f5f30cee40c1c12467587ffba498723
3
  size 4966157056
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e54f6ac1e9ad1843b756445e8bc41790a72a0731d6d05871ae3e7bd5fb804cd6
3
  size 4966157056
model-00010-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f67b273c0dca38ef6bcc917de3d8e3a7be85ba1d98b0047770aa86978d12dfc
3
  size 4664134408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06628e1b8b130140ecfd154db7a2b16189d7616870d7fc63b5ae760286b798c2
3
  size 4664134408
model-00011-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de754821593679bfc4997c7d0ddcabdbe7bf8346611f0b87be13939295e82fe5
3
  size 4664167408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c726cfc07ba932d8f31eb91f749385c87aaccb8d6a8fb05f39b67d619d3a8d21
3
  size 4664167408
model-00012-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:187129aacbd18ed1fcc6041feed73385124d470bb65f93e50ef1a0013eeb96d0
3
  size 4664167408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3e601196392560b3ac31fa1f839c472e852872ec3b23e8fff5427dd6360c81f
3
  size 4664167408
model-00013-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18d9997b7062b00f7b81b9b58f9b684cdbc4368c7d57d14b593be66f6af4a8ce
3
  size 4999711728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad8782aa3ab097eba3f8233efce781d8d0cabb45f26d56a917c7dcb097a332af
3
  size 4999711728
model-00014-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aaf6000cdc614cb1a47c959d22822cf544ab623cfda9928596d855af66b4bedc
3
  size 4966157056
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b012d4e9a88fdfd7856cc8af28af2971ec325693b3e18457ad899257cec8610c
3
  size 4966157056
model-00015-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef1808b365e913e1370dce52bf05af99e8bbc5f98a74388534be35b18929a96d
3
  size 4664134408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8c63e46229d67c88e9e2b9ad4497f779fe922b3c21d79ff7c04d04e5786df37
3
  size 4664134408
model-00016-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:828e905d43c18ef497ec02b5a36760703329e45551816600787e749496587966
3
  size 4664167408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46e76a2cd2b2aaa7524b1187db6e7d2aa7c873e2dd3c2ce89c022e061acace37
3
  size 4664167408
model-00017-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:987d4be2093e5815c8ec6364c04000187ddcc59a71c156a818d271eab06a7436
3
  size 4664167408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6b39ca86411851783a21aca3e109c276bae894359b6e4021d4c26a73f291a9c
3
  size 4664167408
model-00018-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:538c62f520e233931bc01ae177279d6b97b30642e959e0fd5c78bfdef25833a9
3
  size 4999711728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e17f135838f01e5d1d45970cef560d258b5fe1b3f87c5c5574d6c1ae02c2a07f
3
  size 4999711728
model-00019-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a8f8b0e48b2d624654f5658d647ac3eca2106227f54ee7696a973e41deaddde
3
  size 4966157056
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6124d9e0abfdfcd3b98250288c430fb394e6b129c8edac63e25c1e5b1d0aa30
3
  size 4966157056
model-00020-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd8f2458bad38f36b78fe3838f99557f7f6fdc33c33ba993e358c306dd142fa3
3
  size 4664134408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0092e30f1301d56465c8071274a1df95bc5c48edcda088282fc4e91ddef3b6d
3
  size 4664134408
model-00021-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f20782804ccf1ba667befb0a14087c9bbdca67f6061981fc9e4a6ed7b268142d
3
  size 4664167408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8d42721d3ac63fff254f875048733de3aa2b80fad2e8581c76cc939245a59e6
3
  size 4664167408
model-00022-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb06374d1398a27d9393c8b55b92b4ce5afd534dc4c53a5fb71520f4723b5638
3
  size 4664167408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c23771b5cddf9dff11f23ee7e76dafc2b7f3215ff0f5baf3ec69a5a85a2b5eb5
3
  size 4664167408
model-00023-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ee25d8e38062b3017b78dcfd762f52d49b3fd2d6d80de360fb409d9c779af23
3
  size 4999711728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ceba963387003ba076d69cf86b0b0135ee80de64087a6029060c56435ebf0644
3
  size 4999711728
model-00024-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7bcab62f5a6681e654f756d29b908ca87561ced1b94fa93d755b9b1ea77eee68
3
  size 4966157056
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68644ff8c2e5dbffe0b70334ee575f70919db332f53e6e08c7ffcb930655c4c7
3
  size 4966157056
model-00025-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35a194168043a2ab06e9bacfa2d4dceff17bf631497926eafad2b573d7b8184f
3
  size 4664134408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f75fe67d2db6f5568bb83d295ba515ab83010cf94a98da2feeea32f13afa6923
3
  size 4664134408
model-00026-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffe73aea7bd94fd6ec76bf5b7d3b09da5c9fc6bc6456916d21ddc94cdc98ef66
3
  size 4664167408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7637913f3caa0aa2cd1a0cc736deb5640e872ae174c87d7c6b5ccdde2d2bc521
3
  size 4664167408
model-00027-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17943ef6837f63a13ae796f84265ab99a3766a38357f515f975ac432c2a8e4e3
3
  size 4664167408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b239e31cf5c45ba683183ea5008030ddcd2580b151870bb928780a03158312e3
3
  size 4664167408
model-00028-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:031f4e3f72548c41f382ae155605729f7a05359b24721ee99da6893939f78cbe
3
  size 4999711728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e6c5da91457037e4cb0a473b59d61ceb07ca0205fd98d7dd187b711d231b98f
3
  size 4999711728
model-00029-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8054984696ef858ada3875536f41471f4a890b340d60095e281fd7fc813e6ffa
3
  size 4966173536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18673cfa947ea640738188442beb37dadb25525c0d7a950ff45b6e633ce7329d
3
  size 4966173536
model-00030-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c845d7ccba30e2e0eb8ab20aa313d5ed45dca6634e214a62ed323b70462fa828
3
- size 2101346432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4999d998507a81d54650a71bd15cb4fbb42d6eb7ada1e1a3fec4eedbefcca93f
3
+ size 2101444736
model.safetensors.index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "metadata": {
3
- "total_size": 141107412992
4
  },
5
  "weight_map": {
6
  "lm_head.weight": "model-00030-of-00030.safetensors",
 
1
  {
2
  "metadata": {
3
+ "total_size": 141107609600
4
  },
5
  "weight_map": {
6
  "lm_head.weight": "model-00030-of-00030.safetensors",