stardust-coder commited on
Commit
c4ad639
1 Parent(s): f687be8

Training in progress, step 16000

Browse files
Files changed (4) hide show
  1. config.json +2 -1
  2. model.safetensors +1 -1
  3. tokenizer.json +7 -16
  4. training_args.bin +2 -2
config.json CHANGED
@@ -16,6 +16,7 @@
16
  "initializer_range": 0.02,
17
  "intermediate_size": 1536,
18
  "max_position_embeddings": 1024,
 
19
  "model_type": "bit_llama",
20
  "n_ctx": 128,
21
  "num_attention_heads": 12,
@@ -27,7 +28,7 @@
27
  "rope_theta": 10000.0,
28
  "tie_word_embeddings": false,
29
  "torch_dtype": "float32",
30
- "transformers_version": "4.38.2",
31
  "use_cache": true,
32
  "vocab_size": 43176
33
  }
 
16
  "initializer_range": 0.02,
17
  "intermediate_size": 1536,
18
  "max_position_embeddings": 1024,
19
+ "mlp_bias": false,
20
  "model_type": "bit_llama",
21
  "n_ctx": 128,
22
  "num_attention_heads": 12,
 
28
  "rope_theta": 10000.0,
29
  "tie_word_embeddings": false,
30
  "torch_dtype": "float32",
31
+ "transformers_version": "4.43.1",
32
  "use_cache": true,
33
  "vocab_size": 43176
34
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9bfe194e198fef3b80b9aad762a114d4a07d86af744fd7100f4700f0b77eedbe
3
  size 510960712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b54db5c0bd7c16b81d205546b0424371ca6c7f3921aff82b21fe49bc3a0f7a2
3
  size 510960712
tokenizer.json CHANGED
@@ -36,23 +36,13 @@
36
  "special": true
37
  }
38
  ],
39
- "normalizer": {
40
- "type": "Sequence",
41
- "normalizers": [
42
- {
43
- "type": "Prepend",
44
- "prepend": "▁"
45
- },
46
- {
47
- "type": "Replace",
48
- "pattern": {
49
- "String": " "
50
- },
51
- "content": "▁"
52
- }
53
- ]
54
  },
55
- "pre_tokenizer": null,
56
  "post_processor": {
57
  "type": "TemplateProcessing",
58
  "single": [
@@ -139,6 +129,7 @@
139
  "end_of_word_suffix": null,
140
  "fuse_unk": true,
141
  "byte_fallback": true,
 
142
  "vocab": {
143
  "<unk>": 0,
144
  "<s>": 1,
 
36
  "special": true
37
  }
38
  ],
39
+ "normalizer": null,
40
+ "pre_tokenizer": {
41
+ "type": "Metaspace",
42
+ "replacement": "▁",
43
+ "prepend_scheme": "first",
44
+ "split": false
 
 
 
 
 
 
 
 
 
45
  },
 
46
  "post_processor": {
47
  "type": "TemplateProcessing",
48
  "single": [
 
129
  "end_of_word_suffix": null,
130
  "fuse_unk": true,
131
  "byte_fallback": true,
132
+ "ignore_merges": false,
133
  "vocab": {
134
  "<unk>": 0,
135
  "<s>": 1,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d1245ad5795253debe58bcbfdd83b24f66ab3036e63cd3b66d342f5ad8f590c
3
- size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b424b2667b6ff1f95ac264726f10142e36ba9a36e85dd23b84f435ef94b9cc29
3
+ size 5176