jtatman commited on
Commit
eda5870
1 Parent(s): c9f5d08

Update tokenizer_config.json

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +3 -50
tokenizer_config.json CHANGED
@@ -26,60 +26,13 @@
26
  "single_word": false,
27
  "special": true
28
  },
29
- "32000": {
30
- "content": "<|im_end|>",
31
- "lstrip": false,
32
- "normalized": false,
33
- "rstrip": false,
34
- "single_word": false,
35
- "special": true
36
- },
37
- "32001": {
38
- "content": "<|im_start|>",
39
- "lstrip": false,
40
- "normalized": false,
41
- "rstrip": false,
42
- "single_word": false,
43
- "special": true
44
- },
45
- "32002": {
46
- "content": "<|im_start|>user",
47
- "lstrip": false,
48
- "normalized": false,
49
- "rstrip": false,
50
- "single_word": false,
51
- "special": true
52
- },
53
- "32003": {
54
- "content": "<|im_start|>assistant",
55
- "lstrip": false,
56
- "normalized": false,
57
- "rstrip": false,
58
- "single_word": false,
59
- "special": true
60
- },
61
- "32004": {
62
- "content": "<|endoftext|>",
63
- "lstrip": false,
64
- "normalized": false,
65
- "rstrip": false,
66
- "single_word": false,
67
- "special": true
68
- }
69
- },
70
- "additional_special_tokens": [
71
- "<|im_start|>user",
72
- "<|im_end|>",
73
- "<|im_start|>assistant",
74
- "<|endoftext|>",
75
- "<|im_start|>"
76
- ],
77
  "bos_token": "<s>",
78
  "clean_up_tokenization_spaces": false,
79
- "eos_token": "<|im_end|>",
80
  "legacy": false,
81
  "model_max_length": 1000000000000000019884624838656,
82
- "pad_token": "<|im_end|>",
83
  "padding_side": "left",
84
  "sp_model_kwargs": {},
85
  "spaces_between_special_tokens": false,
 
26
  "single_word": false,
27
  "special": true
28
  },
29
+ }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
30
  "bos_token": "<s>",
31
  "clean_up_tokenization_spaces": false,
32
+ "eos_token": "</s>",
33
  "legacy": false,
34
  "model_max_length": 1000000000000000019884624838656,
35
+ "pad_token": "</s>",
36
  "padding_side": "left",
37
  "sp_model_kwargs": {},
38
  "spaces_between_special_tokens": false,