BAAI
/

hyxmmm commited on
Commit
171ab28
1 Parent(s): e738e43

Update tokenizer_config.json

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +3 -3
tokenizer_config.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "add_prefix_space": false,
3
- "bos_token": "<|endoftext|>",
4
  "clean_up_tokenization_spaces": true,
5
- "eos_token": "<|endoftext|>",
6
- "model_max_length": 2048,
7
  "padding_side": "right",
8
  "tokenizer_class": "GPT2Tokenizer",
9
  "unk_token": "<|endoftext|>"
 
1
  {
2
  "add_prefix_space": false,
3
+ "bos_token": "[CLS]",
4
  "clean_up_tokenization_spaces": true,
5
+ "eos_token": "</s>",
6
+ "model_max_length": 4096,
7
  "padding_side": "right",
8
  "tokenizer_class": "GPT2Tokenizer",
9
  "unk_token": "<|endoftext|>"