thenlper michaelfeil commited on
Commit
8fdde9c
1 Parent(s): 3276994

undo PR 20 (#22)

Browse files

- undo PR 20 (ebaf4f3e76c91ca9e67751c5eb088b71842ccd25)
- Update sentence_bert_config.json (64c8869ce5bf1876b0cd88e4039cbc32ae52c3dc)
- Update tokenizer_config.json (dde01c7ef2499209ac7da7f5c572b15197f74187)


Co-authored-by: Michael <michaelfeil@users.noreply.huggingface.co>

config.json CHANGED
@@ -14,7 +14,7 @@
14
  "hidden_size": 1536,
15
  "initializer_range": 0.02,
16
  "intermediate_size": 8960,
17
- "max_position_embeddings": 2048,
18
  "max_window_layers": 21,
19
  "model_type": "qwen2",
20
  "num_attention_heads": 12,
@@ -22,7 +22,7 @@
22
  "num_key_value_heads": 2,
23
  "rms_norm_eps": 1e-06,
24
  "rope_theta": 1000000.0,
25
- "sliding_window": 2048,
26
  "tie_word_embeddings": false,
27
  "torch_dtype": "float32",
28
  "transformers_version": "4.41.2",
 
14
  "hidden_size": 1536,
15
  "initializer_range": 0.02,
16
  "intermediate_size": 8960,
17
+ "max_position_embeddings": 131072,
18
  "max_window_layers": 21,
19
  "model_type": "qwen2",
20
  "num_attention_heads": 12,
 
22
  "num_key_value_heads": 2,
23
  "rms_norm_eps": 1e-06,
24
  "rope_theta": 1000000.0,
25
+ "sliding_window": 131072,
26
  "tie_word_embeddings": false,
27
  "torch_dtype": "float32",
28
  "transformers_version": "4.41.2",
sentence_bert_config.json CHANGED
@@ -1,4 +1,4 @@
1
  {
2
- "max_seq_length": 2048,
3
  "do_lower_case": false
4
  }
 
1
  {
2
+ "max_seq_length": 32768,
3
  "do_lower_case": false
4
  }
tokenizer_config.json CHANGED
@@ -39,7 +39,7 @@
39
  "clean_up_tokenization_spaces": false,
40
  "eos_token": "<|endoftext|>",
41
  "errors": "replace",
42
- "model_max_length": 2048,
43
  "pad_token": "<|endoftext|>",
44
  "split_special_tokens": false,
45
  "tokenizer_class": "Qwen2Tokenizer",
 
39
  "clean_up_tokenization_spaces": false,
40
  "eos_token": "<|endoftext|>",
41
  "errors": "replace",
42
+ "model_max_length": 32768,
43
  "pad_token": "<|endoftext|>",
44
  "split_special_tokens": false,
45
  "tokenizer_class": "Qwen2Tokenizer",