Hemanth-thunder commited on
Commit
3296d70
1 Parent(s): e925584

Upload tokenizer

Browse files
README.md CHANGED
@@ -1,15 +1,15 @@
1
  ---
2
- license: apache-2.0
3
- pipeline_tag: text-generation
4
  language:
5
  - ta
 
6
  tags:
7
  - pretrained
 
 
 
8
  inference:
9
  parameters:
10
  temperature: 0.7
11
- datasets:
12
- - Hemanth-thunder/tamil-madlad-400
13
  ---
14
  # Model Card for Tamil-Mistral-7B-v0.1
15
 
 
1
  ---
 
 
2
  language:
3
  - ta
4
+ license: apache-2.0
5
  tags:
6
  - pretrained
7
+ datasets:
8
+ - Hemanth-thunder/tamil-madlad-400
9
+ pipeline_tag: text-generation
10
  inference:
11
  parameters:
12
  temperature: 0.7
 
 
13
  ---
14
  # Model Card for Tamil-Mistral-7B-v0.1
15
 
special_tokens_map.json CHANGED
@@ -13,13 +13,7 @@
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
- "pad_token": {
17
- "content": "</s>",
18
- "lstrip": false,
19
- "normalized": false,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
  "unk_token": {
24
  "content": "<unk>",
25
  "lstrip": false,
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "pad_token": "</s>",
 
 
 
 
 
 
17
  "unk_token": {
18
  "content": "<unk>",
19
  "lstrip": false,
tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 200,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
tokenizer_config.json CHANGED
@@ -1,6 +1,7 @@
1
  {
2
  "add_bos_token": true,
3
  "add_eos_token": false,
 
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<unk>",
 
1
  {
2
  "add_bos_token": true,
3
  "add_eos_token": false,
4
+ "add_prefix_space": true,
5
  "added_tokens_decoder": {
6
  "0": {
7
  "content": "<unk>",