Shaltiel commited on
Commit
bcdfa14
โ€ข
1 Parent(s): 143edb2

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +29 -15
README.md CHANGED
@@ -22,7 +22,7 @@ oracle = pipeline('ner', model='dicta-il/dictabert-ner', aggregation_strategy='s
22
  from tokenizers.decoders import WordPiece
23
  oracle.tokenizer.backend_tokenizer.decoder = WordPiece()
24
 
25
- sentence = 'ื”ื›ื™ ื“ืจืžื˜ื™ ืฉื™ืฉ: ืฉืขืจ ืฉืœ ืกื“ืจื™ืง ื”ืžื—ืœื™ืฃ ื”ืขื ื™ืง ืœื–ื™ื• ืืจื™ื” ื ื™ืฆื—ื•ืŸ ืฉื ื™ ื‘ืฉืœื•ืฉื” ืžืฉื—ืงื™ื ื•ืขืœื™ื™ื” ืžืขืœ ื”ืงื• ื”ืื“ื•ื.'
26
  oracle(sentence)
27
  ```
28
 
@@ -31,24 +31,38 @@ Output:
31
  [
32
  {
33
  "entity_group": "PER",
34
- "score": 0.99978834,
35
- "word": "ืกื“ืจื™ืง",
36
- "start": 22,
37
- "end": 27
38
  },
39
  {
40
- "entity_group": "PER",
41
- "score": 0.99994457,
42
- "word": "ืœื–ื™",
43
- "start": 41,
44
- "end": 44
45
  },
46
  {
47
- "entity_group": "PER",
48
- "score": 0.99993944,
49
- "word": "ืืจื™ื”",
50
- "start": 46,
51
- "end": 50
 
 
 
 
 
 
 
 
 
 
 
 
 
 
52
  }
53
  ]
54
  ```
 
22
  from tokenizers.decoders import WordPiece
23
  oracle.tokenizer.backend_tokenizer.decoder = WordPiece()
24
 
25
+ sentence = '''ื“ื•ื“ ื‘ืŸ-ื’ื•ืจื™ื•ืŸ (16 ื‘ืื•ืงื˜ื•ื‘ืจ 1886 - ื•' ื‘ื›ืกืœื• ืชืฉืœ"ื“) ื”ื™ื” ืžื“ื™ื ืื™ ื™ืฉืจืืœื™ ื•ืจืืฉ ื”ืžืžืฉืœื” ื”ืจืืฉื•ืŸ ืฉืœ ืžื“ื™ื ืช ื™ืฉืจืืœ.'''
26
  oracle(sentence)
27
  ```
28
 
 
31
  [
32
  {
33
  "entity_group": "PER",
34
+ "score": 0.9999443,
35
+ "word": "ื“ื•ื“ ื‘ืŸ - ื’ื•ืจื™ื•ืŸ",
36
+ "start": 0,
37
+ "end": 13
38
  },
39
  {
40
+ "entity_group": "TIMEX",
41
+ "score": 0.99987966,
42
+ "word": "16 ื‘ืื•ืงื˜ื•ื‘ืจ 1886",
43
+ "start": 15,
44
+ "end": 31
45
  },
46
  {
47
+ "entity_group": "TIMEX",
48
+ "score": 0.9998579,
49
+ "word": "ื•' ื‘ื›ืกืœื• ืชืฉืœ\"ื“",
50
+ "start": 34,
51
+ "end": 48
52
+ },
53
+ {
54
+ "entity_group": "TTL",
55
+ "score": 0.99963045,
56
+ "word": "ื•ืจืืฉ ื”ืžืžืฉืœื”",
57
+ "start": 68,
58
+ "end": 79
59
+ },
60
+ {
61
+ "entity_group": "GPE",
62
+ "score": 0.9997943,
63
+ "word": "ื™ืฉืจืืœ",
64
+ "start": 96,
65
+ "end": 101
66
  }
67
  ]
68
  ```