dicta-il
/

dictabert-ner

Token Classification

Inference Endpoints

Model card Files Files and versions Community

Shaltiel commited on Dec 29, 2023

Commit

bcdfa14

•

1 Parent(s): 143edb2

Update README.md

Files changed (1) hide show

README.md +29 -15

README.md CHANGED Viewed

@@ -22,7 +22,7 @@ oracle = pipeline('ner', model='dicta-il/dictabert-ner', aggregation_strategy='s
 from tokenizers.decoders import WordPiece
 oracle.tokenizer.backend_tokenizer.decoder = WordPiece()
-sentence = 'הכי דרמטי שיש: שער של סדריק המחליף העניק לזיו אריה ניצחון שני בשלושה משחקים ועלייה מעל הקו האדום.'
 oracle(sentence)
 ```
@@ -31,24 +31,38 @@ Output:
 [
   {
     "entity_group": "PER",
-    "score": 0.99978834,
-    "word": "סדריק",
-    "start": 22,
-    "end": 27
   },
   {
-    "entity_group": "PER",
-    "score": 0.99994457,
-    "word": "לזי",
-    "start": 41,
-    "end": 44
   },
   {
-    "entity_group": "PER",
-    "score": 0.99993944,
-    "word": "אריה",
-    "start": 46,
-    "end": 50
   }
 ]
 ```

 from tokenizers.decoders import WordPiece
 oracle.tokenizer.backend_tokenizer.decoder = WordPiece()
+sentence = '''דוד בן-גוריון (16 באוקטובר 1886 - ו' בכסלו תשל"ד) היה מדינאי ישראלי וראש הממשלה הראשון של מדינת ישראל.'''
 oracle(sentence)
 ```
 [
   {
     "entity_group": "PER",
+    "score": 0.9999443,
+    "word": "דוד בן - גוריון",
+    "start": 0,
+    "end": 13
   },
   {
+    "entity_group": "TIMEX",
+    "score": 0.99987966,
+    "word": "16 באוקטובר 1886",
+    "start": 15,
+    "end": 31
   },
   {
+    "entity_group": "TIMEX",
+    "score": 0.9998579,
+    "word": "ו' בכסלו תשל\"ד",
+    "start": 34,
+    "end": 48
+  },
+  {
+    "entity_group": "TTL",
+    "score": 0.99963045,
+    "word": "וראש הממשלה",
+    "start": 68,
+    "end": 79
+  },
+  {
+    "entity_group": "GPE",
+    "score": 0.9997943,
+    "word": "ישראל",
+    "start": 96,
+    "end": 101
   }
 ]
 ```