dicta-il
/

dictabert-large-ner

Token Classification

Inference Endpoints

Model card Files Files and versions Community

Shaltiel commited on Dec 29, 2023

Commit

1d09167

•

1 Parent(s): b39e253

Update README.md

Files changed (1) hide show

README.md +29 -15

README.md CHANGED Viewed

@@ -25,7 +25,7 @@ oracle = pipeline('ner', model='dicta-il/dictabert-large-ner', aggregation_strat
 from tokenizers.decoders import WordPiece
 oracle.tokenizer.backend_tokenizer.decoder = WordPiece()
-sentence = 'הכי דרמטי שיש: שער של סדריק המחליף העניק לזיו אריה ניצחון שני בשלושה משחקים ועלייה מעל הקו האדום.'
 oracle(sentence)
 ```
@@ -34,24 +34,38 @@ Output:
 [
   {
     "entity_group": "PER",
-    "score": 0.9998621,
-    "word": "סדריק",
-    "start": 22,
-    "end": 27
   },
   {
-    "entity_group": "PER",
-    "score": 0.9999503,
-    "word": "לזי",
-    "start": 41,
-    "end": 44
   },
   {
-    "entity_group": "PER",
-    "score": 0.9998287,
-    "word": "אריה",
-    "start": 46,
-    "end": 50
   }
 ]
 ```

 from tokenizers.decoders import WordPiece
 oracle.tokenizer.backend_tokenizer.decoder = WordPiece()
+sentence = '''דוד בן-גוריון (16 באוקטובר 1886 - ו' בכסלו תשל"ד) היה מדינאי ישראלי וראש הממשלה הראשון של מדינת ישראל.'''
 oracle(sentence)
 ```
 [
   {
     "entity_group": "PER",
+    "score": 0.9998988,
+    "word": "דוד בן - גוריון",
+    "start": 0,
+    "end": 13
   },
   {
+    "entity_group": "TIMEX",
+    "score": 0.99989706,
+    "word": "16 באוקטובר 1886",
+    "start": 15,
+    "end": 31
   },
   {
+    "entity_group": "TIMEX",
+    "score": 0.99991614,
+    "word": "ו' בכסלו תשל\"ד",
+    "start": 34,
+    "end": 48
+  },
+  {
+    "entity_group": "TTL",
+    "score": 0.9931756,
+    "word": "וראש הממשלה",
+    "start": 68,
+    "end": 79
+  },
+  {
+    "entity_group": "GPE",
+    "score": 0.9995702,
+    "word": "ישראל",
+    "start": 96,
+    "end": 101
   }
 ]
 ```