Named_Entity_Recognition

Sleeping

AyushDey commited on Jul 28, 2023

Commit

518c7d9

1 Parent(s): 9c0109a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,21 +3,24 @@ from transformers import pipeline
 ner = pipeline('ner')
-def merged_words(tokens):
-    m = []
     for token in tokens:
-        if m and token['entity'].startswith('I-') and m[-1]['entity'].endswith(token['entity'][2:]):
-            last_token = m[-1]
             last_token['word'] += token['word'].replace('##', '')
             last_token['end'] = token['end']
-            last_token['score'] = (last_token['score'] + token[score]) / 2
         else:
-            m.append(token)
-    return m
 def named(input):
     output = ner(input)
-    merged_word = merged_words(output)
     return {'text': input, 'entities': merged_word}
 a = gr.Interface(fn=named,

 ner = pipeline('ner')
+def merge_tokens(tokens):
+    merged_tokens = []
     for token in tokens:
+        if merged_tokens and token['entity'].startswith('I-') and merged_tokens[-1]['entity'].endswith(token['entity'][2:]):
+            # If current token continues the entity of the last one, merge them
+            last_token = merged_tokens[-1]
             last_token['word'] += token['word'].replace('##', '')
             last_token['end'] = token['end']
+            last_token['score'] = (last_token['score'] + token['score']) / 2
         else:
+            # Otherwise, add the token to the list
+            merged_tokens.append(token)
+    return merged_tokens
 def named(input):
     output = ner(input)
+    merged_word = merged_tokens(output)
     return {'text': input, 'entities': merged_word}
 a = gr.Interface(fn=named,