DD0101 commited on
Commit
e7a0f80
1 Parent(s): 41bca58

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -2
app.py CHANGED
@@ -107,7 +107,7 @@ def ner(text):
107
  text = " ".join(rdrsegmenter.word_segment(text))
108
 
109
  # Some words in lowercase like "đà nẵng" will get error (due to vncorenlp)
110
- text = text.replace("đà ", " đà ")
111
 
112
  output = my_classifier(text)
113
  for entity in output:
@@ -124,7 +124,10 @@ def ner(text):
124
 
125
  slot_tokens = []
126
 
127
- for word, pred in zip(words, slot_preds):
 
 
 
128
  if pred == 'O':
129
  slot_tokens.extend([(word, None), (" ", None)])
130
  elif pred[0] == 'I':
 
107
  text = " ".join(rdrsegmenter.word_segment(text))
108
 
109
  # Some words in lowercase like "đà nẵng" will get error (due to vncorenlp)
110
+ text = text.replace("_đà ", " đà_").replace("_Đà ", " Đà_")
111
 
112
  output = my_classifier(text)
113
  for entity in output:
 
124
 
125
  slot_tokens = []
126
 
127
+ words[0].capitalize()
128
+ for i, word in enumerate(words):
129
+ word = word.replace("_", " ")
130
+
131
  if pred == 'O':
132
  slot_tokens.extend([(word, None), (" ", None)])
133
  elif pred[0] == 'I':