toxic_test

Running

HMPhuoc commited on May 25

Commit

5a9d314

•

1 Parent(s): 3ff429e

bert option

bert param use to indicate whether to use bert model

Files changed (1) hide show

app.py CHANGED Viewed

@@ -14,7 +14,7 @@ import unicodedata as ud
 from underthesea import word_tokenize
-#from phoBERT import BERT_predict
 # Load tokenizer
 # fp = Path(__file__).with_name('tokenizer.pkl')
@@ -76,7 +76,7 @@ def plot(result):
   return p
   pass
-def judge(x):
   label = ['độc hại', 'cực kì độc hại', 'tục tĩu', 'đe dọa', 'xúc phạm', 'thù ghét cá nhân']
   result = []
@@ -93,7 +93,13 @@ def judge(x):
   result_lstm = np.round(lstm_pred, 2)
   result_gru = np.round(gru_pred, 2)
   #result_bert = np.round(bert_pred, 2)
-  for i in range(6):
-    result.append((result_lstm[i]+result_gru[i])/2)
   return (result)

 from underthesea import word_tokenize
+from phoBERT import BERT_predict
 # Load tokenizer
 # fp = Path(__file__).with_name('tokenizer.pkl')
   return p
   pass
+def judge(x, bert=False):
   label = ['độc hại', 'cực kì độc hại', 'tục tĩu', 'đe dọa', 'xúc phạm', 'thù ghét cá nhân']
   result = []
   result_lstm = np.round(lstm_pred, 2)
   result_gru = np.round(gru_pred, 2)
   #result_bert = np.round(bert_pred, 2)
+  if bert == True:
+    bert_pred = BERT_predict(x)
+    result_bert = np.round(bert_pred, 2)
+    for i in range(6):
+      result.append((result_lstm[i]+result_gru[i]+result_bert[i])/3)
+  else:
+    for i in range(6):
+      result.append((result_lstm[i]+result_gru[i])/2)
   return (result)