Spaces:

larkkin
/

perin

Runtime error

Larisa Kolesnichenko commited on Sep 11, 2022

Commit

099a2f3

•

1 Parent(s): a0be2a1

Make processing of punctuation consistent with train data: frame each symbol with spaces

Files changed (1) hide show

model_wrapper.py CHANGED Viewed

@@ -4,6 +4,7 @@ import tempfile
 import sys
 import datetime
 import re
 sys.path.append('mtool')
 import torch
@@ -78,7 +79,10 @@ class PredictionModel:
     def clean_texts(self, texts):
-        return [re.sub(r' +', ' ', t) for t in texts]
     def _predict_to_mrp(self, texts, graph_mode='labeled-edge'):

 import sys
 import datetime
 import re
+import string
 sys.path.append('mtool')
 import torch
     def clean_texts(self, texts):
+        punctuation = ''.join([f'\\{s}' for s in string.punctuation])
+        texts = [re.sub(f'([{punctuation}])', ' \\1 ', t) for t in texts]
+        texts = [re.sub(r' +', ' ', t) for t in texts]
+        return texts
     def _predict_to_mrp(self, texts, graph_mode='labeled-edge'):