File size: 980 Bytes
7bbae49
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
gender_labels = ["M","MALE", "F", "FEMALE", "V/F","N/F","FEMENINO","MASCULINA"]

def gender_extract(ocr_list):
    try:
        for words in ocr_list:
            for word in words.split(): 
                word = word.upper()
                if word in gender_labels:
                    return True, word, ocr_list
                elif "FEMALE" in word:
                    gender = 'F'
                    return True, gender, ocr_list
                elif "MALE" in word:
                    gender = 'M'
                    return True, gender, ocr_list
                elif "FEMENINO" in word:
                    gender = "F"
                    return True, gender, ocr_list
                elif "MASCULINA" in word:
                    gender = "M"
                    return True, gender, ocr_list
                
        return False, None, ocr_list
    except Exception as e:
        print("[Exception in gender_extract] ", str(e))
        return None, None, ocr_list