File size: 1,894 Bytes
3155660
584eeb2
 
 
 
3155660
d40170e
 
3155660
f48f009
 
584eeb2
 
d77da02
584eeb2
 
 
d77da02
 
584eeb2
 
 
 
 
 
12e78de
e59c5eb
584eeb2
 
 
12e78de
 
 
82056e7
 
584eeb2
b54bba3
46a8feb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
import gradio as gr
import pandas as pd
import torch
import numpy as np
from transformers import AutoTokenizer, AutoModelForSequenceClassification

tokenizer = AutoTokenizer.from_pretrained("model")
model = AutoModelForSequenceClassification.from_pretrained("model")

cpv = pd.read_csv("cpv.csv", sep=";")
df = pd.read_csv("code-desc.csv", sep=";")

labels = df.columns[1:]
cpv = cpv.code

id2label = {idx:label for idx, label in enumerate(labels)}
label2id = {label:idx for idx, label in enumerate(labels)}
codeDesc = dict(zip(df.code, df.desc))
   
def askcpv(description):
    
    encoding = tokenizer(description, return_tensors="pt")
    encoding = {k: v.to(model.device) for k,v in encoding.items()}
    outputs = model(**encoding)
    sigmoid = torch.nn.Sigmoid()
    probs = sigmoid(outputs.logits.squeeze().cpu())
    values, indices = torch.topk(probs, k=5)
    # turn predicted id's into actual label names
    # predicted_labels = [id2label[idx] for idx, label in enumerate(predictions) if label == 1.0]
    # return predicted_labels
    print("probs: ", probs.detach().numpy())
    print("values: ", values.detach().numpy())
    print("indices: ", indices.detach().numpy())
    # print({i: v.item() for i, v in zip(indices, values)})
    return {cpv[i]: v.item() for i, v in zip(indices.detach().numpy(), values.detach().numpy())}

gr.Interface(fn=askcpv, inputs="textbox", outputs="label", description = "Devuelve los dos primeros d铆gitos m谩s probables dada la descripci贸n de una licitaci贸n en espa帽ol.",
title = "Clasificador de c贸digos CPV",  examples=[["Nuevo edificio de acceso en piscinas de Binaced."], ["Servicio de ambulancias y personal sanitario para el servicio de salvamento y socorrismo de las playas de C谩diz"]], css=".text-2xl{font-size:1.2rem !important; line-height: 0.5rem;} .text-sm{font-size:0.7rem !important} .mb-2{margin-bottom: 0.1rem};" ).launch()