File size: 2,296 Bytes
424c175
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
44adb4d
452e8f6
44adb4d
452e8f6
44adb4d
424c175
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59

import logging
import os
from supabase import create_client, Client
from fuzzywuzzy import fuzz
from config import SUPABASE_URL, SUPABASE_KEY
import json
import logging

url: str = SUPABASE_URL
key: str = SUPABASE_KEY
supabase: Client = create_client(url, key)

def insert_papers_data(data,author_name ,table_name: str = 'papers'):
    if data == []:
        print("No data to insert")
        return
    formatted_data = []
    for entry in data:
        entry = json.loads(entry)
        data_db = {
            'doi_no': entry.get('doi'),
            'title': entry.get('title'),
            'summary': entry.get('summary'),
            'authors': ", ".join(entry.get('authors',[])),
            'year': entry.get('year'),
            'pdf_link': entry.get('pdf_link'),
            'references': ", ".join(entry.get('references')),
            'categories': ", ".join(entry.get('categories')),
            'comment': entry.get('comment'),
            'journal_ref': entry.get('journal_ref'),
            'source': entry.get('source'),
            'primary_category': entry.get('primary_category'),
            'published': entry.get('published'),
            'author_name' : author_name,
        }
        formatted_data.append(data_db)
    data, count = supabase.table(table_name).insert(formatted_data).execute()


def get_correct_author_name(user_input_author):
    authors_name_data = supabase.table('papers').select('author_name').execute()
    unique_authors = set(author_dict['author_name'] for author_dict in authors_name_data.data)
    unique_authors_list = list(unique_authors)
    similar_authors = [author for author in unique_authors_list if fuzz.ratio(user_input_author, author) > 60]
    if similar_authors:
        return similar_authors[0]
    else:
        print(f"No similar author found for '{user_input_author}'")
        return None
    

def fetch_papers_data(author_name, fields_to_query = ["doi_no"],table_name: str = 'papers', all=False):
    author_name = get_correct_author_name(author_name)
    if all:
        data, count = supabase.table(table_name).select("*").eq('author_name', author_name).execute()
        return data
    data, count = supabase.table(table_name).select(",".join(fields_to_query)).eq('author_name', author_name).execute()
    return data[1]