Spaces:

TeresaK
/

cpv_test

Runtime error

App Files Files Community

cpv_test / app.py

leavoigt

Update app.py

27a4df7 over 1 year ago

raw

history blame

2.9 kB

	import streamlit as st
	from setfit import SetFitModel


	####################################### Dashboard ######################################################

	# App
	st.title("Identify references to vulnerable groups.")

	st.write("""Vulnerable groups encompass various communities and individuals who are disproportionately affected by the impacts of climate change
	due to their socioeconomic status, geographical location, or inherent characteristics. By incorporating the needs and perspectives of these groups
	into national climate policies, governments can ensure equitable outcomes, promote social justice, and strive to build resilience within the most marginalized populations,
	fostering a more sustainable and inclusive society as we navigate the challenges posed by climate change.This app allows you to identify whether a text contains any
	references to vulnerable groups, for example when talking about policy documents.""")

	# Document upload
	uploaded_file = st.file_uploader(label, type=None, accept_multiple_files=False, key=None, help=None, on_change=None, args=None, kwargs=None, *, disabled=False, label_visibility="visible")

	# Create text input box
	#input_text = st.text_area(label='Please enter your text here', value="This policy has been implemented to support women.")

	#st.write('Prediction:', model(input_text))

	######################################### Model #########################################################

	# Load the model
	model = SetFitModel.from_pretrained("leavoigt/vulnerable_groups")

	# Define the classes
	id2label = {
	0: 'Agricultural communities',
	1: 'Children and Youth',
	2: 'Coastal communities',
	3: 'Drought-prone regions',
	4: 'Economically disadvantaged communities',
	5: 'Elderly population',
	6: 'Ethnic minorities and indigenous people',
	7: 'Informal sector workers',
	8: 'Migrants and Refugees',
	9: 'Other',
	10: 'People with Disabilities',
	11: 'Rural populations',
	12: 'Sexual minorities (LGBTQI+)',
	13: 'Urban populations',
	14: 'Women'}

	# Import the file_processing function
	from file_processing.py import get_paragraphs

	# Process document to paragraphs
	par_list = process_documents(uploaded_file)

	# Make predictions
	preds = vg_model(par_list)

	# Get label names
	preds_list = preds.tolist()

	predictions_names=[]

	# loop through each prediction
	for ele in preds_list:
	try:
	index_of_one = ele.index(1)
	except ValueError:
	index_of_one = "NA"
	if index_of_one != "NA":
	name = id2label[index_of_one]
	else:
	name = "NA"
	predictions_names.append(name)

	# Combine the paragraphs and labels to a dataframe
	df_predictions = pd.DataFrame({'Paragraph': par_list, 'Prediction': predictions_names})

	# Drop all "Other" and "NA" predictions
	filtered_df = df[df['Prediction'].isin(['Other', 'NA'])]


	#####################################
	st.write(df)