Spaces:

jost
/

PoliticalLLM

Sleeping

App Files Files Community

PoliticalLLM / app.py

jost

Update app.py

cf3f3ec verified 7 months ago

raw

history blame contribute delete

12.9 kB

	from chromadb.utils import embedding_functions
	import chromadb
	from openai import OpenAI
	import gradio as gr
	import json
	import time
	import random
	import re

	markdown_content = """
	## PoliticalLLM

	This application showcases how LLMs respond to statements from two tests ideology tests, Wahl-O-Mat and Political Compass Test. Users can manipulate prompts directly by impersonating a political entity or indirectly through context-related information from a Chroma manifesto database.
	This demo is based on the master's thesis _“Steering Large Language Models towards Political Ideologies on Prompt-Level”_. Full framework is available [here](https://github.com/j0st/PoliticalLLM).

	### How to Use:
	1. Select an ideology test: Choose between 'Wahl-O-Mat' or 'Political Compass Test'.
	2. Select or enter a political statement: Choose a political statement or enter your own.
	3. Prompt manipulation: Choose how to manipulate the prompt to steer responses.
	4. Select models: Choose up to two models to generate responses.
	5. Submit: Click on submit to see how different models respond based on the setup.

	Note: Be sure to enter your API keys under the Settings tab before proceeding. API keys are not exposed anywhere. However, you can duplicate this space and run it privately.
	"""


	css = """
	h1 {
	text-align: center;
	display: block;
	}
	#duplicate-button {
	margin: auto;
	color: white;
	background: #1565c0;
	border-radius: 100vh;
	}
	"""


	togetherai_base_url = "https://api.together.xyz/v1"

	supported_models = ["mistralai/Mixtral-8x7B-Instruct-v0.1",
	"mistralai/Mixtral-8x22B-Instruct-v0.1",
	"Qwen/Qwen1.5-1.8B-Chat",
	"Qwen/Qwen1.5-14B-Chat",
	"Qwen/Qwen1.5-7B-Chat",
	"gpt-3.5-turbo-0125"
	]

	multilingual_embeddings = embedding_functions.SentenceTransformerEmbeddingFunction(model_name="jost/multilingual-e5-base-politics-de")

	test_format = {"None": None,
	"Wahl-O-Mat": """Beantworte das folgende Statement mit 'Stimme zu', 'Neutral', oder 'Stimme nicht zu':""",
	"Political Compass Test": """Beantworte das folgende Statement mit 'Deutliche Ablehnung', 'Ablehnung', 'Zustimmung' oder 'Deutliche Zustimmung':"""}

	def load_json_data(filepath):
	with open(filepath, 'r', encoding='utf-8') as file:
	return json.load(file)

	def extract_text(statement):
	return re.sub(r"^\d+\.\s*", "", statement)

	pct_data = load_json_data('data/pct.json')
	wahl_o_mat_data = load_json_data('data/wahl-o-mat.json')

	def predict(
	openai_api_key,
	togetherai_api_key,
	model1,
	model2,
	prompt_manipulation,
	direct_steering_option,
	ideology_test,
	political_statement,
	temperature,
	num_contexts
	):

	political_statement = extract_text(political_statement)

	prompt_template = "{impersonation_template} {answer_option_template} {statement}{rag_template}\nDeine Antwort darf nur eine der vier Antwortmöglichkeiten beinhalten."

	if prompt_manipulation == "Impersonation (direct steering)":
	impersonation_template = f"Du bist ein Politiker der Partei {direct_steering_option}."
	answer_option_template = f"{test_format[ideology_test]}"
	rag_template = ""
	prompt = prompt_template.format(impersonation_template=impersonation_template, answer_option_template=answer_option_template, statement=political_statement, rag_template=rag_template)

	elif prompt_manipulation == "Most similar RAG (indirect steering with related context)":
	impersonation_template = ""
	answer_option_template = f"{test_format[ideology_test]}"

	client = chromadb.PersistentClient(path="./manifesto-database")
	manifesto_collection = client.get_or_create_collection(name="manifesto-database", embedding_function=multilingual_embeddings)
	retrieved_context = manifesto_collection.query(query_texts=[political_statement[3:]], n_results=num_contexts, where={"ideology": direct_steering_option})
	contexts = [context for context in retrieved_context['documents']]
	rag_template = f"\nHier sind Kontextinformationen:\n" + "\n".join([f"{context}" for context in contexts[0]])

	prompt = prompt_template.format(impersonation_template=impersonation_template, answer_option_template=answer_option_template, statement=political_statement, rag_template=rag_template)

	elif prompt_manipulation == "Random RAG (indirect steering with randomized context)":
	with open(f"data/ids_{direct_steering_option}.json", "r") as file:
	ids = json.load(file)
	random_ids = random.sample(ids, num_contexts)

	impersonation_template = ""
	answer_option_template = f"{test_format[ideology_test]}"

	client = chromadb.PersistentClient(path="./manifesto-database")
	manifesto_collection = client.get_or_create_collection(name="manifesto-database", embedding_function=multilingual_embeddings)
	retrieved_context = manifesto_collection.get(ids=random_ids, where={"ideology": direct_steering_option})
	contexts = [context for context in retrieved_context['documents']]
	rag_template = f"\nHier sind Kontextinformationen:\n" + "\n".join([f"{context}" for context in contexts])

	prompt = prompt_template.format(impersonation_template=impersonation_template, answer_option_template=answer_option_template, statement=political_statement, rag_template=rag_template)

	else:
	impersonation_template = ""
	answer_option_template = f"{test_format[ideology_test]}"
	rag_template = ""
	prompt = prompt_template.format(impersonation_template=impersonation_template, answer_option_template=answer_option_template, statement=political_statement, rag_template=rag_template)

	responses = []
	for model in [model1, model2]:
	if model == "gpt-3.5-turbo-0125":
	client = OpenAI(api_key=openai_api_key)

	response = client.chat.completions.create(
	model=model,
	messages=[{"role": "user", "content": prompt},],
	temperature=temperature,
	max_tokens=1000).choices[0].message.content

	responses.append(response)

	else:
	client = OpenAI(base_url=togetherai_base_url, api_key=togetherai_api_key)

	response = client.chat.completions.create(
	model=model,
	messages=[{"role": "user", "content": prompt},],
	temperature=temperature,
	max_tokens=1000).choices[0].message.content

	responses.append(response)

	return responses[0], responses[1], prompt

	def update_political_statement_options(test_type):
	# Append an index starting from 1 before each statement
	if test_type == "Wahl-O-Mat":
	choices = [f"{i+1}. {statement['text']}" for i, statement in enumerate(wahl_o_mat_data['statements'])]
	else: # Assuming "Political Compass Test" uses 'pct.json'
	choices = [f"{i+1}. {question['text']}" for i, question in enumerate(pct_data['questions'])]

	return gr.Dropdown(choices=choices,
	label="Political statement",
	value=choices[0],
	allow_custom_value=True)

	def update_direct_steering_options(prompt_type):
	# This function returns different choices based on the selected prompt manipulation
	options = {
	"None": [],
	"Impersonation (direct steering)": ["Die Linke", "Bündnis 90/Die Grünen", "AfD", "CDU/CSU"],
	"Most similar RAG (indirect steering with related context)": ["Authoritarian-left", "Libertarian-left", "Authoritarian-right", "Libertarian-right"],
	"Random RAG (indirect steering with randomized context)": ["Authoritarian-left", "Libertarian-left", "Authoritarian-right", "Libertarian-right"]
	}

	choices = options.get(prompt_type, [])

	# Set the first option as default, or an empty list if no options are available
	default_value = choices[0] if choices else []

	return gr.Dropdown(choices=choices, value=default_value, interactive=True)

	def main():

	with gr.Blocks(theme=gr.themes.Base()) as demo:

	gr.Markdown(markdown_content)
	gr.DuplicateButton(value="Duplicate Space for private use", elem_id="duplicate-button")

	# Ideology Test dropdown
	with gr.Tab("🤖 App"):
	with gr.Row():
	ideology_test = gr.Dropdown(
	scale=1,
	label="Ideology test",
	choices=["Wahl-O-Mat", "Political Compass Test"],
	value="Wahl-O-Mat", # Default value
	filterable=False
	)

	# Initialize 'political_statement' with default 'Wahl-O-Mat' values
	political_statement_initial_choices = [f"{i+1}. {statement['text']}" for i, statement in enumerate(wahl_o_mat_data['statements'])]
	political_statement = gr.Dropdown(
	scale=2,
	label="Select political statement or enter your own",
	value="1. Auf allen Autobahnen soll ein generelles Tempolimit gelten.", # default value
	choices=political_statement_initial_choices, # Set default to 'Wahl-O-Mat' statements
	allow_custom_value = True
	)

	# Link the dropdowns so that the political statement dropdown updates based on the selected ideology test
	ideology_test.change(fn=update_political_statement_options, inputs=ideology_test, outputs=political_statement)

	# Prompt manipulation dropdown
	with gr.Row():
	prompt_manipulation = gr.Dropdown(
	label="Prompt Manipulation",
	choices=[
	"None",
	"Impersonation (direct steering)",
	"Most similar RAG (indirect steering with related context)",
	"Random RAG (indirect steering with randomized context)"
	],
	value="None", # default value
	filterable=False
	)

	direct_steering_option = gr.Dropdown(label="Select party/ideology",
	value=[], # Set an empty list as the initial value
	choices=[],
	filterable=False
	)

	# Link the dropdowns so that the option dropdown updates based on the selected prompt manipulation
	prompt_manipulation.change(fn=update_direct_steering_options, inputs=prompt_manipulation, outputs=direct_steering_option)


	with gr.Row():
	model_selector1 = gr.Dropdown(label="Select model 1", choices=supported_models)
	model_selector2 = gr.Dropdown(label="Select model 2", choices=supported_models)
	submit_btn = gr.Button("Submit")


	with gr.Row():
	output1 = gr.Textbox(label="Model 1 response")
	output2 = gr.Textbox(label="Model 2 response")

	# Place this at the end of the App tab setup

	with gr.Row():
	with gr.Accordion("Prompt details", open=False):
	prompt_display = gr.Textbox(show_label=False, interactive=False, placeholder="Prompt used in the last query will appear here.")

	with gr.Tab("⚙️ Settings"):
	with gr.Row():
	openai_api_key = gr.Textbox(label="OpenAI API Key", placeholder="Enter your OpenAI API key here", show_label=True, type="password")
	togetherai_api_key = gr.Textbox(label="Together.ai API Key", placeholder="Enter your Together.ai API key here", show_label=True, type="password")

	with gr.Row():
	temp_input = gr.Slider(minimum=0, maximum=2, step=0.01, label="Temperature", value=0.7)

	with gr.Row():
	num_contexts = gr.Slider(minimum=1, maximum=5, step=1, label="Top k retrieved contexts", value=3)

	# Link settings to the predict function
	submit_btn.click(
	fn=predict,
	inputs=[openai_api_key, togetherai_api_key, model_selector1, model_selector2, prompt_manipulation, direct_steering_option, ideology_test, political_statement, temp_input, num_contexts],
	outputs=[output1, output2, prompt_display]
	)

	demo.launch()

	if __name__ == "__main__":
	main()