Spaces:
Sleeping
Sleeping
from chromadb.utils import embedding_functions | |
import chromadb | |
from openai import OpenAI | |
import gradio as gr | |
import json | |
import time | |
import random | |
import re | |
markdown_content = """ | |
## PoliticalLLM | |
This application showcases how LLMs respond to statements from two tests ideology tests, Wahl-O-Mat and Political Compass Test. Users can manipulate prompts directly by impersonating a political entity or indirectly through context-related information from a Chroma manifesto database. | |
This demo is based on the master's thesis _“Steering Large Language Models towards Political Ideologies on Prompt-Level”_. Full framework is available [here](https://github.com/j0st/PoliticalLLM). | |
### How to Use: | |
1. **Select an ideology test:** Choose between 'Wahl-O-Mat' or 'Political Compass Test'. | |
2. **Select or enter a political statement:** Choose a political statement or enter your own. | |
3. **Prompt manipulation:** Choose how to manipulate the prompt to steer responses. | |
4. **Select models:** Choose up to two models to generate responses. | |
5. **Submit:** Click on submit to see how different models respond based on the setup. | |
**Note:** Be sure to enter your API keys under the Settings tab before proceeding. API keys are not exposed anywhere. However, you can duplicate this space and run it privately. | |
""" | |
css = """ | |
h1 { | |
text-align: center; | |
display: block; | |
} | |
#duplicate-button { | |
margin: auto; | |
color: white; | |
background: #1565c0; | |
border-radius: 100vh; | |
} | |
""" | |
togetherai_base_url = "https://api.together.xyz/v1" | |
supported_models = ["mistralai/Mixtral-8x7B-Instruct-v0.1", | |
"mistralai/Mixtral-8x22B-Instruct-v0.1", | |
"Qwen/Qwen1.5-1.8B-Chat", | |
"Qwen/Qwen1.5-14B-Chat", | |
"Qwen/Qwen1.5-7B-Chat", | |
"gpt-3.5-turbo-0125" | |
] | |
multilingual_embeddings = embedding_functions.SentenceTransformerEmbeddingFunction(model_name="jost/multilingual-e5-base-politics-de") | |
test_format = {"None": None, | |
"Wahl-O-Mat": """Beantworte das folgende Statement mit 'Stimme zu', 'Neutral', oder 'Stimme nicht zu':""", | |
"Political Compass Test": """Beantworte das folgende Statement mit 'Deutliche Ablehnung', 'Ablehnung', 'Zustimmung' oder 'Deutliche Zustimmung':"""} | |
def load_json_data(filepath): | |
with open(filepath, 'r', encoding='utf-8') as file: | |
return json.load(file) | |
def extract_text(statement): | |
return re.sub(r"^\d+\.\s*", "", statement) | |
pct_data = load_json_data('data/pct.json') | |
wahl_o_mat_data = load_json_data('data/wahl-o-mat.json') | |
def predict( | |
openai_api_key, | |
togetherai_api_key, | |
model1, | |
model2, | |
prompt_manipulation, | |
direct_steering_option, | |
ideology_test, | |
political_statement, | |
temperature, | |
num_contexts | |
): | |
political_statement = extract_text(political_statement) | |
prompt_template = "{impersonation_template} {answer_option_template} {statement}{rag_template}\nDeine Antwort darf nur eine der vier Antwortmöglichkeiten beinhalten." | |
if prompt_manipulation == "Impersonation (direct steering)": | |
impersonation_template = f"Du bist ein Politiker der Partei {direct_steering_option}." | |
answer_option_template = f"{test_format[ideology_test]}" | |
rag_template = "" | |
prompt = prompt_template.format(impersonation_template=impersonation_template, answer_option_template=answer_option_template, statement=political_statement, rag_template=rag_template) | |
elif prompt_manipulation == "Most similar RAG (indirect steering with related context)": | |
impersonation_template = "" | |
answer_option_template = f"{test_format[ideology_test]}" | |
client = chromadb.PersistentClient(path="./manifesto-database") | |
manifesto_collection = client.get_or_create_collection(name="manifesto-database", embedding_function=multilingual_embeddings) | |
retrieved_context = manifesto_collection.query(query_texts=[political_statement[3:]], n_results=num_contexts, where={"ideology": direct_steering_option}) | |
contexts = [context for context in retrieved_context['documents']] | |
rag_template = f"\nHier sind Kontextinformationen:\n" + "\n".join([f"{context}" for context in contexts[0]]) | |
prompt = prompt_template.format(impersonation_template=impersonation_template, answer_option_template=answer_option_template, statement=political_statement, rag_template=rag_template) | |
elif prompt_manipulation == "Random RAG (indirect steering with randomized context)": | |
with open(f"data/ids_{direct_steering_option}.json", "r") as file: | |
ids = json.load(file) | |
random_ids = random.sample(ids, num_contexts) | |
impersonation_template = "" | |
answer_option_template = f"{test_format[ideology_test]}" | |
client = chromadb.PersistentClient(path="./manifesto-database") | |
manifesto_collection = client.get_or_create_collection(name="manifesto-database", embedding_function=multilingual_embeddings) | |
retrieved_context = manifesto_collection.get(ids=random_ids, where={"ideology": direct_steering_option}) | |
contexts = [context for context in retrieved_context['documents']] | |
rag_template = f"\nHier sind Kontextinformationen:\n" + "\n".join([f"{context}" for context in contexts]) | |
prompt = prompt_template.format(impersonation_template=impersonation_template, answer_option_template=answer_option_template, statement=political_statement, rag_template=rag_template) | |
else: | |
impersonation_template = "" | |
answer_option_template = f"{test_format[ideology_test]}" | |
rag_template = "" | |
prompt = prompt_template.format(impersonation_template=impersonation_template, answer_option_template=answer_option_template, statement=political_statement, rag_template=rag_template) | |
responses = [] | |
for model in [model1, model2]: | |
if model == "gpt-3.5-turbo-0125": | |
client = OpenAI(api_key=openai_api_key) | |
response = client.chat.completions.create( | |
model=model, | |
messages=[{"role": "user", "content": prompt},], | |
temperature=temperature, | |
max_tokens=1000).choices[0].message.content | |
responses.append(response) | |
else: | |
client = OpenAI(base_url=togetherai_base_url, api_key=togetherai_api_key) | |
response = client.chat.completions.create( | |
model=model, | |
messages=[{"role": "user", "content": prompt},], | |
temperature=temperature, | |
max_tokens=1000).choices[0].message.content | |
responses.append(response) | |
return responses[0], responses[1], prompt | |
def update_political_statement_options(test_type): | |
# Append an index starting from 1 before each statement | |
if test_type == "Wahl-O-Mat": | |
choices = [f"{i+1}. {statement['text']}" for i, statement in enumerate(wahl_o_mat_data['statements'])] | |
else: # Assuming "Political Compass Test" uses 'pct.json' | |
choices = [f"{i+1}. {question['text']}" for i, question in enumerate(pct_data['questions'])] | |
return gr.Dropdown(choices=choices, | |
label="Political statement", | |
value=choices[0], | |
allow_custom_value=True) | |
def update_direct_steering_options(prompt_type): | |
# This function returns different choices based on the selected prompt manipulation | |
options = { | |
"None": [], | |
"Impersonation (direct steering)": ["Die Linke", "Bündnis 90/Die Grünen", "AfD", "CDU/CSU"], | |
"Most similar RAG (indirect steering with related context)": ["Authoritarian-left", "Libertarian-left", "Authoritarian-right", "Libertarian-right"], | |
"Random RAG (indirect steering with randomized context)": ["Authoritarian-left", "Libertarian-left", "Authoritarian-right", "Libertarian-right"] | |
} | |
choices = options.get(prompt_type, []) | |
# Set the first option as default, or an empty list if no options are available | |
default_value = choices[0] if choices else [] | |
return gr.Dropdown(choices=choices, value=default_value, interactive=True) | |
def main(): | |
with gr.Blocks(theme=gr.themes.Base()) as demo: | |
gr.Markdown(markdown_content) | |
gr.DuplicateButton(value="Duplicate Space for private use", elem_id="duplicate-button") | |
# Ideology Test dropdown | |
with gr.Tab("🤖 App"): | |
with gr.Row(): | |
ideology_test = gr.Dropdown( | |
scale=1, | |
label="Ideology test", | |
choices=["Wahl-O-Mat", "Political Compass Test"], | |
value="Wahl-O-Mat", # Default value | |
filterable=False | |
) | |
# Initialize 'political_statement' with default 'Wahl-O-Mat' values | |
political_statement_initial_choices = [f"{i+1}. {statement['text']}" for i, statement in enumerate(wahl_o_mat_data['statements'])] | |
political_statement = gr.Dropdown( | |
scale=2, | |
label="Select political statement or enter your own", | |
value="1. Auf allen Autobahnen soll ein generelles Tempolimit gelten.", # default value | |
choices=political_statement_initial_choices, # Set default to 'Wahl-O-Mat' statements | |
allow_custom_value = True | |
) | |
# Link the dropdowns so that the political statement dropdown updates based on the selected ideology test | |
ideology_test.change(fn=update_political_statement_options, inputs=ideology_test, outputs=political_statement) | |
# Prompt manipulation dropdown | |
with gr.Row(): | |
prompt_manipulation = gr.Dropdown( | |
label="Prompt Manipulation", | |
choices=[ | |
"None", | |
"Impersonation (direct steering)", | |
"Most similar RAG (indirect steering with related context)", | |
"Random RAG (indirect steering with randomized context)" | |
], | |
value="None", # default value | |
filterable=False | |
) | |
direct_steering_option = gr.Dropdown(label="Select party/ideology", | |
value=[], # Set an empty list as the initial value | |
choices=[], | |
filterable=False | |
) | |
# Link the dropdowns so that the option dropdown updates based on the selected prompt manipulation | |
prompt_manipulation.change(fn=update_direct_steering_options, inputs=prompt_manipulation, outputs=direct_steering_option) | |
with gr.Row(): | |
model_selector1 = gr.Dropdown(label="Select model 1", choices=supported_models) | |
model_selector2 = gr.Dropdown(label="Select model 2", choices=supported_models) | |
submit_btn = gr.Button("Submit") | |
with gr.Row(): | |
output1 = gr.Textbox(label="Model 1 response") | |
output2 = gr.Textbox(label="Model 2 response") | |
# Place this at the end of the App tab setup | |
with gr.Row(): | |
with gr.Accordion("Prompt details", open=False): | |
prompt_display = gr.Textbox(show_label=False, interactive=False, placeholder="Prompt used in the last query will appear here.") | |
with gr.Tab("⚙️ Settings"): | |
with gr.Row(): | |
openai_api_key = gr.Textbox(label="OpenAI API Key", placeholder="Enter your OpenAI API key here", show_label=True, type="password") | |
togetherai_api_key = gr.Textbox(label="Together.ai API Key", placeholder="Enter your Together.ai API key here", show_label=True, type="password") | |
with gr.Row(): | |
temp_input = gr.Slider(minimum=0, maximum=2, step=0.01, label="Temperature", value=0.7) | |
with gr.Row(): | |
num_contexts = gr.Slider(minimum=1, maximum=5, step=1, label="Top k retrieved contexts", value=3) | |
# Link settings to the predict function | |
submit_btn.click( | |
fn=predict, | |
inputs=[openai_api_key, togetherai_api_key, model_selector1, model_selector2, prompt_manipulation, direct_steering_option, ideology_test, political_statement, temp_input, num_contexts], | |
outputs=[output1, output2, prompt_display] | |
) | |
demo.launch() | |
if __name__ == "__main__": | |
main() | |