40point12

Running

App Files Files Community

Émile commited on 23 days ago

Commit

88d4118

1 Parent(s): 17b81f2

Adding example, simpler model for anonymization

Browse files

Files changed (1) hide show

app.py +25 -32

app.py CHANGED Viewed

@@ -8,6 +8,8 @@ from haystack_integrations.document_stores.chroma import ChromaDocumentStore
 from haystack_integrations.components.retrievers.chroma import ChromaEmbeddingRetriever
 import rsa
 from cryptography.fernet import Fernet
 import gradio as gr
@@ -145,39 +147,20 @@ answer_query.warm_up()
 ####### Logging ##########
 ##########################
-prompt_template_hide_info = """You are a privacy robot that specialise in hiding sensitive information in a text.
-Your help will ensure that no user information gets leaked, so you are always happy to help.
-You will be given a text, and your task is to remove any sensitive information, and replacing it with a descriptive marker.
-Here are a few examples, but you should not restrict yourself to only those:
-If the text contains an email address, you should replace it with a marker "<email>".
-If the text contains a phone number, you should replace it with a marker "<phone>".
-If the text contains the name of the user, you should replace it with a marker "<name>".
-Ensure you distinguish when a name, email, etc is actually that of a public figure or company and is provided by the assistant and not the user: inthis case you should not hide it, as it it not sensible information.
-The rest of the text should be copied IDENTICALLY, including the punctuation and formatting, and the beginning and end of the text in capital letters. Do not add or remove any other character.
-BEGINNING OF TEXT
-{{ message }}
-END OF TEXT
-Your response:
-"""
-prompt_builder_hide_info = PromptBuilder(template=prompt_template_hide_info)
-llm_hide_info = setup_generator("gpt-4o-mini")
-pipe_hide_sensitive_info = Pipeline()
-pipe_hide_sensitive_info.add_component("prompt_builder_hide_info", prompt_builder_hide_info)
-pipe_hide_sensitive_info.add_component("llm_hide_info", llm_hide_info)
-pipe_hide_sensitive_info.connect("prompt_builder_hide_info", "llm_hide_info")
-def hide_sensitive_info(message):
-    for tries in range(3):
-        answer = pipe_hide_sensitive_info.run({"message": message})["llm_hide_info"]["replies"][0]
-        if "BEGINNING OF TEXT" in answer and "END OF TEXT" in answer:
-            text = answer[answer.find("BEGINNING OF TEXT") + len("BEGINNING OF TEXT"):answer.find("END OF TEXT")].strip()
-            return text
-        return "[Error when hiding user info, no log generated]"
 def log_QA(question, answer):
     message = f"User: {question}\nAssistant: {answer}"
@@ -207,11 +190,21 @@ def chat(message, history):
     log_QA(message, answer)
     return answer
 if __name__ == "__main__":
     interface = gr.ChatInterface(
         fn=chat,
         type="messages",
         title="40.12 Chatbot",
-        description="Ask me anything about social media APIs, the Digital Services Act (DSA), or online platform regulations.")
     interface.launch()

 from haystack_integrations.components.retrievers.chroma import ChromaEmbeddingRetriever
 import rsa
 from cryptography.fernet import Fernet
+from presidio_analyzer import AnalyzerEngine
+from presidio_anonymizer import AnonymizerEngine
 import gradio as gr
 ####### Logging ##########
 ##########################
+analyzer = AnalyzerEngine()
+anonymizer = AnonymizerEngine()
+def hide_sensitive_info(text):
+    analysis = analyzer.analyze(
+        text=text,
+        language="en",
+    )
+    result = anonymizer.anonymize(
+        text=text,
+        analyzer_results=analysis
+    )
+    return result.text
 def log_QA(question, answer):
     message = f"User: {question}\nAssistant: {answer}"
     log_QA(message, answer)
     return answer
+examples = [
+    "What is Article 40.12 of the Digital Services Act, and how does it help researchers?",
+    "How can I start the process of requesting platform data for research?",
+    "How do I submit a data access request for Meta’s API under the DSA?",
+    "What are the authentication and setup steps for Youtube’s API?",
+    "What specific types of data can I access through Snapchat’s API?"
+]
 if __name__ == "__main__":
     interface = gr.ChatInterface(
         fn=chat,
         type="messages",
         title="40.12 Chatbot",
+        description="Ask me anything about social media APIs, the Digital Services Act (DSA), or online platform regulations.",
+        examples=examples
+    )
     interface.launch()