Spaces:

protectai
/

prompt-injection-benchmark

Running

App Files Files Community

asofter commited on Dec 11, 2023

Commit

0ccf7ba

•

1 Parent(s): 6aa9546

* upgrade transformers

Browse files

* make dataset private
* support azure benchmarks

Files changed (2) hide show

app.py +21 -3
requirements.txt +1 -1

app.py CHANGED Viewed

@@ -27,6 +27,8 @@ num_processes = 2  # mp.cpu_count()
 lakera_api_key = os.getenv("LAKERA_API_KEY")
 automorphic_api_key = os.getenv("AUTOMORPHIC_API_KEY")
 rebuff_api_key = os.getenv("REBUFF_API_KEY")
 @lru_cache(maxsize=2)
@@ -134,6 +136,22 @@ def detect_rebuff(prompt: str) -> (bool, bool):
         return False, False
 detection_providers = {
     "Laiyer (HF model)": detect_hf_laiyer,
     "Deepset (HF model)": detect_hf_deepset,
@@ -141,6 +159,7 @@ detection_providers = {
     "Lakera Guard": detect_lakera,
     "Automorphic Aegis": detect_automorphic,
     "Rebuff": detect_rebuff,
 }
@@ -210,9 +229,8 @@ if __name__ == "__main__":
         ],
         title="Prompt Injection Benchmark",
         description="This interface aims to benchmark the prompt injection detection providers. "
-        "The results are <strong>stored in the public dataset</strong> "
-        '<a href="https://huggingface.co/datasets/laiyer/prompt-injection-benchmark" target="_blank">laiyer/prompt-injection-benchmark</a> '
-        "for fairness of all sides.<br /><br />"
         "HuggingFace (HF) models are hosted on Spaces while other providers are called as APIs.<br /><br />"
         "<b>Disclaimer</b>: This interface is for research purposes only.",
         examples=[

 lakera_api_key = os.getenv("LAKERA_API_KEY")
 automorphic_api_key = os.getenv("AUTOMORPHIC_API_KEY")
 rebuff_api_key = os.getenv("REBUFF_API_KEY")
+azure_content_safety_endpoint = os.getenv("AZURE_CONTENT_SAFETY_ENDPOINT")
+azure_content_safety_key = os.getenv("AZURE_CONTENT_SAFETY_KEY")
 @lru_cache(maxsize=2)
         return False, False
+def detect_azure(prompt: str) -> (bool, bool):
+    try:
+        response = requests.post(
+            f"{azure_content_safety_endpoint}contentsafety/text:detectJailbreak?api-version=2023-10-15-preview",
+            json={"text": prompt},
+            headers={"Ocp-Apim-Subscription-Key": azure_content_safety_key},
+        )
+        response_json = response.json()
+        logger.info(f"Prompt injection result from Azure: {response.json()}")
+        return True, response_json["jailbreakAnalysis"]["detected"]
+    except requests.RequestException as err:
+        logger.error(f"Failed to call Azure API: {err}")
+        return False, False
 detection_providers = {
     "Laiyer (HF model)": detect_hf_laiyer,
     "Deepset (HF model)": detect_hf_deepset,
     "Lakera Guard": detect_lakera,
     "Automorphic Aegis": detect_automorphic,
     "Rebuff": detect_rebuff,
+    "Azure Content Safety": detect_azure,
 }
         ],
         title="Prompt Injection Benchmark",
         description="This interface aims to benchmark the prompt injection detection providers. "
+        "The results are <strong>stored in the private dataset</strong> for further analysis and improvements."
+        "<br /><br />"
         "HuggingFace (HF) models are hosted on Spaces while other providers are called as APIs.<br /><br />"
         "<b>Disclaimer</b>: This interface is for research purposes only.",
         examples=[

requirements.txt CHANGED Viewed

@@ -5,4 +5,4 @@ onnxruntime==1.16.3
 optimum[onnxruntime]==1.15.0
 rebuff==0.0.5
 requests==2.31.0
-transformers==4.35.2

 optimum[onnxruntime]==1.15.0
 rebuff==0.0.5
 requests==2.31.0
+transformers==4.36.0