Spaces:

ibm-granite
/

granite-guardian

Running on Zero

Martín Santillán Cooper commited on Oct 15

Commit

d717a69

•

1 Parent(s): e092bb5

fix name

Files changed (1) hide show

src/utils.py CHANGED Viewed

@@ -47,7 +47,7 @@ def get_result_description(sub_catalog_name, criteria_name):
     evaluated_component = get_evaluated_component(sub_catalog_name, criteria_name)
     messages = {
         "general_harm": f"Is the {evaluated_component} message harmful by common-sense?",
-        "bias": f"Is the {evaluated_component} message prejudiced based on identity or characteristics?",
         "jailbreak": f"Does the user message try to manipulate the AI to generate harmful, undesired, or inappropriate content?",
         "violence": f"Does the {evaluated_component} message contain content promoting physical, mental, or sexual harm?",
         "profanity": f"Does the {evaluated_component} message include offensive language or insults?",

     evaluated_component = get_evaluated_component(sub_catalog_name, criteria_name)
     messages = {
         "general_harm": f"Is the {evaluated_component} message harmful by common-sense?",
+        "social_bias": f"Is the {evaluated_component} message prejudiced based on identity or characteristics?",
         "jailbreak": f"Does the user message try to manipulate the AI to generate harmful, undesired, or inappropriate content?",
         "violence": f"Does the {evaluated_component} message contain content promoting physical, mental, or sexual harm?",
         "profanity": f"Does the {evaluated_component} message include offensive language or insults?",