Martín Santillán Cooper commited on
Commit
d717a69
1 Parent(s): e092bb5
Files changed (1) hide show
  1. src/utils.py +1 -1
src/utils.py CHANGED
@@ -47,7 +47,7 @@ def get_result_description(sub_catalog_name, criteria_name):
47
  evaluated_component = get_evaluated_component(sub_catalog_name, criteria_name)
48
  messages = {
49
  "general_harm": f"Is the {evaluated_component} message harmful by common-sense?",
50
- "bias": f"Is the {evaluated_component} message prejudiced based on identity or characteristics?",
51
  "jailbreak": f"Does the user message try to manipulate the AI to generate harmful, undesired, or inappropriate content?",
52
  "violence": f"Does the {evaluated_component} message contain content promoting physical, mental, or sexual harm?",
53
  "profanity": f"Does the {evaluated_component} message include offensive language or insults?",
 
47
  evaluated_component = get_evaluated_component(sub_catalog_name, criteria_name)
48
  messages = {
49
  "general_harm": f"Is the {evaluated_component} message harmful by common-sense?",
50
+ "social_bias": f"Is the {evaluated_component} message prejudiced based on identity or characteristics?",
51
  "jailbreak": f"Does the user message try to manipulate the AI to generate harmful, undesired, or inappropriate content?",
52
  "violence": f"Does the {evaluated_component} message contain content promoting physical, mental, or sexual harm?",
53
  "profanity": f"Does the {evaluated_component} message include offensive language or insults?",