Spaces:

GEM
/

DatasetCardForm

Runtime error

App Files Files Community

Yacine Jernite commited on Nov 16, 2021

Commit

969e2c4

•

1 Parent(s): fcb0120

social-previous-underserved

Browse files

Files changed (2) hide show

datacards/considerations.py +1 -1
datacards/context.py +44 -37

datacards/considerations.py CHANGED Viewed

@@ -101,7 +101,7 @@ def considerations_summary():
     ):
         completion_markdown = ""
         completion_markdown += (
-            f"- **Overall competion:**\n  - {total_filled} of {N_FIELDS} fields\n"
         )
         completion_markdown += f"- **Sub-section - PII Risks and Liability:**\n  - {len(st.session_state.card_dict.get('considerations', {}).get('pii', {}))} of {N_FIELDS_PII} fields\n"
         completion_markdown += f"- **Sub-section - Licenses:**\n  - {len(st.session_state.card_dict.get('considerations', {}).get('licenses', {}))} of {N_FIELDS_LICENSES} fields\n"

     ):
         completion_markdown = ""
         completion_markdown += (
+            f"- **Overall completion:**\n  - {total_filled} of {N_FIELDS} fields\n"
         )
         completion_markdown += f"- **Sub-section - PII Risks and Liability:**\n  - {len(st.session_state.card_dict.get('considerations', {}).get('pii', {}))} of {N_FIELDS_PII} fields\n"
         completion_markdown += f"- **Sub-section - Licenses:**\n  - {len(st.session_state.card_dict.get('considerations', {}).get('licenses', {}))} of {N_FIELDS_LICENSES} fields\n"

datacards/context.py CHANGED Viewed

@@ -8,58 +8,65 @@ from .streamlit_utils import (
     make_radio,
 )
-N_FIELDS_SOCIAL_IMPACT = 9
-N_FIELDS_UNDERSERVED_COMMUNITIES = 8
 N_FIELDS_BIASES= 3
-N_FIELDS = N_FIELDS_SOCIAL_IMPACT + N_FIELDS_UNDERSERVED_COMMUNITIES + N_FIELDS_BIASES
 def context_page():
     st.session_state.card_dict["context"] = st.session_state.card_dict.get(
         "context", {}
     )
-    with st.expander("Social Impact of the Dataset", expanded=False):
-        key_pref = ["context", "social-impact"]
-        st.session_state.card_dict["context"]["social-impact"] = st.session_state.card_dict[
             "context"
-        ].get("social-impact", {})
-        make_text_area(
-            label="What tasks has this dataset been used for previously?",
-            key_list=key_pref + [""],
-            help="",
-        )
-        make_text_area(
-            label="Did any of these previous uses result in observations about the dataset?",
-            key_list=key_pref + [""],
-            help="",
-        )
-        make_text_area(
-            label="Have any changes been made to the dataset as a result of these observations?",
-            key_list=key_pref + [""],
             help="",
         )
-        make_text_area(
-            label="Task",
-            key_list=key_pref + [""],
-            help="",
-        )
-        make_text_area(
-            label="Dataset-specific",
-            key_list=key_pref + [""],
-            help="",
-        )
     with st.expander("Impact on Under-Served Communities", expanded=False):
         key_pref = ["context", "underserved"]
         st.session_state.card_dict["context"]["underserved"] = st.session_state.card_dict[
             "context"
         ].get("underserved", {})
     with st.expander("Discussion of Biases", expanded=False):
         key_pref = ["context", "biases"]
@@ -101,9 +108,9 @@ def context_summary():
     ):
         completion_markdown = ""
         completion_markdown += (
-            f"- **Overall competion:**\n  - {total_filled} of {N_FIELDS} fields\n"
         )
-        completion_markdown += f"- **Sub-section - Social Impact of the Dataset:**\n  - {len(st.session_state.card_dict.get('context', {}).get('social-impact', {}))} of {N_FIELDS_SOCIAL_IMPACT} fields\n"
         completion_markdown += f"- **Sub-section - Impact on Under-Served Communities:**\n  - {len(st.session_state.card_dict.get('context', {}).get('underserved', {}))} of {N_FIELDS_UNDERSERVED_COMMUNITIES} fields\n"
         completion_markdown += f"- **Sub-section - Discussion of Biases:**\n  - {len(st.session_state.card_dict.get('context', {}).get('biases', {}))} of {N_FIELDS_BIASES} fields\n"
         st.markdown(completion_markdown)

     make_radio,
 )
+N_FIELDS_PREVIOUS = 3
+N_FIELDS_UNDERSERVED_COMMUNITIES = 2
 N_FIELDS_BIASES= 3
+N_FIELDS = N_FIELDS_PREVIOUS + N_FIELDS_UNDERSERVED_COMMUNITIES + N_FIELDS_BIASES
 def context_page():
     st.session_state.card_dict["context"] = st.session_state.card_dict.get(
         "context", {}
     )
+    with st.expander("Previous Work on the Social Impact of the Dataset", expanded=False):
+        key_pref = ["context", "previous"]
+        st.session_state.card_dict["context"]["previous"] = st.session_state.card_dict[
             "context"
+        ].get("previous", {})
+        make_radio(
+            label="Are you aware of cases where models trained on the task featured in this dataset ore related tasks have been used in automated systems?",
+            options=["no", "yes - related tasks", "yes - other datasets featuring the same task", "yes - models trained on this dataset"],
+            key_list=key_pref + ["is-deployed"],
             help="",
         )
+        if "yes" in st.session_state.card_dict["context"]["previous"]["is-deployed"]:
+            make_text_area(
+                label="Did any of these previous uses result in observations about the social impact of the systems? " + \
+                "In particular, has there been work outlining the risks and limitations of the system? Provide links and descriptions here:",
+                key_list=key_pref + ["described-risks"],
+                help="",
+            )
+            if st.session_state.card_dict["context"]["previous"]["is-deployed"] == "yes - models trained on this dataset":
+                make_text_area(
+                    label="Have any changes been made to the dataset as a result of these observations?",
+                    key_list=key_pref + ["changes-from-observation"],
+                    help="",
+                )
+            else:
+                st.session_state.card_dict["context"]["previous"]["changes-from-observation"] = "N/A"
+        else:
+            st.session_state.card_dict["context"]["previous"]["described-risks"] = "N/A"
+            st.session_state.card_dict["context"]["previous"]["changes-from-observation"] = "N/A"
     with st.expander("Impact on Under-Served Communities", expanded=False):
         key_pref = ["context", "underserved"]
         st.session_state.card_dict["context"]["underserved"] = st.session_state.card_dict[
             "context"
         ].get("underserved", {})
+        make_radio(
+            label="Does this dataset address the needs of communities that are traditionally underserved in language technology, and particularly language generation technology?" + \
+                "Communities may be underserved for exemple because their language, language variety, or social or geographical context is underepresented in NLP and NLG resources (datasets and models).",
+            options=["no", "yes"],
+            key_list=key_pref+["helps-underserved"],
+        )
+        if st.session_state.card_dict["context"]["underserved"]["helps-underserved"] == "yes":
+            make_text_area(
+                label="Describe how this dataset addresses the needs of underserved communities",
+                key_list=key_pref+["underserved-description"],
+            )
+        else:
+            st.session_state.card_dict["context"]["underserved"]["underserved-description"] = "N/A"
     with st.expander("Discussion of Biases", expanded=False):
         key_pref = ["context", "biases"]
     ):
         completion_markdown = ""
         completion_markdown += (
+            f"- **Overall completion:**\n  - {total_filled} of {N_FIELDS} fields\n"
         )
+        completion_markdown += f"- **Sub-section - Social Impact of the Dataset:**\n  - {len(st.session_state.card_dict.get('context', {}).get('previous', {}))} of {N_FIELDS_PREVIOUS} fields\n"
         completion_markdown += f"- **Sub-section - Impact on Under-Served Communities:**\n  - {len(st.session_state.card_dict.get('context', {}).get('underserved', {}))} of {N_FIELDS_UNDERSERVED_COMMUNITIES} fields\n"
         completion_markdown += f"- **Sub-section - Discussion of Biases:**\n  - {len(st.session_state.card_dict.get('context', {}).get('biases', {}))} of {N_FIELDS_BIASES} fields\n"
         st.markdown(completion_markdown)