Spaces:
Runtime error
Runtime error
Sebastian Gehrmann
commited on
Commit
•
b03f385
1
Parent(s):
37b8c09
Continue
Browse files- datacards/curation.py +28 -1
- datacards/gem.py +1 -1
- datacards/overview.py +7 -4
datacards/curation.py
CHANGED
@@ -7,7 +7,34 @@ from .streamlit_utils import (
|
|
7 |
N_FIELDS = 1
|
8 |
|
9 |
def curation_page():
|
10 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
11 |
|
12 |
def curation_summary():
|
13 |
return None
|
|
|
7 |
N_FIELDS = 1
|
8 |
|
9 |
def curation_page():
|
10 |
+
st.session_state.card_dict["curation"] = st.session_state.card_dict.get("curation", {})
|
11 |
+
with st.expander("Original Curation", expanded=False):
|
12 |
+
key_pref = ["curation", "original"]
|
13 |
+
st.session_state.card_dict["curation"]["original"] = st.session_state.card_dict["curation"].get("original", {})
|
14 |
+
|
15 |
+
with st.expander("Language Data", expanded=False):
|
16 |
+
key_pref = ["curation", "language"]
|
17 |
+
st.session_state.card_dict["curation"]["language"] = st.session_state.card_dict["curation"].get("language", {})
|
18 |
+
|
19 |
+
with st.expander("Structured Annotations", expanded=False):
|
20 |
+
key_pref = ["curation", "annotations"]
|
21 |
+
st.session_state.card_dict["curation"]["annotations"] = st.session_state.card_dict["curation"].get("annotations", {})
|
22 |
+
|
23 |
+
with st.expander("Consent", expanded=False):
|
24 |
+
key_pref = ["curation", "consent"]
|
25 |
+
st.session_state.card_dict["curation"]["consent"] = st.session_state.card_dict["curation"].get("consent", {})
|
26 |
+
|
27 |
+
with st.expander("Personal and Sensitive information", expanded=False):
|
28 |
+
key_pref = ["curation", "pii"]
|
29 |
+
st.session_state.card_dict["curation"]["pii"] = st.session_state.card_dict["curation"].get("pii", {})
|
30 |
+
|
31 |
+
with st.expander("Maintenance", expanded=False):
|
32 |
+
key_pref = ["curation", "maintenance"]
|
33 |
+
st.session_state.card_dict["curation"]["maintenance"] = st.session_state.card_dict["curation"].get("maintenance", {})
|
34 |
+
|
35 |
+
with st.expander("GEM Curation", expanded=False):
|
36 |
+
key_pref = ["curation", "gem"]
|
37 |
+
st.session_state.card_dict["curation"]["gem"] = st.session_state.card_dict["curation"].get("gem", {})
|
38 |
|
39 |
def curation_summary():
|
40 |
return None
|
datacards/gem.py
CHANGED
@@ -25,7 +25,7 @@ def gem_page():
|
|
25 |
key_pref = ["gem", "rationale"]
|
26 |
st.session_state.card_dict["gem"]["rationale"] = st.session_state.card_dict["gem"].get("rationale", {})
|
27 |
make_text_area(
|
28 |
-
label="
|
29 |
key_list=key_pref + ["contribution"],
|
30 |
help="Describe briefly what makes this dataset an interesting target for NLG evaluations and why it is part of GEM",
|
31 |
)
|
|
|
25 |
key_pref = ["gem", "rationale"]
|
26 |
st.session_state.card_dict["gem"]["rationale"] = st.session_state.card_dict["gem"].get("rationale", {})
|
27 |
make_text_area(
|
28 |
+
label="What does this dataset contribute toward better generation evaluation and why is it part of GEM?",
|
29 |
key_list=key_pref + ["contribution"],
|
30 |
help="Describe briefly what makes this dataset an interesting target for NLG evaluations and why it is part of GEM",
|
31 |
)
|
datacards/overview.py
CHANGED
@@ -32,7 +32,7 @@ license_list = json.load(open(pjoin("resources", "licenses.json"), encoding="utf
|
|
32 |
|
33 |
def overview_page():
|
34 |
st.session_state.card_dict["overview"] = st.session_state.card_dict.get("overview", {})
|
35 |
-
with st.expander("Where to find", expanded=False):
|
36 |
key_pref = ["overview", "where"]
|
37 |
st.session_state.card_dict["overview"]["where"] = st.session_state.card_dict["overview"].get("where", {})
|
38 |
make_text_input(
|
@@ -107,12 +107,15 @@ def overview_page():
|
|
107 |
label="What is the license of the dataset?",
|
108 |
key_list=key_pref + ["license"],
|
109 |
options=license_list,
|
110 |
-
help="select `other` if missing from list, `unkown` if not provided"
|
111 |
)
|
112 |
-
|
113 |
label="What primary task does the dataset support?",
|
114 |
key_list=key_pref + ["task"],
|
115 |
-
|
|
|
|
|
|
|
116 |
)
|
117 |
make_text_area(
|
118 |
label="Provide a short description of the communicative goal of a model trained for this task on this dataset.",
|
|
|
32 |
|
33 |
def overview_page():
|
34 |
st.session_state.card_dict["overview"] = st.session_state.card_dict.get("overview", {})
|
35 |
+
with st.expander("Where to find the data and its documentation", expanded=False):
|
36 |
key_pref = ["overview", "where"]
|
37 |
st.session_state.card_dict["overview"]["where"] = st.session_state.card_dict["overview"].get("where", {})
|
38 |
make_text_input(
|
|
|
107 |
label="What is the license of the dataset?",
|
108 |
key_list=key_pref + ["license"],
|
109 |
options=license_list,
|
110 |
+
help="select `other` if missing from list, `unkown` if not provided."
|
111 |
)
|
112 |
+
make_selectbox(
|
113 |
label="What primary task does the dataset support?",
|
114 |
key_list=key_pref + ["task"],
|
115 |
+
options=["Simplification", "Summarization", "Paraphrasing", "Dialog",
|
116 |
+
"Data-to-Text", "Style Transfer", "Text-to-Slide",
|
117 |
+
"Question Generation", "Reasoning", "Content Transfer"],
|
118 |
+
help="Select `other` if the task is not included in the list.",
|
119 |
)
|
120 |
make_text_area(
|
121 |
label="Provide a short description of the communicative goal of a model trained for this task on this dataset.",
|