Spaces:
Running
Running
Zekun Wu
commited on
Commit
•
f0d28e4
1
Parent(s):
08a5da2
update
Browse files- pages/1_Generation.py +14 -12
- pages/2_Evaluation.py +1 -0
pages/1_Generation.py
CHANGED
@@ -9,15 +9,19 @@ from util.analysis import statistical_tests, result_evaluation
|
|
9 |
st.title('JobFair: A Benchmark for Fairness in LLM Employment Decision')
|
10 |
st.sidebar.title('Model Settings')
|
11 |
|
|
|
12 |
# Define a function to manage state initialization
|
13 |
def initialize_state():
|
14 |
keys = ["model_submitted", "api_key", "endpoint_url", "deployment_name", "temperature", "max_tokens",
|
15 |
-
"data_processed", "group_name","occupation", "privilege_label", "protect_label", "num_run",
|
16 |
-
|
|
|
|
|
17 |
for key, default in zip(keys, defaults):
|
18 |
if key not in st.session_state:
|
19 |
st.session_state[key] = default
|
20 |
|
|
|
21 |
initialize_state()
|
22 |
|
23 |
# Model selection and configuration
|
@@ -62,17 +66,20 @@ if st.session_state.model_submitted:
|
|
62 |
if st.button('Process Data') and not st.session_state.data_processed:
|
63 |
# Initialize the correct agent based on model type
|
64 |
if model_type == 'AzureAgent':
|
65 |
-
agent = AzureAgent(st.session_state.api_key, st.session_state.endpoint_url,
|
|
|
66 |
else:
|
67 |
-
agent = GPTAgent(st.session_state.api_key, st.session_state.endpoint_url,
|
|
|
68 |
|
69 |
# Process data and display results
|
70 |
with st.spinner('Processing data...'):
|
71 |
parameters = {"temperature": st.session_state.temperature, "max_tokens": st.session_state.max_tokens}
|
72 |
-
df = process_scores(df, st.session_state.num_run, parameters, st.session_state.privilege_label,
|
|
|
|
|
73 |
st.session_state.data_processed = True # Mark as processed
|
74 |
|
75 |
-
|
76 |
st.write('Processed Data:', df)
|
77 |
|
78 |
# Allow downloading of the evaluation results
|
@@ -83,11 +90,6 @@ if st.session_state.model_submitted:
|
|
83 |
mime='text/csv',
|
84 |
)
|
85 |
|
86 |
-
|
87 |
-
|
88 |
-
|
89 |
-
|
90 |
-
|
91 |
if st.button("Reset Experiment Settings"):
|
92 |
st.session_state.occupation = "Programmer"
|
93 |
st.session_state.group_name = "Gender"
|
@@ -95,4 +97,4 @@ if st.session_state.model_submitted:
|
|
95 |
st.session_state.protect_label = "Female"
|
96 |
st.session_state.num_run = 1
|
97 |
st.session_state.data_processed = False
|
98 |
-
st.session_state.uploaded_file = None
|
|
|
9 |
st.title('JobFair: A Benchmark for Fairness in LLM Employment Decision')
|
10 |
st.sidebar.title('Model Settings')
|
11 |
|
12 |
+
|
13 |
# Define a function to manage state initialization
|
14 |
def initialize_state():
|
15 |
keys = ["model_submitted", "api_key", "endpoint_url", "deployment_name", "temperature", "max_tokens",
|
16 |
+
"data_processed", "group_name", "occupation", "privilege_label", "protect_label", "num_run",
|
17 |
+
"uploaded_file"]
|
18 |
+
defaults = [False, "", "https://safeguard-monitor.openai.azure.com/", "gpt35-1106", 0.5, 150, False, "Gender",
|
19 |
+
"Programmer", "Male", "Female", 1, None]
|
20 |
for key, default in zip(keys, defaults):
|
21 |
if key not in st.session_state:
|
22 |
st.session_state[key] = default
|
23 |
|
24 |
+
|
25 |
initialize_state()
|
26 |
|
27 |
# Model selection and configuration
|
|
|
66 |
if st.button('Process Data') and not st.session_state.data_processed:
|
67 |
# Initialize the correct agent based on model type
|
68 |
if model_type == 'AzureAgent':
|
69 |
+
agent = AzureAgent(st.session_state.api_key, st.session_state.endpoint_url,
|
70 |
+
st.session_state.deployment_name)
|
71 |
else:
|
72 |
+
agent = GPTAgent(st.session_state.api_key, st.session_state.endpoint_url,
|
73 |
+
st.session_state.deployment_name, api_version)
|
74 |
|
75 |
# Process data and display results
|
76 |
with st.spinner('Processing data...'):
|
77 |
parameters = {"temperature": st.session_state.temperature, "max_tokens": st.session_state.max_tokens}
|
78 |
+
df = process_scores(df, st.session_state.num_run, parameters, st.session_state.privilege_label,
|
79 |
+
st.session_state.protect_label, agent, st.session_state.group_name,
|
80 |
+
st.session_state.occupation)
|
81 |
st.session_state.data_processed = True # Mark as processed
|
82 |
|
|
|
83 |
st.write('Processed Data:', df)
|
84 |
|
85 |
# Allow downloading of the evaluation results
|
|
|
90 |
mime='text/csv',
|
91 |
)
|
92 |
|
|
|
|
|
|
|
|
|
|
|
93 |
if st.button("Reset Experiment Settings"):
|
94 |
st.session_state.occupation = "Programmer"
|
95 |
st.session_state.group_name = "Gender"
|
|
|
97 |
st.session_state.protect_label = "Female"
|
98 |
st.session_state.num_run = 1
|
99 |
st.session_state.data_processed = False
|
100 |
+
st.session_state.uploaded_file = None
|
pages/2_Evaluation.py
CHANGED
@@ -25,6 +25,7 @@ def app():
|
|
25 |
if st.button('Evaluate Data'):
|
26 |
with st.spinner('Evaluating data...'):
|
27 |
test_results = statistical_tests(df)
|
|
|
28 |
evaluation_results = result_evaluation(test_results)
|
29 |
st.write('Evaluation Results:', evaluation_results)
|
30 |
|
|
|
25 |
if st.button('Evaluate Data'):
|
26 |
with st.spinner('Evaluating data...'):
|
27 |
test_results = statistical_tests(df)
|
28 |
+
st.write('Test Results:', test_results)
|
29 |
evaluation_results = result_evaluation(test_results)
|
30 |
st.write('Evaluation Results:', evaluation_results)
|
31 |
|