Spaces:
Runtime error
Runtime error
fix column reference to TXT file analysis work
Browse files
app.py
CHANGED
@@ -17,14 +17,14 @@ def compatison1(selected_column):
|
|
17 |
# type_of_comparison 1
|
18 |
row2_col1, row2_col2 = st.columns(2)
|
19 |
with row2_col1:
|
20 |
-
first_source = st.selectbox("Choose First Source", df[
|
21 |
with row2_col2:
|
22 |
-
second_source = st.selectbox("Choose Second Source", df[
|
23 |
key='second_source_select')
|
24 |
|
25 |
# filter data
|
26 |
-
first_data = df[df[
|
27 |
-
second_data = df[df[
|
28 |
filtered_data = pd.concat([first_data, second_data])
|
29 |
st.write(filtered_data)
|
30 |
|
@@ -50,12 +50,12 @@ def compatison1(selected_column):
|
|
50 |
|
51 |
# type_of_comparison 2
|
52 |
def comparison2(selected_column):
|
53 |
-
df[
|
54 |
-
df.dropna(subset=[
|
55 |
-
df[
|
56 |
|
57 |
-
min_year = int(df[
|
58 |
-
max_year = int(df[
|
59 |
# layout row2
|
60 |
row2_col1, row2_col2 = st.columns(2)
|
61 |
with row2_col1:
|
@@ -64,10 +64,10 @@ def comparison2(selected_column):
|
|
64 |
second_range = st.slider("Second range", min_value = min_year, max_value= max_year, step = 1, value= (min_year, max_year))
|
65 |
|
66 |
# filter data
|
67 |
-
first_range_filter_df = df[(df[
|
68 |
first_range_filter_df['Topic Range'] = 'First range'
|
69 |
|
70 |
-
second_range_filter_df = df[(df[
|
71 |
second_range_filter_df['Topic Range'] = 'Second range'
|
72 |
|
73 |
filtered_df = pd.concat([first_range_filter_df, second_range_filter_df])
|
@@ -101,11 +101,15 @@ if __name__ == '__main__':
|
|
101 |
df = pd.read_csv(uploaded_file)
|
102 |
abstract_col = 'Abstract'
|
103 |
title_col = 'Title'
|
|
|
|
|
104 |
# preview the uploaded file
|
105 |
elif uploaded_file.name.endswith(".txt"):
|
106 |
df = pd.read_table(uploaded_file, sep='\t') # Doc: assume contents are seperated by Tabs.
|
107 |
abstract_col = 'AB'
|
108 |
title_col = 'TI'
|
|
|
|
|
109 |
# preview the uploaded file
|
110 |
else:
|
111 |
st.error("Unsupported file format.")
|
|
|
17 |
# type_of_comparison 1
|
18 |
row2_col1, row2_col2 = st.columns(2)
|
19 |
with row2_col1:
|
20 |
+
first_source = st.selectbox("Choose First Source", df[source_title_col].unique(), key='first_source_select')
|
21 |
with row2_col2:
|
22 |
+
second_source = st.selectbox("Choose Second Source", df[source_title_col].unique(),
|
23 |
key='second_source_select')
|
24 |
|
25 |
# filter data
|
26 |
+
first_data = df[df[source_title_col] == first_source].copy()
|
27 |
+
second_data = df[df[source_title_col] == second_source].copy()
|
28 |
filtered_data = pd.concat([first_data, second_data])
|
29 |
st.write(filtered_data)
|
30 |
|
|
|
50 |
|
51 |
# type_of_comparison 2
|
52 |
def comparison2(selected_column):
|
53 |
+
df[year_col] = pd.to_numeric(df[year_col], errors='coerce')
|
54 |
+
df.dropna(subset=[year_col], inplace=True)
|
55 |
+
df[year_col] = df[year_col].astype(int)
|
56 |
|
57 |
+
min_year = int(df[year_col].min())
|
58 |
+
max_year = int(df[year_col].max())
|
59 |
# layout row2
|
60 |
row2_col1, row2_col2 = st.columns(2)
|
61 |
with row2_col1:
|
|
|
64 |
second_range = st.slider("Second range", min_value = min_year, max_value= max_year, step = 1, value= (min_year, max_year))
|
65 |
|
66 |
# filter data
|
67 |
+
first_range_filter_df = df[(df[year_col] >= first_range[0]) & (df[year_col] <= first_range[1])].copy()
|
68 |
first_range_filter_df['Topic Range'] = 'First range'
|
69 |
|
70 |
+
second_range_filter_df = df[(df[year_col] >= second_range[0]) & (df[year_col] <= second_range[1])].copy()
|
71 |
second_range_filter_df['Topic Range'] = 'Second range'
|
72 |
|
73 |
filtered_df = pd.concat([first_range_filter_df, second_range_filter_df])
|
|
|
101 |
df = pd.read_csv(uploaded_file)
|
102 |
abstract_col = 'Abstract'
|
103 |
title_col = 'Title'
|
104 |
+
source_title_col = 'Source Title'
|
105 |
+
year_col = 'Year'
|
106 |
# preview the uploaded file
|
107 |
elif uploaded_file.name.endswith(".txt"):
|
108 |
df = pd.read_table(uploaded_file, sep='\t') # Doc: assume contents are seperated by Tabs.
|
109 |
abstract_col = 'AB'
|
110 |
title_col = 'TI'
|
111 |
+
source_title_col = 'SO'
|
112 |
+
year_col = 'PY'
|
113 |
# preview the uploaded file
|
114 |
else:
|
115 |
st.error("Unsupported file format.")
|