Oliviayc commited on
Commit
765bd01
·
1 Parent(s): 3096aed

fix column reference to TXT file analysis work

Browse files
Files changed (1) hide show
  1. app.py +15 -11
app.py CHANGED
@@ -17,14 +17,14 @@ def compatison1(selected_column):
17
  # type_of_comparison 1
18
  row2_col1, row2_col2 = st.columns(2)
19
  with row2_col1:
20
- first_source = st.selectbox("Choose First Source", df['Source title'].unique(), key='first_source_select')
21
  with row2_col2:
22
- second_source = st.selectbox("Choose Second Source", df['Source title'].unique(),
23
  key='second_source_select')
24
 
25
  # filter data
26
- first_data = df[df['Source title'] == first_source].copy()
27
- second_data = df[df['Source title'] == second_source].copy()
28
  filtered_data = pd.concat([first_data, second_data])
29
  st.write(filtered_data)
30
 
@@ -50,12 +50,12 @@ def compatison1(selected_column):
50
 
51
  # type_of_comparison 2
52
  def comparison2(selected_column):
53
- df['Year'] = pd.to_numeric(df['Year'], errors='coerce')
54
- df.dropna(subset=['Year'], inplace=True)
55
- df['Year'] = df['Year'].astype(int)
56
 
57
- min_year = int(df['Year'].min())
58
- max_year = int(df['Year'].max())
59
  # layout row2
60
  row2_col1, row2_col2 = st.columns(2)
61
  with row2_col1:
@@ -64,10 +64,10 @@ def comparison2(selected_column):
64
  second_range = st.slider("Second range", min_value = min_year, max_value= max_year, step = 1, value= (min_year, max_year))
65
 
66
  # filter data
67
- first_range_filter_df = df[(df['Year'] >= first_range[0]) & (df['Year'] <= first_range[1])].copy()
68
  first_range_filter_df['Topic Range'] = 'First range'
69
 
70
- second_range_filter_df = df[(df['Year'] >= second_range[0]) & (df['Year'] <= second_range[1])].copy()
71
  second_range_filter_df['Topic Range'] = 'Second range'
72
 
73
  filtered_df = pd.concat([first_range_filter_df, second_range_filter_df])
@@ -101,11 +101,15 @@ if __name__ == '__main__':
101
  df = pd.read_csv(uploaded_file)
102
  abstract_col = 'Abstract'
103
  title_col = 'Title'
 
 
104
  # preview the uploaded file
105
  elif uploaded_file.name.endswith(".txt"):
106
  df = pd.read_table(uploaded_file, sep='\t') # Doc: assume contents are seperated by Tabs.
107
  abstract_col = 'AB'
108
  title_col = 'TI'
 
 
109
  # preview the uploaded file
110
  else:
111
  st.error("Unsupported file format.")
 
17
  # type_of_comparison 1
18
  row2_col1, row2_col2 = st.columns(2)
19
  with row2_col1:
20
+ first_source = st.selectbox("Choose First Source", df[source_title_col].unique(), key='first_source_select')
21
  with row2_col2:
22
+ second_source = st.selectbox("Choose Second Source", df[source_title_col].unique(),
23
  key='second_source_select')
24
 
25
  # filter data
26
+ first_data = df[df[source_title_col] == first_source].copy()
27
+ second_data = df[df[source_title_col] == second_source].copy()
28
  filtered_data = pd.concat([first_data, second_data])
29
  st.write(filtered_data)
30
 
 
50
 
51
  # type_of_comparison 2
52
  def comparison2(selected_column):
53
+ df[year_col] = pd.to_numeric(df[year_col], errors='coerce')
54
+ df.dropna(subset=[year_col], inplace=True)
55
+ df[year_col] = df[year_col].astype(int)
56
 
57
+ min_year = int(df[year_col].min())
58
+ max_year = int(df[year_col].max())
59
  # layout row2
60
  row2_col1, row2_col2 = st.columns(2)
61
  with row2_col1:
 
64
  second_range = st.slider("Second range", min_value = min_year, max_value= max_year, step = 1, value= (min_year, max_year))
65
 
66
  # filter data
67
+ first_range_filter_df = df[(df[year_col] >= first_range[0]) & (df[year_col] <= first_range[1])].copy()
68
  first_range_filter_df['Topic Range'] = 'First range'
69
 
70
+ second_range_filter_df = df[(df[year_col] >= second_range[0]) & (df[year_col] <= second_range[1])].copy()
71
  second_range_filter_df['Topic Range'] = 'Second range'
72
 
73
  filtered_df = pd.concat([first_range_filter_df, second_range_filter_df])
 
101
  df = pd.read_csv(uploaded_file)
102
  abstract_col = 'Abstract'
103
  title_col = 'Title'
104
+ source_title_col = 'Source Title'
105
+ year_col = 'Year'
106
  # preview the uploaded file
107
  elif uploaded_file.name.endswith(".txt"):
108
  df = pd.read_table(uploaded_file, sep='\t') # Doc: assume contents are seperated by Tabs.
109
  abstract_col = 'AB'
110
  title_col = 'TI'
111
+ source_title_col = 'SO'
112
+ year_col = 'PY'
113
  # preview the uploaded file
114
  else:
115
  st.error("Unsupported file format.")