Spaces:

SR05
/

Delhi_Irish_visa_decisions

Running

SR05 commited on Nov 20, 2024

Commit

62f4c5f

verified ·

1 Parent(s): 82e2987

Update dataframe.py (#8)

Files changed (1) hide show

dataframe.py CHANGED Viewed

@@ -1,27 +1,28 @@
 import pandas as pd
 import streamlit as st
-def process_dataframe(ods_file):
     try:
         # Read the .ods file into a DataFrame
-        df = pd.read_excel(ods_file, engine='odf')
-        # Clean up unnecessary columns and rows
         df.drop(columns=["Unnamed: 0", "Unnamed: 1"], inplace=True, errors='ignore')
         df.dropna(how='all', inplace=True)
         df.reset_index(drop=True, inplace=True)
-        # Identify and set the header row
         for idx, row in df.iterrows():
             if row['Unnamed: 2'] == 'Application Number' and row['Unnamed: 3'] == 'Decision':
                 df.columns = ['Application Number', 'Decision']
-                df = df.iloc[idx + 1:]
                 break
-        # Convert application numbers to strings
         df.reset_index(drop=True, inplace=True)
-        df['Application Number'] = df['Application Number'].astype(str)
         return df
     except Exception as e:
-        st.error(f"Error processing the data: {e}")
-        return pd.DataFrame()  # Return an empty DataFrame on failure

 import pandas as pd
 import streamlit as st
+def prepare_dataframe(file):
     try:
         # Read the .ods file into a DataFrame
+        df = pd.read_excel(file, engine='odf')
+        # Clean the DataFrame
         df.drop(columns=["Unnamed: 0", "Unnamed: 1"], inplace=True, errors='ignore')
         df.dropna(how='all', inplace=True)
         df.reset_index(drop=True, inplace=True)
+        # Identify the header row and reformat the DataFrame
         for idx, row in df.iterrows():
             if row['Unnamed: 2'] == 'Application Number' and row['Unnamed: 3'] == 'Decision':
                 df.columns = ['Application Number', 'Decision']
+                df = df.iloc[idx + 1:]  # Skip the header row
                 break
+        # Reset the index and convert the Application Number to integers
         df.reset_index(drop=True, inplace=True)
+        df['Application Number'] = df['Application Number'].astype(str).str.strip()
         return df
     except Exception as e:
+        st.error(f"Error preparing the DataFrame: {e}")
+        return None