Spaces:
Sleeping
Sleeping
######################################## IMPORTING REQUIRED LIBRARIES #################################### | |
import os | |
import sys | |
import pandas as pd | |
import streamlit as st | |
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))) | |
data_folder = os.path.join(os.path.dirname(os.path.dirname(os.path.abspath(__file__))), 'data') | |
from utilities import get_data, input_filter, clean_data, autogenerate_labels | |
def data_sourcing(left_lat, left_lon, dist, loc_name): | |
lat, lon = input_filter(lat = left_lat, lon=left_lon) | |
df = get_data(lat, lon, dist) | |
df.to_csv(f'{data_folder}/LOCATION_{loc_name}_DATA.csv', index=False) | |
return df | |
def data_clean_for_training(df): | |
df = clean_data(df) | |
df.to_csv(f'{data_folder}/MMR_DATA_CLEAN.csv', index=False) | |
return df | |
st.title("Map Data Analysis - ETL Pipeline") | |
left_lat = st.number_input("Enter the left latitude", value=18.889833) | |
left_lon = st.number_input("Enter the left longitude", value=72.779844) | |
print(left_lat, left_lon) | |
loc_name = st.text_input("Enter the location name", value="Mumbai") | |
dist = st.number_input("Enter the distance", value=35) | |
if st.button("Run ETL Pipeline"): | |
df = data_sourcing(left_lat, left_lon, dist, loc_name) | |
if df: | |
st.write("Data loaded successfully !!") | |
df = clean_data(df) | |
labelled_df, embeddings_df = autogenerate_labels(df) | |
labelled_df.to_csv(f'{data_folder}/DATA_{loc_name}_CLEAN_LABELLED.csv', index=False) | |
embeddings_df.to_csv(f'{data_folder}/DATA_{loc_name}_CLEAN_EMBEDDINGS.csv', index=False) | |
st.write("ETL Pipeline executed successfully !!") |