import streamlit as st # type: ignore
import numpy as np
import pandas as pd
import seaborn as sns # type: ignore
import matplotlib.pyplot as plt
import base64
import pickle
import time
@st.cache_data
def load_data(dataset):
df = pd.read_csv(dataset)
return df
def filedownload(df):
csv = df.to_csv(index=False)
b64 = base64.b64encode(csv.encode()).decode() # strings <-> bytes conversions
href = f'Download CSV File'
href2 = f''
return href,href2
data = load_data('dataset/brain_stroke.csv')
meanGlucose = data['avg_glucose_level'].mean()
meanBmi = data['bmi'].mean()
meanAge = data['age'].mean()
st.sidebar.image('images/ahat.png',width=280)
def main():
st.markdown("
Streamlit Brain Stroke Prediction App
",unsafe_allow_html=True)
st.markdown("Brain Stroke study in USA
",unsafe_allow_html=True)
menu = ['Home','Analysis','Data Visualization','Machine Learning']
choice = st.sidebar.selectbox('Select Menu', menu)
if choice == 'Home':
left,middle,right = st.columns((2,3,2))
with middle:
col4, col5, col6 = st.columns(3)
with col4:
temp = st.metric(label="Average Glucose Level", value=meanGlucose, delta="From 5010 To 2012")
with col5:
temp = st.metric(label="Average BMI", value=meanBmi, delta="From 2010 To 2012")
with col6:
temp = st.metric(label="Average Age", value=meanAge, delta="From 2010 To 2012")
st.image('images/ahat.png',width=280)
if choice == 'Analysis':
st.subheader('Brain Stroke Dataset')
st.write(data.head())
if st.checkbox('Summary'):
st.write(data.describe())
elif st.checkbox('Correlation'):
fig = plt.figure(figsize=(15,5))
st.write(sns.heatmap(data.corr(),annot=True))
st.pyplot(fig)
elif choice == 'Data Visualization':
if st.checkbox('Countplot'):
fig = plt.figure(figsize=(15,5))
sns.countplot(x='age',data=data)
st.pyplot(fig)
elif st.checkbox('Scatterplot'):
fig = plt.figure(figsize=(15,5))
sns.scatterplot(x='avg_glucose_level',y='age',data=data,hue='stroke')
st.pyplot(fig)
elif choice == 'Machine Learning':
tab1, tab2, tab3 = st.tabs([":clipboard: Data",":bar_chart:✅ Visualisation", "📈🎯 Prediction"])
uploaded_file = st.sidebar.file_uploader('Upload your Dataset(.csv file)',
type=['csv'])
if uploaded_file:
df = load_data(uploaded_file)
with tab1:
st.subheader('Loaded Dataset')
st.write(df)
with tab2:
st.subheader("Heart Disease's Histogram")
fig = plt.figure(figsize=(8,8))
sns.histplot(x='heart_disease',data=data)
st.pyplot(fig)
with tab3:
model = pickle.load(open('./models/gbc_dump.pkl', 'rb')) # Load the trained model from disk
prediction = model.predict(df)
pp = pd.DataFrame(prediction, columns=['Prediction'])
ndf = pd.concat([df, pp], axis=1)
ndf['Prediction'].replace(0, 'No Stroke Risk', inplace=True)
ndf['Prediction'].replace(1, 'Stroke Risk', inplace=True)
st.header("📈🎯 Stroke Risk Prediction")
st.subheader("Predictions")
st.write(ndf)
if st.button(' 💾 Download csv file'):
st.markdown(filedownload(ndf), unsafe_allow_html=True)
if __name__ == '__main__':
main()