Spaces:

Penguni
/

Analyze-and-predict-student-performance

Running

App Files Files Community

Analyze-and-predict-student-performance / app.py

Penguni

Rename main.py to app.py

d9a2d12 over 1 year ago

raw

history blame

10.3 kB

	import pandas as pd
	import streamlit as st
	import plotly.express as px
	import numpy as np
	import plotly.graph_objs as go
	from function import process_data,predict_late_student, predict_rank,predict_one_student
	from datetime import datetime
	from PIL import Image
	import base64
	from io import BytesIO


	df = pd.DataFrame()


	def color_cell(val):
	if val == "not late":
	color = "green"
	elif val == "may late":
	color = "yellow"
	elif val == "late":
	color = "red"
	else:
	color = "black"
	return "color: %s" % color


	def get_year(student_id):
	return int(student_id[6:8])


	def generate_comment(median):
	if median < 30:
	comment = f"The median score for {course} is quite low at {median}. Students may need to work harder to improve their performance."
	elif median < 50:
	comment = f"The median score for {course} is below average at {median}. Students should work on improving their understanding of the material."
	elif median < 80:
	comment = f"The median score for {course} is solid at {median}. Students are making good progress but could still work on improving their skills."
	else:
	comment = f"The median score for {course} is outstanding at {median}. Students are doing an excellent job in this course."
	return comment

	favicon = 'R.png'

	st.set_page_config(
	page_title='Student System',
	page_icon=favicon,
	layout='wide',
	)
	currentYear = datetime.now().year
	im1 = Image.open("R.png")

	# get the image from the URL


	# create a three-column layout
	col1, col2 = st.columns([1, 3])

	# add a centered image to the first and third columns
	with col1:
	st.image(im1, width=150)


	# add a centered title to the second column
	with col2:
	st.title("Student Performance Prediction System")


	# Load the raw data
	# uploaded_file = st.file_uploader("Choose a score file", type=["xlsx", "csv"])

	# if uploaded_file is not None:
	# file_contents = uploaded_file.read()
	# file_ext = uploaded_file.name.split(".")[-1].lower() # Get the file extension

	# if file_ext == "csv":
	# df = pd.read_csv(BytesIO(file_contents))
	# elif file_ext in ["xls", "xlsx"]:
	# df = pd.read_excel(BytesIO(file_contents))
	# else:
	# st.error("Invalid file format. Please upload a CSV or Excel file.")

	# raw_data = df.copy()
	raw_data = pd.read_csv("All_major.csv")
	st.sidebar.title("Analysis Tool")

	option = ["Dashboard", "Predict"]
	# Add an expander to the sidebar
	tabs = st.sidebar.selectbox("Select an option", option)


	# draw histogram
	# Streamlit app
	if tabs == "Dashboard":
	# try:

	df = process_data(raw_data)
	unique_values_major = df["Major"].unique()
	major=st.selectbox("Select a major:", unique_values_major)
	if major == "All":
	# If so, display the entire DataFrame
	filtered_df = df.copy()
	else:
	# Otherwise, filter the DataFrame based on the selected value
	filtered_df = df[df["Major"] == major]
	filtered_df = filtered_df.dropna(axis=1, how="all")

	# Select course dropdown
	df=filtered_df
	unique_values = df["MaSV_school"].unique()
	all_values = np.concatenate([["All"],unique_values ])
	school = st.selectbox("Select a school:", all_values)
	if school == "All":
	# If so, display the entire DataFrame
	filtered_df = df.copy()
	else:
	# Otherwise, filter the DataFrame based on the selected value
	filtered_df = df[df["MaSV_school"] == school]
	filtered_df = filtered_df.dropna(axis=1, how="all")

	# Select course dropdown
	df=filtered_df
	unique_values_year = df["Year"].unique()
	all_values_year = np.concatenate([["All"],unique_values_year ])
	year = st.selectbox("Select a year:", all_values_year)

	if year == "All":
	# If so, display the entire DataFrame
	filtered_df = df.copy()
	else:
	# Otherwise, filter the DataFrame based on the selected value
	filtered_df = df[df["Year"] == year]
	filtered_df = filtered_df.dropna(axis=1, how="all")


	df=filtered_df

	options = df.columns[:-3]
	course = st.selectbox("Select a course:", options)

	# Filter the data for the selected course
	course_data = df[course].dropna()

	# Calculate summary statistics for the course


	st.write(generate_comment(course_data.median()))
	# Show summary statistics

	st.write("Course:", course, " of ", school," student" )


	col1, col2,col3= st.columns(3)

	with col1:
	fig = go.Figure()
	fig.add_trace(
	go.Histogram(
	x=course_data, nbinsx=40, name="Histogram"
	)
	)
	fig.update_layout(
	title="Histogram of Scores for {}".format(course),
	xaxis_title="Score",
	yaxis_title="Count",
	height=400,
	width=400
	)
	st.plotly_chart(fig)

	with col2:
	fig = go.Figure()
	fig.add_trace(
	go.Box(
	y=course_data, name="Box plot"
	)
	)
	fig.update_layout(
	title="Box plot of Scores for {}".format(course),
	yaxis_title="Score",
	height=400,
	width=400
	)
	st.plotly_chart(fig)
	with col3:
	raw_data['MaSV_school'] = raw_data['MaSV'].str.slice(2, 4)
	if school == "All":
	# If so, display the entire DataFrame
	data = raw_data.copy()
	else:
	# Otherwise, filter the DataFrame based on the selected value
	data = raw_data[raw_data["MaSV_school"] == school]
	df1=data[['TenMH','NHHK','DiemHP']].copy()
	df1['DiemHP'] = pd.to_numeric(df1['DiemHP'], errors='coerce')
	df1['NHHK'] = df1['NHHK'].apply(lambda x: str(x)[:4] + ' S ' + str(x)[4:])
	selected_TenMH = " " + course
	filtered_df1 = df1[df1['TenMH'] == selected_TenMH]
	mean_DiemHP = filtered_df1.groupby('NHHK')['DiemHP'].mean().round(1).reset_index(name='Mean')
	# Create Plotly line graph
	fig = px.line(mean_DiemHP, x='NHHK', y='Mean', title=f"Mean DiemHP for{selected_TenMH} thought period")
	fig.update_layout(
	height=400,
	width=400)
	st.plotly_chart(fig)


	# except:
	# st.write("Add CSV to analysis")


	# predict student

	elif tabs == "Predict":
	try:
	raw_data = pd.read_csv("dataScore.csv")
	predict = predict_late_student(raw_data)
	rank = predict_rank(raw_data)

	predict = pd.merge(predict, rank, on="MaSV")
	rank_mapping = {
	"Khá": "Good",
	"Trung Bình Khá": "Average good",
	"Giỏi": "Very good",
	"Kém": "Very weak",
	"Trung Bình": "Ordinary",
	"Yếu": "Weak",
	"Xuất Sắc": "Excellent",
	}
	predict["Pred Rank"].replace(rank_mapping, inplace=True)

	# Filter students who have a Result value of "late"
	df_late = predict

	MaSV = st.text_input("Enter Student ID:")
	if MaSV:
	df_filtered = predict[predict["MaSV"] == MaSV]
	styled_table = (
	df_filtered[["MaSV", "GPA", "Mean_Cre", "Pred Rank", "Result", "Period"]]
	.style.applymap(color_cell)
	.format({"GPA": "{:.2f}", "Mean_Cre": "{:.1f}", "Period": "{:.1f}"})
	)

	with st.container():
	st.write(styled_table)
	predict_one_student(raw_data,MaSV)
	else:
	df_late = predict
	# df_late = predict[(predict['Pred Rank'] == 'Yếu') \| (predict['Pred Rank'] == 'Kém')]
	df_late["Year"] = 2000 + df_late["MaSV"].apply(get_year)
	df_late = df_late[
	(df_late["Year"] != currentYear - 1) & (df_late["Year"] != currentYear - 2)
	]
	year = st.selectbox("Select Year", options=df_late["Year"].unique())
	df_filtered = df_late[df_late["Year"] == year]
	styled_table = (
	df_filtered[["MaSV", "GPA", "Mean_Cre", "Pred Rank", "Result", "Period"]]
	.style.applymap(color_cell)
	.format({"GPA": "{:.2f}", "Mean_Cre": "{:.2f}", "Period": "{:.2f}"})
	)
	csv = df_filtered.to_csv(index=False)
	b64 = base64.b64encode(csv.encode()).decode()
	href = f'<a href="data:file/csv;base64,{b64}" download="Preidct data.csv">Download CSV</a>'
	st.markdown(href, unsafe_allow_html=True)
	fig1 = px.pie(
	df_filtered,
	names="Pred Rank",
	title="Pred Rank",
	color_discrete_sequence=px.colors.sequential.Mint,
	height=400,
	width=400,
	)
	fig2 = px.pie(
	df_filtered,
	names="Result",
	title="Result",
	color_discrete_sequence=px.colors.sequential.Peach,
	height=400,
	width=400,
	)
	fig1.update_layout(
	title={
	"text": "Pred Rank",
	"y": 0.95,
	"x": 0.5,
	"xanchor": "center",
	"yanchor": "top",
	}
	)
	fig2.update_layout(
	title={
	"text": "Result",
	"y": 0.95,
	"x": 0.5,
	"xanchor": "center",
	"yanchor": "top",
	}
	)
	st.dataframe(styled_table)
	col1, col2 = st.columns([1, 1])
	with col1:
	st.plotly_chart(fig1)
	with col2:
	st.plotly_chart(fig2)



	# display the grid of pie charts using Streamlit

	except:
	st.write('Add CSV to analysis')