Spaces:

omdenalagos
/

job_skill_cat

Runtime error

App Files Files Community

Basanth commited on Jul 15, 2023

Commit

b544d86

1 Parent(s): e5d2c3b

file check added,spinner added

Browse files

Files changed (2) hide show

apps/demo.py +28 -17
src/file_uploader.py +5 -4

apps/demo.py CHANGED Viewed

@@ -13,8 +13,12 @@ model = load_model()
 skill_extractor = load_skill_extractor()
 def app():
-    if 'input_text' not in st.session_state:
-        st.session_state['input_text'] = ''
     st.markdown(f"""<h1
                 style= "text-align:-webkit-center;
@@ -32,15 +36,18 @@ def app():
         identify skill gaps, and prioritize development
         </h1>""",unsafe_allow_html=True)
-    uploaded_file = st.file_uploader("Choose a file",type =['pdf','docx'],label_visibility = "collapsed")
     if uploaded_file is not None:
-            st.session_state['input_text'] = extract_text_from_file(uploaded_file)
     else:
-            st.session_state['input_text'] = ''
     # st.title("Uploaded resume ")
@@ -50,20 +57,24 @@ def app():
         # # input_text = st.text_area('', value=default_text, height=200)
         # submit_button = st.form_submit_button(label="Submit")
-    cls_text = clean_text(st.session_state['input_text'])
-    prob,job_cat = predict_cat(model, cls_text)
-    annotations = skill_extractor.annotate(cls_text,tresh=1)
-    text = annotations['text']
-    annotations = annotations['results']
-    df = create_dfs(annotations)
-    match = get_match(job_cat,df)
     col1, col2,= st.columns(2)
     gaugeData,option = gauge(value=0)
     with st.form(key='result'):
-        if st.session_state['input_text']:
-            gaugeData[0]['value']=match
             with col1:
                 st.markdown(f"""<h1 style= "text-align: -webkit-center;font-family: sans-serif;">Job Category</h1>""", unsafe_allow_html=True)
                 html_str = f"""
@@ -73,7 +84,7 @@ def app():
                                     color: #ff4d4f;
                                     font-family: sans-serif;
                                     font-weight: bold;">
-                                    {job_cat}
                             </div>
                             """
@@ -97,7 +108,7 @@ def app():
                 # st.markdown('-----------')
                 df = create_dfs(annotations)
                 st.markdown(f"""<h1 style= "text-align: -webkit-center;font-family: sans-serif;">Extracted Skill</h1>""",unsafe_allow_html=True)
-                st.write(", \n".join(df))

 skill_extractor = load_skill_extractor()
 def app():
+    session_items = ['input_text','match','job_cat','rerun']
+    if any(session_items) not in st.session_state:
+        st.session_state.input_text = ''
+        st.session_state.job_cat = ''
+        st.session_state.match = 0
+        st.session_state.rerun = False
     st.markdown(f"""<h1
                 style= "text-align:-webkit-center;
         identify skill gaps, and prioritize development
         </h1>""",unsafe_allow_html=True)
+    uploaded_file = st.file_uploader("Choose a file",label_visibility = "collapsed")
     if uploaded_file is not None:
+            st.session_state.input_text,st.session_state.rerun = extract_text_from_file(uploaded_file)
     else:
+        st.session_state.rerun = False
     # st.title("Uploaded resume ")
         # # input_text = st.text_area('', value=default_text, height=200)
         # submit_button = st.form_submit_button(label="Submit")
+    if st.session_state.rerun:
+        with st.spinner('Processing.....'):
+            cls_text = clean_text(st.session_state.input_text)
+            prob,st.session_state.job_cat  = predict_cat(model, cls_text)
+            annotations = skill_extractor.annotate(cls_text,tresh=1)
+            text = annotations['text']
+            annotations = annotations['results']
+            df = create_dfs(annotations)
+            st.session_state.match = get_match(st.session_state.job_cat ,df)
     col1, col2,= st.columns(2)
     gaugeData,option = gauge(value=0)
     with st.form(key='result'):
+        if st.session_state.rerun:
+            gaugeData[0]['value']=st.session_state.match
             with col1:
                 st.markdown(f"""<h1 style= "text-align: -webkit-center;font-family: sans-serif;">Job Category</h1>""", unsafe_allow_html=True)
                 html_str = f"""
                                     color: #ff4d4f;
                                     font-family: sans-serif;
                                     font-weight: bold;">
+                                    {st.session_state.job_cat }
                             </div>
                             """
                 # st.markdown('-----------')
                 df = create_dfs(annotations)
                 st.markdown(f"""<h1 style= "text-align: -webkit-center;font-family: sans-serif;">Extracted Skill</h1>""",unsafe_allow_html=True)
+                st.write(", \n".join(df))

src/file_uploader.py CHANGED Viewed

@@ -25,17 +25,18 @@ def get_file_type(uploaded_file):
     return file_type
 def extract_text_from_file(uploaded_file):
     file_type = get_file_type(uploaded_file)
     # st.write("File type: ", file_type)
     if file_type == 'pdf':
-        return pdf2text(io.BytesIO(uploaded_file.read()))
     elif file_type == 'vnd.openxmlformats-officedocument.wordprocessingml.document':
-        return doc2text(io.BytesIO(uploaded_file.read()))
     else:
-        st.warning("plese upload the correct file type")
-        return ""
 def main():
     uploaded_file = st.file_uploader("Choose a file", type=['pdf', 'docx', 'doc'])

     return file_type
 def extract_text_from_file(uploaded_file):
+    rerun_state = False
     file_type = get_file_type(uploaded_file)
     # st.write("File type: ", file_type)
     if file_type == 'pdf':
+        return pdf2text(io.BytesIO(uploaded_file.read())), True
     elif file_type == 'vnd.openxmlformats-officedocument.wordprocessingml.document':
+        return doc2text(io.BytesIO(uploaded_file.read())),True
     else:
+        st.info("Only PDF and DOCX files are supported.", icon="ℹ️")
+        return "",False
 def main():
     uploaded_file = st.file_uploader("Choose a file", type=['pdf', 'docx', 'doc'])