The_Music_Of_New_Orleans_MoE

Running

awacke1 commited on Apr 26

Commit

47ed41d

•

1 Parent(s): 5a42dc4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -96,33 +96,37 @@ def parse_to_markdown(text):
 import re
 def extract_urls(text):
-    # Regular expression patterns to find the required fields
-    date_pattern = re.compile(r'### (\d{2} \w{3} \d{4})')
-    abs_link_pattern = re.compile(r'\[(.*?)\]\((https://arxiv\.org/abs/\d+\.\d+)\)')
-    pdf_link_pattern = re.compile(r'\[⬇️\]\((https://arxiv\.org/pdf/\d+\.\d+)\)')
-    title_pattern = re.compile(r'### \d{2} \w{3} \d{4} \| \[(.*?)\]')
-    # Find all occurrences of the required fields using the regular expression patterns
-    date_matches = date_pattern.findall(text)
-    abs_link_matches = abs_link_pattern.findall(text)
-    pdf_link_matches = pdf_link_pattern.findall(text)
-    title_matches = title_pattern.findall(text)
-    # Generate markdown string with the extracted fields
-    markdown_text = ""
-    for i in range(len(date_matches)):
-        date = date_matches[i]
-        title = title_matches[i]
-        abs_link = abs_link_matches[i][1]
-        pdf_link = pdf_link_matches[i]
-        markdown_text += f"**Date:** {date}\n\n"
-        markdown_text += f"**Title:** {title}\n\n"
-        markdown_text += f"**Abstract Link:** [{abs_link}]({abs_link})\n\n"
-        markdown_text += f"**PDF Link:** [{pdf_link}]({pdf_link})\n\n"
-        markdown_text += "---\n\n"
-    return markdown_text

 import re
 def extract_urls(text):
+    try:
+        # Regular expression patterns to find the required fields
+        date_pattern = re.compile(r'### (\d{2} \w{3} \d{4})')
+        abs_link_pattern = re.compile(r'\[(.*?)\]\((https://arxiv\.org/abs/\d+\.\d+)\)')
+        pdf_link_pattern = re.compile(r'\[⬇️\]\((https://arxiv\.org/pdf/\d+\.\d+)\)')
+        title_pattern = re.compile(r'### \d{2} \w{3} \d{4} \| \[(.*?)\]')
+        # Find all occurrences of the required fields using the regular expression patterns
+        date_matches = date_pattern.findall(text)
+        abs_link_matches = abs_link_pattern.findall(text)
+        pdf_link_matches = pdf_link_pattern.findall(text)
+        title_matches = title_pattern.findall(text)
+        # Generate markdown string with the extracted fields
+        markdown_text = ""
+        for i in range(len(date_matches)):
+            date = date_matches[i]
+            title = title_matches[i]
+            abs_link = abs_link_matches[i][1]
+            pdf_link = pdf_link_matches[i]
+            markdown_text += f"**Date:** {date}\n\n"
+            markdown_text += f"**Title:** {title}\n\n"
+            markdown_text += f"**Abstract Link:** [{abs_link}]({abs_link})\n\n"
+            markdown_text += f"**PDF Link:** [{pdf_link}]({pdf_link})\n\n"
+            markdown_text += "---\n\n"
+        return markdown_text
+    except:
+        st.write('.')
+        return ''