Standard_Intelligence_Dev

Sleeping

YchKhan commited on Mar 5, 2024

Commit

079e255

verified ·

1 Parent(s): 9ce5b88

move browse_folder to scrape_3gpp.py

Files changed (1) hide show

scrape_3gpp.py CHANGED Viewed

@@ -8,6 +8,20 @@ import zipfile
 import textract
 import gradio as gr
 def scrape(url, excel_file, folder_name,progress=gr.Progress()):
     filenames = []
     # Check if the excel_file argument is provided and if the file exists.

 import textract
 import gradio as gr
+def browse_folder(url):
+    if url.lower().endswith(('docs', 'docs/')):
+      return gr.update(choices=[])
+    response = requests.get(url)
+    response.raise_for_status()  # This will raise an exception if there's an error
+    soup = BeautifulSoup(response.text, 'html.parser')
+    excel_links = [a['href'] + '/' for a in soup.find_all('a', href=True) if a['href'].startswith(url)]
+    return gr.update(choices=excel_links)
 def scrape(url, excel_file, folder_name,progress=gr.Progress()):
     filenames = []
     # Check if the excel_file argument is provided and if the file exists.