Spaces:
Building
Building
Update app.py
Browse files
app.py
CHANGED
@@ -49,7 +49,7 @@ def fetch_sitemap_urls_from_xml(sitemap_url, domain, recursive=False):
|
|
49 |
try:
|
50 |
response = requests.get(sitemap_url, headers={"User-Agent": "SiteFocusTool/1.0"}, timeout=10)
|
51 |
response.raise_for_status()
|
52 |
-
soup = BeautifulSoup(response.content, "xml")
|
53 |
if soup.find_all("sitemap"):
|
54 |
for sitemap in soup.find_all("sitemap"):
|
55 |
loc = sitemap.find("loc").text
|
|
|
49 |
try:
|
50 |
response = requests.get(sitemap_url, headers={"User-Agent": "SiteFocusTool/1.0"}, timeout=10)
|
51 |
response.raise_for_status()
|
52 |
+
soup = BeautifulSoup(response.content, "lxml-xml") # Use lxml parser
|
53 |
if soup.find_all("sitemap"):
|
54 |
for sitemap in soup.find_all("sitemap"):
|
55 |
loc = sitemap.find("loc").text
|