Spaces:
Running
Running
Update trend_crawl2.py
Browse files- trend_crawl2.py +8 -3
trend_crawl2.py
CHANGED
@@ -161,20 +161,25 @@ def process_li_element(index, li_data, url):
|
|
161 |
"""Process a single li element."""
|
162 |
driver = setup_driver()
|
163 |
try:
|
|
|
164 |
driver.get(url)
|
165 |
WebDriverWait(driver, 20).until(
|
166 |
EC.presence_of_element_located((By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]"))
|
167 |
)
|
168 |
-
|
169 |
ul_element = driver.find_element(By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]")
|
|
|
170 |
li_elements = ul_element.find_elements(By.TAG_NAME, "li")
|
|
|
171 |
selected_li = li_elements[li_data['index']]
|
172 |
-
|
173 |
driver.execute_script("arguments[0].scrollIntoView();", selected_li)
|
|
|
174 |
driver.execute_script("arguments[0].click();", selected_li)
|
175 |
time.sleep(2)
|
176 |
|
177 |
span_content = selected_li.find_element(By.CLASS_NAME, "W7g1Rb-rymPhb-fpDzbe-fmcmS").get_attribute("innerText")
|
|
|
178 |
print(f"LI {li_data['index']} clicked: {span_content}")
|
179 |
|
180 |
data = scrape_google_trends(driver)
|
@@ -190,7 +195,7 @@ def crawl_url(url):
|
|
190 |
driver = setup_driver()
|
191 |
result_dict = {}
|
192 |
try:
|
193 |
-
|
194 |
driver.get(url)
|
195 |
WebDriverWait(driver, 20).until(
|
196 |
EC.presence_of_element_located((By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]"))
|
|
|
161 |
"""Process a single li element."""
|
162 |
driver = setup_driver()
|
163 |
try:
|
164 |
+
print("driver.get")
|
165 |
driver.get(url)
|
166 |
WebDriverWait(driver, 20).until(
|
167 |
EC.presence_of_element_located((By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]"))
|
168 |
)
|
169 |
+
print("1")
|
170 |
ul_element = driver.find_element(By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]")
|
171 |
+
print("2")
|
172 |
li_elements = ul_element.find_elements(By.TAG_NAME, "li")
|
173 |
+
print("2")
|
174 |
selected_li = li_elements[li_data['index']]
|
175 |
+
print("2")
|
176 |
driver.execute_script("arguments[0].scrollIntoView();", selected_li)
|
177 |
+
print("3")
|
178 |
driver.execute_script("arguments[0].click();", selected_li)
|
179 |
time.sleep(2)
|
180 |
|
181 |
span_content = selected_li.find_element(By.CLASS_NAME, "W7g1Rb-rymPhb-fpDzbe-fmcmS").get_attribute("innerText")
|
182 |
+
print("4")
|
183 |
print(f"LI {li_data['index']} clicked: {span_content}")
|
184 |
|
185 |
data = scrape_google_trends(driver)
|
|
|
195 |
driver = setup_driver()
|
196 |
result_dict = {}
|
197 |
try:
|
198 |
+
|
199 |
driver.get(url)
|
200 |
WebDriverWait(driver, 20).until(
|
201 |
EC.presence_of_element_located((By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]"))
|