Add1E commited on
Commit
c63c43e
·
verified ·
1 Parent(s): b7c50f4

Update trend_crawl2.py

Browse files
Files changed (1) hide show
  1. trend_crawl2.py +8 -3
trend_crawl2.py CHANGED
@@ -161,20 +161,25 @@ def process_li_element(index, li_data, url):
161
  """Process a single li element."""
162
  driver = setup_driver()
163
  try:
 
164
  driver.get(url)
165
  WebDriverWait(driver, 20).until(
166
  EC.presence_of_element_located((By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]"))
167
  )
168
-
169
  ul_element = driver.find_element(By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]")
 
170
  li_elements = ul_element.find_elements(By.TAG_NAME, "li")
 
171
  selected_li = li_elements[li_data['index']]
172
-
173
  driver.execute_script("arguments[0].scrollIntoView();", selected_li)
 
174
  driver.execute_script("arguments[0].click();", selected_li)
175
  time.sleep(2)
176
 
177
  span_content = selected_li.find_element(By.CLASS_NAME, "W7g1Rb-rymPhb-fpDzbe-fmcmS").get_attribute("innerText")
 
178
  print(f"LI {li_data['index']} clicked: {span_content}")
179
 
180
  data = scrape_google_trends(driver)
@@ -190,7 +195,7 @@ def crawl_url(url):
190
  driver = setup_driver()
191
  result_dict = {}
192
  try:
193
- print("driver.get")
194
  driver.get(url)
195
  WebDriverWait(driver, 20).until(
196
  EC.presence_of_element_located((By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]"))
 
161
  """Process a single li element."""
162
  driver = setup_driver()
163
  try:
164
+ print("driver.get")
165
  driver.get(url)
166
  WebDriverWait(driver, 20).until(
167
  EC.presence_of_element_located((By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]"))
168
  )
169
+ print("1")
170
  ul_element = driver.find_element(By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]")
171
+ print("2")
172
  li_elements = ul_element.find_elements(By.TAG_NAME, "li")
173
+ print("2")
174
  selected_li = li_elements[li_data['index']]
175
+ print("2")
176
  driver.execute_script("arguments[0].scrollIntoView();", selected_li)
177
+ print("3")
178
  driver.execute_script("arguments[0].click();", selected_li)
179
  time.sleep(2)
180
 
181
  span_content = selected_li.find_element(By.CLASS_NAME, "W7g1Rb-rymPhb-fpDzbe-fmcmS").get_attribute("innerText")
182
+ print("4")
183
  print(f"LI {li_data['index']} clicked: {span_content}")
184
 
185
  data = scrape_google_trends(driver)
 
195
  driver = setup_driver()
196
  result_dict = {}
197
  try:
198
+
199
  driver.get(url)
200
  WebDriverWait(driver, 20).until(
201
  EC.presence_of_element_located((By.XPATH, "//ul[contains(@aria-label, 'Kategorie') or contains(@aria-label, 'Category')]"))