forked from iCON/CrawlerEngines
bug fix
parent
36353926de
commit
3d0e534375
|
|
@ -161,11 +161,18 @@ class Crawler_NewsCN:
|
||||||
WebDriverWait(self.driver, 10).until(EC.title_contains("Xinhua"))
|
WebDriverWait(self.driver, 10).until(EC.title_contains("Xinhua"))
|
||||||
# time.sleep(1)
|
# time.sleep(1)
|
||||||
|
|
||||||
region_code = urllib.parse.urlparse(url).path.split("/")[1]
|
# 特殊情况:https://german.news.cn/20241016/93ca92839e1b44dc8f6dca21f9c80902/c.html
|
||||||
if region_code in XINHUA_OVERSEAS_REGIONS:
|
# region_code = urllib.parse.urlparse(url).path.split("/")[1]
|
||||||
blog = self.__retrieve_overseas_blog()
|
# if region_code in XINHUA_OVERSEAS_REGIONS:
|
||||||
else:
|
# blog = self.__retrieve_overseas_blog()
|
||||||
|
# else:
|
||||||
|
# blog = self.__retrieve_china_blog()
|
||||||
|
|
||||||
|
if self.driver.find_elements(By.CLASS_NAME, "conBox"):
|
||||||
blog = self.__retrieve_china_blog()
|
blog = self.__retrieve_china_blog()
|
||||||
|
else:
|
||||||
|
if self.driver.find_elements(By.CLASS_NAME, "main.clearfix"):
|
||||||
|
blog = self.__retrieve_overseas_blog()
|
||||||
|
|
||||||
# div = WebDriverWait(self.driver, 10).until(
|
# div = WebDriverWait(self.driver, 10).until(
|
||||||
# EC.presence_of_element_located((By.CLASS_NAME, "detailContent"))
|
# EC.presence_of_element_located((By.CLASS_NAME, "detailContent"))
|
||||||
|
|
|
||||||
|
|
@ -20,8 +20,8 @@ class submit_test:
|
||||||
# # # 创建一个测试队列:10000 / BBCSearch
|
# # # 创建一个测试队列:10000 / BBCSearch
|
||||||
submit_test.submit(10000, {"keyword": "习近平"})
|
submit_test.submit(10000, {"keyword": "习近平"})
|
||||||
submit_test.submit(10000, {"keyword": "US election"})
|
submit_test.submit(10000, {"keyword": "US election"})
|
||||||
# submit_test.submit(10000, {"keyword": "US election"})
|
submit_test.submit(10000, {"keyword": "Yahya Sinwar"})
|
||||||
# submit_test.submit(10000, {"keyword": "US election"})
|
submit_test.submit(10000, {"keyword": "Bin Laden"})
|
||||||
|
|
||||||
# # 创建一个测试队列:11000 / Wikipedia
|
# # 创建一个测试队列:11000 / Wikipedia
|
||||||
# submit_test.submit(11000, {"keyword": keyword})
|
# submit_test.submit(11000, {"keyword": keyword})
|
||||||
|
|
@ -31,4 +31,8 @@ submit_test.submit(10000, {"keyword": "US election"})
|
||||||
|
|
||||||
# 创建一个测试队列:13000 / Crawler_NewsCN 新华网英文站在线搜索
|
# 创建一个测试队列:13000 / Crawler_NewsCN 新华网英文站在线搜索
|
||||||
submit_test.submit(13000, {"keyword": "china", "lang": "en"})
|
submit_test.submit(13000, {"keyword": "china", "lang": "en"})
|
||||||
|
submit_test.submit(13000, {"keyword": "fujian", "lang": "en"})
|
||||||
|
submit_test.submit(13000, {"keyword": "shenzhen", "lang": "en"})
|
||||||
submit_test.submit(13000, {"keyword": "中国", "lang": "cn"})
|
submit_test.submit(13000, {"keyword": "中国", "lang": "cn"})
|
||||||
|
submit_test.submit(13000, {"keyword": "吴邦国", "lang": "cn"})
|
||||||
|
submit_test.submit(13000, {"keyword": "李强", "lang": "cn"})
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue