|
@@ -137,8 +137,7 @@ class Spider(BaseParser, Thread):
|
|
self._heartbeat_buffer.stop() # 关闭 heartbeat_buffer
|
|
self._heartbeat_buffer.stop() # 关闭 heartbeat_buffer
|
|
|
|
|
|
# 关闭 webdriver
|
|
# 关闭 webdriver
|
|
- if Request.webdriver_pool:
|
|
|
|
- Request.webdriver_pool.close()
|
|
|
|
|
|
+ Request.render_downloader and Request.render_downloader.close_all()
|
|
|
|
|
|
log.info("无任务,爬虫结束")
|
|
log.info("无任务,爬虫结束")
|
|
break
|
|
break
|
|
@@ -214,6 +213,7 @@ class BaseBusinessDetailSpider(Spider):
|
|
yield failed_item
|
|
yield failed_item
|
|
|
|
|
|
def get_tasks(self, limit=None, **kwargs):
|
|
def get_tasks(self, limit=None, **kwargs):
|
|
|
|
+ show_log = kwargs.pop("show_log", False)
|
|
timeout = kwargs.pop("timeout", 10)
|
|
timeout = kwargs.pop("timeout", 10)
|
|
queue = setting.TAB_ITEMS.format(redis_key=self._redis_key.replace("_detailc", ""))
|
|
queue = setting.TAB_ITEMS.format(redis_key=self._redis_key.replace("_detailc", ""))
|
|
|
|
|
|
@@ -221,8 +221,8 @@ class BaseBusinessDetailSpider(Spider):
|
|
url = f"{setting.JY_TASK_URL}/tasks/fd?qn={queue}&limit={limit}"
|
|
url = f"{setting.JY_TASK_URL}/tasks/fd?qn={queue}&limit={limit}"
|
|
headers = {"Authorization": self.task_api_auth_token}
|
|
headers = {"Authorization": self.task_api_auth_token}
|
|
params = dict(headers=headers, timeout=timeout, proxies=False)
|
|
params = dict(headers=headers, timeout=timeout, proxies=False)
|
|
- response = Request(method="GET", url=url, **params).get_response()
|
|
|
|
- ret = response.json["task"]
|
|
|
|
|
|
+ r = Request(method="GET", url=url, **params).get_response(show_log=show_log)
|
|
|
|
+ ret = r.json["task"]
|
|
self.tasks_dict = {
|
|
self.tasks_dict = {
|
|
"token": self.task_api_auth_token,
|
|
"token": self.task_api_auth_token,
|
|
"data": {t["pyuuid"]: {"tid": t["tid"], "queue": queue} for t in ret}
|
|
"data": {t["pyuuid"]: {"tid": t["tid"], "queue": queue} for t in ret}
|