lizongze hai 1 ano
pai
achega
7df8b6e20b
Modificáronse 4 ficheiros con 1 adicións e 4 borrados
  1. 0 1
      ybw/config/conf.yaml
  2. 0 2
      ybw/detail_spider.py
  3. 0 1
      ybw/list_spider.py
  4. 1 0
      ybw/utils/title_participle.py

+ 0 - 1
ybw/config/conf.yaml

@@ -16,7 +16,6 @@ redis:
 
 es:
   host: 172.17.4.184
-#  host: 127.0.0.1
   usename: "jybid"
   pwd: "Top2023_JEB01i@31"
   port: !!int 19905

+ 0 - 2
ybw/detail_spider.py

@@ -4,7 +4,6 @@ import time
 import requests.exceptions
 from lxml.html import fromstring, HtmlElement, tostring
 from lxml.html.clean import Cleaner
-from pymongo.errors import DuplicateKeyError
 
 from crawler.check_utils import CheckText, CheckTask
 from crawler.clean_html import cleaner
@@ -13,7 +12,6 @@ from crawler.login import login, load_login_cookies, login_check
 from utils.databases import mongo_table, int2long
 from utils.execptions import YbwCrawlError
 from utils.log import logger
-from utils.socks5 import Proxy
 
 
 def iter_node(element: HtmlElement):

+ 0 - 1
ybw/list_spider.py

@@ -13,7 +13,6 @@ from crawler.login import login, load_login_cookies, login_session_check
 from utils.databases import mongo_table, int2long, es_query, redis_client
 from utils.execptions import CrawlError, YbwCrawlError
 from utils.log import logger
-from utils.socks5 import Proxy
 from utils.tools import sha1,clean_title
 
 CrawlMenu = namedtuple('CrawlMenu', ['channel', 'spidercode', 'table_type'])

+ 1 - 0
ybw/utils/title_participle.py

@@ -13,6 +13,7 @@ import json
 
 def get_should(title):
 
+    # url = "http://192.168.3.149:9201/_analyze"  # 测试
     url = "http://172.17.4.184:19905/_analyze"  # 线上
     username = "jybid"
     password = "Top2023_JEB01i@31"