__init__.py 551 B

123456789101112131415161718192021
  1. import threading
  2. from crawler.spiders import SyncData, SearchEngine, DataExcavate
  3. class BreadthCrawler:
  4. def __init__(self, engines=None, **kwargs):
  5. SyncData(**kwargs)
  6. self._engines = SearchEngine(engines, **kwargs)
  7. self._excavator = DataExcavate(**kwargs)
  8. def start(self):
  9. threading.Thread(
  10. target=self._engines.start,
  11. name='MainSearchEngine'
  12. ).start()
  13. threading.Thread(
  14. target=self._excavator.start,
  15. name='MainSearchVisit'
  16. ).start()