dongzhaorui 3 年之前
父節點
當前提交
72332bccd9
共有 1 個文件被更改,包括 4 次插入1 次删除
  1. 4 1
      find_source/crawler/analysis/DomAnalysis.py

+ 4 - 1
find_source/crawler/analysis/DomAnalysis.py

@@ -50,7 +50,10 @@ class DomAnalysis(FilterUrl):
                 name = "{:.50s}".format(name)
             if tag.get('href') is None:
                 return
-            href = self.filter(tag.get('href'))
+            try:
+                href = self.filter(tag.get('href'))
+            except ValueError:
+                return
             data = {'name': name, 'host': href}
             if data not in items:
                 items.append(data)