|
@@ -105,13 +105,17 @@ class TitleChecker(object):
|
|
|
return True
|
|
|
#标题以异常字符结尾
|
|
|
#re.search()匹配整个字符串,并返回第一个成功的匹配,如果匹配失败,则返回None
|
|
|
- with open(abnormal_config["table_field_config"]["path5"], "r") as f:
|
|
|
- reads = csv.reader(f)
|
|
|
- for w in reads:
|
|
|
- ret=re.search(f"{w[0]}$", title)
|
|
|
- if ret != None:
|
|
|
- return True
|
|
|
+ # with open(abnormal_config["table_field_config"]["path5"], "r") as f:
|
|
|
+ # reads = csv.reader(f)
|
|
|
+ # for w in reads:
|
|
|
+ # ret=re.search(f"{w[0]}$", title)
|
|
|
+ # if (ret!= None) or (ret.group() == w[0]):
|
|
|
+ # return True
|
|
|
+ p2 = re.search("[nbsp\..\...\.]$",title)
|
|
|
+ #re.search():匹配整个字符串,并返回第一个成功的匹配,如果匹配失败,则返回None
|
|
|
+ if p2!=None:
|
|
|
+ return True
|
|
|
#标题以异常字符开始
|
|
|
- p1 = re.compile(r"^[3|6|7|8|0|\.]")
|
|
|
- if p1.match(title):
|
|
|
+ p1 = re.search("^[36780\.]",title)
|
|
|
+ if p1!=None:
|
|
|
return True
|