1 rok temu · e4fd28c25d
--- a/a2s-0.0.2-py3-none-any.whl
+++ b/a2s-0.0.2-py3-none-any.whl
--- a/client.py
+++ b/client.py
--- a/docs/config.py
+++ b/docs/config.py
@@ -27,6 +27,8 @@ abnormal_config = {
 
				         "path2": "./docs/table_head_doc/abnormal_buyer_contain.csv",
			
 
				         "path3": "./docs/table_head_doc/abnormal_buyer_end.csv",
			
 
				         "path4": "./docs/table_head_doc/projectcode.csv",
			
 
				+        "path5": "./docs/table_head_doc/title_abnormal.csv",
			
 
				+        "path6": "./docs/table_head_doc/title_abnormal_contain.csv",
			
 
				     }}
			
 
				 
			
 
				 # 调试
			
--- a/docs/table_head_doc/general_label.csv
+++ b/docs/table_head_doc/general_label.csv
@@ -1,128 +1,126 @@
 
				-"采购计划任务"
			
 
				-"采购公告"
			
 
				-"招标文件预公示"
			
 
				-"招标预公告"
			
 
				-"计划招标公告"
			
 
				-"调研公告"
			
 
				-"预申公告"
			
 
				-"预审文件"
			
 
				-"预审公告更正公告"
			
 
				-"预审结果"
			
 
				-"预审结果公示"
			
 
				-"预审结果"
			
 
				-"预审结果的公示"
			
 
				-"预审结果变更"
			
 
				-"论证意见公示"
			
 
				-"需求论证公示"
			
 
				-"征求意见公告"
			
 
				-"进口产品公示"
			
 
				-"需求公告"
			
 
				-"直接采购公告"
			
 
				-"需求公示"
			
 
				-"采购公告"
			
 
				-"采购项目"
			
 
				-"项目公告"
			
 
				-"招标公告"
			
 
				-"意向公开"
			
 
				-"比选公告"
			
 
				-"邀请公告"
			
 
				-"采购邀请"
			
 
				-"邀请书"
			
 
				-"邀请函"
			
 
				-"询价采购"
			
 
				-"询价公告"
			
 
				-"比价公告"
			
 
				-"比价项目公告"
			
 
				-"建设项目"
			
 
				-"中标（成交）公告"
			
 
				-"服务"
			
 
				-"项目"
			
 
				-"合同公告"
			
 
				-"比价项目公告"
			
 
				-"比质比价"
			
 
				-"比质比价公告"
			
 
				-"询价采购公告"
			
 
				-"询价书"
			
 
				-"询价单"
			
 
				-"询价采购"
			
 
				-"公开询价"
			
 
				-"询价邀请书"
			
 
				-"竞价交易公告"
			
 
				-"竞价公告"
			
 
				-"竞价项目"
			
 
				-"竞价的公告"
			
 
				-"竞价采购公告"
			
 
				-"变更公告"
			
 
				-"更正公告"
			
 
				-"暂停公告"
			
 
				-"候选人公示"
			
 
				-"候选人公示"
			
 
				-"结果公告"
			
 
				-"结果公示"
			
 
				-"服务项目"
			
 
				-"成交公告"
			
 
				-"中选人公示"
			
 
				-"中选结果公示"
			
 
				-"中标公示"
			
 
				-"中标公告"
			
 
				-"成交公示"
			
 
				-"废标公告"
			
 
				-"终止公告"
			
 
				-"异常公告"
			
 
				-"流标公告"
			
 
				-"失败公告"
			
 
				-"合同公告"
			
 
				-"合同信息"
			
 
				-"采购合同"
			
 
				-"销售合同"
			
 
				-"集成合同"
			
 
				-"项目合同"
			
 
				-"合同公示"
			
 
				-"服务合同"
			
 
				-"验收公告"
			
 
				-"验收单公示"
			
 
				-"标段"
			
 
				-"单一来源采购公示"
			
 
				-"考试培训"
			
 
				-"比价单"
			
 
				-"项目询价"
			
 
				-"采购项目"
			
 
				-"询价"
			
 
				-"竞争性谈判"
			
 
				-"竞争性磋商"
			
 
				-"单一来源"
			
 
				-"竞价处置公告"
			
 
				-"网上竞价"
			
 
				-"结果公告"
			
 
				-"结果公示"
			
 
				-"中标公示"
			
 
				-"中标公告"
			
 
				-"公告"
			
 
				-"合同"
			
 
				-"评审失败"
			
 
				-"招标失败"
			
 
				-"比选失败"
			
 
				-"采购失败"
			
 
				-"流标公示"
			
 
				-"项目合同"
			
 
				-"验收结果"
			
 
				-"验收公告"
			
 
				-"行政处罚"
			
 
				-"违约行为"
			
 
				-"投诉"
			
 
				-"不良行为"
			
 
				-"协议书"
			
 
				-"候选人"
			
 
				-"购置"
			
 
				-"公示"
			
 
				-"建设"
			
 
				-"中标"
			
 
				-"招标"
			
 
				-"工程"
			
 
				-"采购"
			
 
				-"成交通知书"
			
 
				-"公告公告"
			
 
				-"项目项目"
			
 
				-"合同合同"
			
 
				-"nbsp"
			
 
				-"..."
			
 
				+采购计划任务
			
 
				+采购公告
			
 
				+招标文件预公示
			
 
				+招标预公告
			
 
				+计划招标公告
			
 
				+调研公告
			
 
				+预申公告
			
 
				+预审文件
			
 
				+预审公告更正公告
			
 
				+预审结果
			
 
				+预审结果公示
			
 
				+预审结果
			
 
				+预审结果的公示
			
 
				+预审结果变更
			
 
				+论证意见公示
			
 
				+需求论证公示
			
 
				+征求意见公告
			
 
				+进口产品公示
			
 
				+需求公告
			
 
				+直接采购公告
			
 
				+需求公示
			
 
				+采购公告
			
 
				+采购项目
			
 
				+项目公告
			
 
				+招标公告
			
 
				+意向公开
			
 
				+比选公告
			
 
				+邀请公告
			
 
				+采购邀请
			
 
				+邀请书
			
 
				+邀请函
			
 
				+询价采购
			
 
				+询价公告
			
 
				+比价公告
			
 
				+比价项目公告
			
 
				+建设项目
			
 
				+中标（成交）公告
			
 
				+服务
			
 
				+项目
			
 
				+合同公告
			
 
				+比价项目公告
			
 
				+比质比价
			
 
				+比质比价公告
			
 
				+询价采购公告
			
 
				+询价书
			
 
				+询价单
			
 
				+询价采购
			
 
				+公开询价
			
 
				+询价邀请书
			
 
				+竞价交易公告
			
 
				+竞价公告
			
 
				+竞价项目
			
 
				+竞价的公告
			
 
				+竞价采购公告
			
 
				+变更公告
			
 
				+更正公告
			
 
				+暂停公告
			
 
				+候选人公示
			
 
				+候选人公示
			
 
				+结果公告
			
 
				+结果公示
			
 
				+服务项目
			
 
				+成交公告
			
 
				+中选人公示
			
 
				+中选结果公示
			
 
				+中标公示
			
 
				+中标公告
			
 
				+成交公示
			
 
				+废标公告
			
 
				+终止公告
			
 
				+异常公告
			
 
				+流标公告
			
 
				+失败公告
			
 
				+合同公告
			
 
				+合同信息
			
 
				+采购合同
			
 
				+销售合同
			
 
				+集成合同
			
 
				+项目合同
			
 
				+合同公示
			
 
				+服务合同
			
 
				+验收公告
			
 
				+验收单公示
			
 
				+标段
			
 
				+单一来源采购公示
			
 
				+考试培训
			
 
				+比价单
			
 
				+项目询价
			
 
				+采购项目
			
 
				+询价
			
 
				+竞争性谈判
			
 
				+竞争性磋商
			
 
				+单一来源
			
 
				+竞价处置公告
			
 
				+网上竞价
			
 
				+结果公告
			
 
				+结果公示
			
 
				+中标公示
			
 
				+中标公告
			
 
				+公告
			
 
				+合同
			
 
				+评审失败
			
 
				+招标失败
			
 
				+比选失败
			
 
				+采购失败
			
 
				+流标公示
			
 
				+项目合同
			
 
				+验收结果
			
 
				+验收公告
			
 
				+行政处罚
			
 
				+违约行为
			
 
				+投诉
			
 
				+不良行为
			
 
				+协议书
			
 
				+候选人
			
 
				+购置
			
 
				+公示
			
 
				+建设
			
 
				+中标
			
 
				+招标
			
 
				+工程
			
 
				+采购
			
 
				+成交通知书
			
 
				+公告公告
			
 
				+项目项目
			
 
				+合同合同
			
--- a/docs/table_head_doc/title_abnormal.csv
+++ b/docs/table_head_doc/title_abnormal.csv
@@ -0,0 +1 @@
 
				+nbsp
			
--- a/docs/table_head_doc/title_abnormal_contain.csv
+++ b/docs/table_head_doc/title_abnormal_contain.csv
@@ -0,0 +1,4 @@
 
				+nbsp
			
 
				+...
			
 
				+.
			
 
				+..
			
--- a/tables/fields/NoField.py
+++ b/tables/fields/NoField.py
@@ -31,44 +31,13 @@ class NoFieldChecker(object):
 
				         :param obj:代表一个item
			
 
				         :return:返回true 代表异常
			
 
				         """
			
 
				-        self.check_bidamount_ac = AcAutomation()
			
 
				-        with open(amount_config["table_field_config"]["path"], "r") as f:
			
 
				-            reads = csv.reader(f)
			
 
				-            [self.check_bidamount_ac.add_word(w[0]) for w in reads]
			
 
				-
			
 
				-        detail = obj.get("detail", "")
			
 
				-        attach_text = obj.get("attach_text", {})
			
 
				         subtype = obj.get("subtype", "")
			
 
				         if subtype in ["中标", "成交","合同","验收"]:
			
 
				-            contents = catch_content.public_attachment_catch(detail, platform="html", document_id="公告") #返回值是字典
			
 
				-            content = "\n".join(contents) #字典处理成字符串
			
 
				-            if self.check_bidamount_ac.search(content):
			
 
				-                return True
			
 
				-
			
 
				-            for attach_index, attach_content in attach_text.items():
			
 
				-                if attach_content:
			
 
				-                    for topic_index, topic_detail in attach_content.items():
			
 
				-                        # oss地址
			
 
				-                        attach_url = topic_detail.get("attach_url", "")
			
 
				-                        if attach_url:
			
 
				-                            # 获取附件内容
			
 
				-                            st, content = fsc.download_text_content(attach_url)
			
 
				-
			
 
				-                            # 下载成功
			
 
				-                            # 超长文本不处理，暂定30万字
			
 
				-                            if st and content.strip():
			
 
				-                                if len(content) > 300000:
			
 
				-                                    continue
			
 
				-                            # 开始检测
			
 
				-                            contents = catch_content.public_attachment_catch(content, platform="attach",document_id=attach_url)
			
 
				-                            content = "\n".join(contents)
			
 
				-                            if self.check_bidamount_ac.search(content):
			
 
				-                                    return True
			
 
				-            return False
			
 
				+            bidamount = obj.get("bidamount", "")
			
 
				+            if bidamount:
			
 
				+                return False
			
 
				+            return True
			
 
				         return False
			
 
				-        # 处理正文
			
 
				-        # 检查因素
			
 
				-        # 是否返回 0000
			
 
				 
			
 
				     def check_winner(self,obj, catch_content: CatchContentObject) -> bool:
			
 
				         """
			
@@ -83,9 +52,7 @@ class NoFieldChecker(object):
 
				                 return False
			
 
				             return True
			
 
				         return  False
			
 
				-        # 处理正文
			
 
				-        # 检查因素
			
 
				-        # 是否返回 0000
			
 
				+
			
 
				 
			
 
				     def check_buyer(self,obj,catch_content: CatchContentObject) -> bool:
			
 
				         """
			
@@ -99,55 +66,19 @@ class NoFieldChecker(object):
 
				             return False
			
 
				         return True
			
 
				 
			
 
				-        # 处理正文
			
 
				-        # 检查因素
			
 
				-        # 是否返回 0000
			
 
				-
			
 
				     def check_budget(self,obj, catch_content: CatchContentObject) -> bool:
			
 
				         """
			
 
				         预算为空检测
			
 
				         :param obj:代表一个item
			
 
				         :return:返回true 代表异常
			
 
				         """
			
 
				-        self.check_budget_ac = AcAutomation()
			
 
				-        with open(budget_config["table_field_config"]["path"],"r") as f :
			
 
				-            reads=csv.reader(f)
			
 
				-            [self.check_budget_ac.add_word(w[0]) for w in reads ]
			
 
				-
			
 
				-        detail = obj.get("detail", "")
			
 
				-        attach_text = obj.get("attach_text", {})
			
 
				         subtype = obj.get("subtype", "")
			
 
				         if subtype not in ["中标", "成交", "合同", "验收"]:
			
 
				-            contents = catch_content.public_attachment_catch(detail, platform="html", document_id="公告")  # 返回值是字典
			
 
				-            content = "\n".join(contents)  # 字典处理成字符串
			
 
				-            if self.check_budget_ac.search(content):
			
 
				-                return True
			
 
				-
			
 
				-            for attach_index, attach_content in attach_text.items():
			
 
				-                if attach_content:
			
 
				-                    for topic_index, topic_detail in attach_content.items():
			
 
				-                        # oss地址
			
 
				-                        attach_url = topic_detail.get("attach_url", "")
			
 
				-                        if attach_url:
			
 
				-                            # 获取附件内容
			
 
				-                            st, content = fsc.download_text_content(attach_url)
			
 
				-
			
 
				-                            # 下载成功
			
 
				-                            # 超长文本不处理，暂定30万字
			
 
				-                            if st and content.strip():
			
 
				-                                if len(content) > 300000:
			
 
				-                                    continue
			
 
				-                            # 开始检测
			
 
				-                            contents = catch_content.public_attachment_catch(content, platform="attach",
			
 
				-                                                                             document_id=attach_url)
			
 
				-                            content = "\n".join(contents)
			
 
				-                            if self.check_budget_ac.search(content):
			
 
				-                                return True
			
 
				-            return False
			
 
				+            budget = obj.get("budget", "")
			
 
				+            if budget:
			
 
				+                return False
			
 
				+            return True
			
 
				         return False
			
 
				-        # 处理正文
			
 
				-        # 检查因素
			
 
				-        # 是否返回 0000
			
 
				 
			
 
				     def check_region(self,obj, catch_content: CatchContentObject) -> bool:
			
 
				         """
			
@@ -169,9 +100,6 @@ class NoFieldChecker(object):
 
				         if title :
			
 
				             return False
			
 
				         return True
			
 
				-        # 处理正文
			
 
				-        # 检查因素
			
 
				-        # 是否返回 0000
			
 
				 
			
 
				     def check_projectname(self,obj, catch_content: CatchContentObject) -> bool:
			
 
				         """
			
@@ -182,9 +110,7 @@ class NoFieldChecker(object):
 
				         if projectname :
			
 
				             return False
			
 
				         return True
			
 
				-        # 处理正文
			
 
				-        # 检查因素
			
 
				-        # 是否返回 0000
			
 
				+
			
 
				 
			
 
				     def check_projectcode(self,obj, catch_content: CatchContentObject) -> bool:
			
 
				         """
			
@@ -192,44 +118,11 @@ class NoFieldChecker(object):
 
				         :param obj:代表一个item
			
 
				         :return:返回true 代表异常
			
 
				         """
			
 
				-        self.check_projectcode_ac = AcAutomation()
			
 
				-        with open(abnormal_config["table_field_config"]["path4"], "r") as f:
			
 
				-            reads = csv.reader(f)
			
 
				-            [self.check_projectcode_ac.add_word(w[0]) for w in reads]
			
 
				-
			
 
				         projectcode = obj.get("projectcode", "")
			
 
				-        detail = obj.get("detail", "")
			
 
				-        attach_text = obj.get("attach_text", {})
			
 
				-        if projectcode == "":
			
 
				-            contents = catch_content.public_attachment_catch(detail, platform="html", document_id="公告") #返回值是字典
			
 
				-            content = "\n".join(contents) #字典处理成字符串
			
 
				-            if self.check_projectcode_ac.search(content):
			
 
				-                return True
			
 
				-
			
 
				-            for attach_index, attach_content in attach_text.items():
			
 
				-                if attach_content:
			
 
				-                    for topic_index, topic_detail in attach_content.items():
			
 
				-                        # oss地址
			
 
				-                        attach_url = topic_detail.get("attach_url", "")
			
 
				-                        if attach_url:
			
 
				-                            # 获取附件内容
			
 
				-                            st, content = fsc.download_text_content(attach_url)
			
 
				-
			
 
				-                            # 下载成功
			
 
				-                            # 超长文本不处理，暂定30万字
			
 
				-                            if st and content.strip():
			
 
				-                                if len(content) > 300000:
			
 
				-                                    continue
			
 
				-                            # 开始检测
			
 
				-                            contents = catch_content.public_attachment_catch(content, platform="attach",document_id=attach_url)
			
 
				-                            content = "\n".join(contents)
			
 
				-                            if self.check_projectcode_ac.search(content):
			
 
				-                                    return True
			
 
				+        if projectcode:
			
 
				             return False
			
 
				-        return False
			
 
				-        # 处理正文
			
 
				-        # 检查因素
			
 
				-        # 是否返回 0000
			
 
				+        return True
			
 
				+
			
 
				     def check_subpackage(self,obj, catch_content: CatchContentObject) -> bool:
			
 
				         """
			
 
				         公司名称检测
			
--- a/tables/fields/buyer.py
+++ b/tables/fields/buyer.py
@@ -26,18 +26,18 @@ class BuyerChecker(object):
 
				         采购单位0101判断不准确，备用
			
 
				         """
			
 
				         self.errors_tables = {
			
 
				-            "0101": {
			
 
				-                "name": "实体识别",
			
 
				-                "parent_name": "名称错误",
			
 
				-                "parent_code": "01",
			
 
				-                "checkFn": self.check0101
			
 
				-            },
			
 
				-            "0201": {
			
 
				-                "name": "看数据的标签是不是采购单位",
			
 
				-                "parent_name": "数据标签错误",
			
 
				-                "parent_code": "02",
			
 
				-                "checkFn": self.check0201
			
 
				-            },
			
 
				+            # "0101": {
			
 
				+            #     "name": "实体识别",
			
 
				+            #     "parent_name": "名称错误",
			
 
				+            #     "parent_code": "01",
			
 
				+            #     "checkFn": self.check0101
			
 
				+            # },
			
 
				+            # "0201": {
			
 
				+            #     "name": "看数据的标签是不是采购单位",
			
 
				+            #     "parent_name": "数据标签错误",
			
 
				+            #     "parent_code": "02",
			
 
				+            #     "checkFn": self.check0201
			
 
				+            # },
			
 
				             "0103": {
			
 
				                 "name": "包含叠词，异常词汇，特殊词汇",
			
 
				                 "parent_name": "名称错误",
			
@@ -281,7 +281,10 @@ class BuyerChecker(object):
 
				         return True
			
 
				 
			
 
				     def check0103(self, buyer: str):
			
 
				-
			
 
				+        """
			
 
				+        return  True 代表异常
			
 
				+        """
			
 
				+        # 采购单位名称以异常词开始
			
 
				         with open(abnormal_config["table_field_config"]["path1"], "r") as f:
			
 
				             reads = csv.reader(f)
			
 
				             for n in reads:
			
@@ -289,24 +292,27 @@ class BuyerChecker(object):
 
				                 if p1.match(buyer):
			
 
				                     return True
			
 
				 
			
 
				-        # 包含词 使用敏感词检验方法
			
 
				+        # 采购单位名称中包含异常词
			
 
				         self.check_abnormal_ac = AcAutomation()
			
 
				         with open(abnormal_config["table_field_config"]["path2"], "r") as f:
			
 
				             reads = csv.reader(f)
			
 
				-            [self.check_abnormal_ac.add_word(w[0]) for w in reads]
			
 
				-        if self.check_abnormal_ac.search(buyer):
			
 
				-            return True
			
 
				+            for k in reads:
			
 
				+                if k[0] in (buyer):
			
 
				+                    return True
			
 
				 
			
 
				+        # 采购单位名称以异常词结尾
			
 
				         with open(abnormal_config["table_field_config"]["path3"], "r") as f:
			
 
				             reads = csv.reader(f)
			
 
				             for m in reads:
			
 
				-                p2 = re.compile(".*$" + m[0])
			
 
				-                if p2.match(buyer):
			
 
				+                p2 = re.compile(f"{m[0]}$")
			
 
				+                if p2.search(buyer):
			
 
				                     return True
			
 
				         return False
			
 
				+        # 如果采购单位类型in ("学校","教育","卫健委","医疗","政府办","政务中心")，则采购单位名称中一般都含有地名
			
 
				 
			
 
				     def check0104(self, buyer: str, buyerclass: str):
			
 
				         if buyerclass in ("学校", "教育", "卫健委", "医疗", "政府办", "政务中心"):
			
 
				-            if get_city_info(buyer) == [None, None, None]:
			
 
				+            province, city, district = get_city_info(buyer)
			
 
				+            if province == None and city == None and district == None:
			
 
				                 return True
			
 
				         return False
			
--- a/tables/fields/projectname.py
+++ b/tables/fields/projectname.py
@@ -5,6 +5,8 @@ import re
 
				 from docs.config import general_config
			
 
				 from util.sensitive_word import AcAutomation
			
 
				 import csv
			
 
				+from docs.config import abnormal_config
			
 
				+
			
 
				 class ProjectnameChecker(object):
			
 
				     """
			
 
				         项目名称字段检查
			
@@ -70,21 +72,32 @@ class ProjectnameChecker(object):
 
				     def check0302(self,projectname: str) -> bool:
			
 
				         """
			
 
				         没有通用后缀
			
 
				-        :param title:
			
 
				+        :param projectname:
			
 
				         :return:返回true 代表异常
			
 
				         """
			
 
				-        self.check_general_ac = AcAutomation()
			
 
				-        with open(general_config["table_field_config"]["path"], "r") as f:
			
 
				+        #标题中包含异常字符
			
 
				+        with open(abnormal_config["table_field_config"]["path6"], "r") as f:
			
 
				+            reads = csv.reader(f)
			
 
				+            for w in reads:
			
 
				+                if w[0] in projectname:
			
 
				+                    return True
			
 
				+        #项目名称以异常字符结尾
			
 
				+        with open(abnormal_config["table_field_config"]["path5"], "r") as f:
			
 
				             reads = csv.reader(f)
			
 
				-            [self.check_general_ac.add_word(w[0]) for w in reads]
			
 
				+            for w in reads:
			
 
				+                if re.search(f"{w[0]}$", projectname) !=None:
			
 
				+                    return True
			
 
				+        # 项目名称以异常字符开始
			
 
				         p1 = re.compile(r"^[3|6|7|8|0|\.]")
			
 
				-        p2 = re.compile(".*--")
			
 
				         if p1.match(projectname):
			
 
				-            # print(11111)
			
 
				             return True
			
 
				-        if p2.match(projectname):
			
 
				-            # print(2222)
			
 
				-            return True
			
 
				-        if self.check_general_ac.search(projectname):
			
 
				-            return False
			
 
				+        # 放在最后判断
			
 
				+        # 项目名称必须以通用词汇结尾
			
 
				+        with open(general_config["table_field_config"]["path"], "r") as f:
			
 
				+            reads = csv.reader(f)
			
 
				+            for w in reads:
			
 
				+                if re.search(f"{w[0]}$", projectname) != None:
			
 
				+                    return False
			
 
				+                else:
			
 
				+                    return True
			
 
				         return True
			
--- a/tables/fields/purchasing.py
+++ b/tables/fields/purchasing.py
@@ -363,6 +363,7 @@ class PurchasingChecker(object):
 
				         """
			
 
				         purchasing_evaluate_list, score = purchasing_evaluate_start(purchasinglist, purchasingsource)
			
 
				         print(score)
			
 
				+        #大于0.85的通过验证的
			
 
				         if score < 0.85:
			
 
				             return True
			
 
				         else:
			
--- a/tables/fields/title.py
+++ b/tables/fields/title.py
@@ -4,7 +4,7 @@
 
				 import re
			
 
				 
			
 
				 from docs.config import general_config
			
 
				-from util.sensitive_word import AcAutomation
			
 
				+from docs.config import abnormal_config
			
 
				 import csv
			
 
				 class TitleChecker(object):
			
 
				     """
			
@@ -75,18 +75,32 @@ class TitleChecker(object):
 
				         :param title:
			
 
				         :return:返回true 代表异常
			
 
				         """
			
 
				-        self.check_general_ac = AcAutomation()
			
 
				-        with open(general_config["table_field_config"]["path"], "r") as f:
			
 
				+        #标题中包含异常字符
			
 
				+        with open(abnormal_config["table_field_config"]["path6"], "r") as f:
			
 
				+            reads = csv.reader(f)
			
 
				+            for w in reads:
			
 
				+                if w[0] in title:
			
 
				+                    return True
			
 
				+        #标题以异常字符结尾
			
 
				+        #re.search()匹配整个字符串，并返回第一个成功的匹配，如果匹配失败，则返回None
			
 
				+        with open(abnormal_config["table_field_config"]["path5"], "r") as f:
			
 
				             reads = csv.reader(f)
			
 
				-            [self.check_general_ac.add_word(w[0]) for w in reads]
			
 
				+            for w in reads:
			
 
				+                ret=re.search(f"{w[0]}$", title)
			
 
				+                if  ret != None:
			
 
				+                    return True
			
 
				+        #标题以异常字符开始
			
 
				         p1 = re.compile(r"^[3|6|7|8|0|\.]")
			
 
				-        p2 = re.compile(".*--")
			
 
				         if p1.match(title):
			
 
				-            print(11111)
			
 
				-            return True
			
 
				-        if p2.match(title):
			
 
				-            print(2222)
			
 
				             return True
			
 
				-        if self.check_general_ac.search(title):
			
 
				-            return False
			
 
				-        return True
			
 
				+
			
 
				+        #放在最后判断
			
 
				+        #标题必须以通用词汇结尾
			
 
				+        with open(general_config["table_field_config"]["path"], "r") as f:
			
 
				+            reads = csv.reader(f)
			
 
				+            for w in reads:
			
 
				+                if re.search(f"{w[0]}$", title) !=None:
			
 
				+                    return False
			
 
				+                else:
			
 
				+                    return True
			
 
				+        return False
			
--- a/tables/fields/winner.py
+++ b/tables/fields/winner.py
@@ -21,18 +21,18 @@ class WinnerChecker(object):
 
				 
			
 
				     def __init__(self):
			
 
				         self.errors_tables = {
			
 
				-            "0101": {
			
 
				-                "name": "实体识别",
			
 
				-                "parent_name": "名称错误",
			
 
				-                "parent_code": "01",
			
 
				-                "checkFn": self.check0101
			
 
				-            },
			
 
				-            "0201": {
			
 
				-                "name": "看数据的标签是不是之中标单位",
			
 
				-                "parent_name": "数据标签错误",
			
 
				-                "parent_code": "02",
			
 
				-                "checkFn": self.check0201
			
 
				-            },
			
 
				+            # "0101": {
			
 
				+            #     "name": "实体识别",
			
 
				+            #     "parent_name": "名称错误",
			
 
				+            #     "parent_code": "01",
			
 
				+            #     "checkFn": self.check0101
			
 
				+            # },
			
 
				+            # "0201": {
			
 
				+            #     "name": "看数据的标签是不是之中标单位",
			
 
				+            #     "parent_name": "数据标签错误",
			
 
				+            #     "parent_code": "02",
			
 
				+            #     "checkFn": self.check0201
			
 
				+            # },
			
 
				             "0103": {
			
 
				                 "name": "包含叠词，异常词汇，特殊词汇",
			
 
				                 "parent_name": "名称错误",
			
@@ -265,26 +265,25 @@ class WinnerChecker(object):
 
				                             return False
			
 
				         return True
			
 
				 
			
 
				-    def check0103(self, winner: str):
			
 
				+    def check0103(self,winner:str):
			
 
				+        #中标单位名称以异常词开始
			
 
				         with open(abnormal_config["table_field_config"]["path1"], "r") as f:
			
 
				             reads = csv.reader(f)
			
 
				-            for n in reads:
			
 
				-                p1 = re.compile("^" + n[0])
			
 
				+            for n in  reads:
			
 
				+                p1 = re.compile("^"+n[0])
			
 
				                 if p1.match(winner):
			
 
				                     return True
			
 
				 
			
 
				-        # 包含词 使用敏感词检验方法
			
 
				-        self.check_abnormal_ac = AcAutomation()
			
 
				+        # 中标单位名称包含异常词
			
 
				         with open(abnormal_config["table_field_config"]["path2"], "r") as f:
			
 
				             reads = csv.reader(f)
			
 
				-            [self.check_abnormal_ac.add_word(w[0]) for w in reads]
			
 
				-        if self.check_abnormal_ac.search(winner):
			
 
				-            return True
			
 
				-
			
 
				+            for n in  reads:
			
 
				+                if n[0] in winner:
			
 
				+                    return True
			
 
				+        # 中标单位名称以异常词结尾
			
 
				         with open(abnormal_config["table_field_config"]["path3"], "r") as f:
			
 
				             reads = csv.reader(f)
			
 
				-            for m in reads:
			
 
				-                p2 = re.compile(".*$" + m[0])
			
 
				-                if p2.match(winner):
			
 
				+            for w in reads:
			
 
				+                if re.search(f"{w[0]}$", winner):
			
 
				                     return True
			
 
				         return False