|
@@ -11,6 +11,8 @@ ReluClient = MongoDBInterface(ReluMongodb)
|
|
|
# 评估服务配置
|
|
|
a2s_ip = "192.168.3.240:9090"
|
|
|
topic = "quality_bid"
|
|
|
+#本地测试用的主题
|
|
|
+topic_test = "test_quality_bid"
|
|
|
timeout = 120
|
|
|
|
|
|
# 开始评估
|
|
@@ -20,7 +22,7 @@ def start_quality(data: dict, rules_id: int, a2s_ip, topic, timeout, retry=3):
|
|
|
bytes_data = json_serialize(row)
|
|
|
for t in range(retry):
|
|
|
try:
|
|
|
- resp_data = a2s_execute(a2s_ip, topic, timeout, bytes_data)
|
|
|
+ resp_data = a2s_execute(a2s_ip, topic_test, timeout, bytes_data)
|
|
|
if resp_data is None:
|
|
|
continue
|
|
|
result = json_deserialize(resp_data)
|
|
@@ -44,7 +46,7 @@ def batch_load_purchasinglist():
|
|
|
print(rules_id)
|
|
|
|
|
|
# max_id = ObjectId("0" * 24)
|
|
|
- max_id = ObjectId("5f164bf552c1d9fbf8437ce0")
|
|
|
+ max_id = ObjectId("5f8e5e1650cded0641ae3f7e")
|
|
|
while True:
|
|
|
# db = MongoClient('192.168.3.71', 29099, unicode_decode_error_handler="ignore").re4art
|
|
|
# coll_user = db["zc_classify_test"]
|
|
@@ -52,8 +54,8 @@ def batch_load_purchasinglist():
|
|
|
coll_user = db["update_data"]
|
|
|
num=0
|
|
|
try:
|
|
|
- for item in coll_user.find({"_id":{"$gte":max_id}}).sort("_id",1):
|
|
|
- # for item in coll_user.find({"_id":ObjectId("652526dfe17a7c80fb06658a")}):
|
|
|
+ # for item in coll_user.find({"_id":{"$gte":max_id}}).sort("_id",1):
|
|
|
+ for item in coll_user.find({"_id":ObjectId("60f84adf1a75b8f4460ead47")}):
|
|
|
# for item in coll_user.find().sort("_id",1):
|
|
|
max_id = item["_id"]
|
|
|
print(max_id)
|
|
@@ -70,6 +72,7 @@ def batch_load_purchasinglist():
|
|
|
code=result.get("code")
|
|
|
if code!=200:
|
|
|
#数据出错
|
|
|
+ coll_user.update_one({"_id": max_id}, {"$set": {"flag": 1}})
|
|
|
continue
|
|
|
data=result.get("data",{})
|
|
|
# coll_user.update_one({"_id":max_id},{"$set":{"data":data}})
|
|
@@ -85,20 +88,19 @@ def batch_load_data():
|
|
|
批量数据质量检查
|
|
|
"""
|
|
|
# 规则查询,根据必要条件 公司名称(用户ID)、版本号
|
|
|
- rules_id = get_rule("北京剑鱼信息技术有限公司", "v1.1")
|
|
|
+ rules_id = get_rule("北京剑鱼信息技术有限公司", "v1.2")
|
|
|
print(rules_id)
|
|
|
|
|
|
# max_id = ObjectId("0" * 24)
|
|
|
- max_id = ObjectId("65409048dd24231d52d9e89c")
|
|
|
+ max_id = ObjectId("655ec5609aed6eb2ffa654ca")
|
|
|
while True:
|
|
|
- # db = MongoClient('192.168.3.71', 29099, unicode_decode_error_handler="ignore").re4art
|
|
|
- # coll_user = db["zc_classify_test"]
|
|
|
- db = MongoClient('192.168.3.166', 27082, unicode_decode_error_handler="ignore").zhengluming
|
|
|
- coll_user = db["f_sourceinfo_HP_channel_succes_data"]
|
|
|
- num=0
|
|
|
+ db = MongoClient('192.168.3.206', 27080, unicode_decode_error_handler="ignore").data_quality
|
|
|
+ coll_user = db["bidding_20231122"]
|
|
|
+ # db = MongoClient('192.168.3.166', 27082, unicode_decode_error_handler="ignore").zhengluming_27082
|
|
|
+ # coll_user = db["update_data"]
|
|
|
try:
|
|
|
for item in coll_user.find({"_id":{"$gte":max_id}}).sort("_id",1):
|
|
|
- # for item in coll_user.find({"_id":ObjectId("652526dfe17a7c80fb06658a")}):
|
|
|
+ # for item in coll_user.find({"_id":ObjectId("65485a930023f3bdb1621a1d")}):
|
|
|
# for item in coll_user.find().sort("_id",1):
|
|
|
max_id = item["_id"]
|
|
|
print(max_id)
|
|
@@ -110,6 +112,7 @@ def batch_load_data():
|
|
|
code=result.get("code")
|
|
|
if code!=200:
|
|
|
#数据出错
|
|
|
+ coll_user.update_one({"_id":max_id},{"$set":{"flag":1}})
|
|
|
continue
|
|
|
data=result.get("data",{})
|
|
|
# coll_user.update_one({"_id":max_id},{"$set":{"data":data}})
|
|
@@ -126,7 +129,7 @@ def batch_load_data_test():
|
|
|
:return:
|
|
|
"""
|
|
|
row_data = {
|
|
|
- "title":"你好周杰伦成交通知书采购计划任务",
|
|
|
+ "title":"你好周杰伦成交通知书...采购计划任务",
|
|
|
"winner": "第一峡江县文化广电新闻出版旅游局",
|
|
|
"detail": "一、采购人名称: 峡江县文化广电新闻出版旅游局 <br/> 二、供应商名称: 中国广电江西网络有限公司峡江县分公司 <br/> 四、中标金额: 140万 <br/> 三、采购项目名称: 峡江县文化广电新闻出版旅游局服务工程项目 <br/> 四、采购项目编号: 2881401000001829192 <br/> 五、合同编号: 2023M0816360823000201 <br/> 六、合同内容:<br/> <table> <tbody><tr> <td>序号</td> <td>标项名称</td> <td>规格型号</td> <td>单位</td> <td>数量</td> <td>单价(元)</td> <td colspan=\"1\">总123价(元)</td> </tr> <tr> <td>1</td> <td>有线电视 宽带网络安装 通信系统工程</td> <td></td> <td>项</td> <td>1.00</td> <td>30416</td> <td colspan=\"1\">30416</td> </tr> </tbody></table><br/> <br/> 服务要求或标的基本概况: <br/> 七、其它事项:<br/> / <br/> 八、联系方式<br/> 1、 采购人名称: 峡江县文化广电新闻出版旅游局 <br/> 联系人: 傅昕尧 <br/> 联系电话: 1569022**** <br/> 传真: <br/> 地址: 玉华路71号 <br/> 2、供应商名称: 中国广电江西网络有限公司峡江县分公司 <br/> 地址: 江西省吉安市峡江县江西省吉安市峡江县文化广播电视局 <br/>附件信息:<br/>关于通信系统工程的服务工程合同(2023M0816360823000201).pdf",
|
|
|
"buyer": "文化广电新闻出版旅游局",
|
|
@@ -144,11 +147,11 @@ def batch_load_data_test():
|
|
|
|
|
|
def batch_load_data_debug():
|
|
|
# 规则查询,根据必要条件 公司名称(用户ID)、版本号
|
|
|
- rules_id = get_rule("北京剑鱼信息技术有限公司", "v1.0")
|
|
|
+ rules_id = get_rule("北京剑鱼信息技术有限公司", "v1.2")
|
|
|
print(rules_id)
|
|
|
- db = MongoClient('192.168.3.71', 29099, unicode_decode_error_handler="ignore").re4art
|
|
|
- coll_user = db["zc_classify_test"]
|
|
|
- for item in coll_user.find({"_id": ObjectId("654862420023f3bdb1624a82")}):
|
|
|
+ db = MongoClient('192.168.3.206', 27080, unicode_decode_error_handler="ignore").data_quality
|
|
|
+ coll_user = db["bidding_20231122"]
|
|
|
+ for item in coll_user.find({"_id": ObjectId("655ec5319aed6eb2ffa5d7ce")}):
|
|
|
# item['detail'] = item['details'].replace("\\\"", "\"")
|
|
|
item["_id"] = str(item["_id"])
|
|
|
result = start_quality(item, rules_id, a2s_ip, topic, timeout)
|
|
@@ -156,7 +159,7 @@ def batch_load_data_debug():
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
- # batch_load_data()
|
|
|
+ batch_load_data()
|
|
|
# batch_load_data_test()
|
|
|
# batch_load_data_debug()
|
|
|
- batch_load_purchasinglist()#标的物检查函数
|
|
|
+ # batch_load_purchasinglist()#标的物检查函数
|