|
@@ -66,7 +66,18 @@ func quickHeavyMethodOne(v *Info, info *Info, reason string) (bool, string) {
|
|
|
//判重方法2
|
|
|
func quickHeavyMethodTwo(v *Info, info *Info, reason string) (bool, string) {
|
|
|
isMeet := false
|
|
|
- if v.agency == info.agency && v.agency != "" && info.agency != "" {
|
|
|
+ isAgency :=false
|
|
|
+ //招标类-代理机构不同-广泛前后缀比较
|
|
|
+ if v.agency != info.agency && v.agency != "" && info.agency != "" {
|
|
|
+ //新增一层判断
|
|
|
+ if strings.Contains(v.agency, info.agency) || strings.Contains(info.agency, v.agency) {
|
|
|
+ isAgency = true
|
|
|
+ }else {
|
|
|
+ return false, reason
|
|
|
+ }
|
|
|
+ }
|
|
|
+
|
|
|
+ if (v.agency == info.agency && v.agency != "" && info.agency != "")|| isAgency {
|
|
|
if info.subtype == "招标" || info.subtype == "邀标" || info.subtype == "询价" ||
|
|
|
info.subtype == "竞谈" || info.subtype == "单一" || info.subtype == "竞价" ||
|
|
|
info.subtype == "变更" || info.subtype == "其他" {
|
|
@@ -122,11 +133,7 @@ func quickHeavyMethodTwo(v *Info, info *Info, reason string) (bool, string) {
|
|
|
}
|
|
|
}
|
|
|
|
|
|
- //不同
|
|
|
- if v.agency != info.agency && v.agency != "" && info.agency != "" {
|
|
|
- return false, reason
|
|
|
- }
|
|
|
- //机构最少一个为空
|
|
|
+ //机构最2少一个为空
|
|
|
if v.agency == "" || info.agency == "" {
|
|
|
var repeat = false
|
|
|
if repeat, reason = quickHeavyMethodOne(v, info, reason); repeat {
|
|
@@ -409,9 +416,16 @@ func contractRepeat_C(v *Info, info *Info) bool {
|
|
|
|
|
|
//快速低质量数据判重
|
|
|
func fastLowQualityHeavy(v *Info, info *Info, reason string) (bool, string) {
|
|
|
- if !isTheSameDay(v.publishtime,info.publishtime) {
|
|
|
+ //if !isTheSameDay(v.publishtime,info.publishtime) {
|
|
|
+ // return false,reason
|
|
|
+ //}
|
|
|
+
|
|
|
+ //区间间隔24小时
|
|
|
+ if !isTimeIntervalPeriod(v.publishtime,info.publishtime) {
|
|
|
return false,reason
|
|
|
}
|
|
|
+
|
|
|
+
|
|
|
//首先判定是否为低质量数据 info目标数据
|
|
|
if info.title!=""&&(info.agency==""||v.agency=="")&&
|
|
|
info.title==v.title&&info.projectcode==""&&info.contractnumber==""&&info.buyer=="" {
|