Selaa lähdekoodia

完善~标题判重模式

zhengkun 2 vuotta sitten
vanhempi
commit
6b68143f71
1 muutettua tiedostoa jossa 7 lisäystä ja 3 poistoa
  1. 7 3
      src/dataMethod.go

+ 7 - 3
src/dataMethod.go

@@ -9,8 +9,10 @@ import (
 
 var cleanNameReg_0 = regexp.MustCompile("([(())::\\s ])")
 var cleanNameReg_1 = regexp.MustCompile("(项目)(.{0,5})(招标|中标|中标结果|成交|候选人|竞谈|竞争性磋商)(公告)?$")
-var cleanNameReg_2 = regexp.MustCompile("(公告|公告公告)$")
-var cleanNameReg_3 = regexp.MustCompile("(公开)(比选|招标)")
+var cleanNameReg_2 = regexp.MustCompile("(公告|公示|公告公告)$")
+var cleanNameReg_3 = regexp.MustCompile("(公开|的)(比选|招标|单一来源)")
+
+var un_cleanNameReg_1 = regexp.MustCompile("(项目[一二三四五六七八九1-9][次](招标|中标|中标结果|成交|候选人|竞谈|竞争性磋商)(公告)?)$")
 
 //完善判重数据检测-前置条件
 func convertArabicNumeralsAndLetters(data string) string {
@@ -407,7 +409,9 @@ func confirmJingPinIsRepeatData(v *Info, info *Info) bool {
 func cleanNameFilterRedundant(name string) string {
 	new_name := name
 	new_name = cleanNameReg_0.ReplaceAllString(new_name, "")
-	new_name = cleanNameReg_1.ReplaceAllString(new_name, "${1}${3}")
+	if !un_cleanNameReg_1.MatchString(new_name) {
+		new_name = cleanNameReg_1.ReplaceAllString(new_name, "${1}${3}")
+	}
 	new_name = cleanNameReg_2.ReplaceAllString(new_name, "")
 	new_name = cleanNameReg_3.ReplaceAllString(new_name, "${2}")