|
@@ -19,7 +19,7 @@ var (
|
|
|
regReplKV = regexp.MustCompile("(.+?[\u4e00-\u9fa5))][\\s\u3000\u2003\u00a0]*[::].*[((]?[^\r\n\\s\u3000\u2003\u00a0]+?[))]?)[\\s\u3000\u2003\u00a0,。;;][((]?(.+?[\u4e00-\u9fa5))][\\s\u3000\u2003\u00a0]*[::].+)[))]?")
|
|
|
regReplKV2 = regexp.MustCompile("(.+?[\u4e00-\u9fa5))][\\s\u3000\u2003\u00a0]*[::].*[((]?[^\r\n\\s\u3000\u2003\u00a0标段包]+?[))]?)([一二三四五六七八九十]+[、..][^一二三四五六七八九十]+?)")
|
|
|
regKV = regexp.MustCompile("([\\p{Han}][^,,。、.;;\r\n]{1,30}?)[::](.*)")
|
|
|
- filterK = regexp.MustCompile("[((\\[【].*?[))\\]】]|<[^>].+?>|[①②③¥·;;‘“'’”,*<>((\\[【、))/\\]】??,。.\".\\s\u3000\u2003\u00a0]+|^[一二三四五六七八九十0-91234567890]+")
|
|
|
+ filterK = regexp.MustCompile("[((\\[【].*?[))\\]】]|<[^>].+?>|[①②③¥·;;‘“'’”,*<>((\\[【、))/\\]】??,。.\".\\s\u3000\u2003\u00a0\u001c]+|^[一二三四五六七八九十0-91234567890]+")
|
|
|
filterValue = regexp.MustCompile("(^(无)$|.+%.*|^[\r\n\\s\u3000\u2003\u00a0]+$|^<.*>)")
|
|
|
regReplKey = regexp.MustCompile("^(包(.+[A-Za-z\\d])?|本项目|推荐|的|本次)|([约为元万亿]+|[大小]写|人民币|[全]称|姓名)$")
|
|
|
buyerAndAgency = regexp.MustCompile("(代理(机构|人)|采购(人|单位))")
|
|
@@ -569,7 +569,14 @@ func FormatContactKv(kvs *[]*Kv, title string, buyers []string, contactFormat *C
|
|
|
continue
|
|
|
}
|
|
|
//qutil.Debug("ContactInfoMustReg.MatchString(k)+++", !ContactInfoMustReg.MatchString(k))
|
|
|
- if !ContactInfoMustReg.MatchString(k) { //判断是否是电话、邮箱、地址等信息
|
|
|
+ matchMust := ContactInfoMustReg.MatchString(k)
|
|
|
+ matchHas := ContactInfoVagueReg.MatchString(k)
|
|
|
+ qutil.Debug("matchMust:", matchMust, "matchHas:", matchHas)
|
|
|
+ if !matchMust && matchHas {
|
|
|
+ k = ContactInfoVagueReg.FindString(k)
|
|
|
+ }
|
|
|
+ //qutil.Debug("kkkkkkkkkkkk", k)
|
|
|
+ if !matchMust && !matchHas { //判断是否是电话、邮箱、地址等信息
|
|
|
if DoubtReg.MatchString(k) { //匹配到投诉和监督 5bc9683ea5cb26b9b72b2302 5c35f3e8a5cb26b9b72dcdbd
|
|
|
startIndex = 0
|
|
|
//notmatchCount = 0
|