|
@@ -44,14 +44,14 @@ var (
|
|
winnerReg9 = regexp.MustCompile("(第[一二三四五六七八九十]中[选|标]?候选人|中标人[1-9])[::\\s]+投标人名称([\\s]+)?([\u4E00-\u9FA5]{4,25})[\\s]+(投标报价)([\\s]+)?([0-9\\.\\s万元]+)")
|
|
winnerReg9 = regexp.MustCompile("(第[一二三四五六七八九十]中[选|标]?候选人|中标人[1-9])[::\\s]+投标人名称([\\s]+)?([\u4E00-\u9FA5]{4,25})[\\s]+(投标报价)([\\s]+)?([0-9\\.\\s万元]+)")
|
|
winnerReg10 = regexp.MustCompile("(第[一二三四五六七八九十]中标人)[::\\s]+?报价[¥]?([0-9\\.\\s万元]+)[;;]([\u4E00-\u9FA5]{4,20})")
|
|
winnerReg10 = regexp.MustCompile("(第[一二三四五六七八九十]中标人)[::\\s]+?报价[¥]?([0-9\\.\\s万元]+)[;;]([\u4E00-\u9FA5]{4,20})")
|
|
winnerReg11 = regexp.MustCompile("([弟|第][一二三四五六七八九十]中[标|选]候选人)[::\\s]+?(单位名称|投标人名称)[::]?(.*)[\\s]+?(参选报价|投标报价[((]含税[))]|投标报价[((]元[))])[::]?(.*)")
|
|
winnerReg11 = regexp.MustCompile("([弟|第][一二三四五六七八九十]中[标|选]候选人)[::\\s]+?(单位名称|投标人名称)[::]?(.*)[\\s]+?(参选报价|投标报价[((]含税[))]|投标报价[((]元[))])[::]?(.*)")
|
|
- winnerReg12 = regexp.MustCompile("(中[标|选]候选人[弟|第][一二三四五六七八九十0-9]名|[弟|第][一二三四五六七八九十0-9](中标)?候选人)[::\\s ]+?(.*)[ \\s,,]+?(投标报价|投标总报价|金额)[::]?([0-9\\.\\s万元]+)")
|
|
|
|
|
|
+ winnerReg12 = regexp.MustCompile("(中[标|选]候选人[弟|第][一二三四五六七八九十0-9]名|[弟|第][一二三四五六七八九十0-9](中标)?候选人)([::\\s ]+)?(.*)[ \\s,,]+?(投标报价|投标总报价|金额)[::]?([0-9\\.\\s万元]+)")
|
|
winnerReg13 = regexp.MustCompile("([弟|第][一二三四五六七八九十0-9])\n(成交候选人|成交供应商)\n(.*)\n([0-9\\.\\s万元]+)")
|
|
winnerReg13 = regexp.MustCompile("([弟|第][一二三四五六七八九十0-9])\n(成交候选人|成交供应商)\n(.*)\n([0-9\\.\\s万元]+)")
|
|
winnerReg14 = regexp.MustCompile("(中标候选人|成交候选人)\n.*\n.*\n第[1-9][\\s]+?名")
|
|
winnerReg14 = regexp.MustCompile("(中标候选人|成交候选人)\n.*\n.*\n第[1-9][\\s]+?名")
|
|
winnerReg14_1 = regexp.MustCompile("(第[1-9])[\\s]+?名[::](.{4,20}公司)[\\s]+中标价[::]([0-9\\.\\s万元]+)")
|
|
winnerReg14_1 = regexp.MustCompile("(第[1-9])[\\s]+?名[::](.{4,20}公司)[\\s]+中标价[::]([0-9\\.\\s万元]+)")
|
|
winnerReg15 = regexp.MustCompile("([弟|第][一二三四五六七八九十0-9](中标|中选)?候选人)[::](.*)[ \\s\\n,,]+(最终报价[::\\s]+不含税单价.*)?不含税总价[::]?([0-9\\.()\\s万元]+)")
|
|
winnerReg15 = regexp.MustCompile("([弟|第][一二三四五六七八九十0-9](中标|中选)?候选人)[::](.*)[ \\s\\n,,]+(最终报价[::\\s]+不含税单价.*)?不含税总价[::]?([0-9\\.()\\s万元]+)")
|
|
winnerReg16 = regexp.MustCompile("(中[标|选]候选人)排序[::]([1-9一二三四五六七])[\\s]+.{1,4}名称[::](.*公司)[\\s]+.{1,4}报价[::]([¥〇0-9\\.人民币零点壹贰叁肆伍陆柒捌玖拾佰仟万亿元圆角分整]+)")
|
|
winnerReg16 = regexp.MustCompile("(中[标|选]候选人)排序[::]([1-9一二三四五六七])[\\s]+.{1,4}名称[::](.*公司)[\\s]+.{1,4}报价[::]([¥〇0-9\\.人民币零点壹贰叁肆伍陆柒捌玖拾佰仟万亿元圆角分整]+)")
|
|
winnerReg17 = regexp.MustCompile("(报价金额|投标金额|应答含税总价|预期中标价格)[::]?[\n]?([¥〇0-9\\.人民币零点壹贰叁肆伍陆柒捌玖拾佰仟万亿元圆角分整]+)")
|
|
winnerReg17 = regexp.MustCompile("(报价金额|投标金额|应答含税总价|预期中标价格)[::]?[\n]?([¥〇0-9\\.人民币零点壹贰叁肆伍陆柒捌玖拾佰仟万亿元圆角分整]+)")
|
|
- winnerReg18 = regexp.MustCompile("([中|投]标候选人[弟|第])([1-9一二三四五])[\\s]?名[::]([\u4E00-\u9FA5]{4,20})([((].*公司[))])?[,,\\s]+投标报价[::]([0-9\\.\\s万元]+)")
|
|
|
|
|
|
+ winnerReg18 = regexp.MustCompile("([中|投]标候选人[弟|第])([1-9一二三四五])[\\s]?名[::]([\u4E00-\u9FA5]{4,20})([((].*公司[))])?[,,\\s]+投标报价[::]([0-9\\.\\s 万元]+)")
|
|
winnerReg19 = regexp.MustCompile("([弟|第][1-9一二三四五]名(中标候选人)?)[::]?([\u4E00-\u9FA5]{4,20}公司)[((]?[,,]?(报价|投标报价)[::]?([0-9\\.\\s万元]+)")
|
|
winnerReg19 = regexp.MustCompile("([弟|第][1-9一二三四五]名(中标候选人)?)[::]?([\u4E00-\u9FA5]{4,20}公司)[((]?[,,]?(报价|投标报价)[::]?([0-9\\.\\s万元]+)")
|
|
|
|
|
|
|
|
|
|
@@ -59,12 +59,23 @@ var (
|
|
winnerReg50 = regexp.MustCompile("(第[一二三]名)\n单位名称\n(.{4,20}公司)[\n\\s]+投标报价\n大写\n([\u4E00-\u9FA5]+)\n")
|
|
winnerReg50 = regexp.MustCompile("(第[一二三]名)\n单位名称\n(.{4,20}公司)[\n\\s]+投标报价\n大写\n([\u4E00-\u9FA5]+)\n")
|
|
winnerReg51 = regexp.MustCompile("(中标候选人第[1-9一二三四五])[\\s](名)")
|
|
winnerReg51 = regexp.MustCompile("(中标候选人第[1-9一二三四五])[\\s](名)")
|
|
winnerReg52 = regexp.MustCompile("(中标金额[::][0-9.]+)\n([万元]+)")
|
|
winnerReg52 = regexp.MustCompile("(中标金额[::][0-9.]+)\n([万元]+)")
|
|
|
|
+ winnerReg53 = regexp.MustCompile("中标候选人[\\s ](第一候选人)[\\s ](第二候选人)[\\s ]?(第三候选人)?\n单位名称[\\s ](.{4,20}公司)[\\s ](.{4,20}公司)[\\s ]?(.{4,20}公司)?\n投标价[((]万元[))]([\\s ]+)([0-9.]+)([\\s ]+)([0-9.]+)([\\s ]+)?([0-9.]+)?")
|
|
|
|
+ winnerReg54 = regexp.MustCompile("(第[一二三1-3]中标候选人)[ \\s]([\u4E00-\u9FA5,]{4,20}公司)[ \\s](人民币|¥)([0-9,,.万元]+)")
|
|
|
|
|
|
|
|
|
|
-
|
|
|
|
|
|
+ //特殊爬虫-特殊情况
|
|
|
|
+ winnerReg80 = regexp.MustCompile("投标报价\n投标人.*\n.*[((]万元[))]\n"+
|
|
|
|
+ "(.*)[\n]?(第[1一]中标候选人).*\\s([0-9]+[.][0-9]+|[0-9]+)\n(.*司)\n" +
|
|
|
|
+ "(.*)[\n]?(第[2二]中标候选人).*\\s([0-9]+[.][0-9]+|[0-9]+)[\n]?(.*司)?")
|
|
|
|
+ winnerReg81 = regexp.MustCompile("投标报价\n[((]万元[))]\n"+
|
|
|
|
+ "(.*)[\n]?(.*司)[\\s]+(第[1一]中标候选人).*\\s([0-9]+[.][0-9]+|[0-9]+)\n" +
|
|
|
|
+ "(.*)[\n]?(.*司)[\\s]+(第[2二]中标候选人).*\\s([0-9]+[.][0-9]+|[0-9]+)\n")
|
|
|
|
+ winnerReg82 = regexp.MustCompile("投标人.*\n.*[((]万元[))]\n元[))]\n"+
|
|
|
|
+ "(.*)\\s(第[1一]中标候)\n.*\\s([0-9]+[.][0-9]+|[0-9]+)\n(.*公司)\\s(选人)\n" +
|
|
|
|
+ "(.*)\\s(第[2二]中标候)\n.*\\s([0-9]+[.][0-9]+|[0-9]+)\n(.*公司)\\s(选人)\n")
|
|
|
|
|
|
//格式化中标金额换行
|
|
//格式化中标金额换行
|
|
- winnerReg100 = regexp.MustCompile("中标金额:[\\s]+([0-9\\.万元]+)")
|
|
|
|
|
|
+ winnerReg100 = regexp.MustCompile("中标金额:[\\s]+([0-9\\.万元]+)")
|
|
|
|
|
|
|
|
|
|
//不带金额
|
|
//不带金额
|
|
@@ -111,6 +122,13 @@ func (wo *WinnerOrderEntity) Find(text string, flag bool, from int, isSite bool,
|
|
if nswinnertabletag.MatchString(text) && !winnerReg0.MatchString(text){
|
|
if nswinnertabletag.MatchString(text) && !winnerReg0.MatchString(text){
|
|
return []map[string]interface{}{}
|
|
return []map[string]interface{}{}
|
|
}
|
|
}
|
|
|
|
+
|
|
|
|
+ if codeSite=="sh_shszfhcxjsglwyh_jsgc_zhbhxrgs" {
|
|
|
|
+ text = winnerReg80.ReplaceAllString(text,"\n$2:$1$4 中标金额:$3 万元\n$6:$5$8 中标金额:$7 万元\n")
|
|
|
|
+ text = winnerReg81.ReplaceAllString(text,"\n$3:$1$2 中标金额:$4 万元\n$7:$5$6 中标金额:$8 万元\n")
|
|
|
|
+ text = winnerReg82.ReplaceAllString(text,"\n$2$5:$1$4 中标金额:$3 万元\n$7$10:$6$9 中标金额:$8 万元\n")
|
|
|
|
+ }
|
|
|
|
+
|
|
text = winnerReg5.ReplaceAllString(text, "\n$3:$1\n")
|
|
text = winnerReg5.ReplaceAllString(text, "\n$3:$1\n")
|
|
text = winnerReg20.ReplaceAllString(text,"\n${4}:${2}\n")
|
|
text = winnerReg20.ReplaceAllString(text,"\n${4}:${2}\n")
|
|
text = winnerReg21.ReplaceAllString(text,"\n${3}成交候选人:${1}\n")
|
|
text = winnerReg21.ReplaceAllString(text,"\n${3}成交候选人:${1}\n")
|
|
@@ -124,7 +142,7 @@ func (wo *WinnerOrderEntity) Find(text string, flag bool, from int, isSite bool,
|
|
text = winnerReg9.ReplaceAllString(text,"\n${1}:${3}\n中标金额:${5}\n")
|
|
text = winnerReg9.ReplaceAllString(text,"\n${1}:${3}\n中标金额:${5}\n")
|
|
text = winnerReg10.ReplaceAllString(text,"\n${1}:${3}\n中标金额:${2}\n")
|
|
text = winnerReg10.ReplaceAllString(text,"\n${1}:${3}\n中标金额:${2}\n")
|
|
text = winnerReg11.ReplaceAllString(text,"\n${1}:${3}\n中标金额:${5}\n")
|
|
text = winnerReg11.ReplaceAllString(text,"\n${1}:${3}\n中标金额:${5}\n")
|
|
- text = winnerReg12.ReplaceAllString(text,"\n${1}:${3}\n中标金额:${5}\n")
|
|
|
|
|
|
+ text = winnerReg12.ReplaceAllString(text,"\n${1}:${4}\n中标金额:${6}\n")
|
|
text = winnerReg13.ReplaceAllString(text,"\n${1}${2}:${3}\n中标金额:${4}\n")
|
|
text = winnerReg13.ReplaceAllString(text,"\n${1}${2}:${3}\n中标金额:${4}\n")
|
|
text = winnerReg15.ReplaceAllString(text,"\n${1}:${3}\n中标金额:${5}\n")
|
|
text = winnerReg15.ReplaceAllString(text,"\n${1}:${3}\n中标金额:${5}\n")
|
|
text = winnerReg16.ReplaceAllString(text,"\n第${2}${1}:${3}\n中标金额:${4}\n")
|
|
text = winnerReg16.ReplaceAllString(text,"\n第${2}${1}:${3}\n中标金额:${4}\n")
|
|
@@ -137,9 +155,8 @@ func (wo *WinnerOrderEntity) Find(text string, flag bool, from int, isSite bool,
|
|
text = winnerReg100.ReplaceAllString(text,"中标金额:${1}")
|
|
text = winnerReg100.ReplaceAllString(text,"中标金额:${1}")
|
|
|
|
|
|
//特殊格式
|
|
//特殊格式
|
|
- if winnerReg14.MatchString(text) {
|
|
|
|
- text = winnerReg14_1.ReplaceAllString(text,"\n中标候选人${1}名:${2}\n中标金额:${3}\n")
|
|
|
|
- }
|
|
|
|
|
|
+ text = winnerReg14_1.ReplaceAllString(text,"\n中标候选人${1}名:${2}\n中标金额:${3}\n")
|
|
|
|
+
|
|
|
|
|
|
|
|
|
|
if winnerReg50.MatchString(text) && strings.Contains(text,"中标候选人公示") {
|
|
if winnerReg50.MatchString(text) && strings.Contains(text,"中标候选人公示") {
|
|
@@ -149,7 +166,8 @@ func (wo *WinnerOrderEntity) Find(text string, flag bool, from int, isSite bool,
|
|
text = winnerReg51.ReplaceAllString(text,"${1}${2}\n中标金额:${3}\n")
|
|
text = winnerReg51.ReplaceAllString(text,"${1}${2}\n中标金额:${3}\n")
|
|
text = winnerReg52.ReplaceAllString(text,"$1$2")
|
|
text = winnerReg52.ReplaceAllString(text,"$1$2")
|
|
|
|
|
|
-
|
|
|
|
|
|
+ text = winnerReg53.ReplaceAllString(text,"\n$1:$4 中标金额:$8 万元\n$2:$5 中标金额:$10 万元\n")
|
|
|
|
+ text = winnerReg54.ReplaceAllString(text,"\n$1:$2 中标金额:$4\n")
|
|
|
|
|
|
text = clearSpace1.ReplaceAllString(text, "") //清理(1) 单位名称:成都维诺信科技有限公司-->单位名称:成都维诺信科技有限公司
|
|
text = clearSpace1.ReplaceAllString(text, "") //清理(1) 单位名称:成都维诺信科技有限公司-->单位名称:成都维诺信科技有限公司
|
|
if strings.TrimSpace(text) == "" {
|
|
if strings.TrimSpace(text) == "" {
|