Pārlūkot izejas kodu

Merge branch 'dev3.4' of http://192.168.3.207:10080/qmx/jy-data-extract into dev3.4

maxiaoshan 5 gadi atpakaļ
vecāks
revīzija
73757d852e

+ 1 - 1
src/jy/clear/cutspace.go

@@ -107,7 +107,7 @@ func ClearEndSymblo(data []interface{}) []interface{} {
 //清理符号
 func CutSymbol(data []interface{}) []interface{} {
 	value := fmt.Sprint(CutSpace(data)[0])
-	symbol := ",,;;::'\"“”。.\\??、/+=\\_—*&……\\^%$¥@!!`~·"
+	symbol := ",,;;::'\"“”。.\\??、/+=\\_—\\-*&……\\^%$¥@!!`~·"
 	startSymbol := "^[" + ")\\)>》】\\]}}〕" + symbol + "]+"
 	endSymbol := "[" + "(\\(<《【\\[{{〔" + symbol + "]+$"
 	startReg := regexp.MustCompile(startSymbol)

+ 8 - 6
src/jy/extract/score_jsondata.go

@@ -146,9 +146,6 @@ func JsonDataMergeProcessing(j *util.Job, e *ExtractTask) map[string][]*util.Ext
 					extFields = append(extFields, &util.ExtField{Code: "JsonData_" + v + "_" + fmt.Sprint(jdextweight), Field: v, ExtFrom: "JsonData_" + v + "_" + fmt.Sprint(jdextweight), SourceValue: (*j.Jsondata)[v], Value: newNum[0], Score: oneScore, IsTrue: newNum[len(newNum)-1].(bool)})
 				}
 				j.Result[v] = append(j.Result[v], extFields...)
-				//AddExtLog("extract", j.SourceMid, nil, newNum[0], &RegLuaInfo{ "JsonData_"+v, "", v, "", false, nil, nil}, e.TaskInfo) //抽取日志
-				//AddExtLog("clear", j.SourceMid, (*j.Jsondata)[v], newNum[0], &RegLuaInfo{ "JsonData_"+v, "", v, "", false, nil, nil}, e.TaskInfo) //抽取日志
-				//}
 				continue
 			}
 
@@ -163,9 +160,14 @@ func JsonDataMergeProcessing(j *util.Job, e *ExtractTask) map[string][]*util.Ext
 				if jdextweight == 2 {
 					oneScore += 2
 				}
-				tmp = append(tmp, &util.ExtField{Code: "JsonData_" + v + "_" + fmt.Sprint(jdextweight), Field: v, ExtFrom: "JsonData_" + v + "_" + fmt.Sprint(jdextweight), SourceValue: (*j.Jsondata)[v], Value: strings.Trim(util2.ObjToString((*j.Jsondata)[v]), " "), Score: oneScore, ScoreItem: []*util.ScoreItem{}})
-				//AddExtLog("extract", j.SourceMid, j.Result[v], (*j.Jsondata)[v], &RegLuaInfo{ "JsonData_"+v, "", v, "", false, nil, nil}, e.TaskInfo) //抽取日志
-				//AddExtLog("clear", j.SourceMid, j.Result[v], (*j.Jsondata)[v], &RegLuaInfo{ "JsonData_"+v, "", v, "", false, nil, nil}, e.TaskInfo) //抽取日志
+				tmp = append(tmp, &util.ExtField{Code: "JsonData_" + v + "_" + fmt.Sprint(jdextweight), Field: v, ExtFrom: "JsonData_" + v + "_" + fmt.Sprint(jdextweight), SourceValue: (*j.Jsondata)[v], Value: strings.Trim(util2.ObjToString((*j.Jsondata)[v]), " "), Score: oneScore, ScoreItem: []*util.ScoreItem{&util.ScoreItem{
+					Des:       "jsondata初始化,取抽取分第一个",
+					Code:      "init_jsondata",
+					RuleText:  "init_jsondata",
+					ScoreFrom: "j.Result[0]",
+					Value:     strings.TrimSpace(util2.ObjToString((*j.Jsondata)[v])),
+					Score:     oneScore,
+				}}})
 				tmps[v] = tmp
 			}
 		}

+ 1 - 1
src/jy/pretreated/analytable.go

@@ -123,7 +123,7 @@ var (
 	jsonReg                     = regexp.MustCompile(`\{.+:[^}]*\} `) //  \{".*\":\".+\"}
 	regHz                       = regexp.MustCompile("[\u4e00-\u9fa5]")
 	winnerOrderAndBidResult     = regexp.MustCompile("((中标)?候选人|(中标|评标)结果)")
-	WinnerOrderStr              = regexp.MustCompile(`(集团|公司|学校|中心|家具城|门诊|\[大中小\]学|部|院|局|厂|店|所|队|社|室|厅|段|会|场|行)$`)
+	WinnerOrderStr              = regexp.MustCompile(`(集团|公司|学校|中心|家具城|门诊|[大中小]+学|部|院|局|厂|店|所|队|社|室|厅|段|会|场|行)$`)
 	DoubtReg                    = regexp.MustCompile("(我中心|有(疑问|质疑|异议|意见)|(书面)?提出|不再受理|投诉|质疑|书面形式|监督|公示期(限)?)")
 )