|
@@ -108,29 +108,22 @@ func ScoreFields(j *ju.Job) map[string][]*ju.ExtField {
|
|
|
//qz := TagConfig["其他"][field]
|
|
|
//tmps[tmpsindex].Score += 2 * qz //乘以权重系数
|
|
|
}
|
|
|
- if tmpsvalue.ExtFrom != "title" { //非标题抽取
|
|
|
- //是否有kv值
|
|
|
- if strings.Contains(tmpsvalue.Type, "colon") {
|
|
|
- tmps[tmpsindex].Score += qu.Float64All(SoreConfig["extractype"]["colon"])
|
|
|
- tmps[tmpsindex].ScoreItem = append(tmps[tmpsindex].ScoreItem, &ju.ScoreItem{Des: "colonkv", Code: "fieldscore.colon", RuleText: qu.ObjToString(SoreConfig["extractype"]["describe"]), Type: "colonkv", ExtFrom: "fieldscore.json", Value: tmpsvalue.Value, Score: qu.Float64All(SoreConfig["extractype"]["colon"])})
|
|
|
- } else if strings.Contains(tmpsvalue.Type, "space") {
|
|
|
- tmps[tmpsindex].Score += qu.Float64All(SoreConfig["extractype"]["space"])
|
|
|
- tmps[tmpsindex].ScoreItem = append(tmps[tmpsindex].ScoreItem, &ju.ScoreItem{Des: "spacekv", Code: "fieldscore.space", RuleText: qu.ObjToString(SoreConfig["extractype"]["describe"]), Type: "spacekv", ExtFrom: "fieldscore.json", Value: tmpsvalue.Value, Score: qu.Float64All(SoreConfig["extractype"]["space"])})
|
|
|
- } else if strings.Contains(tmpsvalue.Type, "table") {
|
|
|
- tmps[tmpsindex].Score += qu.Float64All(SoreConfig["extractype"]["table"])
|
|
|
- tmps[tmpsindex].ScoreItem = append(tmps[tmpsindex].ScoreItem, &ju.ScoreItem{Des: "tablekv", Code: "fieldscore.table", RuleText: qu.ObjToString(SoreConfig["extractype"]["describe"]), Type: "tablekv", ExtFrom: "fieldscore.json", Value: tmpsvalue.Value, Score: qu.Float64All(SoreConfig["extractype"]["table"])})
|
|
|
- }
|
|
|
+ //是否有kv值
|
|
|
+ if strings.Contains(tmpsvalue.Type, "colon") {
|
|
|
+ tmps[tmpsindex].Score += qu.Float64All(SoreConfig["extractype"]["colon"])
|
|
|
+ tmps[tmpsindex].ScoreItem = append(tmps[tmpsindex].ScoreItem, &ju.ScoreItem{Des: "colonkv", Code: "fieldscore.colon", RuleText: qu.ObjToString(SoreConfig["extractype"]["describe"]), Type: "colonkv", ExtFrom: "fieldscore.json", Value: tmpsvalue.Value, Score: qu.Float64All(SoreConfig["extractype"]["colon"])})
|
|
|
+ } else if strings.Contains(tmpsvalue.Type, "space") {
|
|
|
+ tmps[tmpsindex].Score += qu.Float64All(SoreConfig["extractype"]["space"])
|
|
|
+ tmps[tmpsindex].ScoreItem = append(tmps[tmpsindex].ScoreItem, &ju.ScoreItem{Des: "spacekv", Code: "fieldscore.space", RuleText: qu.ObjToString(SoreConfig["extractype"]["describe"]), Type: "spacekv", ExtFrom: "fieldscore.json", Value: tmpsvalue.Value, Score: qu.Float64All(SoreConfig["extractype"]["space"])})
|
|
|
+ } else if strings.Contains(tmpsvalue.Type, "table") {
|
|
|
+ tmps[tmpsindex].Score += qu.Float64All(SoreConfig["extractype"]["table"])
|
|
|
+ tmps[tmpsindex].ScoreItem = append(tmps[tmpsindex].ScoreItem, &ju.ScoreItem{Des: "tablekv", Code: "fieldscore.table", RuleText: qu.ObjToString(SoreConfig["extractype"]["describe"]), Type: "tablekv", ExtFrom: "fieldscore.json", Value: tmpsvalue.Value, Score: qu.Float64All(SoreConfig["extractype"]["table"])})
|
|
|
}
|
|
|
if tmpsvalue.ExtFrom != "title" { //非标题抽取
|
|
|
if strings.Contains(tmpsvalue.Type, "regexp") {
|
|
|
tmps[tmpsindex].Score += qu.Float64All(SoreConfig["extractype"]["regexp"])
|
|
|
tmps[tmpsindex].ScoreItem = append(tmps[tmpsindex].ScoreItem, &ju.ScoreItem{Des: "regexp", Code: "fieldscore.regexp", RuleText: qu.ObjToString(SoreConfig["extractype"]["describe"]), Type: "regexp", ExtFrom: "fieldscore.json", Value: tmpsvalue.Value, Score: qu.Float64All(SoreConfig["extractype"]["regexp"])})
|
|
|
}
|
|
|
- } else {
|
|
|
- if strings.Contains(tmpsvalue.Type, "regexp") {
|
|
|
- tmps[tmpsindex].Score += qu.Float64All(SoreConfig["extractype"]["regexp"]) + 1
|
|
|
- tmps[tmpsindex].ScoreItem = append(tmps[tmpsindex].ScoreItem, &ju.ScoreItem{Des: "regexp", Code: "fieldscore.regexp", RuleText: qu.ObjToString(SoreConfig["extractype"]["describe"]), Type: "regexp", ExtFrom: "fieldscore.json", Value: tmpsvalue.Value, Score: qu.Float64All(SoreConfig["extractype"]["regexp"]) + 1})
|
|
|
- }
|
|
|
}
|
|
|
scoreRule := SoreConfig[field]
|
|
|
if scoreRule == nil {
|