12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019 |
- package main
- import (
- "encoding/json"
- "field_sync/config"
- "field_sync/oss"
- "fmt"
- "net"
- "reflect"
- "regexp"
- "sort"
- "strconv"
- "strings"
- "time"
- "log"
- "go.mongodb.org/mongo-driver/bson"
- util "jygit.jydev.jianyu360.cn/data_processing/common_utils"
- "jygit.jydev.jianyu360.cn/data_processing/common_utils/mongodb"
- "jygit.jydev.jianyu360.cn/data_processing/common_utils/redis"
- "jygit.jydev.jianyu360.cn/data_processing/common_utils/udp"
- )
- var (
- regLetter = regexp.MustCompile("[a-z]*")
- cityEndReg = regexp.MustCompile("(区|县|市)$")
- )
- func biddingTask(data []byte, mapInfo map[string]interface{}) {
- defer util.Catch()
- stype := util.ObjToString(mapInfo["stype"])
- q, _ := mapInfo["query"].(map[string]interface{})
- bkey, _ := mapInfo["bkey"].(string)
- if q == nil {
- q = map[string]interface{}{
- "_id": map[string]interface{}{
- "$gt": mongodb.StringTOBsonId(mapInfo["gtid"].(string)),
- "$lte": mongodb.StringTOBsonId(mapInfo["lteid"].(string)),
- },
- }
- }
- //extract库
- // extractConn := MgoE.GetMgoConn()
- // defer MgoE.DestoryMongoConn(extractConn)
- // extractResult := extractConn.DB(MgoE.DbName).C(config.Conf.DB.MongoE.Coll).Find(q).Select(map[string]interface{}{
- // "field_source": 0,
- // "kvtext": 0,
- // }).Sort("_id").Iter()
- // eMap := map[string]map[string]interface{}{}
- // extCount, repeatCount := 0, 0
- // for tmp := make(map[string]interface{}); extractResult.Next(tmp); extCount++ {
- // if util.IntAll(tmp["repeat"]) == 1 {
- // repeatCount++
- // }
- // tid := mongodb.BsonIdToSId(tmp["_id"])
- // eMap[tid] = tmp
- // tmp = make(map[string]interface{})
- // }
- // log.Println("抽取表 数据量", extCount, "重复数据量", repeatCount)
- //bidding库
- biddingConn := MgoB.GetMgoConn()
- count, _ := biddingConn.DB(MgoB.DbName).C(config.Conf.DB.MongoB.Coll).Find(&q).Count()
- log.Println("bidding表 同步总数:", count)
- c := 0
- // if count < 500000 {
- var res []map[string]interface{}
- result := biddingConn.DB(MgoB.DbName).C(config.Conf.DB.MongoB.Coll).Find(q).Select(map[string]interface{}{
- "contenthtml": 0,
- }).Iter()
- for tmp := make(map[string]interface{}); result.Next(tmp); {
- res = append(res, tmp)
- tmp = make(map[string]interface{})
- }
- MgoB.DestoryMongoConn(biddingConn)
- // log.Println("查询结果 bidding", count, "抽取:", extCount)
- c = doIndex(res, bkey, stype)
- // } else {
- // log.Println("查询结果 数据量太大,放弃", count)
- // MgoB.DestoryMongoConn(biddingConn)
- // }
- log.Println("bidding sync...over all", count, "extract sync ", c)
- NextNode(mapInfo, stype)
- // NextNodePro(mapInfo, stype)
- NextNodeTidb(mapInfo, stype)
- if stype == "bidding_history" {
- NextNodeBidData(mapInfo) // bidding-data数据
- NextNodeTidbQyxy(mapInfo) // tidb-企业数据
- NextNodeHn(mapInfo)
- }
- if stype == "bidding" {
- uq := map[string]interface{}{
- "gtid": map[string]interface{}{
- "$gte": util.ObjToString(mapInfo["gtid"]),
- },
- "lteid": map[string]interface{}{
- "$lte": util.ObjToString(mapInfo["lteid"]),
- },
- }
- MgoB.Update("bidding_processing_ids", uq, bson.M{"$set": bson.M{"dataprocess": 7, "updatetime": time.Now().Unix()}}, false, true)
- }
- //领域标签处理的数据 id段
- if stype == "bidding_history" {
- MgoB.Save("field_data_record", map[string]interface{}{"gtid": mapInfo["gtid"], "lteid": mapInfo["lteid"], "status": 0})
- }
- }
- func biddingAllTask(data []byte, mapInfo map[string]interface{}) {
- defer util.Catch()
- q, _ := mapInfo["query"].(map[string]interface{})
- if q == nil {
- q = map[string]interface{}{
- "_id": map[string]interface{}{
- "$gt": mongodb.StringTOBsonId(mapInfo["gtid"].(string)),
- "$lte": mongodb.StringTOBsonId(mapInfo["lteid"].(string)),
- },
- }
- }
- //extract库
- extractConn := MgoE.GetMgoConn()
- defer MgoE.DestoryMongoConn(extractConn)
- extractResult := extractConn.DB(MgoE.DbName).C(config.Conf.DB.MongoE.Coll).Find(q).Select(map[string]interface{}{
- "field_source": 0,
- "kvtext": 0,
- }).Sort("-_id").Iter()
- //bidding库
- biddingConn := MgoB.GetMgoConn()
- defer MgoB.DestoryMongoConn(biddingConn)
- count := 0
- var compare map[string]interface{}
- result := biddingConn.DB(MgoB.DbName).C(config.Conf.DB.MongoB.Coll).Find(q).Select(map[string]interface{}{
- "contenthtml": 0,
- "field_source": 0,
- }).Sort("-_id").Iter()
- for tmp := make(map[string]interface{}); result.Next(tmp); count++ {
- update := map[string]interface{}{}
- del := map[string]interface{}{} //记录extract没有值而bidding中有值的字段
- //对比方法----------------
- for {
- if compare == nil {
- compare = make(map[string]interface{})
- if !extractResult.Next(compare) {
- break
- }
- }
- if compare != nil {
- cid := mongodb.BsonIdToSId(compare["_id"])
- tid := mongodb.BsonIdToSId(tmp["_id"])
- if cid == tid {
- //更新bidding表;bidding表modifyinfo中的字段不更新
- modifyinfo := make(map[string]bool)
- if tmpmodifyinfo, ok := tmp["modifyinfo"].(map[string]interface{}); ok && tmpmodifyinfo != nil {
- for k := range tmpmodifyinfo {
- modifyinfo[k] = true
- }
- }
- for _, k := range config.Conf.Serve.FieldS {
- v1 := compare[k] //extract
- v2 := tmp[k] //bidding
- if v2 == nil && v1 != nil {
- update[k] = v1
- } else if v2 != nil && v1 != nil && !modifyinfo[k] {
- update[k] = v1
- } else if v2 != nil && v1 == nil && !modifyinfo[k] {
- if k == "s_subscopeclass" && del["subscopeclass"] == nil {
- continue
- } else if k == "s_topscopeclass" && del["topscopeclass"] == nil {
- continue
- }
- del[k] = 1
- //util.Debug("抽取结果没有值,bidding有值:field--", k, del)
- }
- }
- if util.IntAll(compare["repeat"]) == 1 {
- update["extracttype"] = -1
- update["dataprocess"] = 7
- if compare["repeat_id"] != nil {
- update["repeat_id"] = compare["repeat_id"]
- }
- } else {
- update["extracttype"] = 1
- update["dataprocess"] = 8
- }
- break
- } else {
- if cid < tid {
- compare = nil
- continue
- } else {
- break
- }
- }
- } else {
- break
- }
- }
- //------------------对比结束
- //处理分类
- if compare != nil { //extract
- fieldFun(compare, update)
- compare = nil
- }
- // entidlist
- extractMap := make(map[string]interface{})
- if update["s_winner"] != "" {
- cid := companyFun(update)
- if len(cid) > 0 {
- update["entidlist"] = cid
- extractMap["entidlist"] = cid
- }
- }
- if len(extractMap) > 0 {
- updateExtPool <- []map[string]interface{}{
- {"_id": tmp["_id"]},
- {"$set": extractMap},
- }
- }
- // 附件有效字段
- if i := validFile(tmp); i != 0 {
- if i == -1 {
- update["isValidFile"] = false
- } else {
- update["isValidFile"] = true
- }
- }
- if len(update) > 0 {
- if len(del) > 0 { //删除的字段
- updateBidPool <- []map[string]interface{}{{
- "_id": tmp["_id"],
- },
- {"$set": update, "$unset": del},
- }
- } else {
- updateBidPool <- []map[string]interface{}{{
- "_id": tmp["_id"],
- },
- {"$set": update},
- }
- }
- }
- if count%50000 == 0 {
- log.Println("biddingTask current", count)
- }
- tmp = make(map[string]interface{})
- }
- log.Println("biddingAll sync...over all", count)
- }
- func doIndex(infos []map[string]interface{}, bkey, stype string) int {
- syncNo := 0 //抽取表数据同步数量
- //对比两张表数据,减少查询次数
- var compare map[string]interface{}
- var bidUpdate [][]map[string]interface{}
- var extUpdate [][]map[string]interface{}
- //SaveEsLock := &sync.Mutex{}
- ygsiteArr := []map[string]interface{}{}
- sitedata, _ := MgoE.Find("bidding_yg_site", map[string]interface{}{}, nil, nil, false, -1, -1)
- if sitedata != nil && len(*sitedata) > 0 {
- ygsiteArr = *sitedata
- }
- log.Println("start ...")
- for n, tmp := range infos {
- tid := mongodb.BsonIdToSId(tmp["_id"])
- update := map[string]interface{}{} //要更新的mongo数据
- del := map[string]interface{}{}
- edata, _ := MgoE.FindById(config.Conf.DB.MongoE.Coll, tid, nil)
- //对比方法----------------
- if edata != nil && len(*edata) > 0 {
- compare = *edata
- if stype == "bidding" {
- // 增量id段 正常数据
- if dg := util.IntAll(compare["dataging"]); dg == 1 { //extract中dataging=1跳过
- tmp = make(map[string]interface{})
- compare = nil
- continue
- }
- // delete(eMap, tid)
- }
- if stype == "bidding_history" {
- //增量id段 历史数据
- if compare["history_updatetime"] == nil { //extract中history_updatetime不存在跳过
- tmp = make(map[string]interface{})
- compare = nil
- continue
- }
- // delete(eMap, tid)
- }
- syncNo++
- log.Println("抽取区域 省", compare["area"], " 市 ", compare["city"], " 区 ", compare["district"], " id ", tid)
- modifyinfo := make(map[string]bool)
- if tmp["modifyinfo"] != nil {
- if tmpmodifyinfo, ok := tmp["modifyinfo"].(map[string]interface{}); ok {
- for k := range tmpmodifyinfo {
- modifyinfo[k] = true
- }
- }
- }
- for _, k := range config.Conf.Serve.FieldS {
- v1 := compare[k] //extract
- v2 := tmp[k] //bidding
- if v2 == nil && v1 != nil {
- update[k] = v1
- } else if v2 != nil && v1 != nil && !modifyinfo[k] {
- update[k] = v1
- } else if v2 != nil && v1 == nil && !modifyinfo[k] {
- if k == "s_subscopeclass" && del["subscopeclass"] == nil {
- continue
- } else if k == "s_topscopeclass" && del["topscopeclass"] == nil {
- continue
- } else if k == "city" || k == "district" {
- update[k] = ""
- } else {
- del[k] = 1
- }
- }
- }
- // 附件重采,数据同步时不更新判重标识
- if util.IntAll(compare["repeat"]) == 1 {
- update["extracttype"] = -1
- update["dataprocess"] = 7
- if compare["repeat_id"] != nil {
- update["repeat_id"] = compare["repeat_id"]
- }
- } else {
- update["extracttype"] = 1
- update["dataprocess"] = 8
- }
- } else {
- compare = nil
- if util.IntAll(tmp["dataging"]) == 1 { //修改未抽取的bidding数据的dataging
- update["dataging"] = 0
- }
- update["dataprocess"] = 8
- }
- //下面可以多线程跑的--->
- //处理分类
- if compare != nil { //extract
- fieldFun(compare, update)
- // publishtime 20230523
- if util.IntAll(tmp["publishtime"]) == -1 {
- if pb := methodPb(compare); pb > 0 {
- update["publishtime"] = pb
- }
- }
- compare = nil
- }
- //------------------对比结束
- //处理key descript
- if bkey == "" {
- DealInfo(&tmp, &update)
- }
- // entidlist
- extractMap := make(map[string]interface{})
- if update["s_winner"] != "" {
- cid := companyFun(update)
- if len(cid) > 0 {
- tmp["entidlist"] = cid
- update["entidlist"] = cid
- extractMap["entidlist"] = cid
- }
- }
- //阳光采购
- spidercode := util.ObjToString(tmp["spidercode"])
- site := util.ObjToString(tmp["site"])
- infoAttribute := util.ObjToString(tmp["infoattribute"])
- if infoAttribute != "" {
- update["public_type"] = "用户发布"
- update["extracttype"] = -1
- MgoE.Save("bidding_yg", map[string]interface{}{"id": tid, "source": "user"})
- } else {
- for _, v := range ygsiteArr {
- spidercodes := util.ObjToString(v["spidercode"])
- sites := util.ObjToString(v["site"])
- datatype := util.ObjToString(v["datatype"])
- if datatype == "1" && spidercodes == spidercode {
- update["infoattribute"] = "zc_cgxx"
- update["public_type"] = "平台发布"
- MgoE.Save("bidding_yg", map[string]interface{}{"id": tid, "source": "spidercode"})
- } else if datatype == "2" && site == sites {
- update["infoattribute"] = "zc_cgxx"
- update["public_type"] = "平台发布"
- MgoE.Save("bidding_yg", map[string]interface{}{"id": tid, "source": "site"})
- }
- }
- }
- // 6.10 剑鱼发布信息分类处理, 写在这里是为了修改抽取表
- typeFunc(tmp, update, extractMap)
- if len(extractMap) > 0 {
- if extractMap["toptype"] != nil && extractMap["subtype"] == nil {
- extUpdate = append(extUpdate, []map[string]interface{}{
- {"_id": tmp["_id"]},
- {"$set": extractMap, "$unset": map[string]interface{}{"subtype": ""}},
- })
- } else {
- extUpdate = append(extUpdate, []map[string]interface{}{
- {"_id": tmp["_id"]},
- {"$set": extractMap},
- })
- }
- if len(extUpdate) >= MgoBulkSize {
- tmps := extUpdate
- MgoE.UpdateBulk(config.Conf.DB.MongoE.Coll, tmps...)
- extUpdate = [][]map[string]interface{}{}
- }
- }
- // 附件有效字段
- if i := validFile(tmp); i != 0 {
- if i == -1 {
- tmp["isValidFile"] = false
- update["isValidFile"] = false
- } else {
- tmp["isValidFile"] = true
- update["isValidFile"] = true
- }
- }
- // 2024-02-21 徐志恒 情报标签字段
- toptype := util.ObjToString(tmp["toptype"])
- subtype := util.ObjToString(tmp["subtype"])
- buyerclass := util.ObjToString(update["buyerclass"])
- if buyerclass != "" {
- update["buyer_type"] = getStr(buyerclass)
- }
- s_topscopeclass := util.ObjToString(update["s_topscopeclass"])
- if (tmp["tag_topinformation"] != nil && (subtype == "合同" || subtype == "中标" || subtype == "成交" || subtype == "采购意向" || toptype == "招标")) || (tmp["tag_topinformation"] == nil && toptype == "拟建" && strings.Contains(s_topscopeclass, "建筑工程")) {
- update["tag_set"] = getTagSet(tmp, compare)
- }
- if len(update) > 0 {
- log.Println("保存bidding区域 省", update["area"], " 市 ", update["city"], " 区 ", update["district"], " buyerclass ", update["buyerclass"], update["buyer_type"], " id ", tid)
- if len(del) > 0 {
- bidUpdate = append(bidUpdate, []map[string]interface{}{{
- "_id": tmp["_id"],
- },
- {"$set": update, "$unset": del},
- })
- } else {
- bidUpdate = append(bidUpdate, []map[string]interface{}{{
- "_id": tmp["_id"],
- },
- {"$set": update},
- })
- }
- if len(bidUpdate) >= MgoBulkSize {
- tmps := bidUpdate
- MgoB.UpdateBulk(config.Conf.DB.MongoB.Coll, tmps...)
- bidUpdate = [][]map[string]interface{}{}
- }
- }
- if n%500 == 0 {
- log.Println("biddingTask current ", n)
- }
- tmp = make(map[string]interface{})
- }
- //SaveEsLock.Lock()
- if len(bidUpdate) > 0 {
- tmps := bidUpdate
- MgoB.UpdateBulk(config.Conf.DB.MongoB.Coll, tmps...)
- bidUpdate = [][]map[string]interface{}{}
- }
- if len(extUpdate) > 0 {
- tmps := extUpdate
- MgoE.UpdateBulk(config.Conf.DB.MongoE.Coll, tmps...)
- extUpdate = [][]map[string]interface{}{}
- }
- //SaveEsLock.Unlock()
- return syncNo
- }
- // @Description subscopeclass、topscopeclass、package
- // 20230523 多包处理 subpackage = 1
- // @Author J 2022/6/7 5:54 PM
- func fieldFun(compare, update map[string]interface{}) {
- subscopeclass, _ := compare["subscopeclass"].([]interface{}) //subscopeclass
- if subscopeclass != nil {
- m1 := map[string]bool{}
- newclass := []string{}
- for _, sc := range subscopeclass {
- sclass, _ := sc.(string)
- if !m1[sclass] {
- m1[sclass] = true
- newclass = append(newclass, sclass)
- }
- }
- update["s_subscopeclass"] = strings.Join(newclass, ",")
- update["subscopeclass"] = newclass
- }
- topscopeclass, _ := compare["topscopeclass"].([]interface{}) //topscopeclass
- if topscopeclass != nil {
- m2 := map[string]bool{}
- newclass := []string{}
- for _, tc := range topscopeclass {
- tclass, _ := tc.(string)
- tclass = regLetter.ReplaceAllString(tclass, "") // 去除字母
- if !m2[tclass] {
- m2[tclass] = true
- newclass = append(newclass, tclass)
- }
- }
- update["topscopeclass"] = topscopeclass
- update["s_topscopeclass"] = strings.Join(newclass, ",")
- }
- if package1 := compare["package"]; package1 != nil {
- packageM, _ := package1.(map[string]interface{})
- update["package"] = packageM
- for _, p := range packageM {
- pm, _ := p.(map[string]interface{})
- if util.ObjToString(pm["winner"]) != "" || util.Float64All(pm["budget"]) > 0 ||
- util.Float64All(pm["bidamount"]) > 0 {
- update["multipackage"] = 1
- break
- }
- }
- } else {
- update["multipackage"] = 0
- }
- // subpackage
- if compare["package"] != nil && compare["s_winner"] != nil && compare["bidamount"] != nil {
- pg := compare["package"].(map[string]interface{})
- if len(pg) > 1 {
- var bmt []float64
- var swn []string
- for _, p := range pg {
- p1 := p.(map[string]interface{})
- if p1["bidamount"] != nil {
- bmt = append(bmt, util.Float64All(p1["bidamount"]))
- }
- if w := util.ObjToString(p1["winner"]); w != "" {
- swn = append(swn)
- }
- }
- if len(bmt) > 1 && len(swn) > 1 {
- sn := strings.Split(util.ObjToString(compare["s_winner"]), ",")
- sort.Strings(sn)
- sort.Strings(swn)
- swn1 := util.ObjArrToStringArr(Duplicate(swn)) // 去重
- if strings.Join(swn1, ",") == strings.Join(sn, ",") {
- bidamount := 0.0
- for _, f := range bmt {
- bidamount += f
- }
- if bidamount == util.Float64All(compare["bidamount"]) {
- update["subpackage"] = 1
- }
- }
- }
- }
- }
- }
- // @Description entidlist
- // @Author J 2022/6/7 2:36 PM
- func companyFun(tmp map[string]interface{}) (cid []string) {
- sWinnerarr := strings.Split(util.ObjToString(tmp["s_winner"]), ",")
- for _, w := range sWinnerarr {
- if w != "" {
- id := redis.GetStr("qyxy_id", w)
- if id == "" {
- ents, _ := MgoQ.Find(config.Conf.DB.MongoQ.Coll, map[string]interface{}{"company_name": w}, map[string]interface{}{"updatetime": -1}, map[string]interface{}{"company_name": 1}, false, -1, -1)
- if len(*ents) > 0 {
- id = util.ObjToString((*ents)[0]["_id"])
- redis.PutCKV("qyxy_id", w, id)
- } else {
- ent, _ := MgoP.FindOne(config.Conf.DB.MongoP.Coll, map[string]interface{}{"history_name": w})
- if len(*ent) > 0 {
- id = util.ObjToString((*ent)["company_id"])
- redis.PutCKV("qyxy_id", w, id)
- }
- }
- }
- if id == "" {
- id = "-"
- }
- cid = append(cid, id)
- }
- }
- return cid
- }
- // @Description update 修改bidding表,extractM修改抽取表
- // @Author J 2022/6/10 10:29 AM
- func typeFunc(tmp, update, extractM map[string]interface{}) {
- if jyData, ok := tmp["jyfb_data"].(map[string]interface{}); ok {
- if t := util.ObjToString(jyData["type"]); t != "" {
- switch t {
- //case "采购信息":
- case "招标公告":
- if util.ObjToString(tmp["toptype"]) != "招标" {
- update["toptype"] = "招标"
- extractM["toptype"] = "招标"
- delete(update, "subtype")
- }
- case "采购意向":
- if util.ObjToString(tmp["toptype"]) != "采购意向" {
- update["toptype"] = "采购意向"
- update["subtype"] = "采购意向"
- extractM["toptype"] = "采购意向"
- extractM["subtype"] = "采购意向"
- }
- case "招标预告":
- if util.ObjToString(tmp["toptype"]) != "预告" {
- update["toptype"] = "预告"
- extractM["toptype"] = "预告"
- delete(update, "subtype")
- }
- case "招标结果":
- if util.ObjToString(tmp["toptype"]) != "结果" {
- update["toptype"] = "结果"
- extractM["toptype"] = "结果"
- delete(update, "subtype")
- }
- }
- }
- }
- }
- // @Description 附件有效字段(isValidFile)
- // @Author J 2022/7/8 14:41
- func validFile(tmp map[string]interface{}) int {
- isContinue := false
- if pinfo, o := tmp["projectinfo"].(map[string]interface{}); o {
- if atts, o1 := pinfo["attachments"].(map[string]interface{}); o1 {
- for _, att := range atts {
- if att == nil {
- continue
- }
- if reflect.TypeOf(att).String() == "string" {
- continue
- }
- att1 := att.(map[string]interface{})
- if fid := util.ObjToString(att1["fid"]); fid != "" {
- isContinue = true
- break
- }
- }
- if isContinue {
- if attachTxt, o := tmp["attach_text"].(map[string]interface{}); o {
- if len(attachTxt) > 0 {
- for _, at := range attachTxt {
- at1 := at.(map[string]interface{})
- if len(at1) > 0 {
- for k, _ := range at1 {
- if reflect.TypeOf(at1[k]).String() == "string" {
- continue
- }
- at2 := at1[k].(map[string]interface{})
- s := strings.ToLower(util.ObjToString(at2["file_name"]))
- if !strings.Contains(s, "jpg") || !strings.Contains(s, "jpeg") != strings.Contains(s, "png") ||
- strings.Contains(s, "pdf") {
- if strings.Contains(s, "swf") || strings.Contains(s, "html") {
- return -1
- } else if AnalysisFile(oss.OssGetObject(util.ObjToString(at2["attach_url"]))) {
- return 1
- }
- }
- }
- break
- } else {
- break
- }
- }
- }
- }
- flag := false
- for _, att := range atts {
- if att == nil {
- continue
- }
- if reflect.TypeOf(att).String() == "string" {
- continue
- }
- att1 := att.(map[string]interface{})
- if fid := util.ObjToString(att1["fid"]); fid != "" {
- ftype := strings.ToLower(util.ObjToString(tmp["ftype"]))
- if ftype != "swf" && ftype != "html" && oss.OssObjExists("jy-datafile", fid) {
- return 1
- } else {
- flag = true
- }
- }
- }
- if flag {
- return -1
- }
- }
- }
- }
- return 0
- }
- // @Description id不变,内容变化 重新索引数据
- // @Author J 2022/8/10 13:29
- func taskinfo(id string) {
- tmp, _ := MgoB.FindById("bidding", id, nil)
- if tmp == nil || len(*tmp) == 0 {
- log.Println(fmt.Sprintf("taskinfo bidding id=%s 未查询到数据", id))
- return
- }
- extractM, _ := MgoE.FindById(config.Conf.DB.MongoE.Coll, id, nil)
- if extractM == nil || len(*extractM) == 0 {
- extractM, _ = MgoE.FindById(config.Conf.DB.MongoE.Coll1, id, nil)
- if extractM == nil || len(*extractM) == 0 {
- log.Println(fmt.Sprintf("taskinfo extract id=%s 未查询到数据", id))
- return
- }
- }
- update := map[string]interface{}{} //要更新的mongo数据
- //更新bidding表字段
- for _, k := range config.Conf.Serve.FieldS {
- v1 := (*extractM)[k] //extract
- v2 := (*tmp)[k] //bidding
- if v2 == nil && v1 != nil {
- update[k] = v1
- } else if v2 != nil && v1 != nil {
- update[k] = v1
- } else if v2 != nil && v1 == nil {
- if k == "city" || k == "district" {
- update[k] = ""
- }
- }
- }
- if util.IntAll((*extractM)["repeat"]) == 1 {
- update["extracttype"] = -1
- update["dataprocess"] = 7
- if (*extractM)["repeat_id"] != nil {
- update["repeat_id"] = (*extractM)["repeat_id"]
- }
- } else {
- update["extracttype"] = 1
- update["dataprocess"] = 8
- }
- //处理分类
- fieldFun(*extractM, update)
- extractMap := make(map[string]interface{})
- if util.ObjToString((*tmp)["s_winner"]) != "" {
- cid := companyFun(*tmp)
- if len(cid) > 0 {
- update["entidlist"] = cid
- extractMap["entidlist"] = cid
- }
- MgoE.UpdateById(config.Conf.DB.MongoE.Coll, id, map[string]interface{}{"$set": extractMap})
- }
- // 附件有效字段
- if i := validFile(*tmp); i != 0 {
- if i == -1 {
- update["isValidFile"] = false
- } else {
- update["isValidFile"] = true
- }
- }
- if len(update) > 0 {
- MgoB.UpdateById(config.Conf.DB.MongoB.Coll, id, map[string]interface{}{"$set": update})
- }
- mapinfo := map[string]interface{}{
- "infoid": id,
- "stype": "index-by-id",
- }
- datas, _ := json.Marshal(mapinfo)
- var next = &net.UDPAddr{
- IP: net.ParseIP(config.Conf.Udp.Next.Addr),
- Port: util.IntAll(config.Conf.Udp.Next.Port),
- }
- log.Println("nsq data over es ", next, " mapinfo ", string(datas))
- _ = UdpClient.WriteUdp(datas, udp.OP_TYPE_DATA, next)
- }
- var DateTimeSelect = []string{"bidopentime", "bidendtime", "signaturedate", "comeintime"}
- // @Description 发布时间处理
- // @Author J 2023/5/23 14:32
- func methodPb(tmp map[string]interface{}) int64 {
- if tmp["ext_publishtime"] != nil {
- if newPb := util.Int64All(tmp["ext_publishtime"]); newPb < time.Now().Unix() && newPb > 1420041600 {
- return newPb
- }
- }
- for _, d := range DateTimeSelect {
- if tmp[d] != nil && util.Int64All(tmp[d]) < time.Now().Unix() {
- return util.Int64All(tmp[d])
- }
- }
- return 0
- }
- // Duplicate
- // @Description 去重
- // @Author J 2023/5/24 09:53
- func Duplicate(a interface{}) (ret []interface{}) {
- va := reflect.ValueOf(a)
- for i := 0; i < va.Len(); i++ {
- if i > 0 && reflect.DeepEqual(va.Index(i-1).Interface(), va.Index(i).Interface()) {
- continue
- }
- ret = append(ret, va.Index(i).Interface())
- }
- return ret
- }
- // @Description 获取情报标签
- // @Author 徐志恒 2024/2/21 09:53
- func getTagSet(tmp, compare map[string]interface{}) map[string]map[string]interface{} {
- tagSet := map[string]map[string]interface{}{}
- wuye := map[string]interface{}{}
- buyer := util.ObjToString(compare["buyer"])
- publishtime := util.Int64All(tmp["publishtime"])
- bidamount := util.Float64All(compare["bidamount"])
- toptype := util.ObjToString(tmp["toptype"])
- subtype := util.ObjToString(tmp["subtype"])
- if subtype == "合同" {
- wuye["isfirsthand"] = 62
- if buyer != "" {
- sql := `{
- "query": {
- "bool": {
- "must": [
- {
- "term": {
- "buyer": "` + buyer + `"
- }
- },
- {
- "term": {
- "tag_topinformation": "情报_物业"
- }
- },
- {
- "term": {
- "subtype": "合同"
- }
- },
- {
- "range": {
- "publishtime": {
- "lte": ` + fmt.Sprint(publishtime) + `
- }
- }
- }
- ]
- }
- },
- "sort": {
- "publishtime": "asc"
- },
- "_source": [
- "s_winner"
- ],
- "size": 10000
- }`
- data := Es.Get("bidding", "bidding", sql)
- if data != nil && len(*data) > 0 {
- count := 0
- first := util.ObjToString((*data)[0]["s_winner"])
- for k, v := range *data {
- winner := util.ObjToString(v["s_winner"])
- if k > 0 && first != winner {
- first = winner
- count++
- }
- }
- changehand := fmt.Sprintf("%.2f", float64(count)/float64(len(*data)))
- changehands, _ := strconv.ParseFloat(changehand, 64)
- wuye["changehand"] = changehands
- if changehands > 0.3 {
- wuye["changehandindex"] = 61
- }
- if len(*data) > 1 {
- wuye["isfirsthand"] = 0
- }
- }
- }
- wuye["period"] = getperiod(compare)
- } else if toptype == "招标" || toptype == "采购意向" {
- bidamount = util.Float64All(compare["budget"])
- }
- if tmp["projectinfo"] != nil {
- projectInfo := util.ObjToMap(tmp["projectinfo"])
- if projectInfo != nil && len(*projectInfo) > 0 {
- if (*projectInfo)["attachments"] != nil {
- wuye["isfile"] = 63
- }
- }
- }
- wuye["scale"] = getBidamountRange(bidamount)
- if tmp["property_form"] != nil {
- property_form := util.ObjArrToStringArr(tmp["property_form"].([]interface{}))
- wuye["property_form"] = getpropertyform(property_form)
- }
- tagSet["wuye"] = wuye
- return tagSet
- }
- func getBidamountRange(value float64) int {
- switch {
- case value < 500000:
- return 1
- case value >= 500000 && value < 1000000:
- return 2
- case value >= 1000000 && value < 2000000:
- return 3
- case value >= 2000000 && value < 5000000:
- return 4
- default:
- return 5
- }
- }
- func getpropertyform(value []string) string {
- arr := []string{}
- categories := map[string]string{
- "住宅": "21",
- "政府办公楼": "22",
- "学校": "23",
- "医院": "24",
- "产业园区": "25",
- "旅游景区": "26",
- "交通运输": "27",
- "商务办公楼": "28",
- "酒店": "29",
- }
- for _, v := range value {
- if categories[v] != "" {
- arr = append(arr, categories[v])
- }
- }
- return strings.Join(arr, ",")
- }
- func getperiod(data map[string]interface{}) int {
- res := 16
- signaturedate := util.Int64All(data["signaturedate"]) //合同签订日期
- expiredate := util.Int64All(data["expiredate"]) //合同截止日期
- // contractperiod := util.ObjToString(data["contractperiod"]) //合同期限
- project_duration := util.IntAll(data["project_duration"]) //工期时长
- project_timeunit := util.ObjToString(data["project_timeunit"]) //工期单位
- result := float64(0)
- if expiredate > 0 && signaturedate > 0 {
- result = calculateYearDifference(signaturedate, expiredate)
- } else if project_duration > 0 && project_timeunit != "" {
- if strings.Contains(project_timeunit, "年") {
- if project_duration == 1 {
- res = 12
- } else if project_duration == 2 {
- res = 13
- } else if project_duration == 3 {
- res = 14
- } else if project_duration == 5 {
- res = 15
- }
- return res
- } else if strings.Contains(project_timeunit, "月") {
- result = float64(project_duration) / 12
- } else if strings.Contains(project_timeunit, "周") {
- result = float64(project_duration) * 7 / 365
- } else if strings.Contains(project_timeunit, "日") || strings.Contains(project_timeunit, "天") {
- result = float64(project_duration) / 365
- }
- }
- if result == 0 {
- res = 16
- } else if result < 1 {
- res = 11
- } else if result >= 1 && result < 2 {
- res = 12
- } else if result >= 2 && result < 3 {
- res = 13
- } else if result >= 3 && result < 4 {
- res = 14
- } else if result >= 5 {
- res = 15
- }
- return res
- }
- func calculateYearDifference(startTime int64, endTime int64) float64 {
- start := time.Unix(startTime, 0)
- end := time.Unix(endTime, 0)
- duration := end.Sub(start)
- years := duration.Hours() / 24 / 365
- return years
- }
- func getStr(b string) string {
- if b == "" {
- return "其它"
- }
- a1 := "(交通|运输物流|工信|农业|住建|城管|市政|出版广电|检察院|科技|民政|生态环境|市场监管|水利|应急管理|自然资源|财政|档案|党委办|组织|发改|宣传|政府办|政务中心|人大|政协|法院|公安|国资委|海关|机关事务|纪委|军队|人社|商务|审计税务|司法|体育|统计|统战|文旅|民宗|银保监|证监|气象|社会团体|公共资源交易)"
- a2 := "(卫健委|医疗)"
- a3 := "(教育|学校)"
- a4 := "(人行|金融业)"
- a5 := "(信息技术|电信行业|农林牧渔|建筑业|传媒|制造业|住宿餐饮|采矿业|能源化工|批发零售)"
- if strings.Contains(a1, b) {
- return "政府机构"
- } else if strings.Contains(a2, b) {
- return "医疗单位"
- } else if strings.Contains(a3, b) {
- return "教育单位"
- } else if strings.Contains(a4, b) {
- return "金融企业"
- } else if strings.Contains(a5, b) {
- return "商业公司"
- } else {
- return "其它"
- }
- return "其它"
- }
|