main.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373
  1. package main
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "github.com/garyburd/redigo/redis"
  6. "go.mongodb.org/mongo-driver/bson"
  7. "go.mongodb.org/mongo-driver/bson/primitive"
  8. es "gopkg.in/olivere/elastic.v1"
  9. "log"
  10. mu "mfw/util"
  11. "net"
  12. "qfw/common/src/qfw/util/elastic"
  13. "qfw/util"
  14. "regexp"
  15. "strconv"
  16. "sort"
  17. "strings"
  18. "time"
  19. )
  20. var (
  21. Config = make(map[string]string)
  22. Fields []string
  23. SourceClient, FClient *MongodbSim
  24. RedisPool redis.Pool
  25. Addrs = make(map[string]interface{}, 0) //省市县
  26. udpclient mu.UdpClient //udp对象
  27. ElasticClientIndex, ElasticClientType string
  28. Reg_xing = regexp.MustCompile(`\*{1,}`)
  29. Reg_person = regexp.MustCompile("[\u4E00-\u9FA5\\s]+")
  30. Reg_tel = regexp.MustCompile(`^[0-9\-\s]*$`)
  31. EsConn *es.Client
  32. Updport int
  33. )
  34. /**
  35. 新增
  36. 初始化
  37. */
  38. func init() {
  39. log.SetFlags(log.Ldate | log.Ltime | log.Lshortfile)
  40. util.ReadConfig(&Config)
  41. log.Println(Config)
  42. Fields = []string{"_id", "contact", "partners", "business_scope", "company_address", "capital",
  43. "establish_date", "legal_person", "company_type", "district", "city", "province", "area_code", "credit_no",
  44. "company_name", "history_name", "topscopeclass", "wechat_accounts", "alias", "website", "report_websites"}
  45. var err error
  46. pool_size, _ := strconv.Atoi(Config["pool_size"])
  47. //mongo init
  48. SourceClient = new(MongodbSim)
  49. SourceClient.MongodbAddr = Config["mgoinit"]
  50. SourceClient.Size = pool_size
  51. //mongodbSim.DbName = "qfw"
  52. SourceClient.InitPool()
  53. SourceClientmgoConn := SourceClient.GetMgoConn()
  54. defer SourceClient.DestoryMongoConn(SourceClientmgoConn)
  55. FClient = new(MongodbSim)
  56. FClient.MongodbAddr = Config["mgourl"]
  57. FClient.Size = pool_size
  58. FClient.DbName =Config["mgodb_extract_kf"]
  59. //mongodbSim.DbName = "qfw"
  60. FClient.InitPool()
  61. FClientmgoConn := FClient.GetMgoConn()
  62. defer FClient.DestoryMongoConn(FClientmgoConn)
  63. //加载省市县代码
  64. cursor2 := FClientmgoConn.DB(Config["mgodb_extract_kf"]).C("address").Find(bson.M{}).Select(bson.M{"province": 1, "code": 1, "city": 1, "district": 1}).Iter()
  65. //defer FClient.Connect(cc)
  66. if cursor2 == nil {
  67. log.Fatalln(cursor2)
  68. }
  69. tmp := make(map[string]interface{})
  70. for cursor2.Next(&tmp) {
  71. code := tmp["code"]
  72. if code != nil && strings.TrimSpace(code.(string)) != "" {
  73. Addrs[fmt.Sprint(code)] = tmp
  74. }
  75. }
  76. log.Println(len(Addrs))
  77. //es.NewClient(es.SetURL(addrs...), es.SetMaxRetries(2), es.SetSniff(false))
  78. //es init
  79. elastic.InitElasticSize(Config["elasticsearch"], 50)
  80. EsConn = elastic.GetEsConn()
  81. defer elastic.DestoryEsConn(EsConn)
  82. //redis
  83. RedisPool = redis.Pool{
  84. MaxIdle: 50,
  85. IdleTimeout: 10 * time.Second,
  86. Dial: func() (redis.Conn, error) {
  87. conn, e := redis.Dial("tcp", Config["redis"])
  88. if e != nil {
  89. return conn, e
  90. }
  91. _, err = conn.Do("SELECT", "1")
  92. if err != nil {
  93. return nil, err
  94. }
  95. return conn, nil
  96. }}
  97. c := RedisPool.Get()
  98. if _, err := c.Do("PING"); err != nil {
  99. log.Fatalln("redis err:", err)
  100. }
  101. c.Close()
  102. }
  103. func main() {
  104. //udp
  105. updport := Config["udpport"]
  106. Updport, _ = strconv.Atoi(Config["port"])
  107. udpclient = mu.UdpClient{Local: updport, BufSize: 1024}
  108. udpclient.Listen(processUdpMsg)
  109. log.Println("Udp服务监听", updport)
  110. log.Println("发送端口port:", Updport)
  111. go TimedTask() //定时任务
  112. c := make(chan int, 1)
  113. <-c
  114. }
  115. func processUdpMsg(act byte, data []byte, ra *net.UDPAddr) {
  116. log.Println(act, string(data), ra)
  117. switch act {
  118. case mu.OP_TYPE_DATA: //上个节点的数据
  119. //从表中开始处理生成企业数据
  120. tmp := new(map[string]interface{})
  121. err := json.Unmarshal(data, &tmp)
  122. if err != nil {
  123. log.Println("err:", err)
  124. udpclient.WriteUdp([]byte("err:"+err.Error()), mu.OP_NOOP, ra)
  125. return
  126. } else if tmp != nil {
  127. if key,ok := (*tmp)["key"].(string);ok{
  128. udpclient.WriteUdp([]byte(key), mu.OP_NOOP, ra)
  129. }else {
  130. udpclient.WriteUdp([]byte("udpok"), mu.OP_NOOP, ra)
  131. }
  132. go task(tmp)
  133. }
  134. case mu.OP_NOOP: //下个节点回应
  135. log.Println("发送成功", string(data))
  136. }
  137. }
  138. func task(mapinfo *map[string]interface{}) {
  139. defer util.Catch()
  140. gtid, lteid := util.ObjToString((*mapinfo)["gtid"]), util.ObjToString((*mapinfo)["lteid"])
  141. if gtid == "" || lteid == "" {
  142. log.Println(gtid, lteid, "参数错误")
  143. return
  144. }
  145. GId, err := primitive.ObjectIDFromHex(gtid)
  146. LtId, err2 := primitive.ObjectIDFromHex(lteid)
  147. if err != nil || err2 != nil {
  148. log.Println(gtid, lteid, "转换_id错误")
  149. return
  150. }
  151. //udp的id区间查询bidding 中标人 中标联系人 中标联系电话
  152. // topscopeclass项目类型-industry行业类型&&topscopeclass联系人项目类型
  153. // (area地区-province省份 city城市-city城市 district区县-district区县)
  154. // winneraddr-company_address企业地址
  155. SourceClientcc := SourceClient.GetMgoConn()
  156. defer SourceClient.DestoryMongoConn(SourceClientcc)
  157. cursor := SourceClientcc.DB(Config["mgodb_bidding"]).C(Config["mgodb_mgoinit_c"]).Find(bson.M{
  158. "_id": bson.M{
  159. "$gte": GId,
  160. "$lte": LtId,
  161. },
  162. }).Select(bson.M{"winner": 1, "winnertel": 1, "winnerperson": 1,
  163. "topscopeclass": 1, "winneraddr": 1}).Iter()
  164. if cursor == nil {
  165. log.Println(cursor)
  166. return
  167. }
  168. overid := gtid
  169. tmp := map[string]interface{}{}
  170. for cursor.Next(&tmp) {
  171. overid = tmp["_id"].(primitive.ObjectID).Hex()
  172. log.Println(tmp["_id"])
  173. if tmp["winner"] == nil || tmp["winner"] == "" {
  174. continue
  175. }
  176. //redis查询是否存在
  177. rdb := RedisPool.Get()
  178. if reply, err := redis.String(rdb.Do("GET", tmp["winner"])); err != nil {
  179. //redis不存在存到临时表,定时任务处理
  180. FClient.DbName = Config["mgodb_extract_kf"]
  181. if tmpid := FClient.Save("winner_new", tmp) ;tmpid==nil{
  182. log.Println("FClient.Save err",tmpid)
  183. }
  184. //log.Println("get redis id err:定时任务处理", err, tmp)
  185. if err := rdb.Close(); err != nil {
  186. log.Println(err)
  187. }
  188. continue
  189. } else {
  190. //log.Println("redis get :", reply)
  191. //redis存在
  192. //log.Println(reply)
  193. //reply = "5e0316b998a9abaf6535df3d"
  194. //id, err := primitive.ObjectIDFromHex(reply)
  195. //if err != nil {
  196. // log.Println("get redis id Hex err:", err, tmp)
  197. // if err := rdb.Close(); err != nil {
  198. // log.Println(err)
  199. // }
  200. // continue
  201. //}
  202. if err := rdb.Close(); err != nil {
  203. log.Println(err)
  204. }
  205. //拿到合并后的qyk
  206. FClient.DbName = Config["mgodb_extract_kf"]
  207. oldTmp := FClient.FindById(Config["mgo_qyk_c"], reply)
  208. if oldTmp == nil{
  209. log.Println("redis id 不存在")
  210. continue
  211. }
  212. //err = FClient.Database(Config["mgodb_extract_kf"]).Collection(Config["mgo_qyk_c"]).
  213. // FindOne(context.TODO(), bson.M{"_id": id}).Decode(&oldTmp)
  214. //if err != nil {
  215. // log.Println("qyk id err:", err, id)
  216. // continue
  217. //}
  218. //比较合并
  219. //行业类型
  220. tmpTopscopeclass := []string{}
  221. tmpTopscopeclassMap := make(map[string]bool)
  222. if oldTmp["industry"] == nil {
  223. //log.Println(reflect.ValueOf(tmp["topscopeclass"]))
  224. if v, ok := tmp["topscopeclass"].(primitive.A); ok {
  225. for _, vv := range v {
  226. if vvv, ok := vv.(string); ok && len(vvv) > 1 {
  227. tmpTopscopeclassMap[vvv[:len(vvv)-1]] = true
  228. }
  229. }
  230. for k := range tmpTopscopeclassMap {
  231. tmpTopscopeclass = append(tmpTopscopeclass, k)
  232. }
  233. }
  234. } else {
  235. if v, ok := oldTmp["industry"].(primitive.A); ok {
  236. for _, vv := range v {
  237. if vvv, ok := vv.(string); ok {
  238. tmpTopscopeclassMap[vvv] = true
  239. }
  240. }
  241. }
  242. if v, ok := tmp["topscopeclass"].(primitive.A); ok {
  243. for _, vv := range v {
  244. if vvv, ok := vv.(string); ok && len(vvv) > 1 {
  245. tmpTopscopeclassMap[vvv[:len(vvv)-1]] = true
  246. }
  247. }
  248. for k := range tmpTopscopeclassMap {
  249. tmpTopscopeclass = append(tmpTopscopeclass, k)
  250. }
  251. }
  252. }
  253. sort.Strings(tmpTopscopeclass)
  254. oldTmp["industry"] = tmpTopscopeclass
  255. esId := oldTmp["_id"].(primitive.ObjectID).Hex()
  256. //更新行业类型
  257. if tmp["winnerperson"] == nil || tmp["winnerperson"] == "" || Reg_xing.MatchString(util.ObjToString(tmp["winnerperson"])) {
  258. oldTmp["updatatime"] = time.Now().Unix()
  259. //mongo更新
  260. FClient.DbName =Config["mgodb_extract_kf"]
  261. if !FClient.UpdateById(Config["mgo_qyk_c"],esId,bson.M{"$set": oldTmp}){
  262. log.Println("mongo更新err",esId)
  263. }
  264. //if _, err := FClient.Database(Config["mgodb_extract_kf"]).Collection(Config["mgo_qyk_c"]).
  265. // UpdateOne(context.TODO(), bson.M{"_id": oldTmp["_id"]}, bson.M{"$set": oldTmp}); err != nil {
  266. // log.Println("mongo更新err:", err)
  267. //}
  268. //es更新
  269. delete(oldTmp, "_id")
  270. //esConn := elastic.GetEsConn()
  271. //defer elastic.DestoryEsConn(esConn)
  272. if _, err := EsConn.Update().Index(Config["elasticsearch_index"]).Type(Config["elasticsearch_type"]).Id(esId).Doc(oldTmp).Refresh(true).Do(); err != nil {
  273. log.Println("update es err:", err)
  274. }
  275. //log.Println( err2,err3)
  276. continue
  277. }
  278. //联系方式合并
  279. var tmpperson, winnertel string
  280. tmpperson = tmp["winnerperson"].(string)
  281. if tmp["winnertel"] == nil || tmp["winnertel"] == "" {
  282. winnertel = ""
  283. } else {
  284. if Reg_xing.MatchString(util.ObjToString(tmp["winnertel"])) || !Reg_tel.MatchString(util.ObjToString(tmp["winnertel"])) {
  285. winnertel = ""
  286. } else {
  287. winnertel = util.ObjToString(tmp["winnertel"])
  288. }
  289. }
  290. contactMaps := make([]interface{}, 0)
  291. if oldTmp["contact"] == nil {
  292. tmpContact := make(map[string]interface{})
  293. tmpContact["contact_person"] = tmpperson
  294. tmpContact["contact_type"] = "项目联系人"
  295. tmpContact["phone"] = winnertel
  296. tmpContact["topscopeclass"] = strings.Join(tmpTopscopeclass, ";")
  297. tmpContact["updatetime"] = time.Now().Unix()
  298. contactMaps = append(contactMaps, tmpContact)
  299. } else {
  300. //对比前四项,相等丢弃
  301. if v, ok := oldTmp["contact"].(primitive.A); ok {
  302. var isNotUpdate bool
  303. for _, vv := range v {
  304. if vvv, ok := vv.(map[string]interface{}); ok {
  305. if vvv["contact_person"] == tmpperson && vvv["contact_type"] == "项目联系人" &&
  306. vvv["phone"] == winnertel && vvv["topscopeclass"] == strings.Join(tmpTopscopeclass, ";") {
  307. isNotUpdate = true
  308. vvv["updatetime"] = time.Now().Unix()
  309. }
  310. contactMaps = append(contactMaps, vvv)
  311. }
  312. }
  313. if !isNotUpdate {
  314. vvv := make(map[string]interface{})
  315. vvv["contact_person"] = tmp["winnerperson"]
  316. vvv["contact_type"] = "项目联系人"
  317. vvv["phone"] = winnertel
  318. vvv["topscopeclass"] = strings.Join(tmpTopscopeclass, ";")
  319. vvv["updatetime"] = time.Now().Unix()
  320. contactMaps = append(contactMaps, vvv)
  321. }
  322. }
  323. }
  324. oldTmp["contact"] = contactMaps
  325. //mongo更新
  326. oldTmp["updatatime"] = time.Now().Unix()
  327. FClient.DbName=Config["mgodb_extract_kf"]
  328. if !FClient.UpdateById(Config["mgo_qyk_c"],esId,bson.M{"$set": oldTmp}){
  329. log.Println("mongo更新 err",esId,oldTmp)
  330. }
  331. //if _, err := FClient.Database(Config["mgodb_extract_kf"]).Collection(Config["mgo_qyk_c"]).
  332. // UpdateOne(context.TODO(), bson.M{"_id": oldTmp["_id"]}, bson.M{"$set": oldTmp}); err != nil {
  333. // log.Println("mongo更新 err :", err)
  334. //}
  335. //es更新
  336. delete(oldTmp, "_id")
  337. //esConn := elastic.GetEsConn()
  338. //defer elastic.DestoryEsConn(esConn)
  339. if _, err := EsConn.Update().Index(Config["elasticsearch_index"]).Type(Config["elasticsearch_type"]).Id(esId).Doc(oldTmp).Refresh(true).Do(); err != nil {
  340. log.Println("EsConn err :", err)
  341. }
  342. //log.Println( err2,err3)
  343. }
  344. }
  345. //defer cursor.Close(context.Background())
  346. //log.Println("合并执行完成", gtid, lteid, overid)
  347. //if overid != lteid {
  348. // by, _ := json.Marshal(map[string]interface{}{
  349. // "gtid": overid,
  350. // "lteid": lteid,
  351. // "stype": "",
  352. // })
  353. // if e := udpclient.WriteUdp(by, mu.OP_TYPE_DATA, &net.UDPAddr{
  354. // IP: net.ParseIP("127.0.0.1"),
  355. // Port: Updport,
  356. // }); e != nil {
  357. // log.Println(e)
  358. // }
  359. // log.Println("重新发送udp:", string(by))
  360. // return
  361. //}
  362. log.Println("合并执行完成 ok", gtid, lteid, overid)
  363. }