main.go 5.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214
  1. package main
  2. import (
  3. "fmt"
  4. "github.com/cron"
  5. "mongodb"
  6. "os"
  7. "qfw/util"
  8. "strings"
  9. "time"
  10. )
  11. var (
  12. Mgo, MgoH *mongodb.MongodbSim
  13. Sysconfig, bidddingConf, biddingHConf map[string]interface{}
  14. noFields string
  15. )
  16. func Init() {
  17. util.ReadConfig(&Sysconfig)
  18. s := Sysconfig
  19. fmt.Println(s)
  20. bidddingConf = Sysconfig["bidding"].(map[string]interface{})
  21. Mgo = &mongodb.MongodbSim{
  22. MongodbAddr: bidddingConf["addr"].(string),
  23. Size: util.IntAllDef(bidddingConf["size"], 5),
  24. DbName: bidddingConf["db"].(string),
  25. UserName: bidddingConf["username"].(string),
  26. Password: bidddingConf["password"].(string),
  27. //Direct: true,
  28. }
  29. Mgo.InitPool()
  30. biddingHConf = Sysconfig["bidding_high"].(map[string]interface{})
  31. //高质量库
  32. MgoH = &mongodb.MongodbSim{
  33. MongodbAddr: biddingHConf["addr"].(string),
  34. Size: util.IntAllDef(biddingHConf["size"], 5),
  35. DbName: biddingHConf["db"].(string),
  36. UserName: biddingHConf["username"].(string),
  37. Password: biddingHConf["password"].(string),
  38. //Direct: true,
  39. }
  40. MgoH.InitPool()
  41. noFields = util.ObjToString(Sysconfig["no_fields"])
  42. }
  43. func main() {
  44. Init()
  45. c := cron.New()
  46. err := c.AddFunc(Sysconfig["spec"].(string), Mark)
  47. if err != nil {
  48. util.Debug("err", err)
  49. }
  50. c.Start()
  51. defer c.Stop()
  52. select {}
  53. }
  54. func Mark() {
  55. go highMark()
  56. }
  57. func highMark() {
  58. defer util.Catch()
  59. sess := Mgo.GetMgoConn()
  60. defer Mgo.DestoryMongoConn(sess)
  61. taskQuery := map[string]interface{}{
  62. "s_stype": "group",
  63. "s_status": "已完成",
  64. "is_return_highdata": map[string]interface{}{
  65. "$exists": 0,
  66. },
  67. }
  68. fields, _ := Mgo.Find("high_fields", nil, `{"sort":1}`, nil, false, -1, -1)
  69. if len(*fields) == 0 {
  70. util.Debug("字段顺序配置为空")
  71. os.Exit(1)
  72. }
  73. tasks, _ := Mgo.Find("f_task", taskQuery, nil, nil, false, -1, -1)
  74. util.Debug("本次处理任务总数:", len(*tasks))
  75. for _, task := range *tasks {
  76. util.Debug("开始处理任务数据:", task["s_groupname"], task["s_entname"])
  77. taskID := mongodb.BsonIdToSId(task["_id"])
  78. //任务对应的数据表
  79. s_sourceinfo := util.ObjToString(task["s_sourceinfo"])
  80. q := map[string]interface{}{
  81. "s_grouptaskid": map[string]interface{}{
  82. "$exists": 1,
  83. },
  84. }
  85. query := sess.DB(bidddingConf["db"].(string)).C(s_sourceinfo).Find(&q).Select(nil).Iter()
  86. count := 0
  87. for tmp := make(map[string]interface{}); query.Next(tmp); count++ {
  88. infoID := mongodb.BsonIdToSId(tmp["_id"])
  89. if count%1000 == 0 {
  90. util.Debug(fmt.Sprintf(" %v deal current --- %d", task["s_entname"], count))
  91. }
  92. //找到标注数据结果
  93. marked, _ := Mgo.FindById("marked", infoID, nil)
  94. markedData := *marked
  95. //计算标注 结果
  96. //标注结果,十进制数字
  97. if markedData["v_taginfo"] == nil {
  98. continue
  99. }
  100. taginfo := markedData["v_taginfo"].(map[string]interface{})
  101. res := calculateFlag(taginfo, *fields) //返回标注的十进制数字
  102. if data, ok := markedData["v_baseinfo"].(map[string]interface{}); ok {
  103. if _, ok := data["id"]; !ok {
  104. continue
  105. }
  106. data["field_bitvalue"] = res
  107. data["i_comeintime"] = time.Now().Unix()
  108. data["i_updatetime"] = time.Now().Unix()
  109. //删除多余无用字段
  110. noField := strings.Split(noFields, ",")
  111. if len(noField) > 0 {
  112. for _, field := range noField {
  113. delete(data, field)
  114. }
  115. }
  116. update := make(map[string]interface{})
  117. update["$set"] = data
  118. where := map[string]interface{}{
  119. "_id": mongodb.StringTOBsonId(util.ObjToString(data["id"])),
  120. }
  121. if !MgoH.Update(util.ObjToString(biddingHConf["coll"]), where, update, true, false) {
  122. util.Debug("任务 ", task["s_groupname"], infoID, "入库错误,请检查")
  123. } else {
  124. //1、更新数据源信息
  125. setResult := map[string]interface{}{ //更新字段集
  126. "is_return_highdata": 1,
  127. "return_highdatetime": time.Now().Unix(),
  128. }
  129. set := map[string]interface{}{
  130. "$set": setResult,
  131. }
  132. Mgo.UpdateById(s_sourceinfo, infoID, set)
  133. }
  134. }
  135. }
  136. util.Debug("任务: ", task["s_entname"], "数据表: ", s_sourceinfo, " 处理总数为: ", count, "分配的数据总量为: ", task["i_givenum"])
  137. if count > 0 {
  138. //当前任务结束
  139. //3.更新任务表,
  140. taskSetResult := map[string]interface{}{ //更新字段集
  141. "is_return_highdata": 1,
  142. }
  143. taskSet := map[string]interface{}{
  144. "$set": taskSetResult,
  145. }
  146. Mgo.UpdateById("f_task", taskID, taskSet)
  147. //4. 记录任务中入高质量库数据
  148. taskInsert := map[string]interface{}{
  149. "task_id": taskID, //任务ID
  150. "high_mark_count": count, // 标注入高质量数据
  151. "given_count": task["i_givenum"], //任务分配数量
  152. "createtime": time.Now().Unix(),
  153. "updatetime": time.Now().Unix(),
  154. }
  155. Mgo.Save("high_result", taskInsert)
  156. } else {
  157. util.Debug(task["s_entname"], "数据表:", s_sourceinfo, "获取的数据总数为:", count, "分配的数据总量为:", task["i_givenum"])
  158. }
  159. util.Debug(task["s_groupname"], "数据处理完毕")
  160. }
  161. util.Debug("所有任务处理完毕")
  162. }
  163. // calculateFlag 根据数据,返回被标注的字段数字
  164. func calculateFlag(marked map[string]interface{}, data []map[string]interface{}) uint64 {
  165. var result uint64
  166. for _, item := range data {
  167. name, ok := item["name"].(string)
  168. if !ok {
  169. continue
  170. }
  171. sort, ok := item["sort"].(int32)
  172. if !ok {
  173. continue
  174. }
  175. // 根据字段名称查找对应的标记值
  176. _, ok = marked[name]
  177. if !ok {
  178. continue
  179. }
  180. // 通过位运算将标记值放置到正确的位置
  181. result |= 1 << (sort - 1)
  182. }
  183. return result
  184. }