main.go 6.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234
  1. package main
  2. import (
  3. "fmt"
  4. "github.com/cron"
  5. "mongodb"
  6. "os"
  7. "qfw/util"
  8. "strings"
  9. "time"
  10. )
  11. var (
  12. Mgo, MgoH, MgoB *mongodb.MongodbSim
  13. Sysconfig, bidddingConf, biddingHConf map[string]interface{}
  14. noFields string
  15. )
  16. func Init() {
  17. util.ReadConfig(&Sysconfig)
  18. s := Sysconfig
  19. fmt.Println(s)
  20. bidddingConf = Sysconfig["bidding"].(map[string]interface{})
  21. Mgo = &mongodb.MongodbSim{
  22. MongodbAddr: bidddingConf["addr"].(string),
  23. Size: util.IntAllDef(bidddingConf["size"], 5),
  24. DbName: bidddingConf["db"].(string),
  25. UserName: bidddingConf["username"].(string),
  26. Password: bidddingConf["password"].(string),
  27. //Direct: true,
  28. }
  29. Mgo.InitPool()
  30. biddingHConf = Sysconfig["bidding_high"].(map[string]interface{})
  31. //高质量库
  32. MgoH = &mongodb.MongodbSim{
  33. MongodbAddr: biddingHConf["addr"].(string),
  34. Size: util.IntAllDef(biddingHConf["size"], 5),
  35. DbName: biddingHConf["db"].(string),
  36. UserName: biddingHConf["username"].(string),
  37. Password: biddingHConf["password"].(string),
  38. //Direct: true,
  39. }
  40. MgoH.InitPool()
  41. //bidding
  42. MgoB = &mongodb.MongodbSim{
  43. MongodbAddr: biddingHConf["addr"].(string),
  44. Size: util.IntAllDef(biddingHConf["size"], 5),
  45. DbName: "qfw",
  46. UserName: biddingHConf["username"].(string),
  47. Password: biddingHConf["password"].(string),
  48. //Direct: true,
  49. }
  50. MgoB.InitPool()
  51. noFields = util.ObjToString(Sysconfig["no_fields"])
  52. }
  53. func main() {
  54. Init()
  55. c := cron.New()
  56. err := c.AddFunc(Sysconfig["spec"].(string), Mark)
  57. if err != nil {
  58. util.Debug("err", err)
  59. }
  60. c.Start()
  61. defer c.Stop()
  62. select {}
  63. }
  64. func Mark() {
  65. go highMark()
  66. }
  67. func highMark() {
  68. defer util.Catch()
  69. sess := Mgo.GetMgoConn()
  70. defer Mgo.DestoryMongoConn(sess)
  71. taskQuery := map[string]interface{}{
  72. "s_stype": "group",
  73. "s_status": "已完成",
  74. "is_return_highdata": map[string]interface{}{
  75. "$exists": 0,
  76. },
  77. }
  78. fields, _ := Mgo.Find("high_fields", nil, `{"sort":1}`, nil, false, -1, -1)
  79. if len(*fields) == 0 {
  80. util.Debug("字段顺序配置为空")
  81. os.Exit(1)
  82. }
  83. tasks, _ := Mgo.Find("f_task", taskQuery, nil, nil, false, -1, -1)
  84. util.Debug("本次处理任务总数:", len(*tasks))
  85. for _, task := range *tasks {
  86. util.Debug("开始处理任务数据:", task["s_groupname"], task["s_entname"])
  87. taskID := mongodb.BsonIdToSId(task["_id"])
  88. //任务对应的数据表
  89. s_sourceinfo := util.ObjToString(task["s_sourceinfo"])
  90. q := map[string]interface{}{
  91. "s_grouptaskid": map[string]interface{}{
  92. "$exists": 1,
  93. },
  94. }
  95. query := sess.DB(bidddingConf["db"].(string)).C(s_sourceinfo).Find(&q).Select(nil).Iter()
  96. count := 0
  97. for tmp := make(map[string]interface{}); query.Next(tmp); count++ {
  98. infoID := mongodb.BsonIdToSId(tmp["_id"])
  99. if count%1000 == 0 {
  100. util.Debug(fmt.Sprintf(" %v deal current --- %d", task["s_entname"], count))
  101. }
  102. //找到标注数据结果
  103. marked, _ := Mgo.FindById("marked", infoID, nil)
  104. markedData := *marked
  105. //计算标注 结果
  106. //标注结果,十进制数字
  107. if markedData["v_taginfo"] == nil {
  108. continue
  109. }
  110. taginfo := markedData["v_taginfo"].(map[string]interface{})
  111. res := calculateFlag(taginfo, *fields) //返回标注的十进制数字
  112. if data, ok := markedData["v_baseinfo"].(map[string]interface{}); ok {
  113. where := make(map[string]interface{})
  114. if _, ok := data["id"]; ok {
  115. bidd, _ := MgoB.FindById("bidding", util.ObjToString(data["id"]), nil)
  116. if len(*bidd) > 0 {
  117. where["_id"] = mongodb.StringTOBsonId(util.ObjToString(data["id"]))
  118. }
  119. } else {
  120. bidd, _ := MgoB.FindById("bidding", mongodb.BsonIdToSId(markedData["_id"]), nil)
  121. if len(*bidd) > 0 {
  122. where["_id"] = mongodb.StringTOBsonId(util.ObjToString(data["id"]))
  123. } else {
  124. continue
  125. }
  126. }
  127. data["field_bitvalue"] = res
  128. data["i_comeintime"] = time.Now().Unix()
  129. data["i_updatetime"] = time.Now().Unix()
  130. //删除多余无用字段
  131. noField := strings.Split(noFields, ",")
  132. if len(noField) > 0 {
  133. for _, field := range noField {
  134. delete(data, field)
  135. }
  136. }
  137. update := make(map[string]interface{})
  138. update["$set"] = data
  139. if !MgoH.Update(util.ObjToString(biddingHConf["coll"]), where, update, true, false) {
  140. util.Debug("任务 ", task["s_groupname"], infoID, "入库错误,请检查")
  141. } else {
  142. //1、更新数据源信息
  143. setResult := map[string]interface{}{ //更新字段集
  144. "is_return_highdata": 1,
  145. "return_highdatetime": time.Now().Unix(),
  146. }
  147. set := map[string]interface{}{
  148. "$set": setResult,
  149. }
  150. Mgo.UpdateById(s_sourceinfo, infoID, set)
  151. }
  152. }
  153. }
  154. util.Debug("任务: ", task["s_entname"], "数据表: ", s_sourceinfo, " 处理总数为: ", count, "分配的数据总量为: ", task["i_givenum"])
  155. if count > 0 {
  156. //当前任务结束
  157. //3.更新任务表,
  158. taskSetResult := map[string]interface{}{ //更新字段集
  159. "is_return_highdata": 1,
  160. }
  161. taskSet := map[string]interface{}{
  162. "$set": taskSetResult,
  163. }
  164. Mgo.UpdateById("f_task", taskID, taskSet)
  165. //4. 记录任务中入高质量库数据
  166. taskInsert := map[string]interface{}{
  167. "task_id": taskID, //任务ID
  168. "high_mark_count": count, // 标注入高质量数据
  169. "given_count": task["i_givenum"], //任务分配数量
  170. "createtime": time.Now().Unix(),
  171. "updatetime": time.Now().Unix(),
  172. }
  173. Mgo.Save("high_result", taskInsert)
  174. } else {
  175. util.Debug(task["s_entname"], "数据表:", s_sourceinfo, "获取的数据总数为:", count, "分配的数据总量为:", task["i_givenum"])
  176. }
  177. util.Debug(task["s_groupname"], "数据处理完毕")
  178. }
  179. util.Debug("所有任务处理完毕")
  180. }
  181. // calculateFlag 根据数据,返回被标注的字段数字
  182. func calculateFlag(marked map[string]interface{}, data []map[string]interface{}) uint64 {
  183. var result uint64
  184. for _, item := range data {
  185. name, ok := item["name"].(string)
  186. if !ok {
  187. continue
  188. }
  189. sort, ok := item["sort"].(int32)
  190. if !ok {
  191. continue
  192. }
  193. // 根据字段名称查找对应的标记值
  194. _, ok = marked[name]
  195. if !ok {
  196. continue
  197. }
  198. // 通过位运算将标记值放置到正确的位置
  199. result |= 1 << (sort - 1)
  200. }
  201. return result
  202. }