qyxy.go 7.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253
  1. package main
  2. import (
  3. "context"
  4. "encoding/json"
  5. "fmt"
  6. "github.com/olivere/elastic/v7"
  7. "github.com/xuri/excelize/v2"
  8. "gorm.io/driver/mysql"
  9. "gorm.io/gorm"
  10. util "jygit.jydev.jianyu360.cn/data_processing/common_utils"
  11. "jygit.jydev.jianyu360.cn/data_processing/common_utils/mongodb"
  12. "log"
  13. "strings"
  14. )
  15. // exportQy 导出企业相关信息,匹配表格中的,企业所在地、企业联系人、职位、联系方式、2023年的中标项目数以及总金额
  16. func exportQy() {
  17. Mgo := &mongodb.MongodbSim{
  18. //MongodbAddr: "172.17.189.140:27080",
  19. MongodbAddr: "127.0.0.1:27083",
  20. Size: 10,
  21. DbName: "mixdata",
  22. UserName: "SJZY_RWbid_ES",
  23. Password: "SJZY@B4i4D5e6S",
  24. Direct: true,
  25. }
  26. Mgo.InitPool()
  27. username := "datascbi"
  28. password := "Da#Bi20221111SC"
  29. host := "127.0.0.1:4001"
  30. //host := "172.17.162.25:4000"
  31. database := "global_common_data"
  32. dsn := fmt.Sprintf("%s:%s@tcp(%s)/%s?charset=utf8mb4&parseTime=True&loc=Local", username, password, host, database)
  33. // 连接到数据库
  34. db, err := gorm.Open(mysql.Open(dsn), &gorm.Config{})
  35. if err != nil {
  36. log.Println("Failed to connect to database:", err)
  37. return
  38. }
  39. f, err := excelize.OpenFile("./2023年数字中国参展商名录.xlsx")
  40. if err != nil {
  41. fmt.Println(err)
  42. return
  43. }
  44. defer func() {
  45. if err := f.Close(); err != nil {
  46. fmt.Println(err)
  47. }
  48. }()
  49. rows, err := f.GetRows("Sheet1")
  50. if err != nil {
  51. fmt.Println(err)
  52. return
  53. }
  54. type BaseInfo struct {
  55. Name string `json:"name"`
  56. NameId string `json:"name_id"`
  57. }
  58. type Contact struct {
  59. ContactName string `json:"contact_name"`
  60. ContactTel string `json:"contact_tel"`
  61. }
  62. //
  63. url2 := "http://127.0.0.1:19905"
  64. username2 := "jybid"
  65. password2 := "Top2023_JEB01i@31"
  66. // 创建 Elasticsearch 客户端
  67. client2, err := elastic.NewClient(
  68. elastic.SetURL(url2),
  69. elastic.SetBasicAuth(username2, password2),
  70. elastic.SetSniff(false),
  71. )
  72. if err != nil {
  73. log.Fatalf("创建 Elasticsearch 客户端失败:%s", err)
  74. }
  75. subtitles := []string{"企业名称", "企业省份", "企业城市", "标讯-联系方式", "凭安-联系方式", "2023中标项目数", "2023中标总金额"}
  76. results := make([][]interface{}, 0)
  77. for i := 1; i < len(rows); i++ {
  78. name := rows[i][0]
  79. //1.标讯抽取的联系方式
  80. contactsMap := make([]string, 0) //联系人信息
  81. baseinfo := BaseInfo{}
  82. log.Println(name)
  83. db.Table("dws_f_ent_baseinfo").Select("name", "name_id").Where("name = ? ", name).Order("publishtime desc").Limit(10).Scan(&baseinfo)
  84. if baseinfo.NameId != "" {
  85. contacts := []Contact{}
  86. db.Table("dws_f_ent_contact").Select("contact_name", "contact_tel").Where("name_id = ? ", baseinfo.NameId).Scan(&contacts)
  87. if len(contacts) > 0 {
  88. for _, v := range contacts {
  89. if strings.Contains(v.ContactTel, ">") {
  90. continue
  91. }
  92. if v.ContactName != "" && v.ContactTel != "" {
  93. s := v.ContactName + "_" + v.ContactTel
  94. if !IsInStringArray(s, contactsMap) {
  95. contactsMap = append(contactsMap, s)
  96. }
  97. } else {
  98. if !IsInStringArray(v.ContactTel, contactsMap) {
  99. contactsMap = append(contactsMap, v.ContactTel)
  100. }
  101. }
  102. }
  103. }
  104. }
  105. //2.凭安联系方式
  106. stds, _ := Mgo.FindOne("qyxy_std", map[string]interface{}{"company_name": name})
  107. var reportsMap = make([]string, 0)
  108. if reports, ok := (*stds)["annual_reports"]; ok {
  109. if rs, ok := reports.([]interface{}); ok {
  110. for _, v := range rs {
  111. if da, ok := v.(map[string]interface{}); ok {
  112. if util.ObjToString(da["operator_name"]) != "" && util.ObjToString(da["company_phone"]) != "" {
  113. tm := util.ObjToString(da["operator_name"]) + "_" + util.ObjToString(da["company_phone"])
  114. if !IsInStringArray(tm, reportsMap) {
  115. reportsMap = append(reportsMap, tm)
  116. }
  117. } else if util.ObjToString(da["company_phone"]) != "" {
  118. if !IsInStringArray(util.ObjToString(da["company_phone"]), reportsMap) {
  119. reportsMap = append(reportsMap, util.ObjToString(da["company_phone"]))
  120. }
  121. }
  122. }
  123. }
  124. }
  125. }
  126. //查询企业中标数据
  127. count, amount := getAmountData(client2, "bidding", name)
  128. results = append(results, []interface{}{name, (*stds)["company_area"], (*stds)["company_city"], strings.Join(contactsMap, ","), strings.Join(reportsMap, ","), count, amount})
  129. }
  130. sheet := "联系方式"
  131. f.NewSheet(sheet)
  132. line := 0
  133. line++
  134. //设置第一行title
  135. _ = f.SetSheetRow(sheet, fmt.Sprintf("%s%d", "A", line), &subtitles)
  136. for k, _ := range results {
  137. line++
  138. err = f.SetSheetRow(sheet, fmt.Sprintf("%s%d", "A", line), &results[k])
  139. if err != nil {
  140. log.Println(err)
  141. }
  142. }
  143. f.Save()
  144. }
  145. // getAmountData 根据企业名称,获取2023年中标数量,以及中标总金额
  146. func getAmountData(client *elastic.Client, index string, companyName string) (int64, float32) {
  147. query := elastic.NewBoolQuery().
  148. Must(elastic.NewTermQuery("s_winner", companyName)).
  149. Must(elastic.NewRangeQuery("publishtime").Gte(1672502400).Lt(1704038400)) //2023-01-01 -- 2024-01-01
  150. //ctx := context.Background()
  151. //
  152. searchResult, err := client.Search().Size(10000).
  153. Index(index).
  154. Query(query).
  155. Do(context.Background())
  156. if err != nil {
  157. log.Fatalf("Error executing search: %s", err)
  158. }
  159. totalAmount := float32(0)
  160. if len(searchResult.Hits.Hits) > 0 {
  161. for _, hit := range searchResult.Hits.Hits {
  162. var doc map[string]interface{}
  163. err := json.Unmarshal(hit.Source, &doc)
  164. if err != nil {
  165. log.Printf("解析文档失败:%s", err)
  166. continue
  167. }
  168. bidamount := float32(util.Float64All(doc["bidamount"]))
  169. totalAmount += bidamount
  170. }
  171. }
  172. return searchResult.TotalHits(), totalAmount
  173. //////////
  174. //开始滚动搜索
  175. //scrollID := ""
  176. //scroll := "10m"
  177. //searchSource := elastic.NewSearchSource().
  178. // Query(query).
  179. // Size(10000).
  180. // Sort("_doc", true) //升序排序
  181. ////Sort("_doc", false) //降序排序
  182. //
  183. //searchService := client.Scroll(index).
  184. // Size(10000).
  185. // Scroll(scroll).
  186. // SearchSource(searchSource)
  187. //
  188. //res, err := searchService.Do(ctx)
  189. //if err != nil {
  190. // if err == io.EOF {
  191. // fmt.Println("没有数据")
  192. // } else {
  193. // panic(err)
  194. // }
  195. //
  196. //}
  197. ////defer client.ClearScroll().ScrollId(scrollID).Do(ctx) // 在退出时清理资源
  198. //fmt.Println(companyName, "总数是:", res.TotalHits())
  199. //total := 0
  200. //totalAmount = float32(0)
  201. //for len(res.Hits.Hits) > 0 {
  202. // for _, hit := range res.Hits.Hits {
  203. // var doc map[string]interface{}
  204. // err := json.Unmarshal(hit.Source, &doc)
  205. // if err != nil {
  206. // log.Printf("解析文档失败:%s", err)
  207. // continue
  208. // }
  209. //
  210. // bidamount := float32(util.Float64All(doc["bidamount"]))
  211. // totalAmount += bidamount
  212. // }
  213. //
  214. // total = total + len(res.Hits.Hits)
  215. // scrollID = res.ScrollId
  216. // res, err = client.Scroll().ScrollId(scrollID).Scroll(scroll).Do(ctx)
  217. // log.Println("current count:", total)
  218. // if err != nil {
  219. // if err == io.EOF {
  220. // // 滚动到最后一批数据,退出循环
  221. // break
  222. // }
  223. // log.Println("滚动搜索失败:", err, res)
  224. // break // 处理错误时退出循环
  225. // }
  226. //}
  227. //// 在循环外调用 ClearScroll
  228. //_, err = client.ClearScroll().ScrollId(scrollID).Do(ctx)
  229. //if err != nil {
  230. // log.Printf("清理滚动搜索失败:%s", err)
  231. //}
  232. //
  233. //fmt.Println(companyName, "结束~~~~~~~~~~~~~~~")
  234. //
  235. //return res.TotalHits(), totalAmount
  236. }