main.go 34 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250
  1. package main
  2. import (
  3. "context"
  4. "encoding/json"
  5. "fmt"
  6. "github.com/olivere/elastic/v7"
  7. "gorm.io/driver/mysql"
  8. "gorm.io/gorm"
  9. "io"
  10. util "jygit.jydev.jianyu360.cn/data_processing/common_utils"
  11. "jygit.jydev.jianyu360.cn/data_processing/common_utils/mongodb"
  12. "log"
  13. "strings"
  14. "sync"
  15. "unicode/utf8"
  16. )
  17. var (
  18. MgoB *mongodb.MongodbSim
  19. )
  20. func InitMgo() {
  21. MgoB = &mongodb.MongodbSim{
  22. //MongodbAddr: "172.31.31.202:27081,172.20.45.128:27080",
  23. MongodbAddr: "127.0.0.1:27083",
  24. Size: 10,
  25. DbName: "qfw",
  26. UserName: "SJZY_RWbid_ES",
  27. Password: "SJZY@B4i4D5e6S",
  28. Direct: true,
  29. }
  30. MgoB.InitPool()
  31. }
  32. func main() {
  33. getBiddingDiff()
  34. return
  35. InitMgo()
  36. getBidding2()
  37. //InitMgo()
  38. //getCountProjectWinner3()
  39. //CountProjectWinner()
  40. //getBiddingLimitData()
  41. //getQyxyNationToFiles()
  42. //exportQyxy() //导出企业数据
  43. //dealXlsx()
  44. //getQyxyNation() //导出 国标行业分类,注册资金靠前的企业
  45. //getQyxyNation()
  46. //InitMgo()
  47. //getDataFromFile()
  48. //updateXlsxDa()
  49. return
  50. /**
  51. getProjectData click 是一起使用的,统计获取中标企业信息
  52. */
  53. //getProjectDataFromEs() //1.拉取项目中标成交数据
  54. //click() //2.处理项目数据,写入clickhouse
  55. //click2()
  56. //dealData()
  57. //getProject()
  58. //getQyLimitData()
  59. //getBiddingData()
  60. //getQyxytData()
  61. //getTidb()
  62. //getEntInfo() //法人库数据
  63. //getBuyerData()
  64. //mgoBidding()
  65. //log.Println("开启第二轮")
  66. //mgoBidding()
  67. //updateMgoEntInfoBuyer()
  68. //getZhiMa()
  69. //log.Println("over ------------------ over")
  70. //fixProjectPortrait()
  71. //
  72. //ClickhouseData() //gorm 操作Clickhouse;gorm 对Clickhouse的bitmap兼容性不行,放弃
  73. //dealClickhouse() //clickhouse-go 操作
  74. //testUpdateBitmap() //测试环境测试更新Clickhouse bitmap字段
  75. ///-------//
  76. //updateHrefByEs()
  77. //getGD() // 获取广东企业数据
  78. //
  79. //getBidding2()
  80. //--------------//
  81. //dealYJG() // 处理姚静歌需求,处理项目数据到Clickhouse
  82. log.Println("over ------------------ over")
  83. }
  84. // dealYJG 处理姚静歌 、韩鸿飞 之前的需要,处理企业数据到Clickhouse
  85. func dealYJG() {
  86. getProjectDataFromEs()
  87. }
  88. // getBiddingData 获取标讯数据
  89. func getBiddingData() {
  90. url := "http://172.17.4.184:19908"
  91. //url := "http://127.0.0.1:19908"
  92. username := "jybid"
  93. password := "Top2023_JEB01i@31"
  94. index := "bidding" //索引名称
  95. //index := "projectset" //索引名称
  96. // 创建 Elasticsearch 客户端
  97. client, err := elastic.NewClient(
  98. elastic.SetURL(url),
  99. elastic.SetBasicAuth(username, password),
  100. elastic.SetSniff(false),
  101. )
  102. if err != nil {
  103. log.Fatalf("创建 Elasticsearch 客户端失败:%s", err)
  104. }
  105. //85 抽取库
  106. //Mgo := &mongodb.MongodbSim{
  107. // //MongodbAddr: "127.0.0.1:27080",
  108. // MongodbAddr: "172.17.4.85:27080",
  109. // DbName: "top",
  110. // Size: 10,
  111. // //Direct: true,
  112. //}
  113. //Mgo.InitPool()
  114. MgoB := &mongodb.MongodbSim{
  115. //MongodbAddr: "172.31.31.202:27081,172.20.45.128:27080",
  116. MongodbAddr: "127.0.0.1:27083",
  117. Size: 10,
  118. DbName: "qfw",
  119. UserName: "SJZY_RWbid_ES",
  120. Password: "SJZY@B4i4D5e6S",
  121. //Direct: true,
  122. }
  123. MgoB.InitPool()
  124. //2023年01-01 2023-10-01,,1-3季度
  125. //2024-1 - 2024-4;1704038400-1711900800
  126. //2023-10-1 2024-1-1;1696089600-1704038400
  127. //areaTermsQuery := elastic.NewTermsQuery("area", "江苏", "安徽", "上海", "天津", "河北", "浙江", "天津市", "上海市", "河北省", "安徽省", "江苏省", "浙江省", "北京", "北京市")
  128. //rangeQuery := elastic.NewRangeQuery("firsttime").Gte(1696089600).Lt(1704038400)
  129. //rangeQuery := elastic.NewRangeQuery("publishtime").Gte("1640966400")
  130. //query := elastic.NewBoolQuery().
  131. // Must(rangeQuery).
  132. // Must(elastic.NewTermsQuery("subtype", "中标", "单一", "成交", "合同"))
  133. //Must(elastic.NewTermQuery("site", "中国招标与采购网")).Must(rangeQuery)
  134. //query := elastic.NewBoolQuery().
  135. // //北京,天津,河北,上海,江苏,浙江,安徽
  136. // //Must(elastic.NewTermQuery("area", "北京市")).sassss
  137. // Must(elastic.NewTermsQuery("subtype", "中标", "单一", "成交", "合同")).
  138. // Must(elastic.NewTermsQuery("area", "北京", "上海", "江苏", "浙江", "广东")).
  139. // Must(rangeQuery)
  140. //
  141. rangeQuery := elastic.NewRangeQuery("publishtime").Gte("1640966400")
  142. termsQuery := elastic.NewTermsQuery("subtype", "中标", "单一", "成交", "合同")
  143. // 综合所有条件
  144. query := elastic.NewBoolQuery().
  145. Must(rangeQuery).
  146. Must(termsQuery)
  147. ctx := context.Background()
  148. //开始滚动搜索
  149. scrollID := ""
  150. scroll := "10m"
  151. searchSource := elastic.NewSearchSource().
  152. Query(query).
  153. Size(10000).
  154. Sort("_doc", true) //升序排序
  155. //Sort("_doc", false) //降序排序
  156. searchService := client.Scroll(index).
  157. Size(10000).
  158. Scroll(scroll).
  159. SearchSource(searchSource)
  160. res, err := searchService.Do(ctx)
  161. if err != nil {
  162. if err == io.EOF {
  163. fmt.Println("没有数据")
  164. } else {
  165. panic(err)
  166. }
  167. }
  168. //defer client.ClearScroll().ScrollId(scrollID).Do(ctx) // 在退出时清理资源
  169. fmt.Println("总数是:", res.TotalHits())
  170. total := 0
  171. for len(res.Hits.Hits) > 0 {
  172. for _, hit := range res.Hits.Hits {
  173. var doc map[string]interface{}
  174. err := json.Unmarshal(hit.Source, &doc)
  175. if err != nil {
  176. log.Printf("解析文档失败:%s", err)
  177. continue
  178. }
  179. delete(doc, "filetext")
  180. delete(doc, "detail")
  181. purchasing := util.ObjToString(doc["purchasing"])
  182. if strings.Contains(purchasing, "新华三") || strings.Contains(purchasing, "华三") || strings.Contains(purchasing, "H3C") || strings.Contains(purchasing, "h3c") {
  183. //存入新表
  184. err = MgoB.InsertOrUpdate("qfw", "wcc_bidding_test_250219", doc)
  185. if err != nil {
  186. log.Println("error", doc["id"])
  187. }
  188. }
  189. // 处理查询结果
  190. //area := util.ObjToString(doc["area"])
  191. //areas := []string{"北京", "上海", "广东", "江苏", "浙江"}
  192. //if !IsInStringArray(area, areas) {
  193. // continue
  194. //}
  195. //projectName := util.ObjToString(doc["projectname"])
  196. //if strings.Contains(projectName, "非政府") {
  197. // continue
  198. //}
  199. //buyerclass := util.ObjToString(doc["buyerclass"])
  200. //if buyerclass == "批发零售" || buyerclass == "住宿餐饮" || buyerclass == "信息技术" {
  201. // continue
  202. //}
  203. ////存入新表
  204. //err = Mgo.InsertOrUpdate("qfw", "wcc_bank_poc", doc)
  205. //if err != nil {
  206. // log.Println("error", doc["id"])
  207. //}
  208. }
  209. total = total + len(res.Hits.Hits)
  210. scrollID = res.ScrollId
  211. res, err = client.Scroll().ScrollId(scrollID).Scroll(scroll).Do(ctx)
  212. log.Println("current count:", total)
  213. if err != nil {
  214. if err == io.EOF {
  215. // 滚动到最后一批数据,退出循环
  216. break
  217. }
  218. log.Println("滚动搜索失败:", err, res)
  219. break // 处理错误时退出循环
  220. }
  221. }
  222. // 在循环外调用 ClearScroll
  223. _, err = client.ClearScroll().ScrollId(scrollID).Do(ctx)
  224. if err != nil {
  225. log.Printf("清理滚动搜索失败:%s", err)
  226. }
  227. fmt.Println("结束~~~~~~~~~~~~~~~")
  228. }
  229. // getProjectDataFromEs 获取项目 中标成交数据
  230. func getProjectDataFromEs() {
  231. //url := "http://172.17.4.184:19908"
  232. url := "http://127.0.0.1:19908"
  233. username := "jybid"
  234. password := "Top2023_JEB01i@31"
  235. index := "projectset" //索引名称
  236. // 创建 Elasticsearch 客户端
  237. client, err := elastic.NewClient(
  238. elastic.SetURL(url),
  239. elastic.SetBasicAuth(username, password),
  240. elastic.SetSniff(false),
  241. )
  242. if err != nil {
  243. log.Fatalf("创建 Elasticsearch 客户端失败:%s", err)
  244. }
  245. //85 抽取库
  246. Mgo := &mongodb.MongodbSim{
  247. MongodbAddr: "127.0.0.1:27080",
  248. //MongodbAddr: "172.17.4.85:27080",
  249. DbName: "top",
  250. Size: 10,
  251. Direct: true,
  252. }
  253. Mgo.InitPool()
  254. //MgoB := &mongodb.MongodbSim{
  255. // MongodbAddr: "172.17.189.140:27080",
  256. // //MongodbAddr: "127.0.0.1:27083",
  257. // Size: 10,
  258. // DbName: "qfw",
  259. // UserName: "SJZY_RWbid_ES",
  260. // Password: "SJZY@B4i4D5e6S",
  261. // //Direct: true,
  262. //}
  263. //MgoB.InitPool()
  264. //2023年01-01 2023-10-01,,1-3季度
  265. //2024-1 - 2024-4;1704038400-1711900800
  266. //2023-10-1 2024-1-1;1696089600-1704038400
  267. //areaTermsQuery := elastic.NewTermsQuery("area", "江苏", "安徽", "上海", "天津", "河北", "浙江", "天津市", "上海市", "河北省", "安徽省", "江苏省", "浙江省", "北京", "北京市")
  268. //rangeQuery := elastic.NewRangeQuery("firsttime").Gte(1711900800).Lt(1719763200) //2024年4-7月
  269. //rangeQuery := elastic.NewRangeQuery("firsttime").Gte(1735660800).Lt(1743436800) //2025年1-3月;25年第一季度数据
  270. rangeQuery := elastic.NewRangeQuery("firsttime").Gte(1743436800).Lt(1751299200) //2025年4.1-7.1 ;25年第二季度数据
  271. query := elastic.NewBoolQuery().
  272. //Must(areaTermsQuery).
  273. Must(elastic.NewTermsQuery("bidstatus", "中标", "单一", "成交", "合同")).
  274. Must(rangeQuery)
  275. //rangeQuery := elastic.NewRangeQuery("comeintime").Gte("1640966400").Lt("1703952000")
  276. //query := elastic.NewBoolQuery().
  277. // //北京,天津,河北,上海,江苏,浙江,安徽
  278. // //Must(elastic.NewTermQuery("area", "北京市")).
  279. // Must(elastic.NewTermsQuery("subtype", "中标", "单一", "成交", "合同")).
  280. // Must(elastic.NewTermsQuery("area", "北京", "上海", "江苏", "浙江", "广东")).
  281. // Must(rangeQuery)
  282. ctx := context.Background()
  283. //开始滚动搜索
  284. scrollID := ""
  285. scroll := "10m"
  286. searchSource := elastic.NewSearchSource().
  287. Query(query).
  288. Size(10000).
  289. Sort("_doc", true) //升序排序
  290. //Sort("_doc", false) //降序排序
  291. searchService := client.Scroll(index).
  292. Size(10000).
  293. Scroll(scroll).
  294. SearchSource(searchSource)
  295. res, err := searchService.Do(ctx)
  296. if err != nil {
  297. if err == io.EOF {
  298. fmt.Println("没有数据")
  299. } else {
  300. panic(err)
  301. }
  302. }
  303. //defer client.ClearScroll().ScrollId(scrollID).Do(ctx) // 在退出时清理资源
  304. fmt.Println("总数是:", res.TotalHits())
  305. total := 0
  306. for len(res.Hits.Hits) > 0 {
  307. for _, hit := range res.Hits.Hits {
  308. var doc map[string]interface{}
  309. err := json.Unmarshal(hit.Source, &doc)
  310. if err != nil {
  311. log.Printf("解析文档失败:%s", err)
  312. continue
  313. }
  314. delete(doc, "filetext")
  315. delete(doc, "detail")
  316. sWinner := util.ObjToString(doc["s_winner"])
  317. winners := strings.Split(sWinner, ",")
  318. for _, v := range winners {
  319. insert := doc
  320. insert["s_winner"] = v
  321. //存入新表
  322. err = Mgo.InsertOrUpdate("top", "wcc_allcity_2025Q2", insert)
  323. if err != nil {
  324. log.Println("error", doc["id"])
  325. }
  326. }
  327. // 处理查询结果
  328. //area := util.ObjToString(doc["area"])
  329. //areas := []string{"北京", "上海", "广东", "江苏", "浙江"}
  330. //if !IsInStringArray(area, areas) {
  331. // continue
  332. //}
  333. //projectName := util.ObjToString(doc["projectname"])
  334. //if strings.Contains(projectName, "非政府") {
  335. // continue
  336. //}
  337. //buyerclass := util.ObjToString(doc["buyerclass"])
  338. //if buyerclass == "批发零售" || buyerclass == "住宿餐饮" || buyerclass == "信息技术" {
  339. // continue
  340. //}
  341. ////存入新表
  342. //err = Mgo.InsertOrUpdate("qfw", "wcc_bank_poc", doc)
  343. //if err != nil {
  344. // log.Println("error", doc["id"])
  345. //}
  346. }
  347. total = total + len(res.Hits.Hits)
  348. scrollID = res.ScrollId
  349. res, err = client.Scroll().ScrollId(scrollID).Scroll(scroll).Do(ctx)
  350. log.Println("current count:", total)
  351. if err != nil {
  352. if err == io.EOF {
  353. // 滚动到最后一批数据,退出循环
  354. break
  355. }
  356. log.Println("滚动搜索失败:", err, res)
  357. break // 处理错误时退出循环
  358. }
  359. }
  360. // 在循环外调用 ClearScroll
  361. _, err = client.ClearScroll().ScrollId(scrollID).Do(ctx)
  362. if err != nil {
  363. log.Printf("清理滚动搜索失败:%s", err)
  364. }
  365. fmt.Println("结束~~~~~~~~~~~~~~~")
  366. }
  367. // getQyxytData 获取企业数据
  368. func getQyxytData() {
  369. //url := "http://172.17.4.184:19908"
  370. url := "http://127.0.0.1:19908"
  371. username := "jybid"
  372. password := "Top2023_JEB01i@31"
  373. index := "qyxy" //索引名称
  374. // 创建 Elasticsearch 客户端
  375. client, err := elastic.NewClient(
  376. elastic.SetURL(url),
  377. elastic.SetBasicAuth(username, password),
  378. elastic.SetSniff(false),
  379. )
  380. if err != nil {
  381. log.Fatalf("创建 Elasticsearch 客户端失败:%s", err)
  382. }
  383. //85 抽取库
  384. //Mgo := &mongodb.MongodbSim{
  385. // //MongodbAddr: "127.0.0.1:27080",
  386. // MongodbAddr: "172.17.4.85:27080",
  387. // DbName: "top",
  388. // Size: 10,
  389. // //Direct: true,
  390. //}
  391. //Mgo.InitPool()
  392. //MgoB := &mongodb.MongodbSim{
  393. // MongodbAddr: "172.17.189.140:27080",
  394. // //MongodbAddr: "127.0.0.1:27083",
  395. // Size: 10,
  396. // DbName: "qfw",
  397. // UserName: "SJZY_RWbid_ES",
  398. // Password: "SJZY@B4i4D5e6S",
  399. // //Direct: true,
  400. //}
  401. //MgoB.InitPool()
  402. //2023年01-01 2023-10-01,,1-3季度
  403. //2024-1 - 2024-4;1704038400-1711900800
  404. //2023-10-1 2024-1-1;1696089600-1704038400
  405. //城市范围
  406. //areaTermsQuery := elastic.NewTermsQuery("company_city", "北京市")
  407. //rangeQuery := elastic.NewRangeQuery("establish_date").Gte(1704038400)
  408. //query := elastic.NewBoolQuery().
  409. // Must(areaTermsQuery).
  410. // Must(rangeQuery)
  411. //---------------------------//
  412. query := elastic.NewBoolQuery()
  413. query.Must(elastic.NewMatchQuery("business_scope", "招投标代理"))
  414. query.Must(elastic.NewTermQuery("company_city", "北京市"))
  415. //rangeQuery := elastic.NewRangeQuery("comeintime").Gte("1640966400").Lt("1703952000")
  416. //query := elastic.NewBoolQuery().
  417. // //北京,天津,河北,上海,江苏,浙江,安徽
  418. // //Must(elastic.NewTermQuery("area", "北京市")).
  419. // Must(elastic.NewTermsQuery("subtype", "中标", "单一", "成交", "合同")).
  420. // Must(elastic.NewTermsQuery("area", "北京", "上海", "江苏", "浙江", "广东")).
  421. // Must(rangeQuery)
  422. ctx := context.Background()
  423. //开始滚动搜索
  424. scrollID := ""
  425. scroll := "10m"
  426. searchSource := elastic.NewSearchSource().
  427. Query(query).
  428. Size(10000).
  429. Sort("_doc", true) //升序排序
  430. //Sort("_doc", false) //降序排序
  431. searchService := client.Scroll(index).
  432. Size(10000).
  433. Scroll(scroll).
  434. SearchSource(searchSource)
  435. res, err := searchService.Do(ctx)
  436. if err != nil {
  437. if err == io.EOF {
  438. fmt.Println("没有数据")
  439. } else {
  440. panic(err)
  441. }
  442. }
  443. //defer client.ClearScroll().ScrollId(scrollID).Do(ctx) // 在退出时清理资源
  444. fmt.Println("总数是:", res.TotalHits())
  445. total := 0
  446. for len(res.Hits.Hits) > 0 {
  447. for _, hit := range res.Hits.Hits {
  448. var doc map[string]interface{}
  449. err := json.Unmarshal(hit.Source, &doc)
  450. if err != nil {
  451. log.Printf("解析文档失败:%s", err)
  452. continue
  453. }
  454. if strings.Contains(util.ObjToString(doc["business_scope"]), "招投标代理") {
  455. //存入新表
  456. insert := map[string]interface{}{
  457. "company_name": doc["company_name"],
  458. "business_scope": doc["business_scope"],
  459. "employee_name": doc["employee_name"],
  460. "company_phone": doc["company_phone"],
  461. }
  462. err = MgoB.InsertOrUpdate("qfw", "wcc_2024_beijing_dailijigou", insert)
  463. if err != nil {
  464. log.Println("error", doc["id"])
  465. }
  466. }
  467. //sWinner := util.ObjToString(doc["s_winner"])
  468. //winners := strings.Split(sWinner, ",")
  469. //for _, v := range winners {
  470. // insert := doc
  471. // insert["s_winner"] = v
  472. // //存入新表
  473. // err = MgoB.InsertOrUpdate("qfw", "wcc_2024_pingdingshan", insert)
  474. // if err != nil {
  475. // log.Println("error", doc["id"])
  476. // }
  477. //}
  478. // 处理查询结果
  479. //area := util.ObjToString(doc["area"])
  480. //areas := []string{"北京", "上海", "广东", "江苏", "浙江"}
  481. //if !IsInStringArray(area, areas) {
  482. // continue
  483. //}
  484. //projectName := util.ObjToString(doc["projectname"])
  485. //if strings.Contains(projectName, "非政府") {
  486. // continue
  487. //}
  488. //buyerclass := util.ObjToString(doc["buyerclass"])
  489. //if buyerclass == "批发零售" || buyerclass == "住宿餐饮" || buyerclass == "信息技术" {
  490. // continue
  491. //}
  492. ////存入新表
  493. //err = Mgo.InsertOrUpdate("qfw", "wcc_bank_poc", doc)
  494. //if err != nil {
  495. // log.Println("error", doc["id"])
  496. //}
  497. }
  498. total = total + len(res.Hits.Hits)
  499. scrollID = res.ScrollId
  500. res, err = client.Scroll().ScrollId(scrollID).Scroll(scroll).Do(ctx)
  501. log.Println("current count:", total)
  502. if err != nil {
  503. if err == io.EOF {
  504. // 滚动到最后一批数据,退出循环
  505. break
  506. }
  507. log.Println("滚动搜索失败:", err, res)
  508. break // 处理错误时退出循环
  509. }
  510. }
  511. // 在循环外调用 ClearScroll
  512. _, err = client.ClearScroll().ScrollId(scrollID).Do(ctx)
  513. if err != nil {
  514. log.Printf("清理滚动搜索失败:%s", err)
  515. }
  516. fmt.Println("结束~~~~~~~~~~~~~~~")
  517. }
  518. // getQyLimitData 获取qyxy 条件数据
  519. func getQyLimitData() {
  520. //url := "http://172.17.4.184:19908"
  521. url := "http://127.0.0.1:19908"
  522. username := "jybid"
  523. password := "Top2023_JEB01i@31"
  524. index := "qyxy" //索引名称
  525. // 创建 Elasticsearch 客户端
  526. client, err := elastic.NewClient(
  527. elastic.SetURL(url),
  528. elastic.SetBasicAuth(username, password),
  529. elastic.SetSniff(false),
  530. )
  531. if err != nil {
  532. log.Fatalf("创建 Elasticsearch 客户端失败:%s", err)
  533. }
  534. // 构建查询
  535. query := elastic.NewBoolQuery().
  536. Must(elastic.NewMatchQuery("company_area", "河南")).
  537. Must(elastic.NewMatchQuery("company_status", "存续")).
  538. MustNot(elastic.NewMatchQuery("company_type", "个体工商户"))
  539. // 执行查询
  540. searchResult, err := client.Search().Size(50).
  541. Index(index).
  542. Query(query).
  543. Do(context.Background())
  544. if err != nil {
  545. log.Fatalf("Error executing search: %s", err)
  546. }
  547. // 本地数据库
  548. MgoB := &mongodb.MongodbSim{
  549. MongodbAddr: "127.0.0.1:27017",
  550. Size: 10,
  551. DbName: "wcc",
  552. }
  553. MgoB.InitPool()
  554. for _, hit := range searchResult.Hits.Hits {
  555. var doc map[string]interface{}
  556. err := json.Unmarshal(hit.Source, &doc)
  557. if err != nil {
  558. log.Printf("解析文档失败:%s", err)
  559. continue
  560. }
  561. MgoB.SaveByOriID("wcc_henan_0428", doc)
  562. }
  563. }
  564. // getTidb 获取tidb 数据
  565. func getTidb() {
  566. MgoB := &mongodb.MongodbSim{
  567. MongodbAddr: "172.17.189.140:27080",
  568. //MongodbAddr: "127.0.0.1:27083",
  569. Size: 10,
  570. DbName: "qfw",
  571. UserName: "SJZY_RWbid_ES",
  572. Password: "SJZY@B4i4D5e6S",
  573. //Direct: true,
  574. }
  575. MgoB.InitPool()
  576. //tidb
  577. username := "datascbi"
  578. password := "Da#Bi20221111SC"
  579. //host := "127.0.0.1:4001"
  580. host := "172.17.162.25:4000"
  581. database := "global_common_data"
  582. dsn := fmt.Sprintf("%s:%s@tcp(%s)/%s?charset=utf8mb4&parseTime=True&loc=Local", username, password, host, database)
  583. // 连接到数据库
  584. db, err := gorm.Open(mysql.Open(dsn), &gorm.Config{})
  585. if err != nil {
  586. log.Println("Failed to connect to database:", err)
  587. return
  588. }
  589. fmt.Println("Connected to the database!")
  590. defer util.Catch()
  591. sess := MgoB.GetMgoConn()
  592. defer MgoB.DestoryMongoConn(sess)
  593. it := sess.DB("qfw").C("wcc_2024_beijing_dailijigou").Find(nil).Select(nil).Iter()
  594. fmt.Println("taskRun 开始")
  595. count := 0
  596. for tmp := make(map[string]interface{}); it.Next(&tmp); count++ {
  597. if count%10000 == 0 {
  598. log.Println("current:", count)
  599. }
  600. companyName := util.ObjToString(tmp["company_name"])
  601. var baseInfo EnterpriseBaseInfo
  602. db.Where(&EnterpriseBaseInfo{Name: companyName}).First(&baseInfo)
  603. if baseInfo.ID > 0 {
  604. insert := map[string]interface{}{
  605. "company_name": companyName,
  606. "name_id": baseInfo.NameID,
  607. "business_scope": tmp["business_scope"],
  608. }
  609. MgoB.InsertOrUpdate("qfw", "wcc_beijing_daili_bidding", insert)
  610. }
  611. }
  612. log.Println("over")
  613. }
  614. // getEntInfo 获取法人库数据
  615. func getEntInfo() {
  616. url := "http://172.17.4.184:19908"
  617. //url := "http://127.0.0.1:19908"
  618. username := "jybid"
  619. password := "Top2023_JEB01i@31"
  620. index := "ent_info" //索引名称
  621. // 创建 Elasticsearch 客户端
  622. client, err := elastic.NewClient(
  623. elastic.SetURL(url),
  624. elastic.SetBasicAuth(username, password),
  625. elastic.SetSniff(false),
  626. )
  627. if err != nil {
  628. log.Fatalf("创建 Elasticsearch 客户端失败:%s", err)
  629. }
  630. query := elastic.NewBoolQuery().
  631. //北京,天津,河北,上海,江苏,浙江,安徽
  632. //Must(elastic.NewMatchQuery("company_name", "医院")).
  633. //Must(elastic.NewTermsQuery("subtype", "中标", "单一", "成交", "合同")).
  634. Must(elastic.NewExistsQuery("tag_labels"))
  635. //Must(rangeQuery)
  636. ctx := context.Background()
  637. //开始滚动搜索
  638. scrollID := ""
  639. scroll := "10m"
  640. searchSource := elastic.NewSearchSource().
  641. Query(query).
  642. Size(10000).
  643. Sort("_doc", true) //升序排序
  644. //Sort("_doc", false) //降序排序
  645. searchService := client.Scroll(index).
  646. Size(10000).
  647. Scroll(scroll).
  648. SearchSource(searchSource)
  649. res, err := searchService.Do(ctx)
  650. if err != nil {
  651. if err == io.EOF {
  652. fmt.Println("没有数据")
  653. } else {
  654. panic(err)
  655. }
  656. }
  657. //defer client.ClearScroll().ScrollId(scrollID).Do(ctx) // 在退出时清理资源
  658. fmt.Println("总数是:", res.TotalHits())
  659. total := 0
  660. for len(res.Hits.Hits) > 0 {
  661. for _, hit := range res.Hits.Hits {
  662. var doc map[string]interface{}
  663. err = json.Unmarshal(hit.Source, &doc)
  664. if err != nil {
  665. log.Printf("解析文档失败:%s", err)
  666. continue
  667. }
  668. name := util.ObjToString(doc["company_name"])
  669. updateData := make(map[string]interface{})
  670. if tag_labels, ok := doc["tag_labels"].([]interface{}); ok {
  671. updateData["main_label"] = tag_labels[0]
  672. _, err = client.Update().
  673. Index(index).
  674. Id(util.ObjToString(doc["id"])).
  675. Doc(updateData).
  676. Do(context.Background())
  677. if err != nil {
  678. log.Println("更新失败", name, tag_labels, err)
  679. }
  680. }
  681. }
  682. total = total + len(res.Hits.Hits)
  683. scrollID = res.ScrollId
  684. res, err = client.Scroll().ScrollId(scrollID).Scroll(scroll).Do(ctx)
  685. log.Println("current count:", total)
  686. if err != nil {
  687. if err == io.EOF {
  688. // 滚动到最后一批数据,退出循环
  689. break
  690. }
  691. log.Println("滚动搜索失败:", err, res)
  692. break // 处理错误时退出循环
  693. }
  694. }
  695. // 在循环外调用 ClearScroll
  696. _, err = client.ClearScroll().ScrollId(scrollID).Do(ctx)
  697. if err != nil {
  698. log.Printf("清理滚动搜索失败:%s", err)
  699. }
  700. fmt.Println("结束~~~~~~~~~~~~~~~")
  701. }
  702. // getBuyerData 获取采购单位数据
  703. func getBuyerData() {
  704. //key := "4d5206b1b297c1e7b77f9578edcb2cf7.TNU2i8G1oUNdR02i"
  705. //model := "glm-4-air"
  706. url := "http://172.17.4.184:19908"
  707. //url := "http://127.0.0.1:19908"
  708. username := "jybid"
  709. password := "Top2023_JEB01i@31"
  710. index := "buyer" //索引名称
  711. // 创建 Elasticsearch 客户端
  712. client, err := elastic.NewClient(
  713. elastic.SetURL(url),
  714. elastic.SetBasicAuth(username, password),
  715. elastic.SetSniff(false),
  716. )
  717. if err != nil {
  718. log.Fatalf("创建 Elasticsearch 客户端失败:%s", err)
  719. }
  720. MgoB := &mongodb.MongodbSim{
  721. MongodbAddr: "172.17.189.140:27080",
  722. //MongodbAddr: "127.0.0.1:27083",
  723. Size: 10,
  724. DbName: "qfw",
  725. UserName: "SJZY_RWbid_ES",
  726. Password: "SJZY@B4i4D5e6S",
  727. //Direct: true,
  728. }
  729. MgoB.InitPool()
  730. //query := elastic.NewBoolQuery().
  731. // //北京,天津,河北,上海,江苏,浙江,安徽
  732. // Must(elastic.NewMatchQuery("company_name", "医院")).
  733. // //Must(elastic.NewTermsQuery("subtype", "中标", "单一", "成交", "合同")).
  734. // Must(elastic.NewTermsQuery("tag_labels", "学校", "教育"))
  735. //Must(rangeQuery)
  736. ctx := context.Background()
  737. //开始滚动搜索
  738. scrollID := ""
  739. scroll := "10m"
  740. searchSource := elastic.NewSearchSource().
  741. //Query(query).
  742. Size(10000).
  743. Sort("_doc", true) //升序排序
  744. //Sort("_doc", false) //降序排序
  745. searchService := client.Scroll(index).
  746. Size(10000).
  747. Scroll(scroll).
  748. SearchSource(searchSource)
  749. res, err := searchService.Do(ctx)
  750. if err != nil {
  751. if err == io.EOF {
  752. fmt.Println("没有数据")
  753. } else {
  754. panic(err)
  755. }
  756. }
  757. //defer client.ClearScroll().ScrollId(scrollID).Do(ctx) // 在退出时清理资源
  758. fmt.Println("总数是:", res.TotalHits())
  759. total := 0
  760. for len(res.Hits.Hits) > 0 {
  761. for _, hit := range res.Hits.Hits {
  762. var doc map[string]interface{}
  763. err = json.Unmarshal(hit.Source, &doc)
  764. if err != nil {
  765. log.Printf("解析文档失败:%s", err)
  766. continue
  767. }
  768. //name := util.ObjToString(doc["buyer_name"])
  769. //ra := ZpAI(key, model, name)
  770. //if util.ObjToString(ra["label1"]) != "" && !checkString(util.ObjToString(ra["label1"])) {
  771. // doc["national_top"] = ra["label1"]
  772. // doc["main_label"] = ra["label1"]
  773. //}
  774. //if util.ObjToString(ra["label2"]) != "" && !checkString(util.ObjToString(ra["label2"])) {
  775. // doc["national_sub"] = ra["label2"]
  776. //}
  777. //if util.ObjToString(ra["label3"]) != "" && !checkString(util.ObjToString(ra["label3"])) {
  778. // doc["national_subsub"] = ra["label3"]
  779. //}
  780. MgoB.Save("ent_info_buyer", doc)
  781. //time.Sleep(time.Microsecond)
  782. }
  783. total = total + len(res.Hits.Hits)
  784. scrollID = res.ScrollId
  785. res, err = client.Scroll().ScrollId(scrollID).Scroll(scroll).Do(ctx)
  786. log.Println("current count:", total)
  787. if err != nil {
  788. if err == io.EOF {
  789. // 滚动到最后一批数据,退出循环
  790. break
  791. }
  792. log.Println("滚动搜索失败:", err, res)
  793. break // 处理错误时退出循环
  794. }
  795. }
  796. // 在循环外调用 ClearScroll
  797. _, err = client.ClearScroll().ScrollId(scrollID).Do(ctx)
  798. if err != nil {
  799. log.Printf("清理滚动搜索失败:%s", err)
  800. }
  801. fmt.Println("结束~~~~~~~~~~~~~~~")
  802. }
  803. // mgoBidding mgoBidding 数据
  804. func mgoBidding() {
  805. MgoB := &mongodb.MongodbSim{
  806. MongodbAddr: "172.17.189.140:27080",
  807. //MongodbAddr: "127.0.0.1:27083",
  808. Size: 10,
  809. DbName: "qfw",
  810. UserName: "SJZY_RWbid_ES",
  811. Password: "SJZY@B4i4D5e6S",
  812. //Direct: true,
  813. }
  814. MgoB.InitPool()
  815. sess := MgoB.GetMgoConn()
  816. defer MgoB.DestoryMongoConn(sess)
  817. //181 凭安库
  818. MgoQY := &mongodb.MongodbSim{
  819. MongodbAddr: "172.17.4.181:27001",
  820. //MongodbAddr: "127.0.0.1:27001",
  821. DbName: "mixdata",
  822. Size: 10,
  823. UserName: "",
  824. Password: "",
  825. //Direct: true,
  826. }
  827. MgoQY.InitPool()
  828. where := map[string]interface{}{
  829. "qy_flag": 1,
  830. }
  831. query := sess.DB("qfw").C("ent_info_buyer").Find(where).Select(map[string]interface{}{
  832. "contenthtml": 0}).Iter()
  833. count := 0
  834. key := "4d5206b1b297c1e7b77f9578edcb2cf7.TNU2i8G1oUNdR02i"
  835. model := "glm-4-air"
  836. ch := make(chan bool, 10)
  837. wg := &sync.WaitGroup{}
  838. for tmp := make(map[string]interface{}); query.Next(tmp); count++ {
  839. if count%100 == 0 {
  840. log.Println("current:", count, tmp["name"])
  841. }
  842. //存在就不再调用大模型
  843. //if _, ok := tmp["national_top"]; ok {
  844. // continue
  845. //}
  846. if utf8.RuneCountInString(util.ObjToString(tmp["name"])) < 4 {
  847. continue
  848. }
  849. ch <- true
  850. wg.Add(1)
  851. go func(tmp map[string]interface{}) {
  852. defer func() {
  853. <-ch
  854. wg.Done()
  855. }()
  856. //
  857. biddingID := mongodb.BsonIdToSId(tmp["_id"])
  858. update := make(map[string]interface{})
  859. name := util.ObjToString(tmp["name"])
  860. where2 := map[string]interface{}{
  861. "company_name": name,
  862. }
  863. data, _ := MgoQY.FindOne("company_base", where2)
  864. businessScope := util.ObjToString((*data)["business_scope"])
  865. ra := ZpAI1(key, model, name, businessScope)
  866. if util.ObjToString(ra["label1"]) != "" && !checkString(util.ObjToString(ra["label1"])) {
  867. //update["national_top"] = ra["label1"]
  868. //update["main_label"] = ra["label1"]
  869. update["label1"] = ra["label1"]
  870. }
  871. if util.ObjToString(ra["label2"]) != "" && !checkString(util.ObjToString(ra["label2"])) {
  872. //update["national_sub"] = ra["label2"]
  873. update["label2"] = ra["label2"]
  874. }
  875. if util.ObjToString(ra["label3"]) != "" && !checkString(util.ObjToString(ra["label3"])) {
  876. //update["national_subsub"] = ra["label3"]
  877. update["label3"] = ra["label3"]
  878. }
  879. if len(update) > 0 {
  880. MgoB.UpdateById("ent_info_buyer", biddingID, map[string]interface{}{"$set": update})
  881. }
  882. }(tmp)
  883. tmp = map[string]interface{}{}
  884. }
  885. wg.Wait()
  886. log.Println("over 22222222222")
  887. //log.Println("开始第二轮迭代")
  888. //for tmp := make(map[string]interface{}); query.Next(tmp); count++ {
  889. // if _, ok := tmp["national_top"]; ok {
  890. // continue
  891. // }
  892. // biddingID := mongodb.BsonIdToSId(tmp["_id"])
  893. // name := util.ObjToString(tmp["name"])
  894. // update := make(map[string]interface{})
  895. // ra := ZpAI(key, model, name)
  896. // if util.ObjToString(ra["label1"]) != "" && !checkString(util.ObjToString(ra["label1"])) {
  897. // update["national_top"] = ra["label1"]
  898. // update["main_label"] = ra["label1"]
  899. // }
  900. // if util.ObjToString(ra["label2"]) != "" && !checkString(util.ObjToString(ra["label2"])) {
  901. // update["national_sub"] = ra["label2"]
  902. // }
  903. // if util.ObjToString(ra["label3"]) != "" && !checkString(util.ObjToString(ra["label3"])) {
  904. // update["national_subsub"] = ra["label3"]
  905. // }
  906. // if count%1000 == 0 {
  907. // log.Println("current", count, name, ra["label1"], ra["label2"])
  908. // }
  909. //
  910. // if len(update) > 0 {
  911. // MgoB.UpdateById("ent_info_buyer", biddingID, map[string]interface{}{"$set": update})
  912. // }
  913. // //time.Sleep(time.Microsecond)
  914. //}
  915. //
  916. //log.Println("开始第3轮迭代")
  917. //for tmp := make(map[string]interface{}); query.Next(tmp); count++ {
  918. // if _, ok := tmp["national_top"]; ok {
  919. // continue
  920. // }
  921. // biddingID := mongodb.BsonIdToSId(tmp["_id"])
  922. // name := util.ObjToString(tmp["name"])
  923. // update := make(map[string]interface{})
  924. // ra := ZpAI(key, model, name)
  925. // if util.ObjToString(ra["label1"]) != "" && !checkString(util.ObjToString(ra["label1"])) {
  926. // update["national_top"] = ra["label1"]
  927. // update["main_label"] = ra["label1"]
  928. // }
  929. // if util.ObjToString(ra["label2"]) != "" && !checkString(util.ObjToString(ra["label2"])) {
  930. // update["national_sub"] = ra["label2"]
  931. // }
  932. // if util.ObjToString(ra["label3"]) != "" && !checkString(util.ObjToString(ra["label3"])) {
  933. // update["national_subsub"] = ra["label3"]
  934. // }
  935. // if count%1000 == 0 {
  936. // log.Println("current", count, name, ra["label1"], ra["label2"])
  937. // }
  938. //
  939. // if len(update) > 0 {
  940. // MgoB.UpdateById("ent_info_buyer", biddingID, map[string]interface{}{"$set": update})
  941. // }
  942. // //time.Sleep(time.Microsecond)
  943. //}
  944. }
  945. // fixProjectPortrait 修复画像数据重复
  946. func fixProjectPortrait() {
  947. url := "http://172.17.4.184:19908"
  948. //url := "http://127.0.0.1:19908"
  949. username := "jybid"
  950. password := "Top2023_JEB01i@31"
  951. index := "project_portrait" //索引名称
  952. buyerMap := make(map[string]int)
  953. buyerDatas := make(map[string][]map[string]interface{})
  954. // 创建 Elasticsearch 客户端
  955. client, err := elastic.NewClient(
  956. elastic.SetURL(url),
  957. elastic.SetBasicAuth(username, password),
  958. elastic.SetSniff(false),
  959. )
  960. if err != nil {
  961. log.Fatalf("创建 Elasticsearch 客户端失败:%s", err)
  962. }
  963. query := elastic.NewBoolQuery()
  964. //query.Must(elastic.NewMatchQuery("business_scope", "招投标代理"))
  965. query.Must(elastic.NewTermQuery("class", "情报_安防"))
  966. ctx := context.Background()
  967. //开始滚动搜索
  968. scrollID := ""
  969. scroll := "10m"
  970. searchSource := elastic.NewSearchSource().
  971. Query(query).
  972. Size(10000).
  973. //Sort("_doc", true) //升序排序
  974. Sort("_doc", false) //降序排序
  975. searchService := client.Scroll(index).
  976. Size(10000).
  977. Scroll(scroll).
  978. SearchSource(searchSource)
  979. res, err := searchService.Do(ctx)
  980. if err != nil {
  981. if err == io.EOF {
  982. fmt.Println("没有数据")
  983. } else {
  984. panic(err)
  985. }
  986. }
  987. //defer client.ClearScroll().ScrollId(scrollID).Do(ctx) // 在退出时清理资源
  988. fmt.Println("project_portrait 总数是:", res.TotalHits())
  989. MgoB := &mongodb.MongodbSim{
  990. MongodbAddr: "172.17.189.140:27080",
  991. //MongodbAddr: "127.0.0.1:27083",
  992. Size: 10,
  993. DbName: "qfw",
  994. UserName: "SJZY_RWbid_ES",
  995. Password: "SJZY@B4i4D5e6S",
  996. //Direct: true,
  997. }
  998. MgoB.InitPool()
  999. //wher := map[string]interface{}{
  1000. // "_id": mongodb.StringTOBsonId("66faf189bf905908d4a252d6"),
  1001. //}
  1002. //MgoB.Delete("project_portrait", wher)
  1003. //
  1004. //return
  1005. total := 0
  1006. for len(res.Hits.Hits) > 0 {
  1007. for _, hit := range res.Hits.Hits {
  1008. var doc map[string]interface{}
  1009. err := json.Unmarshal(hit.Source, &doc)
  1010. if err != nil {
  1011. log.Printf("解析文档失败:%s", err)
  1012. continue
  1013. }
  1014. buyerName := util.ObjToString(doc["buyer"])
  1015. buyerMap[buyerName]++
  1016. buyerArr := buyerDatas[buyerName]
  1017. buyerArr = append(buyerArr, doc)
  1018. buyerDatas[buyerName] = buyerArr
  1019. }
  1020. total = total + len(res.Hits.Hits)
  1021. scrollID = res.ScrollId
  1022. res, err = client.Scroll().ScrollId(scrollID).Scroll(scroll).Do(ctx)
  1023. log.Println("current count:", total)
  1024. if err != nil {
  1025. if err == io.EOF {
  1026. // 滚动到最后一批数据,退出循环
  1027. break
  1028. }
  1029. log.Println("滚动搜索失败:", err, res)
  1030. break // 处理错误时退出循环
  1031. }
  1032. }
  1033. // 在循环外调用 ClearScroll
  1034. _, err = client.ClearScroll().ScrollId(scrollID).Do(ctx)
  1035. if err != nil {
  1036. log.Printf("清理滚动搜索失败:%s", err)
  1037. }
  1038. fmt.Println("迭代结束~~~~~~~~~~~~~~~")
  1039. su := 0
  1040. for k, v := range buyerMap {
  1041. su++
  1042. if su%1000 == 0 {
  1043. log.Println("su", su)
  1044. }
  1045. if v > 1 {
  1046. buyerName := k
  1047. buyerArr := buyerDatas[buyerName]
  1048. doc := buyerArr[0]
  1049. doc["_id"] = mongodb.StringTOBsonId(util.ObjToString(doc["id"]))
  1050. MgoB.SaveByOriID("project_portrait_1030_test", doc)
  1051. for kk, vv := range buyerArr {
  1052. id := util.ObjToString(vv["id"])
  1053. where := map[string]interface{}{
  1054. "_id": mongodb.StringTOBsonId(util.ObjToString(doc["id"])),
  1055. }
  1056. MgoB.Delete("project_portrait", where)
  1057. if kk > 0 {
  1058. client.Delete().Index(index).Id(id).Do(context.Background())
  1059. }
  1060. }
  1061. }
  1062. }
  1063. }
  1064. // updateMgoEntInfoBuyer updateMgoEntInfoBuyer
  1065. func updateMgoEntInfoBuyer() {
  1066. MgoB := &mongodb.MongodbSim{
  1067. MongodbAddr: "172.17.189.140:27080",
  1068. //MongodbAddr: "127.0.0.1:27083",
  1069. Size: 10,
  1070. DbName: "qfw",
  1071. UserName: "SJZY_RWbid_ES",
  1072. Password: "SJZY@B4i4D5e6S",
  1073. //Direct: true,
  1074. }
  1075. MgoB.InitPool()
  1076. //181 凭安库
  1077. MgoQY := &mongodb.MongodbSim{
  1078. MongodbAddr: "172.17.4.181:27001",
  1079. //MongodbAddr: "127.0.0.1:27001",
  1080. DbName: "mixdata",
  1081. Size: 10,
  1082. UserName: "",
  1083. Password: "",
  1084. //Direct: true,
  1085. }
  1086. MgoQY.InitPool()
  1087. sess := MgoB.GetMgoConn()
  1088. defer MgoB.DestoryMongoConn(sess)
  1089. query := sess.DB("qfw").C("ent_info_buyer").Find(nil).Select(map[string]interface{}{
  1090. "contenthtml": 0}).Iter()
  1091. count := 0
  1092. for tmp := make(map[string]interface{}); query.Next(tmp); count++ {
  1093. if count%1000 == 0 {
  1094. log.Println("current:", count, tmp["name"])
  1095. }
  1096. name := util.ObjToString(tmp["name"])
  1097. where := map[string]interface{}{
  1098. "company_name": name,
  1099. }
  1100. id := mongodb.BsonIdToSId(tmp["_id"])
  1101. data, _ := MgoQY.FindOne("company_base", where)
  1102. if data != nil && len(*data) > 0 {
  1103. update := map[string]interface{}{
  1104. "qy_flag": 1,
  1105. "use_flag": (*data)["use_flag"],
  1106. "company_type": (*data)["company_type"],
  1107. "company_status": (*data)["company_status"],
  1108. "credit_no": (*data)["credit_no"],
  1109. "business_scope": (*data)["business_scope"],
  1110. }
  1111. MgoB.UpdateById("ent_info_buyer", id, map[string]interface{}{"$set": update})
  1112. }
  1113. }
  1114. }