es.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491
  1. package main
  2. import (
  3. "bytes"
  4. "context"
  5. "encoding/base64"
  6. "errors"
  7. "fmt"
  8. "github.com/olivere/elastic/v7"
  9. "go.uber.org/zap"
  10. "net/http"
  11. "strconv"
  12. "jygit.jydev.jianyu360.cn/data_processing/common_utils/log"
  13. "time"
  14. )
  15. var mapping = ` "mappings": {
  16. "dynamic": false,
  17. "properties": {
  18. "dataweight": {
  19. "type": "long"
  20. },
  21. "projectcode": {
  22. "type": "keyword"
  23. },
  24. "object_type": {
  25. "type": "keyword"
  26. },
  27. "bidopentime": {
  28. "type": "long"
  29. },
  30. "bidamount": {
  31. "type": "double"
  32. },
  33. "winner": {
  34. "type": "keyword"
  35. },
  36. "buyer": {
  37. "type": "keyword",
  38. "fields": {
  39. "mbuyer": {
  40. "analyzer": "my_ngram_title",
  41. "type": "text"
  42. }
  43. }
  44. },
  45. "budget": {
  46. "type": "double"
  47. },
  48. "projectname": {
  49. "type": "keyword",
  50. "fields": {
  51. "pname": {
  52. "analyzer": "my_ngram_title",
  53. "type": "text"
  54. }
  55. }
  56. },
  57. "area": {
  58. "type": "keyword"
  59. },
  60. "city": {
  61. "type": "keyword"
  62. },
  63. "district": {
  64. "type": "keyword"
  65. },
  66. "s_winner": {
  67. "analyzer": "douhao",
  68. "type": "text",
  69. "fields": {
  70. "mwinner": {
  71. "analyzer": "my_ngram_title",
  72. "type": "text"
  73. }
  74. }
  75. },
  76. "pici": {
  77. "type": "long"
  78. },
  79. "id": {
  80. "type": "keyword"
  81. },
  82. "title": {
  83. "analyzer": "my_ngram_title",
  84. "type": "text",
  85. "fields": {
  86. "mtitle": {
  87. "type": "keyword"
  88. }
  89. }
  90. },
  91. "detail": {
  92. "analyzer": "my_ngram",
  93. "type": "text"
  94. },
  95. "site": {
  96. "type": "keyword"
  97. },
  98. "comeintime": {
  99. "type": "long"
  100. },
  101. "href": {
  102. "type": "keyword"
  103. },
  104. "infoformat": {
  105. "type": "long"
  106. },
  107. "publishtime": {
  108. "type": "long"
  109. },
  110. "toptype": {
  111. "type": "keyword"
  112. },
  113. "subtype": {
  114. "type": "keyword"
  115. },
  116. "createtime": {
  117. "type": "long"
  118. }
  119. }
  120. }`
  121. //createIndex 创建索引
  122. func createIndex(clients map[string]*elastic.Client, PreBiddingIndex string) error {
  123. //createJson := fmt.Sprintf(`{%s,%s}`, setting, mapping)
  124. for k, client := range clients {
  125. url := GF.ES[k].URL
  126. username := GF.ES[k].Username
  127. password := GF.ES[k].Password
  128. exist, err := client.IndexExists(PreBiddingIndex).Do(context.Background())
  129. if exist {
  130. log.Info("CreateIndex", zap.String(PreBiddingIndex, "已经存在了"))
  131. }
  132. setting := fmt.Sprintf(` "settings": {
  133. "index": {
  134. "analysis": {
  135. "analyzer": {
  136. "my_ngram_title": {
  137. "filter": [
  138. "lowercase"
  139. ],
  140. "tokenizer": "my_ngram_title"
  141. },
  142. "douhao": {
  143. "type": "pattern",
  144. "pattern": ","
  145. },
  146. "my_ngram": {
  147. "filter": [
  148. "lowercase"
  149. ],
  150. "tokenizer": "my_ngram"
  151. }
  152. },
  153. "tokenizer": {
  154. "my_ngram_title": {
  155. "token_chars": [
  156. "letter",
  157. "digit",
  158. "punctuation",
  159. "symbol"
  160. ],
  161. "min_gram": "1",
  162. "type": "nGram",
  163. "max_gram": "1"
  164. },
  165. "my_ngram": {
  166. "token_chars": [
  167. "letter",
  168. "digit",
  169. "punctuation",
  170. "symbol"
  171. ],
  172. "min_gram": "2",
  173. "type": "nGram",
  174. "max_gram": "2"
  175. }
  176. }
  177. },
  178. "number_of_shards": "%s",
  179. "number_of_replicas": "0",
  180. "max_result_window": "20000"
  181. }
  182. }`, GF.ES[k].Shares)
  183. createJson := fmt.Sprintf(`{%s,%s}`, setting, mapping)
  184. //1. 开启节点平衡
  185. // 设置临时的节点平衡设置
  186. balanceSettings := `{
  187. "transient" : {
  188. "cluster.routing.allocation.enable" : "all"
  189. }
  190. }`
  191. requestURL := fmt.Sprintf("%s/_cluster/settings", url)
  192. req, err := http.NewRequest("PUT", requestURL, bytes.NewBuffer([]byte(balanceSettings)))
  193. if err != nil {
  194. log.Error("开启节点平衡", zap.Error(err))
  195. }
  196. req.Header.Set("Content-Type", "application/json")
  197. // 添加身份验证头部
  198. auth := username + ":" + password
  199. basicAuth := "Basic " + base64.StdEncoding.EncodeToString([]byte(auth))
  200. req.Header.Set("Authorization", basicAuth)
  201. clientQ := &http.Client{}
  202. resp, err := clientQ.Do(req)
  203. if err != nil {
  204. log.Error("开启节点平衡", zap.Error(err))
  205. return err
  206. }
  207. defer resp.Body.Close()
  208. if resp.StatusCode != http.StatusOK {
  209. log.Fatal("设置节点平衡失败")
  210. return err
  211. }
  212. fmt.Println(url, "节点平衡已开启")
  213. //2. 创建索引
  214. createIndexR, err := client.CreateIndex(PreBiddingIndex).BodyString(createJson).Do(context.Background())
  215. if err != nil {
  216. log.Error(PreBiddingIndex, zap.Error(err))
  217. return err
  218. }
  219. if !createIndexR.Acknowledged {
  220. log.Error("CreateIndex", zap.String(PreBiddingIndex, "创建索引失败"))
  221. return err
  222. }
  223. //3. 关闭节点平衡
  224. //设置临时的节点平衡设置
  225. disableSettings := `{
  226. "transient" : {
  227. "cluster.routing.allocation.enable" : "none"
  228. }
  229. }`
  230. req2, err2 := http.NewRequest("PUT", requestURL, bytes.NewBuffer([]byte(disableSettings)))
  231. if err2 != nil {
  232. log.Error("开启节点平衡", zap.Error(err))
  233. }
  234. req2.Header.Set("Content-Type", "application/json")
  235. // 添加身份验证头部
  236. req2.Header.Set("Authorization", basicAuth)
  237. //clientQ := &http.Client{}
  238. resp2, err2 := clientQ.Do(req)
  239. if err2 != nil {
  240. log.Error("关闭节点平衡", zap.Error(err))
  241. }
  242. defer resp2.Body.Close()
  243. fmt.Println(url, "节点平衡已关闭")
  244. //4. 新索引 添加别名
  245. for _, alias := range GF.Env.Alias {
  246. _, err = client.Alias().Add(PreBiddingIndex, alias).Do(context.Background())
  247. if err != nil {
  248. log.Error("添加别名失败:", zap.Error(err))
  249. }
  250. }
  251. log.Info("CreateIndex", zap.String(url, "索引别名 添加完毕"))
  252. }
  253. return nil
  254. }
  255. //deleteIndex 删除索引
  256. func deleteIndex(clients map[string]*elastic.Client, index string) error {
  257. if len(clients) == 0 {
  258. return errors.New("没有 配置 ES集群信息")
  259. }
  260. for k, client := range clients {
  261. exist, err := client.IndexExists(index).Do(context.Background())
  262. if !exist {
  263. log.Info("deleteIndex", zap.String(k, index+" 索引文件不存在"))
  264. }
  265. if err != nil {
  266. return err
  267. }
  268. num, err := client.Count(index).Do(context.Background())
  269. if err != nil {
  270. return err
  271. }
  272. if num > 0 {
  273. log.Info("deleteIndex", zap.String(k, "索引"+index+"还存在有效数据"))
  274. }
  275. _, err = client.DeleteIndex(index).Do(context.Background())
  276. if err != nil {
  277. return err
  278. }
  279. }
  280. return nil
  281. }
  282. //dealIndexByDay 处理预处理索引,根据天;
  283. func dealIndexByDay() {
  284. now := time.Now()
  285. PreBiddingIndex := ""
  286. //hour := now.Hour()
  287. // 判断当前时间是否时最后一个小时
  288. //if hour == 23 {
  289. //当天最后一小时
  290. var clients = make(map[string]*elastic.Client, 0)
  291. for k, v := range GF.ES {
  292. url := v.URL
  293. username := v.Username
  294. password := v.Password
  295. // 创建 Elasticsearch 客户端
  296. client, err := elastic.NewClient(
  297. elastic.SetURL(url),
  298. elastic.SetBasicAuth(username, password),
  299. elastic.SetSniff(false),
  300. )
  301. if err != nil {
  302. log.Error("创建 Elasticsearch 客户端失败:", zap.Error(err))
  303. }
  304. clients[k] = client
  305. }
  306. next := now.AddDate(0, 0, 1)
  307. month := int(next.Month())
  308. monthStr := strconv.Itoa(month)
  309. year := next.Year()
  310. yearStr := strconv.Itoa(year)
  311. dayStr := strconv.Itoa(next.Day())
  312. //下一天的索引名称
  313. PreBiddingIndex = "bidding_" + yearStr + monthStr + dayStr
  314. err := createIndex(clients, PreBiddingIndex)
  315. if err != nil {
  316. log.Info("dealIndexByDay", zap.Error(err))
  317. SendMail("预处理索引", "预处理索引创建失败,请检查")
  318. }
  319. log.Info("dealIndexByDay", zap.String(PreBiddingIndex, "创建成功"))
  320. //3. 删除昨天的索引
  321. last := now.AddDate(0, 0, -1)
  322. month2 := int(last.Month())
  323. monthStr2 := strconv.Itoa(month2)
  324. year2 := last.Year()
  325. yearStr2 := strconv.Itoa(year2)
  326. dayStr2 := strconv.Itoa(last.Day())
  327. //索引名称
  328. lastIndex := "bidding_" + yearStr2 + monthStr2 + dayStr2
  329. err = deleteIndex(clients, lastIndex)
  330. if err != nil {
  331. log.Info("dealIndexByDay", zap.Error(err))
  332. }
  333. //}
  334. }
  335. //dealIndexByMonth 处理预处理索引,根据月份;提前一天创建好 下个月的索引
  336. func dealIndexByMonth() {
  337. now := time.Now()
  338. PreBiddingIndex := ""
  339. // 获取当前月份的最后一天
  340. lastDayOfMonth := time.Date(now.Year(), now.Month()+1, 0, 0, 0, 0, 0, time.UTC)
  341. // 判断当前时间是否为当前月份的最后一天
  342. if now.Day() == lastDayOfMonth.Day() {
  343. //当月最后一天,需要提前创建好索引
  344. fmt.Println("当前时间是当前月份的最后一天")
  345. var clients = make(map[string]*elastic.Client, 0)
  346. for k, v := range GF.ES {
  347. url := v.URL
  348. username := v.Username
  349. password := v.Password
  350. // 创建 Elasticsearch 客户端
  351. client, err := elastic.NewClient(
  352. elastic.SetURL(url),
  353. elastic.SetBasicAuth(username, password),
  354. elastic.SetSniff(false),
  355. )
  356. if err != nil {
  357. log.Error("创建 Elasticsearch 客户端失败:", zap.Error(err))
  358. }
  359. clients[k] = client
  360. }
  361. next := now.AddDate(0, 0, 1)
  362. month := int(next.Month())
  363. monthStr := strconv.Itoa(month)
  364. year := next.Year()
  365. yearStr := strconv.Itoa(year)
  366. //下一个月的索引名称
  367. PreBiddingIndex = "bidding_" + yearStr + monthStr
  368. //2 创建下个月索引结构
  369. err := createIndex(clients, PreBiddingIndex)
  370. if err != nil {
  371. log.Info("dealIndexByMonth", zap.Error(err))
  372. SendMail("预处理索引", "预处理索引创建失败,请检查")
  373. }
  374. log.Info("dealIndexByMonth", zap.String(PreBiddingIndex, "创建成功"))
  375. //3. 删除上个月的索引
  376. last := now.AddDate(0, -1, 1)
  377. month2 := int(last.Month())
  378. monthStr2 := strconv.Itoa(month2)
  379. year2 := last.Year()
  380. yearStr2 := strconv.Itoa(year2)
  381. //上个月的索引名称
  382. lastIndex := "bidding_" + yearStr2 + monthStr2
  383. err = deleteIndex(clients, lastIndex)
  384. if err != nil {
  385. log.Info("dealIndexByMonth", zap.Error(err))
  386. }
  387. }
  388. }
  389. ////SwitchAlias 切换别名
  390. //func SwitchAlias() {
  391. // now := time.Now()
  392. // // 判断当前时间是否为当前月份的最后一天
  393. // //按日创建索引
  394. // if GF.Env.SpecType == "day" {
  395. // dealAlias()
  396. // } else if GF.Env.SpecType == "month" {
  397. // // 获取当前月份的最后一天
  398. // lastDayOfMonth := time.Date(now.Year(), now.Month()+1, 0, 0, 0, 0, 0, time.UTC)
  399. // //按月创建索引
  400. // if now.Day() == lastDayOfMonth.Day() {
  401. // dealAlias()
  402. // }
  403. // }
  404. //}
  405. //
  406. ////dealAlias 处理 索引别名
  407. //func dealAlias() {
  408. // now := time.Now()
  409. //
  410. // for _, v := range GF.ES {
  411. // url := v.URL
  412. // username := v.Username
  413. // password := v.Password
  414. // // 创建 Elasticsearch 客户端
  415. // client, err := elastic.NewClient(
  416. // elastic.SetURL(url),
  417. // elastic.SetBasicAuth(username, password),
  418. // elastic.SetSniff(false),
  419. // )
  420. // if err != nil {
  421. // log.Error("创建 Elasticsearch 客户端失败:", zap.Error(err))
  422. // }
  423. //
  424. // preBiddingIndex := "" //下一个索引名称
  425. // next := now.AddDate(0, 0, 1)
  426. // month := int(next.Month())
  427. // monthStr := strconv.Itoa(month)
  428. // year := next.Year()
  429. // yearStr := strconv.Itoa(year)
  430. // dayStr := strconv.Itoa(next.Day())
  431. // if GF.Env.SpecType == "month" {
  432. // //下一个月的索引名称
  433. // preBiddingIndex = "bidding_" + yearStr + monthStr
  434. // } else if GF.Env.SpecType == "day" {
  435. // //下一天的索引名称
  436. // preBiddingIndex = "bidding_" + yearStr + monthStr + dayStr
  437. // }
  438. //
  439. // for _, alias := range GF.Env.Alias {
  440. // _, err = client.Alias().Add(preBiddingIndex, alias).Do(context.Background())
  441. // if err != nil {
  442. // log.Error("添加别名失败:", zap.Error(err))
  443. // }
  444. // }
  445. // log.Info("dealAlias", zap.String(url, "索引别名处理完毕"))
  446. // }
  447. //}
  448. //SendMail 发送邮件
  449. func SendMail(title, content string) {
  450. url := fmt.Sprintf("%s?to=%s&title=%s&body=%s", GF.Email.Api, GF.Email.To, title, content)
  451. fmt.Println("url=>", url)
  452. res, err := http.Get(url)
  453. if err != nil {
  454. log.Info("SendMail", zap.Any("err", err))
  455. } else {
  456. log.Info("SendMail", zap.Any("res", res))
  457. }
  458. }