suggester_phrase.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538
  1. // Copyright 2012-2015 Oliver Eilhard. All rights reserved.
  2. // Use of this source code is governed by a MIT-license.
  3. // See http://olivere.mit-license.org/license.txt for details.
  4. package elastic
  5. // For more details, see
  6. // http://www.elasticsearch.org/guide/reference/api/search/phrase-suggest/
  7. type PhraseSuggester struct {
  8. Suggester
  9. name string
  10. text string
  11. field string
  12. analyzer string
  13. size *int
  14. shardSize *int
  15. contextQueries []SuggesterContextQuery
  16. // fields specific to a phrase suggester
  17. maxErrors *float32
  18. separator *string
  19. realWordErrorLikelihood *float32
  20. confidence *float32
  21. generators map[string][]CandidateGenerator
  22. gramSize *int
  23. smoothingModel SmoothingModel
  24. forceUnigrams *bool
  25. tokenLimit *int
  26. preTag, postTag *string
  27. collateQuery *string
  28. collateFilter *string
  29. collatePreference *string
  30. collateParams map[string]interface{}
  31. collatePrune *bool
  32. }
  33. // Creates a new phrase suggester.
  34. func NewPhraseSuggester(name string) PhraseSuggester {
  35. return PhraseSuggester{
  36. name: name,
  37. contextQueries: make([]SuggesterContextQuery, 0),
  38. collateParams: make(map[string]interface{}),
  39. }
  40. }
  41. func (q PhraseSuggester) Name() string {
  42. return q.name
  43. }
  44. func (q PhraseSuggester) Text(text string) PhraseSuggester {
  45. q.text = text
  46. return q
  47. }
  48. func (q PhraseSuggester) Field(field string) PhraseSuggester {
  49. q.field = field
  50. return q
  51. }
  52. func (q PhraseSuggester) Analyzer(analyzer string) PhraseSuggester {
  53. q.analyzer = analyzer
  54. return q
  55. }
  56. func (q PhraseSuggester) Size(size int) PhraseSuggester {
  57. q.size = &size
  58. return q
  59. }
  60. func (q PhraseSuggester) ShardSize(shardSize int) PhraseSuggester {
  61. q.shardSize = &shardSize
  62. return q
  63. }
  64. func (q PhraseSuggester) ContextQuery(query SuggesterContextQuery) PhraseSuggester {
  65. q.contextQueries = append(q.contextQueries, query)
  66. return q
  67. }
  68. func (q PhraseSuggester) ContextQueries(queries ...SuggesterContextQuery) PhraseSuggester {
  69. q.contextQueries = append(q.contextQueries, queries...)
  70. return q
  71. }
  72. func (q PhraseSuggester) GramSize(gramSize int) PhraseSuggester {
  73. if gramSize >= 1 {
  74. q.gramSize = &gramSize
  75. }
  76. return q
  77. }
  78. func (q PhraseSuggester) MaxErrors(maxErrors float32) PhraseSuggester {
  79. q.maxErrors = &maxErrors
  80. return q
  81. }
  82. func (q PhraseSuggester) Separator(separator string) PhraseSuggester {
  83. q.separator = &separator
  84. return q
  85. }
  86. func (q PhraseSuggester) RealWordErrorLikelihood(realWordErrorLikelihood float32) PhraseSuggester {
  87. q.realWordErrorLikelihood = &realWordErrorLikelihood
  88. return q
  89. }
  90. func (q PhraseSuggester) Confidence(confidence float32) PhraseSuggester {
  91. q.confidence = &confidence
  92. return q
  93. }
  94. func (q PhraseSuggester) CandidateGenerator(generator CandidateGenerator) PhraseSuggester {
  95. if q.generators == nil {
  96. q.generators = make(map[string][]CandidateGenerator)
  97. }
  98. typ := generator.Type()
  99. if _, found := q.generators[typ]; !found {
  100. q.generators[typ] = make([]CandidateGenerator, 0)
  101. }
  102. q.generators[typ] = append(q.generators[typ], generator)
  103. return q
  104. }
  105. func (q PhraseSuggester) CandidateGenerators(generators ...CandidateGenerator) PhraseSuggester {
  106. for _, g := range generators {
  107. q = q.CandidateGenerator(g)
  108. }
  109. return q
  110. }
  111. func (q PhraseSuggester) ClearCandidateGenerator() PhraseSuggester {
  112. q.generators = nil
  113. return q
  114. }
  115. func (q PhraseSuggester) ForceUnigrams(forceUnigrams bool) PhraseSuggester {
  116. q.forceUnigrams = &forceUnigrams
  117. return q
  118. }
  119. func (q PhraseSuggester) SmoothingModel(smoothingModel SmoothingModel) PhraseSuggester {
  120. q.smoothingModel = smoothingModel
  121. return q
  122. }
  123. func (q PhraseSuggester) TokenLimit(tokenLimit int) PhraseSuggester {
  124. q.tokenLimit = &tokenLimit
  125. return q
  126. }
  127. func (q PhraseSuggester) Highlight(preTag, postTag string) PhraseSuggester {
  128. q.preTag = &preTag
  129. q.postTag = &postTag
  130. return q
  131. }
  132. func (q PhraseSuggester) CollateQuery(collateQuery string) PhraseSuggester {
  133. q.collateQuery = &collateQuery
  134. return q
  135. }
  136. func (q PhraseSuggester) CollateFilter(collateFilter string) PhraseSuggester {
  137. q.collateFilter = &collateFilter
  138. return q
  139. }
  140. func (q PhraseSuggester) CollatePreference(collatePreference string) PhraseSuggester {
  141. q.collatePreference = &collatePreference
  142. return q
  143. }
  144. func (q PhraseSuggester) CollateParams(collateParams map[string]interface{}) PhraseSuggester {
  145. q.collateParams = collateParams
  146. return q
  147. }
  148. func (q PhraseSuggester) CollatePrune(collatePrune bool) PhraseSuggester {
  149. q.collatePrune = &collatePrune
  150. return q
  151. }
  152. // simplePhraseSuggesterRequest is necessary because the order in which
  153. // the JSON elements are routed to Elasticsearch is relevant.
  154. // We got into trouble when using plain maps because the text element
  155. // needs to go before the simple_phrase element.
  156. type phraseSuggesterRequest struct {
  157. Text string `json:"text"`
  158. Phrase interface{} `json:"phrase"`
  159. }
  160. // Creates the source for the phrase suggester.
  161. func (q PhraseSuggester) Source(includeName bool) interface{} {
  162. ps := &phraseSuggesterRequest{}
  163. if q.text != "" {
  164. ps.Text = q.text
  165. }
  166. suggester := make(map[string]interface{})
  167. ps.Phrase = suggester
  168. if q.analyzer != "" {
  169. suggester["analyzer"] = q.analyzer
  170. }
  171. if q.field != "" {
  172. suggester["field"] = q.field
  173. }
  174. if q.size != nil {
  175. suggester["size"] = *q.size
  176. }
  177. if q.shardSize != nil {
  178. suggester["shard_size"] = *q.shardSize
  179. }
  180. switch len(q.contextQueries) {
  181. case 0:
  182. case 1:
  183. suggester["context"] = q.contextQueries[0].Source()
  184. default:
  185. ctxq := make([]interface{}, 0)
  186. for _, query := range q.contextQueries {
  187. ctxq = append(ctxq, query.Source())
  188. }
  189. suggester["context"] = ctxq
  190. }
  191. // Phase-specified parameters
  192. if q.realWordErrorLikelihood != nil {
  193. suggester["real_word_error_likelihood"] = *q.realWordErrorLikelihood
  194. }
  195. if q.confidence != nil {
  196. suggester["confidence"] = *q.confidence
  197. }
  198. if q.separator != nil {
  199. suggester["separator"] = *q.separator
  200. }
  201. if q.maxErrors != nil {
  202. suggester["max_errors"] = *q.maxErrors
  203. }
  204. if q.gramSize != nil {
  205. suggester["gram_size"] = *q.gramSize
  206. }
  207. if q.forceUnigrams != nil {
  208. suggester["force_unigrams"] = *q.forceUnigrams
  209. }
  210. if q.tokenLimit != nil {
  211. suggester["token_limit"] = *q.tokenLimit
  212. }
  213. if q.generators != nil && len(q.generators) > 0 {
  214. for typ, generators := range q.generators {
  215. arr := make([]interface{}, 0)
  216. for _, g := range generators {
  217. arr = append(arr, g.Source())
  218. }
  219. suggester[typ] = arr
  220. }
  221. }
  222. if q.smoothingModel != nil {
  223. x := make(map[string]interface{})
  224. x[q.smoothingModel.Type()] = q.smoothingModel.Source()
  225. suggester["smoothing"] = x
  226. }
  227. if q.preTag != nil {
  228. hl := make(map[string]string)
  229. hl["pre_tag"] = *q.preTag
  230. if q.postTag != nil {
  231. hl["post_tag"] = *q.postTag
  232. }
  233. suggester["highlight"] = hl
  234. }
  235. if q.collateQuery != nil || q.collateFilter != nil {
  236. collate := make(map[string]interface{})
  237. suggester["collate"] = collate
  238. if q.collateQuery != nil {
  239. collate["query"] = *q.collateQuery
  240. }
  241. if q.collateFilter != nil {
  242. collate["filter"] = *q.collateFilter
  243. }
  244. if q.collatePreference != nil {
  245. collate["preference"] = *q.collatePreference
  246. }
  247. if len(q.collateParams) > 0 {
  248. collate["params"] = q.collateParams
  249. }
  250. if q.collatePrune != nil {
  251. collate["prune"] = *q.collatePrune
  252. }
  253. }
  254. if !includeName {
  255. return ps
  256. }
  257. source := make(map[string]interface{})
  258. source[q.name] = ps
  259. return source
  260. }
  261. // -- Smoothing models --
  262. type SmoothingModel interface {
  263. Type() string
  264. Source() interface{}
  265. }
  266. // StupidBackoffSmoothingModel implements a stupid backoff smoothing model.
  267. // See http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-suggesters-phrase.html#_smoothing_models
  268. // for details about smoothing models.
  269. type StupidBackoffSmoothingModel struct {
  270. discount float64
  271. }
  272. func NewStupidBackoffSmoothingModel(discount float64) *StupidBackoffSmoothingModel {
  273. return &StupidBackoffSmoothingModel{
  274. discount: discount,
  275. }
  276. }
  277. func (sm *StupidBackoffSmoothingModel) Type() string {
  278. return "stupid_backoff"
  279. }
  280. func (sm *StupidBackoffSmoothingModel) Source() interface{} {
  281. source := make(map[string]interface{})
  282. source["discount"] = sm.discount
  283. return source
  284. }
  285. // --
  286. // LaplaceSmoothingModel implements a laplace smoothing model.
  287. // See http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-suggesters-phrase.html#_smoothing_models
  288. // for details about smoothing models.
  289. type LaplaceSmoothingModel struct {
  290. alpha float64
  291. }
  292. func NewLaplaceSmoothingModel(alpha float64) *LaplaceSmoothingModel {
  293. return &LaplaceSmoothingModel{
  294. alpha: alpha,
  295. }
  296. }
  297. func (sm *LaplaceSmoothingModel) Type() string {
  298. return "laplace"
  299. }
  300. func (sm *LaplaceSmoothingModel) Source() interface{} {
  301. source := make(map[string]interface{})
  302. source["alpha"] = sm.alpha
  303. return source
  304. }
  305. // --
  306. // LinearInterpolationSmoothingModel implements a linear interpolation
  307. // smoothing model.
  308. // See http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-suggesters-phrase.html#_smoothing_models
  309. // for details about smoothing models.
  310. type LinearInterpolationSmoothingModel struct {
  311. trigramLamda float64
  312. bigramLambda float64
  313. unigramLambda float64
  314. }
  315. func NewLinearInterpolationSmoothingModel(trigramLamda, bigramLambda, unigramLambda float64) *LinearInterpolationSmoothingModel {
  316. return &LinearInterpolationSmoothingModel{
  317. trigramLamda: trigramLamda,
  318. bigramLambda: bigramLambda,
  319. unigramLambda: unigramLambda,
  320. }
  321. }
  322. func (sm *LinearInterpolationSmoothingModel) Type() string {
  323. return "linear_interpolation"
  324. }
  325. func (sm *LinearInterpolationSmoothingModel) Source() interface{} {
  326. source := make(map[string]interface{})
  327. source["trigram_lambda"] = sm.trigramLamda
  328. source["bigram_lambda"] = sm.bigramLambda
  329. source["unigram_lambda"] = sm.unigramLambda
  330. return source
  331. }
  332. // -- CandidateGenerator --
  333. type CandidateGenerator interface {
  334. Type() string
  335. Source() interface{}
  336. }
  337. // DirectCandidateGenerator implements a direct candidate generator.
  338. // See http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-suggesters-phrase.html#_smoothing_models
  339. // for details about smoothing models.
  340. type DirectCandidateGenerator struct {
  341. field string
  342. preFilter *string
  343. postFilter *string
  344. suggestMode *string
  345. accuracy *float64
  346. size *int
  347. sort *string
  348. stringDistance *string
  349. maxEdits *int
  350. maxInspections *int
  351. maxTermFreq *float64
  352. prefixLength *int
  353. minWordLength *int
  354. minDocFreq *float64
  355. }
  356. func NewDirectCandidateGenerator(field string) *DirectCandidateGenerator {
  357. return &DirectCandidateGenerator{
  358. field: field,
  359. }
  360. }
  361. func (g *DirectCandidateGenerator) Type() string {
  362. return "direct_generator"
  363. }
  364. func (g *DirectCandidateGenerator) Field(field string) *DirectCandidateGenerator {
  365. g.field = field
  366. return g
  367. }
  368. func (g *DirectCandidateGenerator) PreFilter(preFilter string) *DirectCandidateGenerator {
  369. g.preFilter = &preFilter
  370. return g
  371. }
  372. func (g *DirectCandidateGenerator) PostFilter(postFilter string) *DirectCandidateGenerator {
  373. g.postFilter = &postFilter
  374. return g
  375. }
  376. func (g *DirectCandidateGenerator) SuggestMode(suggestMode string) *DirectCandidateGenerator {
  377. g.suggestMode = &suggestMode
  378. return g
  379. }
  380. func (g *DirectCandidateGenerator) Accuracy(accuracy float64) *DirectCandidateGenerator {
  381. g.accuracy = &accuracy
  382. return g
  383. }
  384. func (g *DirectCandidateGenerator) Size(size int) *DirectCandidateGenerator {
  385. g.size = &size
  386. return g
  387. }
  388. func (g *DirectCandidateGenerator) Sort(sort string) *DirectCandidateGenerator {
  389. g.sort = &sort
  390. return g
  391. }
  392. func (g *DirectCandidateGenerator) StringDistance(stringDistance string) *DirectCandidateGenerator {
  393. g.stringDistance = &stringDistance
  394. return g
  395. }
  396. func (g *DirectCandidateGenerator) MaxEdits(maxEdits int) *DirectCandidateGenerator {
  397. g.maxEdits = &maxEdits
  398. return g
  399. }
  400. func (g *DirectCandidateGenerator) MaxInspections(maxInspections int) *DirectCandidateGenerator {
  401. g.maxInspections = &maxInspections
  402. return g
  403. }
  404. func (g *DirectCandidateGenerator) MaxTermFreq(maxTermFreq float64) *DirectCandidateGenerator {
  405. g.maxTermFreq = &maxTermFreq
  406. return g
  407. }
  408. func (g *DirectCandidateGenerator) PrefixLength(prefixLength int) *DirectCandidateGenerator {
  409. g.prefixLength = &prefixLength
  410. return g
  411. }
  412. func (g *DirectCandidateGenerator) MinWordLength(minWordLength int) *DirectCandidateGenerator {
  413. g.minWordLength = &minWordLength
  414. return g
  415. }
  416. func (g *DirectCandidateGenerator) MinDocFreq(minDocFreq float64) *DirectCandidateGenerator {
  417. g.minDocFreq = &minDocFreq
  418. return g
  419. }
  420. func (g *DirectCandidateGenerator) Source() interface{} {
  421. source := make(map[string]interface{})
  422. if g.field != "" {
  423. source["field"] = g.field
  424. }
  425. if g.suggestMode != nil {
  426. source["suggest_mode"] = *g.suggestMode
  427. }
  428. if g.accuracy != nil {
  429. source["accuracy"] = *g.accuracy
  430. }
  431. if g.size != nil {
  432. source["size"] = *g.size
  433. }
  434. if g.sort != nil {
  435. source["sort"] = *g.sort
  436. }
  437. if g.stringDistance != nil {
  438. source["string_distance"] = *g.stringDistance
  439. }
  440. if g.maxEdits != nil {
  441. source["max_edits"] = *g.maxEdits
  442. }
  443. if g.maxInspections != nil {
  444. source["max_inspections"] = *g.maxInspections
  445. }
  446. if g.maxTermFreq != nil {
  447. source["max_term_freq"] = *g.maxTermFreq
  448. }
  449. if g.prefixLength != nil {
  450. source["prefix_length"] = *g.prefixLength
  451. }
  452. if g.minWordLength != nil {
  453. source["min_word_length"] = *g.minWordLength
  454. }
  455. if g.minDocFreq != nil {
  456. source["min_doc_freq"] = *g.minDocFreq
  457. }
  458. if g.preFilter != nil {
  459. source["pre_filter"] = *g.preFilter
  460. }
  461. if g.postFilter != nil {
  462. source["post_filter"] = *g.postFilter
  463. }
  464. return source
  465. }