Prechádzať zdrojové kódy

添加 数据预处理 索引

wcc 1 rok pred
rodič
commit
600f2c6efd
1 zmenil súbory, kde vykonal 162 pridanie a 0 odobranie
  1. 162 0
      mapping/bidding_preprocess.txt

+ 162 - 0
mapping/bidding_preprocess.txt

@@ -0,0 +1,162 @@
+curl -H 'Content-Type: application/json'  -u es_all:TopJkO2E_d1x  -XPUT http://127.0.0.1:19805/bidding_20231120 -d '{
+    "settings": {
+        "index": {
+            "analysis": {
+                "analyzer": {
+                    "my_ngram_title": {
+                        "filter": [
+                            "lowercase"
+                        ],
+                        "tokenizer": "my_ngram_title"
+                    },
+                    "douhao": {
+                        "type": "pattern",
+                        "pattern": ","
+                    },
+                    "my_ngram": {
+                        "filter": [
+                            "lowercase"
+                        ],
+                        "tokenizer": "my_ngram"
+                    }
+                },
+                "tokenizer": {
+                    "my_ngram_title": {
+                        "token_chars": [
+                            "letter",
+                            "digit",
+                            "punctuation",
+                            "symbol"
+                        ],
+                        "min_gram": "1",
+                        "type": "nGram",
+                        "max_gram": "1"
+                    },
+                    "my_ngram": {
+                        "token_chars": [
+                            "letter",
+                            "digit",
+                            "punctuation",
+                            "symbol"
+                        ],
+                        "min_gram": "2",
+                        "type": "nGram",
+                        "max_gram": "2"
+                    }
+                }
+            },
+            "number_of_shards": "12",
+            "number_of_replicas": "0",
+            "max_result_window": "20000"
+        }
+    },
+    "mappings": {
+        "dynamic": false,
+        "properties": {
+            "dataweight": {
+                "type": "long"
+            },
+            "projectcode": {
+                "type": "keyword"
+            },
+             "object_type": {
+                "type": "keyword"
+            },
+           "fromtable": {
+                "type": "keyword"
+            },
+            "bidopentime": {
+                "type": "long"
+            },
+            "bidamount": {
+                "type": "double"
+            },
+            "winner": {
+                "type": "keyword"
+            },
+            "buyer": {
+                "type": "keyword",
+                "fields": {
+                    "mbuyer": {
+                        "analyzer": "my_ngram_title",
+                        "type": "text"
+                    }
+                }
+            },
+            "budget": {
+                "type": "double"
+            },
+            "projectname": {
+                "type": "keyword",
+                "fields": {
+                    "pname": {
+                        "analyzer": "my_ngram_title",
+                        "type": "text"
+                    }
+                }
+            },
+            "area": {
+                "type": "keyword"
+            },
+            "city": {
+                "type": "keyword"
+            },
+            "district": {
+                "type": "keyword"
+            },
+            "s_winner": {
+                "analyzer": "douhao",
+                "type": "text",
+                "fields": {
+                    "mwinner": {
+                        "analyzer": "my_ngram_title",
+                        "type": "text"
+                    }
+                }
+            },
+            "pici": {
+                "type": "long"
+            },
+            "id": {
+                "type": "keyword"
+            },
+            "title": {
+                "analyzer": "my_ngram_title",
+                "type": "text",
+                "fields": {
+                    "mtitle": {
+                        "type": "keyword"
+                    }
+                }
+            },
+            "detail": {
+                "analyzer": "my_ngram",
+                "type": "text"
+            },
+            "site": {
+                "type": "keyword"
+            },
+            "comeintime": {
+                "type": "long"
+            },
+            "href": {
+                "type": "keyword"
+            },
+            "infoformat": {
+                "type": "long"
+            },
+            "publishtime": {
+                "type": "long"
+            },
+            "toptype": {
+                "type": "keyword"
+            },
+            "subtype": {
+                "type": "keyword"
+            },
+            "createtime": {
+                "type": "long"
+            }
+        }
+    }
+}'