ES基础知识总结含SQL、DSL、GOLANG

本文介绍: Elas t ic search 生态简介+es与kibana的紧密结合使用方法+es多种混合查询使用+golang 框架调用以及源码解析

在这里插入图片描述

Elas t ic search是一个基于Lucene的全文搜索和分析引擎，Lucene Core是一个完全用Jav a 编写的高性能、全功能搜索引擎库。

它可以扩展到上百台服务器，处理PB级数据。PB = 2^50 Byt e，在数值上约等于1000个TB。人类功能记忆容量约1.25TB，也意味着800个人类记忆相当于1PB。

Luc ene，封装好了各种建立倒排索引、匹配索引进行搜索的各种算法。我们可以引入Lucene，基于它的API进行开发。

Elas t icSearc h就在Lucene的基础上实现的，对Lucene进行了良好的封装，简化开发，并提供了很多高级功能

term	Doc 1	Doc 2	Doc 3
no	✅
po	✅
work	✅	✅
enjoy		✅	✅
your	✅	✅	✅
team		✅	✅
With			✅
chal len ge			✅

Elasticsearch 名称	ElasticSearc h 概念	数据库
Index	索引	库
Type	类型	表
Document	文档	行
field	字段	列


version: '3.1'
services:
  elasticsearch:
    image: elasticsearch:7.13.3
    container_name: elasticsearch
    privileged: true
    environment:
      - "cluster.name=elasticsearch" #设置集群名称为elasticsearch
      - "discovery.type=single-node" #以单一节点模式启动
      - "ES_JAVA_OPTS=-Xms512m -Xmx1096m" #设置使用jvm内存大小
      - bootstrap.memory_lock=true
    volumes:
      - ./es/plugins:/usr/local/dockercompose/elasticsearch/plugins #插件文件挂载
      - ./es/data:/usr/local/dockercompose/elasticsearch/data:rw #数据文件挂载
      - ./es/logs:/usr/local/dockercompose/elasticsearch/logs:rw
    ports:
      - 9200:9200
      - 9300:9300
    deploy:
     resources:
        limits:
           cpus: "2"
           memory: 1000M
        reservations:
           memory: 200M
  kibana:
    image: kibana:7.13.3
    container_name: kibana
    depends_on:
      - elasticsearch #kibana在elasticsearch启动之后再启动
    environment:
      ELASTICSEARCH_HOSTS: http://elasticsearch:9200 #设置访问elasticsearch的地址
      I18N_LOCALE: zh-CN
    ports:
      - 5601:5601

将上述代码写入docker-compose.yml ，后运行即可拉起es、kibana 服务：

docker-compose up -d

method 方法	url地址	描述
PUT	/索引名称/类型名称/文档id	创建文档（指定id）
POST	/索引名称/类型名称	创建文档（随机id）
POST	/索引名称/类型名称/文档id/_update	修改文档
DELETE	/索引名称/类型名称/文档id	删除文档
GET	/索引名称/类型名称/文档id	通过id查询文档
POST	/索引名称/类型名称/_sear ch	查询所有数据


PUT /tool_index/
{
  "settings": {
    "index": {
      "number_of_shards":10,  
      "number_of_replicas":0
    }
  }
}

GET /tool_index/_settings

PUT /tool_index/tools/20230326214500
{
  "name": "ijie",
  "age": 22,
  "grade": 1,
  "hobby": "coding"
}

POST /tool_index/_doc
{
  "name": "erran_new",
  "age": 24,
  "grade": 2,
  "hobby": "code"
}

GET /tool_index/tools/_search

GET /tool_index/tools/_search?q=name:erran

GET /tool_index/tools/_search 
{
  "query": {
    "match": {
      "name.keyword": "erran"
    }
  }
  "_source": ["name", "grade"]
}

POST /tool_index/tools/20230326213100/_update
{
  "doc": {
    "grade": 3
  }
}

PUT /tool_index/tools/20230326214500
{
  "people": "ijie"
}

DELETE /tool_index/tools/20230326214500

DELETE tool_index

name	age	sex	grade	hobby	Weight
John	24	男	2	code
Alis	24	女	1	movie
Jack	22	男	1	code
Rookie	23	男	4	read	sixty kilo grams
Jam	25	女	3	eat	fifty-kilo-grams

select * from person where name = 'Rookie';

GET /person/_search
{
  "query": {
    "term": {
      "name": "Rookie"
    }
  }
}

      {
        "_index" : "person",
        "_type" : "_doc",
        "_id" : "rIpjQYcBtP47ROwdblh9",
        "_score" : 0.2876821,
        "_source" : {
          "name" : "Rookie",
          "age" : 23,
          "sex" : "男",
          "grade" : 4,
          "hobby" : "read"
        }
      }

	client, err := elastic.NewClient(elastic.SetURL("http://xxxx:9200"),
		elastic.SetSniff(false),
		elastic.SetHealthcheck(false),
		elastic.SetBasicAuth("username", "password"))
	if err != nil {
		fmt.Println(err)
		return
	}
	q := elastic.NewTermQuery("name", "Rookie")
	req, err := client.Search().
		Index("person").
		Query(q).
		Do(context.Background())
	if err != nil {
		fmt.Println(err)
		return
	}
	for _, v := range req.Hits.Hits {
		var tmp interface{}
		_ = json.Unmarshal(v.Source, &amp;tmp)
		fmt.Println(tmp)
	}

select * from persons where age in(23, 24);

GET /person/_search
{
  "query": {
    "terms": {
      "age": [23,24]
    }
  }
}

      {
        "_index" : "person",
        "_type" : "_doc",
        "_id" : "rIpjQYcBtP47ROwdblh9",
        "_score" : 1.0,
        "_source" : {
          "name" : "Rookie",
          "age" : 23,
          "sex" : "男",
          "grade" : 4,
          "hobby" : "read"
        }
      },
      {
        "_index" : "person",
        "_type" : "_doc",
        "_id" : "n4phQYcBtP47ROwd1Vha",
        "_score" : 1.0,
        "_source" : {
          "name" : "Alis",
          "age" : 24,
          "sex" : "女",
          "grade" : 1,
          "hobby" : "movie"
        }
      },
      {
        "_index" : "person",
        "_type" : "_doc",
        "_id" : "vIlfQYcBzqYw9eGTVRry",
        "_score" : 1.0,
        "_source" : {
          "name" : "John",
          "age" : 24,
          "sex" : "男",
          "grade" : 2,
          "hobby" : "code"
        }
      }

	q := elastic.NewTermsQuery("age", 23, 24)
	req, err := client.Search().
		Index("person").
		Query(q).
		Do(context.Background())

select * from pesons where age between 21 and 23;

GET /person/_search
{
  "query": {
    "range": {
      "age": {
        "gte": 21,
        "lte": 23
      }
    }
  }
}

      {
        "_index" : "person",
        "_type" : "_doc",
        "_id" : "rIpjQYcBtP47ROwdblh9",
        "_score" : 1.0,
        "_source" : {
          "name" : "Rookie",
          "age" : 23,
          "sex" : "男",
          "grade" : 4,
          "hobby" : "read"
        }
      },
      {
        "_index" : "person",
        "_type" : "_doc",
        "_id" : "DYliQYcBzqYw9eGTqht2",
        "_score" : 1.0,
        "_source" : {
          "name" : "Jack",
          "age" : 22,
          "sex" : "男",
          "grade" : 1,
          "hobby" : "code"
        }
      }

	q := elastic.NewRangeQuery("age").Gte(21).Lte(23)
	req, err := client.Search().
		Index("person").
		Query(q).
		Do(context.Background())

select * from persons where hobby like '%o%';

GET /person/_search
{
  "query": {
    "wildcard": {
      "hobby": "*o*"
    }
  }
}

      {
        "_index" : "person",
        "_type" : "_doc",
        "_id" : "n4phQYcBtP47ROwd1Vha",
        "_score" : 1.0,
        "_source" : {
          "name" : "Alis",
          "age" : 24,
          "sex" : "女",
          "grade" : 1,
          "hobby" : "movie"
        }
      },
      {
        "_index" : "person",
        "_type" : "_doc",
        "_id" : "vIlfQYcBzqYw9eGTVRry",
        "_score" : 1.0,
        "_source" : {
          "name" : "John",
          "age" : 24,
          "sex" : "男",
          "grade" : 2,
          "hobby" : "code"
        }
      },
      {
        "_index" : "person",
        "_type" : "_doc",
        "_id" : "DYliQYcBzqYw9eGTqht2",
        "_score" : 1.0,
        "_source" : {
          "name" : "Jack",
          "age" : 22,
          "sex" : "男",
          "grade" : 1,
          "hobby" : "code"
        }
      }

q := elastic.NewWildcardQuery("hobby", "*o*")
	req, err := client.Search().
		Index("person").
		Query(q).
		Do(context.Background())

match 查询是执行全文搜索的标准查询，包括模糊匹配的选项。

GET /person/_search
{
  "query": {
    "match": {
      "weight": {
        "query": "fifty-kilo-grams"
      }
    }
  }
}

match 用到的参数

GET /person/_search
{
  "query": {
    "match": {
      "weight": "fifty-kilo-grams"
    }
  }
}

可以使用fuzziness来模糊匹配字段, “AUTO”会根据词项的长度来产生可编辑距离,默认值是AUTO:3,6

可以使用prefix_length、max_expansions来控制模糊过程

可以使用fuzzy_rewrite来允许控制查询将如何被重写

可以使用fuzzy_transpositions来控制是否允许模糊换位(ab->ba)

GET /person/_search
{
  "query": {
    "match": {
      "weight": {
        "query": "2fifty-kilo-grams1",
        "fuzziness": "AUTO"
      }
    }
  }
}

GET /person/_mapping

"properties" : {
  "age" : {
    "type" : "long"
  },
  "grade" : {
    "type" : "long"
  },
  "hobby" : {
    "type" : "keyword"
  },
  "name" : {
    "type" : "keyword"
  },
  "sex" : {
    "type" : "keyword"
  },
  "weight" : {
    "type" : "keyword"
  }
}

新建一个text类型的new_field，并设置new_field.keyword为keyword类型

PUT /person/_mapping
{
  "properties": {
    "new_field": {
      "type": "text",
      "fields": {
        "keyword": {
          "type": "keyword",
          "ignore_above": 256
        }
      }
    }
  }
}

POST /person/_doc/rIpjQYcBtP47ROwdblh9
{
  "name": "Rookie",
  "age": 23,
  "sex": "男",
  "grade": 4,
  "hobby": "read",
  "weight": "sixty kilogram",
  "new_field": "sixty kilo grams, sixty kilogram, 60 千克"
}
POST /person/_doc/vYplQYcBtP47ROwdc1gz
{
  "name": "Jam",
  "age": 25,
  "sex": "女",
  "grade": 3,
  "hobby": "eat",
  "weight": "fifty-kilo-grams",
  "new_field": "60"
}

match_all(固定用法： "match_all": {}) 查询所有

GET /person/_analyze
{
  "text":"sixty kilo grams, sixty kilogram, 60 千克"
}

text	term	match	match_phrase
分词器分词	✅	✅	✅
分词器多个分词	❌	✅	✅
完整内容	❌	✅	✅
中文短语	❌	✅	✅

{ "id" : 1,"content":"关注我,系统学编程" }
{ "id" : 2,"content":"系统学编程,关注我" }
{ "id" : 3,"content":"系统编程,关注我" }
{ "id" : 4,"content":"关注我,间隔系统学编程" }

查询 关注我，系统学

q := elastic.NewMatchQuery("new_field", "60").Operator("and")
	//map[age:23 grade:4 hobby:read name:Rookie new_field:sixty kilo grams, sixty kilogram, 60 千克 sex:男 weight:sixty kilogram, 60kg,千克]
q2 := elastic.NewMatchPhraseQuery("new_field", "千克")
	//map[age:25 grade:3 hobby:eat name:Jam new_field:60 sex:女 weight:fifty-kilo-grams]
	//map[age:23 grade:4 hobby:read name:Rookie new_field:sixty kilo grams, sixty kilogram, 60 千克 sex:男 weight:sixty kilogram, 60kg,千克]

type MatchQuery struct {
	name                string    		// key
	text                interface{}		// value
  operator            string 				// or(默认)/and 使用and时，需要查询字段包含query中的所有分词
	analyzer            string
	boost               *float64			// 权重
  fuzziness           string				// AUTO(默认) 可编辑最大距离
	prefixLength        *int					// 未模糊的初始字符数
	maxExpansions       *int					// 结果返回term的数量限制
	minimumShouldMatch  string
	fuzzyRewrite        string
	lenient             *bool					// 忽略数据类型不匹配
	fuzzyTranspositions *bool
  zeroTermsQuery      string				// none(默认)/all 使用all时 忽略analyzer限制，效果与match_all相似
  cutoffFrequency     *float64			// 分数(0.02)表示频率，正整数(3)表示出现次数 
	queryName           string
}

type MatchPhraseQuery struct {
	name           string							// key
	value          interface{}				// value
	analyzer       string
	slop           *int								//分词词项最大移动次数
	boost          *float64
	queryName      string
	zeroTermsQuery string
}


GET /person/_search
{
  "query": {
    "multi_match": {
      "query": "sixty 60",
      "fields": ["weight", "new_field"]
    }
  }
}

GET /person/_search
{
  "query": {
    "dis_max": {
      "queries": [
        { "match": { "weight": "sixty 60" }},
        { "match": { "new_field": "sixty 60" }}
      ]
    }
  }
}

the multi_match builds on the match query to allow multi-field queries

q := elastic.NewMultiMatchQuery("sixty 60", "weight", "new_field").Operator("and")
// map[age:23 grade:4 hobby:read name:Rookie new_field:sixty kilo grams, sixty kilogram, 60 千克 sex:男 weight:sixty kilogram, 60kg,千克]
q := elastic.NewMultiMatchQuery("sixty 60", "weight", "new_field")
// map[age:23 grade:4 hobby:read name:Rookie new_field:sixty kilo grams, sixty kilogram, 60 千克 sex:男 weight:sixty kilogram, 60kg,千克]
// map[age:25 grade:3 hobby:eat name:Jam new_field:60 sex:女 weight:fifty-kilo-grams]

SELECT * FROM person WHERE sex='女' AND age>=23;

GET /person/_search
{
  "query": {
    "bool": {
      "must": [
        {
          "term": {
            "sex": {
              "value": "女"
            }
          }
        },
        {
          "range": {
            "age": {
              "gte": 23
            }
          }
        }
      ]
    }
  }
}

query1 := elastic.NewTermQuery("sex", "女")
	query2 := elastic.NewRangeQuery("age").Gte(23)
	q := elastic.NewBoolQuery().Must(query1, query2)
// map[age:25 grade:3 hobby:eat name:Jam new_field:60 sex:女 weight:fifty-kilo-grams]
// map[age:24 grade:1 hobby:movie name:Alis sex:女]

// Creates a new bool query.
func NewBoolQuery() *BoolQuery {
	return &amp;BoolQuery{
		mustClauses:    make([]Query, 0),
		mustNotClauses: make([]Query, 0),
		filterClauses:  make([]Query, 0),
		shouldClauses:  make([]Query, 0),
	}
}

select *from persons
where 
	sex = '男'
and
	age between 22 and 25
and 
	grade != 1
and 
	(hobby = 'code' OR weight = 'sixty kilogram, 60kg,千克')

GET /person/_search
{
  "query": {
    "bool": {
      "must": [
        {
          "term": {
            "sex": {
              "value": "男"
            }
          }
        },
        {
          "range": {
            "age": {
              "gte": 22,
              "lte": 25
            }
          }
        }
      ],
      "must_not": [
        {
          "match": {
            "grade": 1
          }
        }
      ],
      "should": [
        {
          "match": {
            "hobby": "code"
          }
        },
        {
          "match_phrase": {
            "weight": "sixty kilogram"
          }
        },
        {
          "match_phrase": {
            "weight": "60kg"
          }
        },
        {
          "match_phrase": {
            "weight": "千克"
          }
        }
      ]
    }
  }
}

	query1 := elastic.NewTermQuery("sex", "男")
	query2 := elastic.NewRangeQuery("age").Gte(23).Lte(25)
	query3 := elastic.NewMatchQuery("grade", 1)
	query4 := elastic.NewMatchQuery("hobby", "code")
	query5 := elastic.NewMatchPhraseQuery("weight", "sixty kilogram")
	query6 := elastic.NewMatchPhraseQuery("weight", "60kg")
	query7 := elastic.NewMatchPhraseQuery("weight", "千克")
	query := elastic.NewBoolQuery().
		Must(query1, query2).
		MustNot(query3).
		Should(query4, query5, query6, query7)
	q := elastic.NewBoolQuery().Filter(query)

GET /person/_search
{
  "aggs": {
    "max_age": {
      "max": {
        "field": "age"
      }
    },
    "min_age": {
      "min": {
        "field": "age"
      }
    },
    "avg_age": {
      "avg": {
        "field": "age"
      }
    }
  }
}

  aggs := elastic.NewMaxAggregation().Field("age")
	q := elastic.NewMatchAllQuery()
	req, err := client.Search().
		Index("person").
		Query(q).
		Aggregation("max_age", aggs).
		Do(context.Background())
// 结果在req.Aggregations中 
// 调用Aggregations对象的方法来获取想要的聚合结果
  aggResult, _ := req.Aggregations.Max("max_age")
	maxAge := *aggResult.Value
	fmt.Printf("Max age: %dn", int(maxAge))
// Max age: 25

GET /person/_search
{
  "aggs": {
    "hobby_count": {
      "cardinality": {
        "field": "hobby"
      }
    }
  }
}

	aggs := elastic.NewCardinalityAggregation().Field("hobby")
	q := elastic.NewMatchAllQuery()
	req, err := client.Search().
		Index("person").
		Query(q).
		Aggregation("hobby_count", aggs).
		Do(context.Background())
//hobby count : 4

GET /person/_search
{
  "aggs": {
    "count": {
      "terms": {
        "field": "sex",
        "size": 10
      }
    }
  }
}
//   "aggregations" : {
//    "count" : {
//      "doc_count_error_upper_bound" : 0,
//      "sum_other_doc_count" : 0,
//      "buckets" : [
//        {
//          "key" : "男",
//         "doc_count" : 3
//        },
//        {
//          "key" : "女",
//         "doc_count" : 2
//        }
//      ]
//    }
//  }

  aggs := elastic.NewTermsAggregation().Field("sex")
	q := elastic.NewMatchAllQuery()
	req, err := client.Search().
		Index("person").
		Query(q).
		Aggregation("count", aggs).
		Do(context.Background())
  aggResult, _ := req.Aggregations.Terms("count")
	for _, v := range aggResult.Buckets {
		fmt.Printf("%v--%dn", v.Key, v.DocCount)
	}
//男--3
//女--2

Warning⚠️：Elasticsearch 不支持对 text 类型的字段进行聚合操作。

显示所有内容

声明：本站所有文章，如无特殊说明或标注，均为本站原创发布。任何个人或组织，在未征得本站同意时，禁止复制、盗用、采集、发布本站内容到任何网站、书籍等各类媒体平台。如若本站内容侵犯了原著者的合法权益，可联系我们进行处理。

es golang lucene

一、简介

二、认知

1、Luc ene

2、倒排索引

3、基本 概念

Document文档

数据类型

三、es与kibana 安装

四、kibana对elasticsear ch 管理

五、查询场景

语句查询

词条查询

单值查询-term

多值查询-terms

范围查询-range

通配符查询-wildcard

匹配查询

复合查询

聚合查询

统计

去重查询

分组

发表回复取消回复