Elasticsearch 核心概念、Kibana 测试与 C++ 客户端封装实战

核心概念

Elasticsearch（简称 ES）是一个开源的分布式搜索引擎，具备零配置、自动发现、索引分片及副本机制等特点。相比传统数据库，它在文本搜索场景下更为高效实用。

数据库通常采用二叉搜索树策略，在模糊匹配时效率较低；而 ES 擅长分词搜索，例如'你好，世界'会被拆解为多个词条进行检索。

ES 核心概念

索引（Index）：拥有相似特征的文档集合，类似 MySQL 中的库。
类型（Type）：索引的逻辑分类，类似表结构（注：新版 ES 中已弃用，建议一个索引管理一种数据）。
字段（Field）：文档数据的属性标识，类似列。

字段类型说明

分类	类型	备注
字符串	`text`, `keyword`	text 会分词生成索引；keyword 不分词，仅精确匹配
整形	`integer`, `long`, `short`, `byte`	-
浮点	`double`, `float`	-
逻辑	`boolean`	true 或 false
日期	`date`, `date_nanos`	支持时间戳或标准格式
二进制	`binary`	通常只存储不索引

映射（Mapping）

映射定义了文档中每个字段的类型及处理方式。通过 enabled 可控制是否参与搜索分析，通过 boost 可设置字段权重。例如在音乐软件搜索中，可将歌名设为最高权重。

常见映射参数如下：

名称	默认值	备注
`enabled`	true	false 时仅作存储
`index`	true	false 时不构建倒排索引
`dynamic`	true	控制未定义字段的自动更新
`doc_value`	true	用于聚合和排序，分词字段不可用
`analyzer`	standard	指定分词器，如 ik
`boost`	1.0	字段级别分数加权

安装与配置

使用 apt 安装 Elasticsearch 7.x 版本。


curl -s https://artifacts.elastic.co/GPG-KEY-elasticsearch |  gpg --no-default-keyring --keyring gnupg:/etc/apt/trusted.gpg.d/elasticsearch.gpg --import


  |   /etc/apt/sources.list.d/elasticsearch.list


 apt update
 apt-get install elasticsearch=7.17.21


 systemctl start elasticsearch


 /usr/share/elasticsearch/bin/elasticsearch-plugin install https://get.infini.cloud/elasticsearch/analysis-ik/7.17.21

#include <elasticlient/client.h> #include <json/json.h> #include <cpr/cpr.h> #include <iostream> #include <vector> #include "../spdlog/logger.hpp" // 序列化辅助函数 bool Serialize(const Json::Value &val, std::string &out) { auto nsw = Json::StreamWriterBuilder().newStreamWriter(); std::stringstream ss; int ret = nsw->write(val, &ss); if (ret != 0) { std::cout << "序列化失败"; return false; } out = ss.str(); return true; } // 反序列化辅助函数 bool UnSerialize(const std::string &str, Json::Value &val) { auto crb = Json::CharReaderBuilder().newCharReader(); std::string erro; bool ret = crb->parse(str.c_str(), str.c_str() + str.size(), &val, &erro); if (ret == false) { std::cout << "反序列化失败" << std::endl; return false; } return true; } // 创建索引类 class ESIndex { public: ESIndex(const std::shared_ptr<elasticlient::Client> client, std::string name, const std::string type = "_doc") : _client(client), _name(name), _type(type) { Json::Value ik; ik["tokenizer"] = "ik_max_word"; Json::Value analyzer; analyzer["ik"] = ik; Json::Value analysis; analysis["analyzer"] = analyzer; Json::Value settings; settings["analysis"] = analysis; _index["settings"] = settings; } ESIndex append(const std::string &key, const std::string &type = "text", const std::string &analyzer = "ik_max_word", bool enabled = true) { Json::Value data; data["type"] = type; data["analyzer"] = analyzer; data["enabled"] = enabled; _properties[key] = data; return *this; } bool create() { Json::Value mappings; mappings["dynamic"] = true; mappings["properties"] = _properties; _index["mappings"] = mappings; std::string body; Serialize(_index, body); try { auto ret = _client->index(_name, _type, "", body); if (ret.status_code < 200 || ret.status_code >= 300) { LOG_ERR("创建索引 {} 失败", _name); return false; } } catch (std::exception &e) { LOG_ERR("创建索引 {} 失败:{}", _name, e.what()); return false; } return true; } private: std::string _name; std::string _type; Json::Value _properties; Json::Value _index; std::shared_ptr<elasticlient::Client> _client; }; // 插入数据类 class ESInsert { public: ESInsert(const std::shared_ptr<elasticlient::Client> client, std::string name, const std::string type = "_doc") : _client(client), _name(name), _type(type) {} template<typename T> ESInsert& append(const std::string& key, const T& val) { _item[key] = val; return *this; } bool insert(const std::string& id = "") { std::string data; bool ret = Serialize(_item, data); if (ret == false) return false; try { auto rsp = _client->index(_name, _type, id, data); if (rsp.status_code < 200 || rsp.status_code >= 300) { LOG_ERR("数据插入失败:{}", rsp.status_code); return false; } } catch (std::exception& e) { LOG_ERR("数据插入失败:{}", e.what()); return false; } return true; } private: std::string _name; std::string _type; Json::Value _item; std::shared_ptr<elasticlient::Client> _client; }; // 删除数据类 class ESRemove { public: ESRemove(const std::shared_ptr<elasticlient::Client> client, std::string name, const std::string type = "_doc") : _client(client), _name(name), _type(type) {} bool remove(std::string id) { try { auto rsp = _client->remove(_name, _type, id); if (rsp.status_code < 200 || rsp.status_code >= 300) { LOG_ERR("数据删除失败:{}", rsp.status_code); return false; } } catch (std::exception& e) { LOG_ERR("数据删除失败:{}", e.what()); return false; } return true; } private: std::string _name; std::string _type; std::shared_ptr<elasticlient::Client> _client; }; // 查询数据类 class ESSearch { public: ESSearch(const std::shared_ptr<elasticlient::Client> client, std::string name, const std::string type = "_doc") : _client(client), _name(name), _type(type) {} ESSearch& append_must_not_terms(const std::string& key, const std::vector<std::string>& data) { Json::Value mnt; for (auto x : data) mnt[key].append(x); Json::Value terms; terms["terms"] = mnt; _must_not.append(terms); return *this; } ESSearch& append_must_terms(const std::string& key, const std::string& val) { Json::Value mt; mt[key] = val; Json::Value terms; terms["terms"] = mt; _must.append(terms); return *this; } ESSearch& append_must_match(const std::string& key, const std::string& val) { Json::Value mm; mm[key] = val; Json::Value match; match["match"] = mm; _must.append(match); return *this; } ESSearch& append_should_match(const std::string& key, const std::string& val) { Json::Value sm; sm[key] = val; Json::Value match; match["match"] = sm; _should.append(match); return *this; } Json::Value search() { Json::Value data; if (!_must_not.empty()) data["must_not"] = _must_not; if (!_must.empty()) data["must"] = _must; if (!_should.empty()) data["should"] = _should; Json::Value bl; bl["bool"] = data; Json::Value query; query["query"] = bl; std::string body; bool ret = Serialize(query, body); if (ret == false) { LOG_ERR("序列化失败"); return Json::Value(); } cpr::Response rsp; try { rsp = _client->search(_name, _type, body); if (rsp.status_code < 200 || rsp.status_code >= 300) { LOG_ERR("搜索失败:{}", rsp.status_code); return Json::Value(); } } catch (std::exception& e) { LOG_ERR("搜索失败:{}", e.what()); return Json::Value(); } Json::Value val; ret = UnSerialize(rsp.text, val); if (ret == false) { LOG_ERR("反序列化失败"); return Json::Value(); } return val["hits"]["hits"]; } private: std::string _name; std::string _type; Json::Value _must_not; Json::Value _must; Json::Value _should; std::shared_ptr<elasticlient::Client> _client; };

Elasticsearch 核心概念、Kibana 测试与 C++ 客户端封装实战

核心概念

安装与配置

更多推荐文章

相关免费在线工具

测试示例

客户端 API 使用

二次封装源码

更多推荐文章

相关免费在线工具

Elasticsearch 核心概念、Kibana 测试与 C++ 客户端封装实战

核心概念

安装与配置

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

测试示例

客户端 API 使用

二次封装源码

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具