C++算法

哈希表进阶：用哈希桶封装 unordered_set 和 unordered_map 及迭代器实现

哈希表进阶实现基于哈希桶结构封装 C++ 标准库的 unordered_set 和 unordered_map。重点阐述模板参数设计、仿函数获取键值、单向迭代器的重载与实现逻辑，以及扩容机制。通过对比 set 与 unordered_set 性能，展示哈希表优势，并提供完整代码示例。

二进制发布于 2026/3/23更新于 2026/5/45 浏览

哈希表进阶：用哈希桶封装 unordered_set 和 unordered_map 及迭代器实现

一、常见接口详解（C++标准库）

文档：《unordered_set》，《unordered_map》

这个我们已经是老生常谈了。

1.1、unordered_set / unordered_map

unordered_set 和 unordered_map 的接口几乎完全相同，所以我们以 unordered_set 为例讲解：

// 头文件： #include<unordered_set> #include<unordered_map>

构造相关接口（常用）
unordered_set ( const unordered_set& ust );	拷贝构造
unordered_set ( InputIterator first, InputIterator last )	迭代器区间构造
unordered_set ( initializer_list<value_type> il)	初始化列表构造
其他接口（常用）
size_type size()	计算哈希表中的数据个数
size_type count ( const key_type& k )	统计值为 k 的数据个数
pair<iterator,bool> insert ( const value_type& val )	插入（注意返回值类型）
iterator erase ( const_iterator position )	删除
迭代器
iterator begin() const_iterator begin() const	返回哈希表第一个存储有效数据位置的迭代器。
iterator end() const_iterator end() const	返回哈希表最后一个位置之后位置的迭代器

1.2、接口测试

void test01() { // unordered_set（无序） unordered_set<int> ust({ 4,2,6,7,9,1,8,0 }); // 初始化列表构造 // 利用迭代器遍历 unordered_set<int>::iterator it = ust.begin(); while (it != ust.end()) { cout << *it << " "; it++; } cout << endl; // set（有序） set<int> st({ 4,2,6,7,9,1,8,0 }); set<int>::iterator begin = st.begin(); while (begin != st.end()) { cout << *begin << " "; begin++; } cout << endl; }

void test02() { size_t N = 10000000; unordered_set<int> us; set<int> st; vector<int> v; v.reserve(N); srand(time(0)); for (size_t i = 0; i < N; i++) { v.push_back(rand() + i); } // 插入数据性能比较 int begin1 = clock(); for (auto e1 : v) { us.insert(e1); } int end1 = clock(); cout << "unordered_set insert: " << end1 - begin1 << endl; int begin2 = clock(); for (auto e2 : v) { st.insert(e2); } int end2 = clock(); cout << "set insert: " << end2 - begin2 << endl; // 插入数据个数 cout << "unordered_set size: " << us.size() << endl; cout << "set size: " << st.size() << endl; // 查找性能 int begin3 = clock(); for (auto e3 : v) { us.find(e3); } int end3 = clock(); cout << "unordered_set find: " << end3 - begin3 << endl; int begin4 = clock(); for (auto e4 : v) { st.find(e4); } int end4 = clock(); cout << "set find: " << end4 - begin4 << endl; // 删除性能 int begin5 = clock(); for (auto e5 : v) { us.erase(e5); } int end5 = clock(); cout << "unordered_set erase: " << end5 - begin5 << endl; int begin6 = clock(); for (auto e6 : v) { st.erase(e6); } int end6 = clock(); cout << "set erase: " << end6 - beg

// K --------键值（key）类型
// T --------哈希实际存储的数据类型
// keyOfT --------仿函数：获取 key 值
// Hash ----------将不同类型的 key 转换为对应的 unsigned int 类型的值
template<class K, class T, class keyOfT, class Hash> class Hash_Bucket {
 typedef HashNode<T> Node;
public:
 // 构造
 Hash_Bucket() :_tables(__stl_next_prime(0)) , _size(0) {}
private:
 vector<Node*> _tables; // Node*类型的数组
 size_t _size = 0; // 记录数据个数
};

// ---------------unordered_set 的仿函数-----------------------
struct keyOfSet {
 const K& operator()(const K& key) { return key; }
};
// ---------------unordered_map 的仿函数-----------------------
struct keyOfMap {
 const K& operator()(const pair<K, V>& kv) // const 修饰返回值，因为键值不能修改
 { return kv.first; }
};

// Ref--------------指代 T& 还是 const T&
// Ptr--------------指代 T* 还是 const T*
template<class K, class T, class Ref, class Ptr, class keyOfT, class Hash> struct HTIterator {
 typedef HashNode<T> Node;
 typedef Hash_Bucket<K, T, keyOfT, Hash> Hash_Bucket;
 typedef HTIterator<K, T, Ref, Ptr, keyOfT, Hash> Self;
 Node* _node; // 当前位置的节点
 const Hash_Bucket* _ht; // 用来找_tables，_tables.size()来确定哈希表的大小，方便取模
 HTIterator(Node* node,const Hash_Bucket* ht) :_node(node) ,_ht(ht) { }
 // ...
};

Self& operator++() {
 // 当前桶还有节点
 if (_node->_next) {
 _node = _node->_next;
 }
 // 当前桶只有一个节点，找下一个不为空的桶
 else {
 keyOfT kot; // 仿函数
 Hash hash; // 仿函数
 size_t hashi = hash(kot(_node->_data)) % _ht->_tables.size(); // 定位到当前的桶
 ++hashi; // 向后寻找
 while (hashi < _ht->_tables.size()) {
 _node = _ht->_tables[hashi]; // _node 指向下一个桶
 // 下一个桶不为空
 if (_node) break;
 // 这个桶仍为空，继续向后找
 else hashi++;
 }
 // 如果 hashi 定位到哈希表的结尾，标记节点为空
 if (hashi == _ht->_tables.size()) {
 _node = nullptr;
 }
 return *this; // 返回++后的迭代器
 }
}

// 友元声明
template<class K, class T, class Ref, class Ptr, class keyOfT, class Hash> friend struct HTIterator;
// --------在前面加上 friend

// 重载*
Ref operator*() { return _node->_data; }
// 重载 ->
Ptr operator->() { return &_node->_data; }
// 重载 ==
bool operator==(const Self& s) const { return _node == s._node; }
// 重载 !=
bool operator!=(const Self& s) const { return _node != s._node; }

#include"Hash_Bucket.h"
template<class K,class Hash=HashFun<K>> class UnorderedSet {
 // --------------------仿函数--------------------------------
 struct keyOfSet {
 const K& operator()(const K& key) { return key; }
 };
 //----------------------------------------------------------
public:
 typedef typename Hash_Bucket<K, const K, keyOfSet, Hash>::Iterator iterator;
 typedef typename Hash_Bucket<K, const K, keyOfSet, Hash>::ConstIterator const_iterator;
 // ----------------------------普通迭代器-------------------------
 iterator begin() { return _ht.Begin(); }
 iterator end() { return _ht.End(); }
 // ----------------------------const 迭代器------------------------
 const_iterator begin() const { return _ht.Begin(); }
 const_iterator end() const { return _ht.End(); }
 pair<iterator, bool> insert(const K& key) // -----------插入
 { return _ht.Insert(key); }
 iterator find(const K& key) // -------------查找
 { return _ht.Find(key); }
 bool erase(const K& key) //--------------删除
 { return _ht.Erase(key); }
private:
 Hash_Bucket<K, const K, keyOfSet, Hash> _ht; // 成员变量（哈希表类对象）
};

#include"Hash_Bucket.h"
template<class K,class V,class Hash=HashFun<K>> class UnorderedMap {
 // ---------------------------仿函数--------------------------------
 struct keyOfMap {
 const K& operator()(const pair<K, V>& kv) // const 修饰键值，键值不能修改
 { return kv.first; }
 };
 // ---------------------------------------------------------------------
public:
 typedef typename Hash_Bucket<K, pair<const K, V>, keyOfMap, Hash>::Iterator iterator;
 typedef typename Hash_Bucket<K, pair<const K, V>, keyOfMap, Hash>::ConstIterator const_iterator;
 // --------------------------普通迭代器----------------------------
 iterator begin() { return _ht.Begin(); }
 iterator end() { return _ht.End(); }
 // -------------------------const 迭代器—-----------------------------
 const_iterator begin()const { return _ht.Begin(); }
 const_iterator end()const { return _ht.End(); }
 V& operator[](const K& key) // --------------------重载 operator[]
 { pair<iterator, bool> ret = insert({ key,V() }); return ret.first->second; }
 pair<iterator,bool> insert(const pair<K, V>& kv) //--------------插入
 { return _ht.Insert(kv); }
 iterator find(const K& key) //-------------------------查找
 { return _ht.Find(key); }
 bool erase(const K& key) // ----------------------删除
 { return _ht.Erase(key); }
private:
 Hash_Bucket<K, pair<const K, V>, keyOfMap, Hash> _ht; // 成员变量
};

void test01() {
 unordered_map<string,string> str;
 vector<string> v({ "sort","left","insert","hdszm","a","b","c","d","e"});
 // 9 个数据
 size_t count = str.bucket_count();
 cout << "bucket_count: " << count << endl;
 // 向 str 对象插入数据
 for (auto e : v) {
 str.insert({ e,e }); // 构造 pair 对象插入（多参数默认类型转换）
 }
 // 更新 count
 count = str.bucket_count(); // 调用 bucket_count() 函数
 cout << "bucket_count: " << count << endl;
}

void test02() {
 unordered_map<string, string> str;
 vector<string> v({ "sort","left","insert","hdszm","a","b","c","d"});
 size_t size = str.bucket_size(2);
 cout << "bucket_size: " << size << endl;
 // 向 str 对象插入数据
 for (auto e : v) {
 str.insert({ e,e }); // 构造 pair 对象插入（多参数默认类型转换）
 }
 // 更新 size
 size = str.bucket_size(2); // 调用 bucket_size() 函数
 cout << "bucket_count: " << size << endl;
}

void test03() {
 // 初始化列表构造
 unordered_map<string, string> mymap = { {"us","United States"},{"uk","United Kingdom"}, {"fr","France"},{"de","Germany"} };
 for (auto& x : mymap) {
 cout << "Element [" << x.first << ":" << x.second << "]";
 cout << " is in bucket #" << mymap.bucket(x.first) << std::endl;
 }
 cout << "us: " << ('u' + 's') % 8 << endl;
 cout << "uk: " << ('u' + 'k') % 8 << endl;
 cout << "fr: " << ('f' + 'r') % 8 << endl;
 cout << "de: " << ('d' + 'e') % 8 << endl;
}

void test04() {
 unordered_map<string, string> mymap = { {"us","United States"},{"uk","United Kingdom"}, {"fr","France"},{"de","Germany"}};
 cout << "load_factor = " << mymap.load_factor() << std::endl;
}

void test05() {
 unordered_map<std::string, std::string> mymap1;
 unordered_map<std::string, std::string> mymap2;
 mymap1.rehash(20);
 mymap2.reserve(20);
 cout << "mymap1_rehash: " << mymap1.bucket_count() << endl;
 cout << "mymap2_reserve: " << mymap2.bucket_count() << endl;
}

哈希表进阶：用哈希桶封装 unordered_set 和 unordered_map 及迭代器实现

一、常见接口详解（C++标准库）

1.1、unordered_set / unordered_map

1.2、接口测试

哈希表进阶：用哈希桶封装 unordered_set 和 unordered_map 及迭代器实现

一、常见接口详解（C++标准库）

1.1、unordered_set / unordered_map

1.2、接口测试

更多推荐文章

相关免费在线工具

💦插入 / 遍历比较：

💦性能测试

二、哈希桶实现（进阶）

2.1、模板参数说明

2.2、获取键值---仿函数

2.3、迭代器

2.3.1、重载 operator++

2.3.2、重载其他

三、封装

3.1、unordered_set 封装

3.2、unordered_map 封装

四、拓展接口说明（C++标准库）

4.1、哈希表大小——bucket_count

4.2、对应位置处的数据个数——bucket_size

4.3、找数据所在位置——bucket

4.4、负载因子——load_factor

4.5、扩容——rehash/reserve

五、完整代码

<<

更多推荐文章

相关免费在线工具

哈希表进阶：用哈希桶封装 unordered_set 和 unordered_map 及迭代器实现

一、常见接口详解（C++标准库）

1.1、unordered_set / unordered_map

1.2、接口测试

哈希表进阶：用哈希桶封装 unordered_set 和 unordered_map 及迭代器实现

一、常见接口详解（C++标准库）

1.1、unordered_set / unordered_map

1.2、接口测试

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

💦插入 / 遍历比较：

💦性能测试

二、哈希桶实现（进阶）

2.1、模板参数说明

2.2、获取键值---仿函数

2.3、迭代器

2.3.1、重载 operator++

2.3.2、重载其他

三、封装

3.1、unordered_set 封装

3.2、unordered_map 封装

四、拓展接口说明（C++标准库）

4.1、哈希表大小——bucket_count

4.2、对应位置处的数据个数——bucket_size

4.3、找数据所在位置——bucket

4.4、负载因子——load_factor

4.5、扩容——rehash/reserve

五、完整代码

<<

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具