C++ 哈希表原理与 unordered 容器实战 | 极客日志

C++算法

C++ 哈希表原理与 unordered 容器实战

综述由AI生成哈希表通过哈希函数将 Key 映射到存储位置，实现 O(1) 平均查找效率。对比了基于红黑树的有序容器与基于哈希表的无序容器差异，解析了哈希冲突产生的原因及负载因子影响。重点讲解了线性探测、二次探测等开放定址法，以及链地址法（哈希桶）的实现细节。结合 C++ 标准库中的 unordered_set 和 unordered_map，展示了仿函数特化、扩容机制及迭代器封装的实战代码，帮助深入理解底层数据结构设计。

蜜桃汽水发布于 2026/3/16更新于 2026/6/1220 浏览

哈希

unordered_set 和 unordered_map

unordered_set

unordered_set 底层结构示意

set 和 unordered_set 功能高度相似，核心差异在于底层数据结构。

unordered_set 与 set 的差异：

Key 要求不同：set 要求 Key 支持小于比较（operator<），而 unordered_set 要求 Key 能转换为整型且支持等于比较（operator==）。
迭代器差异：set 的 iterator 是双向迭代器，底层红黑树中序遍历有序，所以遍历时有序 + 去重。unordered_set 底层是哈希表，iterator 是单向迭代器，遍历时无序 + 去重。
性能差异：大多数场景下，unordered_set 的增删查改更快。红黑树操作效率是 O(logN)，而哈希表平均效率是 O(1)。

unordered_map

unordered_map 底层结构示意

map 和 unordered_map 也是高度相似，仅有细微差异：

map 要求 Key 支持小于比较，unordered_map 要求 Key 支持转成整形且支持等于比较。
map 的 iterator 是双向迭代器，unordered_map 是单向迭代器。map 底层红黑树有序，unordered_map 底层哈希表 Key 无序 + 去重。
多数场景下，unordered_map 的增删查改更快，因为哈希表平均效率为 O(1)，优于红黑树的 O(logN)。

代码示例

#include <iostream>
#include <unordered_set>
using namespace std;

int main() {
    unordered_set<int> s = {3, 1, 6, 7, 8, 2, 1, , , , , };
    unordered_set<>::iterator it = s.();
     (it != s.()) {
        cout << *it << ;
        ++it;
    }
    cout << endl;
     ;
}

相关免费在线工具

加密/解密文本
使用加密算法（如AES、TripleDES、Rabbit或RC4）加密和解密文本明文。在线工具，加密/解密文本在线工具，online
Gemini 图片去水印
基于开源反向 Alpha 混合算法去除 Gemini/Nano Banana 图片水印，支持批量处理与下载。在线工具，Gemini 图片去水印在线工具，online
Base64 字符串编码/解码
将字符串编码和解码为其 Base64 格式表示形式即可。在线工具，Base64 字符串编码/解码在线工具，online
Base64 文件转换器
将字符串、文件或图像转换为其 Base64 表示形式。在线工具，Base64 文件转换器在线工具，online
Markdown转HTML
将 Markdown（GFM）转为 HTML 片段，浏览器内 marked 解析；与 HTML转Markdown 互为补充。在线工具，Markdown转HTML在线工具，online
HTML转Markdown
将 HTML 片段转为 GitHub Flavored Markdown，支持标题、列表、链接、代码块与表格等；浏览器内处理，可链接预填。在线工具，HTML转Markdown在线工具，online

template<class K>
struct HashFunc {
    size_t operator()(const K& key) {
        return (size_t)key;
    }
};

template<>
struct HashFunc<string> {
    size_t operator()(const string& s) {
        size_t hash = 0;
        for (auto& e : s) {
            // 有效避免 "abcd" 与 "bcad" 冲突
            hash += e;
            hash *= 131;
        }
        return hash;
    }
};

inline unsigned long __stl_next_prime(unsigned long n) {
    static const int __stl_num_primes = 28;
    static const unsigned long __stl_prime_list[__stl_num_primes] = {
        53, 97, 193, 389, 769, 1543, 3079, 6151, 12289, 24593,
        49157, 98317, 196613, 393241, 786433, 1572869, 3145739,
        6291469, 12582917, 25165843, 50331653, 100663319, 201326611,
        402653189, 805306457, 1610612741, 3221225473, 4294967291
    };
    const unsigned long* first = __stl_prime_list;
    const unsigned long* last = __stl_prime_list + __stl_num_primes;
    const unsigned long* pos = lower_bound(first, last, n);
    return pos == last ? *(last - 1) : *pos;
}

#include <vector>
#include <string>
#include <utility>
using namespace std;

enum State { EXIST, EMPTY, DELETE };

template<class K, class V>
struct HashData {
    pair<K, V> _kv;
    State _state = EMPTY;
};

template<class K>
struct HashFunc {
    size_t operator()(const K& key) {
        return (size_t)key;
    }
};

template<>
struct HashFunc<string> {
    size_t operator()(const string& s) {
        size_t hash = 0;
        for (auto& e : s) {
            hash += e;
            hash *= 131;
        }
        return hash;
    }
};

namespace open_address {
template<class K, class V, class Hash = HashFunc<K>>
class HashTable {
public:
    HashTable() : _tables(__stl_next_prime(0)), _n(0) {}

    bool Insert(const pair<K, V>& kv) {
        if (Find(kv.first)) return false;
        if (_n * 10 / _tables.size() >= 7) { // 扩容
            HashTable<K, V, Hash> newht;
            newht._tables.resize(__stl_next_prime(_tables.size() + 1));
            for (auto& e : _tables) {
                if (e._state == EXIST) newht.Insert(e._kv);
            }
            _tables.swap(newht._tables);
        }
        Hash hash;
        size_t hash0 = hash(kv.first) % _tables.size();
        size_t hashi = hash0;
        size_t i = 1;
        while (_tables[hashi]._state == EXIST) {
            hashi = (hash0 + i) % _tables.size();
            i++;
        }
        _tables[hashi]._kv = kv;
        _tables[hashi]._state = EXIST;
        ++_n;
        return true;
    }

    HashData<K, V>* Find(const K& key) {
        Hash hash;
        size_t hash0 = hash(key) % _tables.size();
        size_t hashi = hash0;
        size_t i = 1;
        while (_tables[hashi]._state != EMPTY) {
            if (_tables[hashi]._state == EXIST && _tables[hashi]._kv.first == key)
                return &_tables[hashi];
            hashi = (hash0 + i) % _tables.size();
            i++;
        }
        return nullptr;
    }

    bool Erase(const K& key) {
        HashData<K, V>* ret = Find(key);
        if (ret) {
            ret->_state = DELETE;
            return true;
        }
        return false;
    }

private:
    vector<HashData<K, V>> _tables;
    size_t _n; // 记录数据个数
};
}

#include "HashTable.h"
int main() {
    open_address::HashTable<int, int> ht;
    int a[] = {19, 30, 5, 36, 13, 20, 21, 12};
    for (auto e : a) {
        ht.Insert({e, e});
    }
    if (ht.Find(13)) ht.Erase(13);
    else cout << "没找到" << endl;
    return 0;
}

struct Date {
    int _year, _month, _day;
    Date(int year = 1, int month = 1, int day = 1)
        : _year(year), _month(month), _day(day) {}
    bool operator==(const Date& d) {
        return _year == d._year && _month == d._month && _day == d._day;
    }
};

struct DateHashFunc {
    size_t operator()(const Date& d) {
        size_t hash = 0;
        hash += d._year; hash *= 131;
        hash += d._month; hash *= 131;
        hash += d._day; hash *= 131;
        return hash;
    }
};

int main() {
    open_address::HashTable<Date, int, DateHashFunc> ht2;
    ht2.Insert({{2026, 1, 2}, 1});
    ht2.Insert({{2026, 2, 1}, 2});
    return 0;
}

namespace hash_bucket {
template<class K, class V>
struct HashNode {
    pair<K, V> _kv;
    HashNode<K, V>* _next;
    HashNode(const pair<K, V>& kv) : _kv(kv), _next(nullptr) {}
};

template<class K, class V, class Hash = HashFunc<K>>
class HashTable {
    typedef HashNode<K, V> Node;
public:
    HashTable() : _tables(__stl_next_prime(0)), _n(0) {}

    // 拷贝构造
    HashTable(const HashTable<K, V, Hash>& ht) {
        _tables.resize(ht._tables.size());
        for (int i = 0; i < ht._tables.size(); i++) {
            Node* htcur = ht._tables[i];
            while (htcur) {
                Node* newnode = new Node(htcur->_kv);
                Node* cur = _tables[i];
                if (cur == nullptr)
                    _tables[i] = newnode;
                else {
                    while (cur->_next) cur = cur->_next;
                    cur->_next = newnode;
                }
                htcur = htcur->_next;
            }
        }
        _n = ht._n;
    }

    ~HashTable() {
        for (int i = 0; i < _tables.size(); i++) {
            Node* cur = _tables[i];
            while (cur) {
                Node* next = cur->_next;
                delete cur;
                cur = next;
            }
            _tables[i] = nullptr;
        }
    }

    bool Insert(const pair<K, V>& kv) {
        if (Find(kv.first)) return false;
        Hash hash;
        if (_n == _tables.size()) { // 扩容
            vector<Node*> newTable(__stl_next_prime(_tables.size() + 1));
            for (int i = 0; i < _tables.size(); i++) {
                Node* cur = _tables[i];
                while (cur) {
                    Node* next = cur->_next;
                    size_t hashi = hash(cur->_kv.first) % newTable.size();
                    // 头插
                    cur->_next = newTable[hashi];
                    newTable[hashi] = cur;
                    cur = next;
                }
                _tables[i] = nullptr;
            }
            _tables.swap(newTable);
        }
        size_t hashi = hash(kv.first) % _tables.size();
        Node* newnode = new Node(kv);
        newnode->_next = _tables[hashi];
        _tables[hashi] = newnode;
        ++_n;
        return true;
    }

    Node* Find(const K& key) {
        Hash hash;
        size_t hashi = hash(key) % _tables.size();
        Node* cur = _tables[hashi];
        while (cur) {
            if (cur->_kv.first == key) return cur;
            cur = cur->_next;
        }
        return nullptr;
    }

    bool Erase(const K& key) {
        Hash hash;
        size_t hashi = hash(key) % _tables.size();
        Node* prev = nullptr;
        Node* cur = _tables[hashi];
        while (cur) {
            if (cur->_kv.first == key) {
                if (prev == nullptr)
                    _tables[hashi] = cur->_next;
                else
                    prev->_next = cur->_next;
                delete cur;
                --_n;
                return true;
            } else {
                prev = cur;
                cur = cur->_next;
            }
        }
        return false;
    }

private:
    vector<Node*> _tables;
    size_t _n = 0;
};
}

int main() {
    int a[] = {19, 30, 5, 36, 13, 20, 21, 12, 24, 96};
    hash_bucket::HashTable<int, int> ht;
    for (auto& e : a) ht.Insert({e, e});
    ht.Insert({100, 100});
    ht.Insert({101, 101});
    cout << ht.Find(19) << endl;
    cout << ht.Find(36) << endl;
    cout << ht.Find(96) << endl;
    cout << ht.Find(101) << endl << endl;
    ht.Erase(19); ht.Erase(36); ht.Erase(96); ht.Erase(101);
    cout << ht.Find(19) << endl;
    cout << ht.Find(36) << endl;
    cout << ht.Find(96) << endl;
    cout << ht.Find(101) << endl << endl;
    return 0;
}

// UnorderedSet.h
#include "HashTable.h"
namespace mine {
template<class K, class Hash = HashFunc<K>>
class unordered_set {
    struct SetKeyOfT {
        const K& operator()(const K& key) { return key; }
    };
public:
    typedef typename hash_bucket::HashTable<K, const K, SetKeyOfT, Hash>::Iterator iterator;
    typedef typename hash_bucket::HashTable<K, const K, SetKeyOfT, Hash>::ConstIterator const_iterator;

    iterator begin() { return _ht.Begin(); }
    iterator end() { return _ht.End(); }
    const_iterator begin() const { return _ht.Begin(); }
    const_iterator end() const { return _ht.End(); }

    pair<iterator, bool> insert(const K& key) { return _ht.Insert(key); }
    iterator find(const K& key) { return _ht.Find(key); }
    bool erase(const K& key) { return _ht.Erase(key); }

private:
    hash_bucket::HashTable<K, const K, SetKeyOfT, Hash> _ht;
};

void print(const unordered_set<int>& us) {
    unordered_set<int>::const_iterator cit = us.begin();
    while (cit != us.end()) {
        cout << *cit << " ";
        ++cit;
    }
    cout << endl;
}
}

#define _CRT_SECURE_NO_WARNINGS
#include <iostream>
using namespace std;
#include "UnorderedSet.h"

int main() {
    int a[] = {3, 11, 86, 7, 88, 82, 1, 881, 5, 6, 7, 6};
    mine::unordered_set<int> us;
    for (auto e : a) us.insert(e);
    auto it = us.begin();
    while (it != us.end()) {
        cout << *it << " ";
        ++it;
    }
    cout << endl;
    mine::print(us);
    return 0;
}

// UnorderedMap.h
#include "HashTable.h"
namespace mine {
template<class K, class V, class Hash = HashFunc<K>>
class unordered_map {
    struct MapKeyOfT {
        const K& operator()(const pair<K, V>& kv) { return kv.first; }
    };
public:
    typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash>::Iterator iterator;
    typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash>::ConstIterator const_iterator;

    iterator begin() { return _ht.Begin(); }
    iterator end() { return _ht.End(); }
    const_iterator begin() const { return _ht.Begin(); }
    const_iterator end() const { return _ht.End(); }

    V& operator[](const K& key) {
        auto ret = insert({key, V()});
        return ret.first->second;
    }
    pair<iterator, bool> insert(const pair<K, V>& kv) { return _ht.Insert(kv); }
    iterator find(const K& key) { return _ht.Find(key); }
    bool erase(const K& key) { return _ht.Erase(key); }

private:
    hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash> _ht;
};

void print(const unordered_map<string, string>& um) {
    unordered_map<string, string>::const_iterator cit = um.begin();
    while (cit != um.end()) {
        cout << cit->first << ":" << cit->second << endl;
        ++cit;
    }
    cout << endl;
}
}

int main() {
    mine::unordered_map<string, string> dict;
    dict.insert({"sort", "排序"});
    dict.insert({"字符串", "string"});
    dict.insert({"left", "左"});
    dict.insert({"right", "右"});
    for (auto& e : dict) {
        cout << e.first << ":" << e.second << endl;
    }
    cout << endl;
    dict["left"] = "左，剩余";
    dict["insert"] = "插入";
    dict["string"];
    auto it = dict.begin();
    while (it != dict.end()) {
        cout << it->first << ":" << it->second << endl;
        ++it;
    }
    cout << endl;
    mine::print(dict);
    return 0;
}

C++ 哈希表原理与 unordered 容器实战

哈希

unordered_set 和 unordered_map

unordered_set

unordered_map

代码示例

更多推荐文章

相关免费在线工具

unordered_multiset / unordered_multimap

哈希概念

直接定址法

哈希冲突

负载因子

将关键字转为 size_t

哈希函数

除法散列法（除留余数法）

处理哈希冲突：开放定址法

线性探测

二次探测

开放定址法线性探测代码实现

处理哈希冲突：链地址法

代码实现

哈希表封装 unordered_set 和 unordered_map

代码实现

unordered_map 封装

更多推荐文章

相关免费在线工具

C++ 哈希表原理与 unordered 容器实战

哈希

unordered_set 和 unordered_map

unordered_set

unordered_map

代码示例

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

unordered_multiset / unordered_multimap

哈希概念

直接定址法

哈希冲突

负载因子

将关键字转为 size_t

哈希函数

除法散列法（除留余数法）

处理哈希冲突：开放定址法

线性探测

二次探测

开放定址法线性探测代码实现

处理哈希冲突：链地址法

代码实现

哈希表封装 unordered_set 和 unordered_map

代码实现

unordered_map 封装

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具