C++ 哈希表：概念、冲突解决与代码实现 | 极客日志

C++算法

C++ 哈希表：概念、冲突解决与代码实现

C++ 中基于哈希表的无序容器 unordered_set 和 unordered_map。阐述了哈希概念、哈希函数设计（除法散列、乘法散列）、负载因子及哈希冲突处理。重点讲解了两种冲突解决策略：开放定址法（线性探测）和链地址法（哈希桶），并提供了相应的 C++ 类实现框架及插入、查找、删除操作代码示例。

不知所云发布于 2026/3/28更新于 2026/7/2453 浏览

unordered_set 和 unordered_map

在 C++ 中，unordered_set 和 unordered_map 是两种基于哈希表（Hash Table）的容器，它们是 C++11 标准模板库的一部分，提供了高效的元素存储和访问。

unordered_set(map) 的介绍

unordered_set 是一个无序集合，它存储唯一的元素，并且不允许重复。unordered_set 提供了平均常数时间复杂度为 O(1) 的插入、删除和查找操作。unordered_set 维护元素的唯一性，如果尝试插入一个已存在的元素，它不会被添加到集合中。

unordered_set 的声明如下：

template < class Key, // unordered_set::key_type/value_type 
            class Hash = hash<Key>, // unordered_set::hasher 
            class Pred = equal_to<Key>, // unordered_set::key_equal 
            class Alloc = allocator<Key> // unordered_set::allocator_type 
           > 
class unordered_set;

第一个模板参数 Key：Key 是 unordered_set 底层关键字类型。
第二个模板参数 Hash（仿函数）：unordered_set 默认要求 Key 支持转换成整形，如果 Key 不支持或者想按自己的需求将 Key 转换成整数，可以自己实现并传入。
第三个模板参数 Pred（仿函数）：unordered_set 默认要求 Key 支持比较相等，不需要支持比较大小，这是因为 unordered_set 的底层是哈希表（哈希桶），其实现不需要比较 Key 的大小，但其 Find 函数和 Erase 函数需要比较 Key 是否相等。如果 Key 支持或者想按自己的需求来，可以自己实现并传入。
第四个模板参数 Alloc：空间配置器，unordered_set 底层存储数据的内存是从空间配置器申请的，如果需要可以自己实现内存池并传入。

unordered_map 的声明如下：

template < class Key, // unordered_map::key_type 
            class T, // unordered_map::mapped_type 
            class Hash = hash<Key>, // unordered_map::hasher 
             Pred = equal_to<Key>, 
             Alloc = allocator< pair< Key,T> > 
           > 
 unordered_map;

相关免费在线工具

加密/解密文本
使用加密算法（如AES、TripleDES、Rabbit或RC4）加密和解密文本明文。在线工具，加密/解密文本在线工具，online
Gemini 图片去水印
基于开源反向 Alpha 混合算法去除 Gemini/Nano Banana 图片水印，支持批量处理与下载。在线工具，Gemini 图片去水印在线工具，online
Base64 字符串编码/解码
将字符串编码和解码为其 Base64 格式表示形式即可。在线工具，Base64 字符串编码/解码在线工具，online
Base64 文件转换器
将字符串、文件或图像转换为其 Base64 表示形式。在线工具，Base64 文件转换器在线工具，online
Markdown转HTML
将 Markdown（GFM）转为 HTML 片段，浏览器内 marked 解析；与 HTML转Markdown 互为补充。在线工具，Markdown转HTML在线工具，online
HTML转Markdown
将 HTML 片段转为 GitHub Flavored Markdown，支持标题、列表、链接、代码块与表格等；浏览器内处理，可链接预填。在线工具，HTML转Markdown在线工具，online

//状态标识，防止元素删除后对查找后面冲突值的影响
enum State { EXIST, EMPTY, DELETE };

//存放的元素
template<class K, class V>
struct HashData {
    pair<K, V> _kv;
    //一开始元素都是空的，这里用缺省值
    State _state = EMPTY;
};

//哈希函数
template<class K>
struct HashFunc {
    size_t operator()(const K& key) {
        return size_t(key);
    }
};

//string 做哈希表的 key 很常见，对哈希函数进行 string 特化
template<>
struct HashFunc<string> {
    // 字符串转换成整形，可以把字符 asci 码相加即可
    // 但是直接相加的话，类似"abcd"和"bcad"这样的字符串计算出是相同的
    // 这⾥⽤上次的计算结果去乘以⼀个质数去解决，这个质数⼀般取
    // 31, 131 等效果会⽐较好
    size_t operator()(const string& s) {
        size_t hash = 0;
        for (auto ch : s) {
            hash += ch;
            hash *= 131;
        }
        return hash;
    }
};

//找比 n 大，离 n 最近的质数
inline unsigned long __stl_next_prime(unsigned long n) {
    //质数数组
    static const int __stl_num_primes = 28;
    static const unsigned long __stl_prime_list[__stl_num_primes] = { 
        53, 97, 193, 389, 769, 1543, 3079, 6151, 12289, 24593, 
        49157, 98317, 196613, 393241, 786433, 1572869, 3145739, 
        6291469, 12582917, 25165843, 50331653, 100663319, 201326611, 
        402653189, 805306457, 1610612741, 3221225473, 4294967291 
    };
    const unsigned long* first = __stl_prime_list;
    const unsigned long* last = __stl_prime_list + __stl_num_primes;
    //在 first 和 last 找大于等于 n 位置的指针
    const unsigned long* pos = lower_bound(first, last, n);
    return pos == last ? *(last - 1) : *pos;
}

//哈希表
template<class K, class V, class Hash = HashFunc<K>>
class HashTable {
public:
    //构造函数
    HashTable() :_tables(__stl_next_prime(0)),_n(0) {}
    //......
private:
    vector<HashData<K, V>> _tables; //用 vector 来存储元素
    size_t _n; //记录有效元素的个数
};

void CheckCapacity() {
    //当负载因子>=0.7 时，扩容
    if (_n * 10 / _tables.size() >= 7) {
        //方法一：旧表映射到新表
        /*vector<HashData<K, V>> newtables(_tables.size() * 2);
        for (auto& data : _tables) {
            if (data._state == EXIST) {
                size_t newhashi = HashFunc(data._kv.first) % newtables.size();
                newtables[newhashi]._kv = data._kv;
                newtables[newhashi]._state = EXIST;
            }
        }
        _tables.swap(newtables);*/
        //方法二：利用新哈希表
        HashTable<K, V> newht;
        //newht._tables.resize(_tables.size() * 2);
        newht._tables.resize(__stl_next_prime(_tables.size() + 1));
        for (auto& data : _tables) {
            if (data._state == EXIST) {
                newht.Insert(data._kv);
            }
        }
        _tables.swap(newht._tables);
    }
}

bool Insert(const pair<K, V>& kv) {
    //如果找到了重复元素，直接返回 false
    if (Find(kv.first)) return false;
    //检查负载因子是否需要扩容
    CheckCapacity();
    //哈希函数
    Hash hashfunc;
    size_t hashi = hashfunc(kv.first) % _tables.size();
    //线性探测
    while (_tables[hashi]._state == EXIST) {
        ++hashi;
        hashi %= _tables.size();
    }
    _tables[hashi]._kv = kv;
    _tables[hashi]._state = EXIST;
    ++_n;
    return true;
}

HashData<K, V>* Find(const K& key) {
    Hash hashfunc;
    size_t hashi = hashfunc(key) % _tables.size();
    while (_tables[hashi]._state != EMPTY) {
        if (_tables[hashi]._state == EXIST && _tables[hashi]._kv.first == key) {
            return &_tables[hashi];
        }
        hashi++;
        hashi %= _tables.size();
    }
    return nullptr;
}

bool Erase(const K& key) {
    HashData<K, V>* ret = Find(key);
    if (ret) {
        ret->_state = DELETE;
        return true;
    } else {
        return false;
    }
}

void test_open_hashtable2() {
    srand((unsigned int)time(0));
    int N = 100000;
    vector<int> v(N);
    for (int i = 0; i < N; ++i) {
        v[i] = rand() + i;
    }
    open_address::HashTable<int, int> ht;
    for (auto e : v) {
        ht.Insert({ e, e });
    }
    auto ret = ht.Find(19);
    if (ret) cout << "找到了" << endl;
    else cout << "没找到" << endl;
}

//哈希函数
template<class K>
struct HashFunc {
    size_t operator()(const K& key) {
        return size_t(key);
    }
};

//string 做哈希表的 key 很常见，对哈希函数进行 string 特化
template<>
struct HashFunc<string> {
    // 字符串转换成整形，可以把字符 asci 码相加即可
    // 但是直接相加的话，类似"abcd"和"bcad"这样的字符串计算出是相同的
    // 这⾥⽤上次的计算结果去乘以⼀个质数去解决，这个质数⼀般取
    // 31, 131 等效果会⽐较好
    size_t operator()(const string& s) {
        size_t hash = 0;
        for (auto ch : s) {
            hash += ch;
            hash *= 131;
        }
        return hash;
    }
};

//找比 n 大，离 n 最近的质数
inline unsigned long __stl_next_prime(unsigned long n) {
    // Note: assumes long is at least 32 bits.
    static const int __stl_num_primes = 28;
    static const unsigned long __stl_prime_list[__stl_num_primes] = { 
        53, 97, 193, 389, 769, 1543, 3079, 6151, 12289, 24593, 
        49157, 98317, 196613, 393241, 786433, 1572869, 3145739, 
        6291469, 12582917, 25165843, 50331653, 100663319, 201326611, 
        402653189, 805306457, 1610612741, 3221225473, 4294967291 
    };
    const unsigned long* first = __stl_prime_list;
    const unsigned long* last = __stl_prime_list + __stl_num_primes;
    //在 first 和 last 找大于等于 n 位置的指针
    const unsigned long* pos = lower_bound(first, last, n);
    return pos == last ? *(last - 1) : *pos;
}

//哈希表里存节点的指针
template<class K, class V>
struct HashNode {
    pair<K, V> _kv;
    HashNode<K, V>* _next;
    HashNode(const pair<K, V>& kv) :_kv(kv),_next(nullptr) {}
};

template<class K, class V, class hash = HashFunc<K>>
class HashTable {
    typedef HashNode<K, V> Node;
public:
    HashTable() : _tables(__stl_next_prime(0)),_n(0) {}
    //...
private:
    vector<Node*> _tables;
    size_t _n = 0;
};

void CheckCapacity() {
    //当哈希表里节点的数量与哈希表大小相等时扩容
    if (_n == _tables.size()) {
        //把哈希桶里的链表每个节点拆下来插入 newht 效率太低了
        /*HashTable<K, V> newht;
        newht._tables.resize(__stl_next_prime(_tables.size() + 1));
        for (size_t i = 0; i < _tables.size(); ++i) {
            Node* cur = _tables[i];
            while (cur) {
                newht.Insert(cur->_kv);
                cur = cur->_next;
            }
        }
        _tables.swap(newht._tables);*/
        hash hashfunc;
        vector<Node*> newtables(__stl_next_prime(_tables.size() + 1));
        for (size_t i = 0; i < _tables.size(); ++i) {
            Node* cur = _tables[i];
            while (cur) {
                Node* next = cur->_next;
                size_t hashi = hashfunc(cur->_kv.first) % newtables.size();
                //头插
                cur->_next = newtables[hashi];
                newtables[hashi] = cur;
                cur = next;
            }
            _tables[i] = nullptr;
        }
        _tables.swap(newtables);
    }
}

bool Insert(const pair<K, V>& kv) {
    //不允许重复插入
    if (Find(kv.first)) return false;
    //检查扩容
    CheckCapacity();
    hash hashfunc;
    size_t hashi = hashfunc(kv.first) % _tables.size();
    //头插
    Node* newnode = new Node(kv);
    newnode->_next = _tables[hashi];
    _tables[hashi] = newnode;
    ++_n;
    return true;
}

Node* Find(const K& key) {
    hash hashfunc;
    size_t hashi = hashfunc(key) % _tables.size();
    Node* cur = _tables[hashi];
    while (cur) {
        if (cur->_kv.first == key) return cur;
        cur = cur->_next;
    }
    return nullptr;
}

bool Erase(const K& key) {
    hash hashfunc;
    size_t hashi = hashfunc(key) % _tables.size();
    Node* prev = nullptr;
    Node* cur = _tables[hashi];
    while (cur) {
        if (cur->_kv.first == key) {
            //头节点的情况特殊处理
            if (prev == nullptr) {
                _tables[hashi] = cur->_next;
            } else {
                prev->_next = cur->_next;
            }
            delete cur;
            --_n;
            return true;
        } else {
            prev = cur;
            cur = cur->_next;
        }
    }
    return false;
}

void test_bucket_hashtable1() {
    int a[] = { 19,30,5,36,13,20,21,12,24,96, 19};
    hash_bucket::HashTable<int, int> ht;
    for (auto e : a) {
        ht.Insert({ e, e });
    }
    auto ret = ht.Find(12);
    if (ret) cout << "找到了" << endl;
    else cout << "没找到" << endl;
    ht.Erase(12);
    ret = ht.Find(12);
    if (ret) cout << "找到了" << endl;
    else cout << "没找到" << endl;
}

void test_bucket_hashtable2() {
    srand((unsigned int)time(0));
    int N = 100000;
    vector<int> v(N);
    for (int i = 0; i < N; ++i) {
        v[i] = rand() + i;
    }
    hash_bucket::HashTable<int, int> ht;
    for (auto& e : v) {
        ht.Insert({ e, e });
    }
    auto ret = ht.Find(12);
}

C++ 哈希表：概念、冲突解决与代码实现

unordered_set 和 unordered_map

unordered_set(map) 的介绍

更多推荐文章

相关免费在线工具

unordered_set(map) 和 set(map) 的差异

unordered_multiset / unordered_multimap

介绍哈希表

哈希概念

直接定址法

哈希冲突

负载因子

常见哈希函数

除法散列法（重点）

乘法散列法

哈希表的实现

开放定址法（闭散列）

整体框架

哈希表的插入

哈希表的查找

哈希表的删除

测试开放定址法实现的哈希表

链地址法（开散列）（重点）

整体框架

哈希表的插入

哈希表的查找

哈希表的删除

测试链地址法实现的哈希表

更多推荐文章

相关免费在线工具

C++ 哈希表：概念、冲突解决与代码实现

unordered_set 和 unordered_map

unordered_set(map) 的介绍

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

unordered_set(map) 和 set(map) 的差异

unordered_multiset / unordered_multimap

介绍哈希表

哈希概念

直接定址法

哈希冲突

负载因子

常见哈希函数

除法散列法（重点）

乘法散列法

哈希表的实现

开放定址法（闭散列）

整体框架

哈希表的插入

哈希表的查找

哈希表的删除

测试开放定址法实现的哈希表

链地址法（开散列）（重点）

整体框架

哈希表的插入

哈希表的查找

哈希表的删除

测试链地址法实现的哈希表

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具