C++ 哈希表原理与 unordered 容器详解 | 极客日志

C++算法

C++ 哈希表原理与 unordered 容器详解

介绍 C++ 中 unordered_set 和 unordered_map 的特性，对比其与 set/map 的差异。详细讲解哈希概念、哈希函数设计、负载因子及哈希冲突处理方法（开放定址法、链地址法），并提供了基于链地址法的哈希表封装实现代码。

链路追踪发布于 2026/3/30更新于 2026/7/2243 浏览

哈希

unordered_set 和 unordered_map

unordered_set

在这里插入图片描述

set 和 unordered_set 的功能高度相似，只是底层结构不同。

unordered_set 与 set 的差异

unordered_set 和 set 的第一个差异是对 key 的要求不同，set 要求 Key 支持小于比较，而 unordered_set 要求 Key 支持转成整形且支持等于比较。
unordered_set 和 set 的第二个差异是迭代器的差异，set 的 iterator 是双向迭代器，unordered_set 是单向迭代器。其次 set 底层是红黑树，红黑树是二叉搜索树，走中序遍历是有序的，所以 set 迭代器遍历是有序 + 去重。而 unordered_set 底层是哈希表，迭代器遍历是无序 + 去重。
unordered_set 和 set 的第三个差异是性能的差异，整体而言大多数场景下，unordered_set 的增删查改更快一些，因为红黑树增删查改效率是 O(logN)，而 哈希表增删查平均效率是 O(1)。

unordered_map

在这里插入图片描述

map 和 unordered_map 也是高度相似，只有些许差异。

map 要求 Key 支持小于比较，而 unordered_map 要求 Key 支持转成整形且支持等于比较。
map 的 iterator 是双向迭代器，unordered_map 是单向迭代器，map 底层是红黑树，unordered_map 底层是哈希表，迭代器遍历是 Key 无序 + 去重。
大多数场景下，unordered_map 的增删查改更快一些，因为红黑树增删查改效率是 O(logN)，而 哈希表增删查平均效率是 O(1)。

代码使用

#define _CRT_SECURE_NO_WARNINGS
#include <iostream>
#include <unordered_set>
#include <unordered_map>
using namespace std;

  {
    unordered_set<> s = {, , , , , , , , , , , };
    unordered_set<>::iterator it = s.();
    (it != s.()) {
        cout << *it << ;
        ++it;
    }
    cout << endl;
     ;
}

相关免费在线工具

加密/解密文本
使用加密算法（如AES、TripleDES、Rabbit或RC4）加密和解密文本明文。在线工具，加密/解密文本在线工具，online
Gemini 图片去水印
基于开源反向 Alpha 混合算法去除 Gemini/Nano Banana 图片水印，支持批量处理与下载。在线工具，Gemini 图片去水印在线工具，online
Base64 字符串编码/解码
将字符串编码和解码为其 Base64 格式表示形式即可。在线工具，Base64 字符串编码/解码在线工具，online
Base64 文件转换器
将字符串、文件或图像转换为其 Base64 表示形式。在线工具，Base64 文件转换器在线工具，online
Markdown转HTML
将 Markdown（GFM）转为 HTML 片段，浏览器内 marked 解析；与 HTML转Markdown 互为补充。在线工具，Markdown转HTML在线工具，online
HTML转Markdown
将 HTML 片段转为 GitHub Flavored Markdown，支持标题、列表、链接、代码块与表格等；浏览器内处理，可链接预填。在线工具，HTML转Markdown在线工具，online

template<class K>
struct HashFunc {
    size_t operator()(const K& key) {
        return (size_t)key;
    }
};

template<>
struct HashFunc<string> {
    size_t operator()(const string& s) {
        size_t hash = 0;
        for(auto& e : s) //可以有效避免"abcd"，"bcad"冲突的情况
            hash += e;
        hash *= 131;
        return hash;
    }
};

inline unsigned long __stl_next_prime(unsigned long n) //会频繁调用，inline 修饰，减少消耗
{
    // Note: assumes long is at least 32 bits.
    static const int __stl_num_primes = 28;
    static const unsigned long __stl_prime_list[__stl_num_primes] = {
        //一个数组
        53, 97, 193, 389, 769, 1543, 3079, 6151, 12289, 24593,
        49157, 98317, 196613, 393241, 786433, 1572869, 3145739,
        6291469, 12582917, 25165843, 50331653, 100663319, 201326611,
        402653189, 805306457, 1610612741, 3221225473, 4294967291
    };
    const unsigned long* first = __stl_prime_list;
    const unsigned long* last = __stl_prime_list + __stl_num_primes;
    const unsigned long* pos = lower_bound(first, last, n); //在下标[first,last)范围内，找大于等于 n 的数
    return pos == last ? *(last - 1) : *pos;
}

#include <vector>
enum State { EXIST, EMPTY, DELETE };

template<class K, class V>
struct HashData {
    pair<K, V> _kv;
    State _state = EMPTY;
};

template<class K>
struct HashFunc {
    size_t operator()(const K& key) {
        return (size_t)key;
    }
};

template<>
struct HashFunc<string> {
    size_t operator()(const string& s) {
        size_t hash = 0;
        for(auto& e : s) {
            hash += e;
            hash *= 131;
        }
        return hash;
    }
};

inline unsigned long __stl_next_prime(unsigned long n) {
    // Note: assumes long is at least 32 bits.
    static const int __stl_num_primes = 28;
    static const unsigned long __stl_prime_list[__stl_num_primes] = {
        53, 97, 193, 389, 769, 1543, 3079, 6151, 12289, 24593,
        49157, 98317, 196613, 393241, 786433, 1572869, 3145739,
        6291469, 12582917, 25165843, 50331653, 100663319, 201326611,
        402653189, 805306457, 1610612741, 3221225473, 4294967291
    };
    const unsigned long* first = __stl_prime_list;
    const unsigned long* last = __stl_prime_list + __stl_num_primes;
    const unsigned long* pos = lower_bound(first, last, n);
    return pos == last ? *(last - 1) : *pos;
}

namespace open_address {
template<class K, class V, class Hash = HashFunc<K>>
class HashTable {
public:
    HashTable() : _tables(__stl_next_prime(0)), _n(0) {}

    bool Insert(const pair<K, V>& kv) {
        if(Find(kv.first)) return false;
        if(_n * 10 / _tables.size() >= 7) //扩容
        {
            HashTable<K, V, Hash> newht;
            newht._tables.resize(__stl_next_prime(_tables.size() + 1));
            for(auto& e : _tables) {
                if(e._state == EXIST) newht.Insert(e._kv);
            }
            _tables.swap(newht._tables);
        }
        Hash hash;
        size_t hash0 = hash(kv.first) % _tables.size();
        size_t hashi = hash0;
        size_t i = 1;
        while(_tables[hashi]._state == EXIST) {
            hashi = (hash0 + i) % _tables.size();
            i++;
        }
        _tables[hashi]._kv = kv;
        _tables[hashi]._state = EXIST;
        ++_n;
        return true;
    }

    HashData<K, V>* Find(const K& key) {
        Hash hash;
        size_t hash0 = hash(key) % _tables.size();
        size_t hashi = hash0;
        size_t i = 1;
        while(_tables[hashi]._state != EMPTY) {
            if(_tables[hashi]._state == EXIST && _tables[hashi]._kv.first == key)
                return &_tables[hashi];
            hashi = (hash0 + i) % _tables.size();
            i++;
        }
        return nullptr;
    }

    bool Erase(const K& key) {
        HashData<K, V>* ret = Find(key);
        if(ret) {
            ret->_state = DELETE;
            return true;
        } else
            return false;
    }

private:
    vector<HashData<K, V>> _tables;
    size_t _n; //记录数据个数
};
}

#include "HashTable.h"

int main() {
    open_address::HashTable<int, int> ht;
    int a[] = {19, 30, 5, 36, 13, 20, 21, 12};
    for(auto e : a) {
        ht.Insert({e, e});
    }
    if(ht.Find(13)) ht.Erase(13);
    else cout << "没找到" << endl;
    return 0;
}

struct Date {
    int _year;
    int _month;
    int _day;
    Date(int year=1, int month=1, int day=1) : _year(year), _month(month), _day(day) {}
    bool operator==(const Date& d) {
        return _year == d._year && _month == d._month && _day == d._day;
    }
};

struct DateHashFunc {
    size_t operator()(const Date& d) {
        size_t hash = 0;
        hash += d._year; hash *= 131;
        hash += d._month; hash *= 131;
        hash += d._day; hash *= 131;
        return hash;
    }
};

int main() {
    string a1[] = {"sort", "insert", "abcd", "bcad", "aadd"};
    open_address::HashTable<string, string> ht;
    for(auto& e : a1) ht.Insert({e, e});

    int a2[] = {-19, -30, 5, 36, 13, 20, 21, 12};
    open_address::HashTable<int, int> ht1;
    for(auto& e : a2) ht1.Insert({e, e});

    open_address::HashTable<Date, int, DateHashFunc> ht2;
    ht2.Insert({{2026, 1, 2}, 1});
    ht2.Insert({{2026, 2, 1}, 2});
    return 0;
}

namespace hash_bucket {
template<class K, class V>
struct HashNode {
    pair<K, V> _kv;
    HashNode<K, V>* _next;
    HashNode(const pair<K,V>& kv) : _kv(kv), _next(nullptr) {}
};

template<class K, class V, class Hash = HashFunc<K>>
class HashTable {
    typedef HashNode<K, V> Node;
public:
    HashTable() : _tables(__stl_next_prime(0)), _n(0) {}

    //拷贝构造
    HashTable(const HashTable<K, V, Hash>& ht) {
        _tables.resize(ht._tables.size());
        for(int i = 0; i < ht._tables.size(); i++) {
            Node* htcur = ht._tables[i];
            while(htcur) {
                Node* newnode = new Node(htcur->_kv); //尾插
                Node* cur = _tables[i];
                if(cur == nullptr) _tables[i] = newnode;
                else {
                    while(cur->_next) cur = cur->_next;
                    cur->_next = newnode;
                }
                htcur = htcur->_next;
            }
        }
        _n = ht._n;
    }

    ~HashTable() {
        for(int i = 0; i < _tables.size(); i++) {
            Node* cur = _tables[i];
            while(cur) {
                Node* next = cur->_next;
                delete cur;
                cur = next;
            }
            _tables[i] = nullptr;
        }
    }

    bool Insert(const pair<K, V>& kv) {
        if(Find(kv.first)) return false;
        Hash hash;
        if(_n == _tables.size()) //扩容
        {
            vector<Node*> newTable(__stl_next_prime(_tables.size() + 1));
            for(int i = 0; i < _tables.size(); i++) {
                Node* cur = _tables[i];
                while(cur) {
                    Node* next = cur->_next;
                    size_t hashi = hash(kv.first) % newTable.size(); //找到新表的映射位置
                    //头插
                    cur->_next = newTable[hashi];
                    newTable[hashi] = cur;
                    cur = next;
                }
                _tables[i] = nullptr;
            }
            _tables.swap(newTable);
        }
        size_t hashi = hash(kv.first) % _tables.size();
        Node* newnode = new Node(kv); //头插
        newnode->_next = _tables[hashi];
        _tables[hashi] = newnode;
        ++_n;
        return true;
    }

    Node* Find(const K& key) {
        Hash hash;
        size_t hashi = hash(key) % _tables.size();
        Node* cur = _tables[hashi];
        while(cur) {
            if(cur->_kv.first == key) return cur;
            cur = cur->_next;
        }
        return nullptr;
    }

    bool Erase(const K& key) {
        Hash hash;
        size_t hashi = hash(key) % _tables.size();
        Node* prev = nullptr;
        Node* cur = _tables[hashi];
        while(cur) {
            if(cur->_kv.first == key) //找到了
            {
                if(prev == nullptr) //待删除节点为头节点
                    _tables[hashi] = cur->_next;
                else //待删除节点为中间节点
                    prev->_next = cur->_next;
                delete cur;
                --_n;
                return true;
            } else {
                prev = cur;
                cur = cur->_next;
            }
        }
        return false;
    }

private:
    vector<Node*> _tables;
    size_t _n = 0;
};
}

int main() {
    int a[] = {19, 30, 5, 36, 13, 20, 21, 12, 24, 96};
    hash_bucket::HashTable<int, int> ht;
    for(auto& e : a) {
        ht.Insert({e, e});
    }
    ht.Insert({100, 100});
    ht.Insert({101, 101});
    cout << ht.Find(19) << endl;
    cout << ht.Find(36) << endl;
    cout << ht.Find(96) << endl;
    cout << ht.Find(101) << endl << endl;
    ht.Erase(19);
    ht.Erase(36);
    ht.Erase(96);
    ht.Erase(101);
    cout << ht.Find(19) << endl;
    cout << ht.Find(36) << endl;
    cout << ht.Find(96) << endl;
    cout << ht.Find(101) << endl << endl;
    return 0;
}

//HashTable.h
#include <vector>
#include <string>
using namespace std;

template<class K>
struct HashFunc {
    size_t operator()(const K& key) {
        return (size_t)key;
    }
};

template<>
struct HashFunc<string> {
    size_t operator()(const string& s) {
        size_t hash = 0;
        for(auto& e : s) {
            hash += e;
            hash *= 131;
        }
        return hash;
    }
};

inline unsigned long __stl_next_prime(unsigned long n) {
    // Note: assumes long is at least 32 bits.
    static const int __stl_num_primes = 28;
    static const unsigned long __stl_prime_list[__stl_num_primes] = {
        53, 97, 193, 389, 769, 1543, 3079, 6151, 12289, 24593,
        49157, 98317, 196613, 393241, 786433, 1572869, 3145739,
        6291469, 12582917, 25165843, 50331653, 100663319, 201326611,
        402653189, 805306457, 1610612741, 3221225473, 4294967291
    };
    const unsigned long* first = __stl_prime_list;
    const unsigned long* last = __stl_prime_list + __stl_num_primes;
    const unsigned long* pos = lower_bound(first, last, n);
    return pos == last ? *(last - 1) : *pos;
}

namespace hash_bucket {
template<class T>
struct HashNode {
    T _data;
    HashNode<T>* _next;
    HashNode(const T& data) : _data(data), _next(nullptr) {}
};

//前置声明
template<class K, class T, class KeyOfT, class Hash>
class HashTable;

template<class K, class T, class Ref, class Ptr, class KeyOfT, class Hash>
struct HTIterator {
    typedef HashNode<T> Node;
    typedef HashTable<K, T, KeyOfT, Hash> HT;
    typedef HTIterator<K, T, Ref, Ptr, KeyOfT, Hash> Self;
    Node* _node;
    const HT* _ht; //用在 operator++

    HTIterator(Node* node, const HT* ht) : _node(node), _ht(ht) {}

    Ref operator*() //解引用
    {
        return _node->_data;
    }

    Ptr operator->() //取数据
    {
        return &_node->_data;
    }

    bool operator!=(const Self& s) {
        return _node != s._node;
    }

    Self& operator++() //函数只是让当前迭代器走到新位置，最后返回该迭代器
    {
        if(_node->_next)
            _node = _node->_next;
        else //当前桶已走完
        {
            KeyOfT kot;
            Hash hash;
            size_t hashi = hash(kot(_node->_data)) % _ht->_tables.size(); //当前桶的位置
            hashi++;
            while(hashi < _ht->_tables.size()) {
                _node = _ht->_tables[hashi];
                if(_node) break;
                else hashi++;
            }
            if(hashi == _ht->_tables.size())
                _node = nullptr;
        }
        return *this;
    }
};

template<class K, class T, class KeyOfT, class Hash = HashFunc<T>> //T 本身是 K，或含有 K
class HashTable {
    //友元声明
    template<class K, class T, class Ref, class Ptr, class KeyOfT, class Hash>
    friend struct HTIterator;

    typedef HashNode<T> Node;
public:
    typedef HTIterator<K, T, T&, T*, KeyOfT, Hash> Iterator;
    typedef HTIterator<K, T, const T&, const T*, KeyOfT, Hash> ConstIterator;

    Iterator Begin() {
        if(_n == 0) return End();
        for(int i = 0; i < _tables.size(); i++) //找到哈希表中不为空的位置
        {
            Node* cur = _tables[i];
            if(cur) return Iterator(cur, this);
        }
        return End();
    }

    Iterator End() {
        return Iterator(nullptr, this);
    }

    ConstIterator Begin() const {
        if(_n == 0) return End();
        for(int i = 0; i < _tables.size(); i++) {
            Node* cur = _tables[i];
            if(cur) return ConstIterator(cur, this);
        }
        return End();
    }

    ConstIterator End() const {
        return Iterator(nullptr, this);
    }

    HashTable() : _tables(__stl_next_prime(0)), _n(0) {}

    ~HashTable() {
        for(int i = 0; i < _tables.size(); i++) {
            Node* cur = _tables[i];
            while(cur) {
                Node* next = cur->_next;
                delete cur;
                cur = next;
            }
            _tables[i] = nullptr;
        }
    }

    pair<Iterator, bool> Insert(const T& data) {
        KeyOfT kot;
        auto it = Find(kot(data));
        if(it != End()) return {it, false};
        Hash hash;
        if(_n == _tables.size()) //扩容
        {
            vector<Node*> _newTable;
            _newTable.resize(__stl_next_prime(_tables.size() + 1));
            for(int i = 0; i < _tables.size(); i++) {
                Node* cur = _tables[i];
                while(cur) {
                    Node* next = cur->_next;
                    size_t hashi = hash(kot(cur->_data)) % _newTable.size(); //找到新表的映射位置
                    //头插
                    cur->_next = _newTable[hashi];
                    _newTable[hashi] = cur;
                    cur = next;
                }
            }
            _tables.swap(_newTable);
        }
        size_t hashi = hash(kot(data)) % _tables.size();
        Node* newnode = new Node(data); //头插
        newnode->_next = _tables[hashi];
        _tables[hashi] = newnode;
        _n++;
        return {Iterator(newnode, this), true};
    }

    Iterator Find(const K& key) {
        KeyOfT kot;
        Hash hash;
        size_t hashi = hash(key) % _tables.size();
        Node* cur = _tables[hashi];
        while(cur) {
            if(kot(cur->_data) == key) return {cur, this};
            cur = cur->_next;
        }
        return End();
    }

    bool Erase(const K& key) {
        Hash hash;
        KeyOfT kot;
        size_t hashi = hash(key) % _tables.size();
        Node* cur = _tables[hashi];
        Node* prev = nullptr;
        while(cur) {
            if(kot(cur->_data) == key) //找到了
            {
                if(prev == nullptr) //待删除节点为头节点
                    _tables[hashi] = cur->_next;
                else //待删除节点为中间节点
                    prev->_next = cur->_next;
                delete cur;
                --_n;
                return true;
            } else {
                prev = cur;
                cur = cur->_next;
            }
        }
        return false;
    }

private:
    vector<Node*> _tables;
    size_t _n = 0;
};
}

//UnorderedSet.h
#include "HashTable.h"

namespace mine {
template<class K, class Hash = HashFunc<K>>
class unordered_set {
    struct SetKeyOfT {
        const K& operator()(const K& key) {
            return key;
        }
    };
public:
    typedef typename hash_bucket::HashTable<K, const K, SetKeyOfT, Hash>::Iterator iterator;
    typedef typename hash_bucket::HashTable<K, const K, SetKeyOfT, Hash>::ConstIterator const_iterator;

    iterator begin() {
        return _ht.Begin();
    }
    iterator end() {
        return _ht.End();
    }
    const_iterator begin() const {
        return _ht.Begin();
    }
    const_iterator end() const {
        return _ht.End();
    }
    pair<iterator, bool> insert(const K& key) {
        return _ht.Insert(key);
    }
    iterator find(const K& key) {
        return _ht.Find();
    }
    bool erase(const K& key) {
        return _ht.Erase(key);
    }

private:
    hash_bucket::HashTable<K, const K, SetKeyOfT, Hash> _ht;
};

void print(const unordered_set<int>& us) //测试 const 迭代器
{
    unordered_set<int>::const_iterator cit = us.begin();
    cout << typeid(us).name() << endl;
    while(cit != us.end()) {
        cout << *cit << " ";
        ++cit;
    }
    cout << endl;
    for(auto e : us) {
        cout << e << " ";
    }
    cout << endl << endl;
}
}

//UnorderedMap.h
#include "HashTable.h"

namespace mine {
template<class K, class V, class Hash = HashFunc<K>>
class unordered_map {
    struct MapKeyOfT {
        const K& operator()(const pair<K, V>& kv) {
            return kv.first;
        }
    };
public:
    typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash>::Iterator iterator;
    typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash>::ConstIterator const_iterator;

    iterator begin() {
        return _ht.Begin();
    }
    iterator end() {
        return _ht.End();
    }
    const_iterator begin() const {
        return _ht.Begin();
    }
    const_iterator end() const {
        return _ht.End();
    }
    V& operator[](const K& key) {
        auto ret = insert({key, V()});
        return ret.first->second;
    }
    pair<iterator, bool> insert(const pair<K, V>& kv) {
        return _ht.Insert(kv);
    }
    iterator find(const K& key) {
        return _ht.Find(key);
    }
    bool erase(const K& key) {
        return _ht.Erase(key);
    }

private:
    hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash> _ht;
};

void print(const unordered_map<string, string>& um) //测试 const 迭代器
{
    unordered_map<string, string>::const_iterator cit = um.begin();
    while(cit != um.end()) {
        cout << cit->first << "：" << cit->second << endl;
        ++cit;
    }
    cout << endl;
    for(auto& e : um) {
        cout << e.first << "：" << e.second << endl;
    }
}
}

#define _CRT_SECURE_NO_WARNINGS
#include <iostream>
using namespace std;
#include "UnorderedSet.h"
#include "UnorderedMap.h"

int main() {
    int a[] = {3, 11, 86, 7, 88, 82, 1, 881, 5, 6, 7, 6};
    mine::unordered_set<int> us;
    for(auto e : a) {
        us.insert(e);
    }
    auto it = us.begin();
    while(it != us.end()) {
        cout << *it << " ";
        ++it;
    }
    cout << endl;
    for(auto& e : us) {
        cout << e << " ";
    }
    cout << endl << endl;
    mine::print(us);
    return 0;
}

int main() {
    mine::unordered_map<string, string> dict;
    dict.insert({"sort", "排序"});
    dict.insert({"字符串", "string"});
    dict.insert({"left", "左"});
    dict.insert({"right", "右"});
    for(auto& e : dict) {
        cout << e.first << "：" << e.second << endl;
    }
    cout << endl;
    dict["left"] = "左，剩余";
    dict["insert"] = "插入";
    dict["string"];
    auto it = dict.begin();
    while(it != dict.end()) {
        //it->second += "x";
        cout << it->first << "：" << it->second << endl;
        ++it;
    }
    cout << endl;
    print(dict);
    return 0;
}

C++ 哈希表原理与 unordered 容器详解

哈希

unordered_set 和 unordered_map

unordered_set

unordered_map

代码使用

更多推荐文章

相关免费在线工具

unordered_multiset/unordered_multimap

哈希概念

直接定址法

哈希冲突

负载因子

将关键字转为 size_t

哈希函数

除法散列法/除留余数法

处理哈希冲突：开放定址法

线性探测

二次探测

开放定址法线性探测代码实现

处理哈希冲突：链地址法

代码实现

哈希表封装 unordered_set 和 unordered_map

代码实现

更多推荐文章

相关免费在线工具

C++ 哈希表原理与 unordered 容器详解

哈希

unordered_set 和 unordered_map

unordered_set

unordered_map

代码使用

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

unordered_multiset/unordered_multimap

哈希概念

直接定址法

哈希冲突

负载因子

将关键字转为 size_t

哈希函数

除法散列法/除留余数法

处理哈希冲突：开放定址法

线性探测

二次探测

开放定址法线性探测代码实现

处理哈希冲突：链地址法

代码实现

哈希表封装 unordered_set 和 unordered_map

代码实现

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具