C++ 哈希表原理与 STL 容器实现详解 | 极客日志

C++算法

C++ 哈希表原理与 STL 容器实现详解

综述由AI生成哈希表通过哈希函数将关键字映射到存储位置，实现 O(1) 平均查找效率。对比了 C++ 中基于红黑树的 set/map 与基于哈希表的 unordered_set/unordered_map，重点讲解了哈希冲突的处理方案，包括开放定址法（线性探测、二次探测）和链地址法。同时提供了完整的哈希表封装代码示例，涵盖扩容机制、迭代器实现及自定义 Key 类型支持，帮助深入理解 STL 容器的底层原理。

古灵精怪发布于 2026/3/15更新于 2026/5/2318 浏览

哈希表核心概念

unordered_set 和 unordered_map

unordered_set 和 set 虽然接口相似，但底层结构决定了它们的适用场景完全不同。

unordered_set 与 set 的差异

Key 的要求不同：set 要求 Key 支持小于比较（用于红黑树排序），而 unordered_set 要求 Key 能转换为整数且支持等于比较（用于哈希映射）。
迭代器差异：set 的 iterator 是双向迭代器，底层是红黑树，中序遍历有序；unordered_set 是单向迭代器，底层是哈希表，遍历时无序。
性能差异：大多数场景下，unordered_set 的增删查改更快。红黑树操作复杂度是 O(logN)，而哈希表平均效率是 O(1)。

unordered_set 示意图

unordered_map 同理

map 和 unordered_map 也是高度相似，只有些许差异：

map 要求 Key 支持小于比较，unordered_map 要求 Key 支持转成整形且支持等于比较。
map 的 iterator 是双向迭代器，unordered_map 是单向迭代器，遍历 Key 无序。
大多数场景下，unordered_map 的增删查改更快，因为哈希表平均效率是 O(1)。

unordered_map 示意图

代码使用示例

#define _CRT_SECURE_NO_WARNINGS
#include <iostream>
#include <unordered_set>
#include <unordered_map>
using namespace std;

int main()
{
    unordered_set<int> s = {3, 1, 6, 7, , , , , , , , };
    unordered_set<>::iterator it = s.();
     (it != s.())
    {
        cout << *it << ;
        ++it;
    }
    cout << endl;
     ;
}

相关免费在线工具

加密/解密文本
使用加密算法（如AES、TripleDES、Rabbit或RC4）加密和解密文本明文。在线工具，加密/解密文本在线工具，online
Gemini 图片去水印
基于开源反向 Alpha 混合算法去除 Gemini/Nano Banana 图片水印，支持批量处理与下载。在线工具，Gemini 图片去水印在线工具，online
Base64 字符串编码/解码
将字符串编码和解码为其 Base64 格式表示形式即可。在线工具，Base64 字符串编码/解码在线工具，online
Base64 文件转换器
将字符串、文件或图像转换为其 Base64 表示形式。在线工具，Base64 文件转换器在线工具，online
Markdown转HTML
将 Markdown（GFM）转为 HTML 片段，浏览器内 marked 解析；与 HTML转Markdown 互为补充。在线工具，Markdown转HTML在线工具，online
HTML转Markdown
将 HTML 片段转为 GitHub Flavored Markdown，支持标题、列表、链接、代码块与表格等；浏览器内处理，可链接预填。在线工具，HTML转Markdown在线工具，online

template<class K>
struct HashFunc
{
    size_t operator()(const K& key)
    {
        return (size_t)key;
    }
};

template<>
struct HashFunc<string>
{
    size_t operator()(const string& s)
    {
        size_t hash = 0;
        for (auto& e : s)//可以有效避免"abcd"，"bcad"冲突的情况
        {
            hash += e;
            hash *= 131;
        }
        return hash;
    }
};

inline unsigned long __stl_next_prime(unsigned long n)//会频繁调用，inline 修饰，减少消耗
{
    // Note: assumes long is at least 32 bits.
    static const int __stl_num_primes = 28;
    static const unsigned long __stl_prime_list[__stl_num_primes]=
    {//一个数组
        53, 97, 193, 389, 769, 1543, 3079, 6151, 12289, 24593,
        49157, 98317, 196613, 393241, 786433, 1572869, 3145739,
        6291469, 12582917, 25165843, 50331653, 100663319, 201326611,
        402653189, 805306457, 1610612741, 3221225473, 4294967291
    };
    const unsigned long* first = __stl_prime_list;
    const unsigned long* last = __stl_prime_list + __stl_num_primes;
    const unsigned long* pos = lower_bound(first, last, n);//在下标[first,last)范围内，找大于等于 n 的数
    return pos == last ? *(last - 1) : *pos;
}

#include <vector>
enum State { EXIST, EMPTY, DELETE };

template<class K, class V>
struct HashData
{
    pair<K, V> _kv;
    State _state = EMPTY;
};

template<class K>
struct HashFunc
{
    size_t operator()(const K& key)
    {
        return (size_t)key;
    }
};

template<>
struct HashFunc<string>
{
    size_t operator()(const string& s)
    {
        size_t hash = 0;
        for (auto& e : s)
        {
            hash += e;
            hash *= 131;
        }
        return hash;
    }
};

inline unsigned long __stl_next_prime(unsigned long n)
{
    static const int __stl_num_primes = 28;
    static const unsigned long __stl_prime_list[__stl_num_primes]=
    {
        53, 97, 193, 389, 769, 1543, 3079, 6151, 12289, 24593,
        49157, 98317, 196613, 393241, 786433, 1572869, 3145739,
        6291469, 12582917, 25165843, 50331653, 100663319, 201326611,
        402653189, 805306457, 1610612741, 3221225473, 4294967291
    };
    const unsigned long* first = __stl_prime_list;
    const unsigned long* last = __stl_prime_list + __stl_num_primes;
    const unsigned long* pos = lower_bound(first, last, n);
    return pos == last ? *(last - 1) : *pos;
}

namespace open_address
{
    template<class K, class V, class Hash = HashFunc<K>>
    class HashTable
    {
    public:
        HashTable() :_tables(__stl_next_prime(0)),_n(0){}

        bool Insert(const pair<K, V>& kv)
        {
            if (Find(kv.first)) return false;
            if (_n * 10 / _tables.size() >= 7)//扩容
            {
                HashTable<K, V, Hash> newht;
                newht._tables.resize(__stl_next_prime(_tables.size() + 1));
                for (auto& e : _tables)
                {
                    if (e._state == EXIST) newht.Insert(e._kv);
                }
                _tables.swap(newht._tables);
            }
            Hash hash;
            size_t hash0 = hash(kv.first) % _tables.size();
            size_t hashi = hash0;
            size_t i = 1;
            while (_tables[hashi]._state == EXIST)
            {
                hashi = (hash0 + i) % _tables.size();
                i++;
            }
            _tables[hashi]._kv = kv;
            _tables[hashi]._state = EXIST;
            ++_n;
            return true;
        }

        HashData<K, V>* Find(const K& key)
        {
            Hash hash;
            size_t hash0 = hash(key) % _tables.size();
            size_t hashi = hash0;
            size_t i = 1;
            while (_tables[hashi]._state != EMPTY)
            {
                if (_tables[hashi]._state == EXIST && _tables[hashi]._kv.first == key)
                    return &_tables[hashi];
                hashi = (hash0 + i) % _tables.size();
                i++;
            }
            return nullptr;
        }

        bool Erase(const K& key)
        {
            HashData<K, V>* ret = Find(key);
            if (ret)
            {
                ret->_state = DELETE;
                return true;
            }
            else return false;
        }

    private:
        vector<HashData<K, V>> _tables;
        size_t _n;//记录数据个数
    };
}

#include "HashTable.h"
int main()
{
    open_address::HashTable<int, int> ht;
    int a[] = {19, 30, 5, 36, 13, 20, 21, 12};
    for (auto e : a)
    {
        ht.Insert({ e,e });
    }
    if (ht.Find(13)) ht.Erase(13);
    else cout << "没找到" << endl;
    return 0;
}

struct Date
{
    int _year;
    int _month;
    int _day;
    Date(int year = 1, int month = 1, int day = 1) :_year(year),_month(month),_day(day){}
    bool operator==(const Date& d)
    {
        return _year == d._year && _month == d._month && _day == d._day;
    }
};

struct DateHashFunc
{
    size_t operator()(const Date& d)
    {
        size_t hash = 0;
        hash += d._year; hash *= 131;
        hash += d._month; hash *= 131;
        hash += d._day; hash *= 131;
        return hash;
    }
};

int main()
{
    string a1[] = {"sort", "insert", "abcd", "bcad", "aadd"};
    open_address::HashTable<string, string> ht;
    for (auto& e : a1) ht.Insert({ e,e });
    int a2[] = {-19, -30, 5, 36, 13, 20, 21, 12};
    open_address::HashTable<int, int> ht1;
    for (auto& e : a2) ht1.Insert({ e,e });
    open_address::HashTable<Date, int, DateHashFunc> ht2;
    ht2.Insert({{2026,1,2},1});
    ht2.Insert({{2026,2,1},2});
    return 0;
}

namespace hash_bucket
{
    template<class K, class V>
    struct HashNode
    {
        pair<K, V> _kv;
        HashNode<K, V>* _next;
        HashNode(const pair<K,V>& kv):_kv(kv),_next(nullptr){}
    };

    template<class K, class V, class Hash = HashFunc<K>>
    class HashTable
    {
        typedef HashNode<K, V> Node;
    public:
        HashTable() :_tables(__stl_next_prime(0)),_n(0){}

        //拷贝构造
        HashTable(const HashTable<K, V, Hash>& ht)
        {
            _tables.resize(ht._tables.size());
            for (int i = 0; i < ht._tables.size(); i++)
            {
                Node* htcur = ht._tables[i];
                while (htcur)
                {
                    Node* newnode = new Node(htcur->_kv);//尾插
                    Node* cur = _tables[i];
                    if (cur == nullptr) _tables[i] = newnode;
                    else
                    {
                        while (cur->_next) cur = cur->_next;
                        cur->_next = newnode;
                    }
                    htcur = htcur->_next;
                }
            }
            _n = ht._n;
        }

        ~HashTable()
        {
            for (int i = 0; i < _tables.size(); i++)
            {
                Node* cur = _tables[i];
                while (cur)
                {
                    Node* next = cur->_next;
                    delete cur;
                    cur = next;
                }
                _tables[i] = nullptr;
            }
        }

        bool Insert(const pair<K, V>& kv)
        {
            if (Find(kv.first)) return false;
            Hash hash;
            if (_n == _tables.size())//扩容
            {
                vector<Node*> newTable(__stl_next_prime(_tables.size() + 1));
                for (int i = 0; i < _tables.size(); i++)
                {
                    Node* cur = _tables[i];
                    while (cur)
                    {
                        Node* next = cur->_next;
                        size_t hashi = hash(kv.first) % newTable.size();//找到新表的映射位置
                        //头插
                        cur->_next = newTable[hashi];
                        newTable[hashi] = cur;
                        cur = next;
                    }
                    _tables[i] = nullptr;
                }
                _tables.swap(newTable);
            }
            size_t hashi = hash(kv.first) % _tables.size();
            Node* newnode = new Node(kv);//头插
            newnode->_next = _tables[hashi];
            _tables[hashi] = newnode;
            ++_n;
            return true;
        }

        Node* Find(const K& key)
        {
            Hash hash;
            size_t hashi = hash(key) % _tables.size();
            Node* cur = _tables[hashi];
            while (cur)
            {
                if (cur->_kv.first == key) return cur;
                cur = cur->_next;
            }
            return nullptr;
        }

        bool Erase(const K& key)
        {
            Hash hash;
            size_t hashi = hash(key) % _tables.size();
            Node* prev = nullptr;
            Node* cur = _tables[hashi];
            while (cur)
            {
                if (cur->_kv.first == key)//找到了
                {
                    if (prev == nullptr)//待删除节点为头节点
                        _tables[hashi] = cur->_next;
                    else//待删除节点为中间节点
                        prev->_next = cur->_next;
                    delete cur;
                    --_n;
                    return true;
                }
                else
                {
                    prev = cur;
                    cur = cur->_next;
                }
            }
            return false;
        }

    private:
        vector<Node*> _tables;
        size_t _n = 0;
    };
}

int main()
{
    int a[] = {19, 30, 5, 36, 13, 20, 21, 12, 24, 96};
    hash_bucket::HashTable<int, int> ht;
    for (auto& e : a)
    {
        ht.Insert({ e,e });
    }
    ht.Insert({100,100});
    ht.Insert({101,101});
    cout << ht.Find(19) << endl;
    cout << ht.Find(36) << endl;
    cout << ht.Find(96) << endl;
    cout << ht.Find(101) << endl << endl;
    ht.Erase(19);
    ht.Erase(36);
    ht.Erase(96);
    ht.Erase(101);
    cout << ht.Find(19) << endl;
    cout << ht.Find(36) << endl;
    cout << ht.Find(96) << endl;
    cout << ht.Find(101) << endl << endl;
    return 0;
}

//HashTable.h
#include <vector>
#include <string>
using namespace std;

template<class K>
struct HashFunc
{
    size_t operator()(const K& key)
    {
        return (size_t)key;
    }
};

template<>
struct HashFunc<string>
{
    size_t operator()(const string& s)
    {
        size_t hash = 0;
        for (auto& e : s)
        {
            hash += e;
            hash *= 131;
        }
        return hash;
    }
};

inline unsigned long __stl_next_prime(unsigned long n)
{
    static const int __stl_num_primes = 28;
    static const unsigned long __stl_prime_list[__stl_num_primes]=
    {
        53, 97, 193, 389, 769, 1543, 3079, 6151, 12289, 24593,
        49157, 98317, 196613, 393241, 786433, 1572869, 3145739,
        6291469, 12582917, 25165843, 50331653, 100663319, 201326611,
        402653189, 805306457, 1610612741, 3221225473, 4294967291
    };
    const unsigned long* first = __stl_prime_list;
    const unsigned long* last = __stl_prime_list + __stl_num_primes;
    const unsigned long* pos = lower_bound(first, last, n);
    return pos == last ? *(last - 1) : *pos;
}

namespace hash_bucket
{
    template<class T>
    struct HashNode
    {
        T _data;
        HashNode<T>* _next;
        HashNode(const T& data):_data(data),_next(nullptr){}
    };

    //前置声明
    template<class K, class T, class KeyOfT, class Hash>
    class HashTable;

    template<class K, class T, class Ref, class Ptr, class KeyOfT, class Hash>
    struct HTIterator
    {
        typedef HashNode<T> Node;
        typedef HashTable<K, T, KeyOfT, Hash> HT;
        typedef HTIterator<K, T, Ref, Ptr, KeyOfT, Hash> Self;
        Node* _node;
        const HT* _ht;//用在 operator++

        HTIterator(Node* node, const HT* ht) :_node(node),_ht(ht){}

        Ref operator*()//解引用
        {
            return _node->_data;
        }

        Ptr operator->()//取数据
        {
            return &_node->_data;
        }

        bool operator!=(const Self& s)
        {
            return _node != s._node;
        }

        Self& operator++()//函数只是让当前迭代器走到新位置，最后返回该迭代器
        {
            if (_node->_next) _node = _node->_next;
            else//当前桶已走完
            {
                KeyOfT kot;
                Hash hash;
                size_t hashi = hash(kot(_node->_data)) % _ht->_tables.size();//当前桶的位置
                hashi++;
                while (hashi < _ht->_tables.size())
                {
                    _node = _ht->_tables[hashi];
                    if (_node) break;
                    else hashi++;
                }
                if (hashi == _ht->_tables.size()) _node = nullptr;
            }
            return *this;
        }
    };

    template<class K, class T, class KeyOfT, class Hash = HashFunc<T>>//T 本身是 K，或含有 K
    class HashTable
    {
        //友元声明
        template<class K, class T, class Ref, class Ptr, class KeyOfT, class Hash>
        friend struct HTIterator;

        typedef HashNode<T> Node;
    public:
        typedef HTIterator<K, T, T&, T*, KeyOfT, Hash> Iterator;
        typedef HTIterator<K, T, const T&, const T*, KeyOfT, Hash> ConstIterator;

        Iterator Begin()
        {
            if (_n == 0) return End();
            for (int i = 0; i < _tables.size(); i++)//找到哈希表中不为空的位置
            {
                Node* cur = _tables[i];
                if (cur) return Iterator(cur, this);
            }
            return End();
        }

        Iterator End()
        {
            return Iterator(nullptr, this);
        }

        ConstIterator Begin() const
        {
            if (_n == 0) return End();
            for (int i = 0; i < _tables.size(); i++)
            {
                Node* cur = _tables[i];
                if (cur) return ConstIterator(cur, this);
            }
            return End();
        }

        ConstIterator End() const
        {
            return ConstIterator(nullptr, this);
        }

        HashTable() :_tables(__stl_next_prime(0)),_n(0){}

        ~HashTable()
        {
            for (int i = 0; i < _tables.size(); i++)
            {
                Node* cur = _tables[i];
                while (cur)
                {
                    Node* next = cur->_next;
                    delete cur;
                    cur = next;
                }
                _tables[i] = nullptr;
            }
        }

        pair<Iterator, bool> Insert(const T& data)
        {
            KeyOfT kot;
            auto it = Find(kot(data));
            if (it != End()) return { it,false };
            Hash hash;
            if (_n == _tables.size())//扩容
            {
                vector<Node*> _newTable;
                _newTable.resize(__stl_next_prime(_tables.size() + 1));
                for (int i = 0; i < _tables.size(); i++)
                {
                    Node* cur = _tables[i];
                    while (cur)
                    {
                        Node* next = cur->_next;
                        size_t hashi = hash(kot(cur->_data)) % _newTable.size();//找到新表的映射位置
                        //头插
                        cur->_next = _newTable[hashi];
                        _newTable[hashi] = cur;
                        cur = next;
                    }
                }
                _tables.swap(_newTable);
            }
            size_t hashi = hash(kot(data)) % _tables.size();
            Node* newnode = new Node(data);//头插
            newnode->_next = _tables[hashi];
            _tables[hashi] = newnode;
            _n++;
            return { Iterator(newnode,this),true };
        }

        Iterator Find(const K& key)
        {
            KeyOfT kot;
            Hash hash;
            size_t hashi = hash(key) % _tables.size();
            Node* cur = _tables[hashi];
            while (cur)
            {
                if (kot(cur->_data) == key) return { cur,this };
                cur = cur->_next;
            }
            return End();
        }

        bool Erase(const K& key)
        {
            Hash hash;
            KeyOfT kot;
            size_t hashi = hash(key) % _tables.size();
            Node* cur = _tables[hashi];
            Node* prev = nullptr;
            while (cur)
            {
                if (kot(cur->_data) == key)//找到了
                {
                    if (prev == nullptr)//待删除节点为头节点
                    {
                        _tables[hashi] = cur->_next;
                    }
                    else//待删除节点为中间节点
                    {
                        prev->_next = cur->_next;
                    }
                    delete cur;
                    --_n;
                    return true;
                }
                else
                {
                    prev = cur;
                    cur = cur->_next;
                }
            }
            return false;
        }

    private:
        vector<Node*> _tables;
        size_t _n = 0;
    };
}

//UnorderedSet.h
#include "HashTable.h"
namespace mine
{
    template<class K, class Hash = HashFunc<K>>
    class unordered_set
    {
        struct SetKeyOfT
        {
            const K& operator()(const K& key)
            {
                return key;
            }
        };
    public:
        typedef typename hash_bucket::HashTable<K, const K, SetKeyOfT, Hash>::Iterator iterator;
        typedef typename hash_bucket::HashTable<K, const K, SetKeyOfT, Hash>::ConstIterator const_iterator;

        iterator begin()
        {
            return _ht.Begin();
        }
        iterator end()
        {
            return _ht.End();
        }
        const_iterator begin() const
        {
            return _ht.Begin();
        }
        const_iterator end() const
        {
            return _ht.End();
        }
        pair<iterator, bool> insert(const K& key)
        {
            return _ht.Insert(key);
        }
        iterator find(const K& key)
        {
            return _ht.Find();
        }
        bool erase(const K& key)
        {
            return _ht.Erase(key);
        }

    private:
        hash_bucket::HashTable<K, const K, SetKeyOfT, Hash> _ht;
    };

    void print(const unordered_set<int>& us)//测试 const 迭代器
    {
        unordered_set<int>::const_iterator cit = us.begin();
        cout << typeid(us).name() << endl;
        while (cit != us.end())
        {
            cout << *cit << " ";
            ++cit;
        }
        cout << endl;
        for (auto e : us)
        {
            cout << e << " ";
        }
        cout << endl << endl;
    }
}

//UnorderedMap.h
#include "HashTable.h"
namespace mine
{
    template<class K, class V, class Hash = HashFunc<K>>
    class unordered_map
    {
        struct MapKeyOfT
        {
            const K& operator()(const pair<K, V>& kv)
            {
                return kv.first;
            }
        };
    public:
        typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash>::Iterator iterator;
        typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash>::ConstIterator const_iterator;

        iterator begin()
        {
            return _ht.Begin();
        }
        iterator end()
        {
            return _ht.End();
        }
        const_iterator begin() const
        {
            return _ht.Begin();
        }
        const_iterator end() const
        {
            return _ht.End();
        }
        V& operator[](const K& key)
        {
            auto ret = insert({ key,V() });
            return ret.first->second;
        }
        pair<iterator, bool> insert(const pair<K, V>& kv)
        {
            return _ht.Insert(kv);
        }
        iterator find(const K& key)
        {
            return _ht.Find(key);
        }
        bool erase(const K& key)
        {
            return _ht.Erase(key);
        }

    private:
        hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash> _ht;
    };

    void print(const unordered_map<string, string>& um)//测试 const 迭代器
    {
        unordered_map<string, string>::const_iterator cit = um.begin();
        while (cit != um.end())
        {
            cout << cit->first << "：" << cit->second << endl;
            ++cit;
        }
        cout << endl;
        for (auto& e : um)
        {
            cout << e.first << "：" << e.second << endl;
        }
    }
}

#define _CRT_SECURE_NO_WARNINGS
#include <iostream>
using namespace std;
#include "UnorderedSet.h"
#include "UnorderedMap.h"

int main()
{
    int a[] = {3, 11, 86, 7, 88, 82, 1, 881, 5, 6, 7, 6};
    mine::unordered_set<int> us;
    for (auto e : a)
    {
        us.insert(e);
    }
    auto it = us.begin();
    while (it != us.end())
    {
        cout << *it << " ";
        ++it;
    }
    cout << endl;
    for (auto& e : us)
    {
        cout << e << " ";
    }
    cout << endl << endl;
    mine::print(us);
    return 0;
}

int main()
{
    mine::unordered_map<string, string> dict;
    dict.insert({"sort","排序"});
    dict.insert({"字符串","string"});
    dict.insert({"left","左"});
    dict.insert({"right","右"});
    for (auto& e : dict)
    {
        cout << e.first << "：" << e.second << endl;
    }
    cout << endl;
    dict["left"]="左，剩余";
    dict["insert"]="插入";
    dict["string"];
    auto it = dict.begin();
    while (it != dict.end())
    {
        //it->second += "x";
        cout << it->first << "：" << it->second << endl;
        ++it;
    }
    cout << endl;
    print(dict);
    return 0;
}

C++ 哈希表原理与 STL 容器实现详解

哈希表核心概念

unordered_set 和 unordered_map

更多推荐文章

相关免费在线工具

unordered_multiset / unordered_multimap

哈希基础

直接定址法

哈希冲突

负载因子

将关键字转为 size_t

哈希函数设计

除法散列法 / 除留余数法

处理哈希冲突：开放定址法

线性探测

二次探测

开放定址法线性探测代码实现

处理哈希冲突：链地址法

代码实现

哈希表封装 unordered_set 和 unordered_map

代码实现

更多推荐文章

相关免费在线工具

C++ 哈希表原理与 STL 容器实现详解

哈希表核心概念

unordered_set 和 unordered_map

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

unordered_multiset / unordered_multimap

哈希基础

直接定址法

哈希冲突

负载因子

将关键字转为 size_t

哈希函数设计

除法散列法 / 除留余数法

处理哈希冲突：开放定址法

线性探测

二次探测

开放定址法线性探测代码实现

处理哈希冲突：链地址法

代码实现

哈希表封装 unordered_set 和 unordered_map

代码实现

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具