手写 C++ 哈希表：unordered_set/unordered_map 用法、模拟实现与性能对比 | 极客日志

C++

手写 C++ 哈希表：unordered_set/unordered_map 用法、模拟实现与性能对比

从标准库用法切入，逐步实现一套基于哈希桶的 unordered_set 和 unordered_map，涵盖节点设计、迭代器构造、桶扩容、key 提取仿函数以及 const 正确性处理。性能测试显示，桶顺序遍历的迭代器比标准库按插入顺序维护的方式更快，最大桶长度仅 2，平均桶长约 1.28，接近 O(1)。

ByteFlow发布于 2026/6/29更新于 2026/7/11 浏览

手写 C++ 哈希表：unordered_set/unordered_map 用法、模拟实现与性能对比

标准库的 unordered_set 和 unordered_map 用起来顺手，但真自己写一个才知道哈希表里藏了多少细节。下面从用法切入，然后一步步模拟实现，顺便看看不同实现策略对性能的影响。

标准库用法

先快速过一下基本操作，顺便留意那些平时不太关注的桶状态。

unordered_set

#include <iostream>
#include <unordered_set>
using namespace std;

void test1() {
    unordered_set<int> st;
    st.insert(1);
    st.insert(3);
    st.insert(2);
    st.insert(4);
    unordered_set<int>::iterator it = st.begin();
    while (it != st.end()) {
        cout << *it << " ";
        ++it;
    }
    cout << endl;
    it = st.find(3);
    if (it != st.end()) cout << *it << "存在" << endl;
    st.erase(1);
    if (st.count(1)) cout << "1存在" << endl;
}

// unordered_set 的负载因子最大是 1
void test2() {
    unordered_set<int> st;
    st.insert(1);
    st.();
    st.();
    st.();
    cout << st.() << endl; 
    cout << st.() << endl; 
    st.();
    st.();
    cout << st.() << endl; 
    cout << st.() << endl; 
    st.();
    st.();
    cout << st.() << endl; 
    cout << st.() << endl; 
}

{
    unordered_set<> st;
     ( i = ; i < ; i++) st.(() + i);
    cout <<  << st.() << endl;
    cout <<  << st.() << endl;
    
     ( < st.()) {
        cout <<  << st.() << endl;
    }
    
     it = st.();
     (it != st.()) {
        cout <<  << st.() <<  << endl;
    }  {
        cout <<  << endl;
    }
}

{
    ();
    ();
    ();
     ;
}

相关免费在线工具

Base64 字符串编码/解码
将字符串编码和解码为其 Base64 格式表示形式即可。在线工具，Base64 字符串编码/解码在线工具，online
Base64 文件转换器
将字符串、文件或图像转换为其 Base64 表示形式。在线工具，Base64 文件转换器在线工具，online
Markdown转HTML
将 Markdown（GFM）转为 HTML 片段，浏览器内 marked 解析；与 HTML转Markdown 互为补充。在线工具，Markdown转HTML在线工具，online
HTML转Markdown
将 HTML 片段转为 GitHub Flavored Markdown，支持标题、列表、链接、代码块与表格等；浏览器内处理，可链接预填。在线工具，HTML转Markdown在线工具，online
JSON 压缩
通过删除不必要的空白来缩小和压缩JSON。在线工具，JSON 压缩在线工具，online
JSON美化和格式化
将JSON字符串修饰为友好的可读格式。在线工具，JSON美化和格式化在线工具，online

#include <iostream>
#include <unordered_map>
using namespace std;

void test1() {
    unordered_map<int, int> mp;
    mp.insert(make_pair(1, 1));
    mp.insert(make_pair(5, 5));
    mp.insert(make_pair(2, 2));
    mp.insert(make_pair(4, 4));
    mp.insert(make_pair(3, 3));
    unordered_map<int, int>::iterator it = mp.begin();
    while (it != mp.end()) {
        cout << it->first << ":" << it->second << endl;
        it++;
    }
    it = mp.find(3);
    if (it != mp.end()) {
        cout << "找到了 " << it->first << ":" << it->second << endl;
    }
    mp.erase(it);
    if (!mp.count(3)) {
        cout << "没有找到 3" << endl;
    }
    mp[3] = 5;
    cout << mp[3] << endl;
}

void test2() {
    string arr[] = { "香蕉", "甜瓜","苹果", "西瓜", "苹果", "西瓜", "苹果", "苹果", "西瓜", "苹果", "香蕉", "苹果", "香蕉" };
    unordered_map<string, int> mp;
    for (auto& e : arr) {
        unordered_map<string, int>::iterator ret = mp.find(e);
        if (ret != mp.end()) {
            ret->second++;
        } else {
            mp.insert(make_pair(e, 1));
        }
    }
    for (auto& e : mp) {
        cout << e.first << " " << e.second << endl;
    }
}

int main() {
    test1();
    test2();
    return 0;
}

template<class T> class HashNode {
public:
    T _data;
    HashNode<T>* _next;
    HashNode(const T& data) :_data(data), _next(nullptr) {}
};

template<class K, class T, class Ref, class Ptr, class KeyOfT, class Hash> struct __HTIterator {
    typedef HashNode<T> Node;
    Node* _node;
    const HashTable<K, T, KeyOfT, Hash>* _pht;
    size_t _hashi; //当前节点所在桶的编号
};

template<class K, class T, class KeyOfT, class Hash> class HashTable;

template<class K, class T, class KeyOfT, class Hash> class HashTable {
    template<class K, class T, class Ref, class Ptr, class KeyOfT, class Hash> friend struct __HTIterator;
    // ...
};

typedef __HTIterator<K, T, Ref, Ptr, KeyOfT, Hash> self;
self& operator++() {
    if (_node->_next) {
        _node = _node->_next;
    } else {
        _hashi++;
        while (_hashi < _pht->_tables.size()) {
            if (_pht->_tables[_hashi]) {
                _node = _pht->_tables[_hashi];
                break;
            }
            _hashi++;
        }
        if (_hashi == _pht->_tables.size()) {
            _node = nullptr;
        }
    }
    return *this;
}

template<class K, class T, class KeyOfT, class Hash> class HashTable {
    typedef HashNode<T> Node;
    template<class K, class T, class Ref, class Ptr, class KeyOfT, class Hash> friend struct __HTIterator;
public:
    typedef __HTIterator<K, T, T&, T*, KeyOfT, Hash> iterator;
    typedef __HTIterator<K, T, const T&, const T*, KeyOfT, Hash> const_iterator;
public:
    iterator begin() {
        for (size_t i = 0; i < _tables.size(); i++) {
            if (_tables[i]) {
                return iterator(_tables[i], this, i);
            }
        }
        return end();
    }
    iterator end() {
        return iterator(nullptr, this, -1);
    }
    const_iterator begin() const {
        for (size_t i = 0; i < _tables.size(); i++) {
            if (_tables[i]) {
                return const_iterator(_tables[i], this, i);
            }
        }
        return end();
    }
    const_iterator end() const {
        return const_iterator(nullptr, this, -1);
    }
    // ...
};

namespace dck {
    template<class K, class Hash = HashFunc<K>> class unordered_set {
        struct SetKeyOfT {
            const K& operator()(const K& key) { return key; }
        };
    public:
        typedef typename hash_bucket::HashTable<K, K, SetKeyOfT, Hash>::const_iterator iterator;
        typedef typename hash_bucket::HashTable<K, K, SetKeyOfT, Hash>::const_iterator const_iterator;
        const_iterator begin() const { return _ht.begin(); }
        const_iterator end() const { return _ht.end(); }
    private:
        hash_bucket::HashTable<K, K, SetKeyOfT, Hash> _ht;
    };
}

namespace dck {
    template<class K, class V, class Hash = HashFunc<K>> class unordered_map {
        struct MapKeyOfT {
            const K& operator()(const pair<K, V>& kv) { return kv.first; }
        };
    public:
        typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash>::iterator iterator;
        typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash>::const_iterator const_iterator;
        iterator begin() { return _ht.begin(); }
        iterator end() { return _ht.end(); }
        const_iterator begin() const { return _ht.begin(); }
        const_iterator end() const { return _ht.end(); }
    private:
        hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash> _ht;
    };
}

iterator Find(const K& key) {
    Hash hf;
    KeyOfT kot;
    size_t hashi = hf(key) % _tables.size();
    Node* cur = _tables[hashi];
    while (cur) {
        if (kot(cur->_data) == key) return iterator(cur, this, hashi);
        cur = cur->_next;
    }
    return end();
}

pair<iterator, bool> Insert(const T& data) {
    KeyOfT kot;
    iterator it = Find(kot(data));
    if (it != end()) return make_pair(it, false);
    Hash hf;
    if (_n == _tables.size()) {
        size_t newSize = _tables.size() * 2;
        vector<Node*> newTables;
        newTables.resize(newSize);
        for (size_t i = 0; i < _tables.size(); i++) {
            Node* cur = _tables[i];
            while (cur) {
                Node* next = cur->_next;
                size_t hashi = hf(kot(cur->_data)) % newSize;
                cur->_next = newTables[hashi];
                newTables[hashi] = cur;
                cur = next;
            }
            _tables[i] = nullptr;
        }
        _tables.swap(newTables);
    }
    size_t hashi = hf(kot(data)) % _tables.size();
    Node* newNode = new Node(data);
    newNode->_next = _tables[hashi];
    _tables[hashi] = newNode;
    ++_n;
    return make_pair(iterator(newNode, this, hashi), true);
}

pair<iterator, bool> insert(const K& key) {
    auto ret = _ht.Insert(key);
    return pair<const_iterator, bool>(const_iterator(ret.first._node, ret.first._pht, ret.first._hashi), ret.second);
}

bool Erase(const K& key) {
    Hash hf;
    size_t hashi = hf(key) % _tables.size();
    Node* prev = nullptr;
    Node* cur = _tables[hashi];
    while (cur) {
        if (cur->_kv.first == key) {
            if (prev == nullptr) {
                _tables[hashi] = cur->_next;
            } else {
                prev->_next = cur->_next;
            }
            delete cur;
            return true;
        }
        prev = cur;
        cur = cur->_next;
    }
    return false;
}

V& operator[](const K& key) {
    pair<iterator, bool> ret = _ht.Insert(make_pair(key, V()));
    return ret.first->second;
}

void Some() {
    size_t bucketSize = 0;
    size_t maxBucketLen = 0;
    size_t sum = 0;
    double averageBucketLen = 0;
    for (size_t i = 0; i < _tables.size(); i++) {
        Node* cur = _tables[i];
        if (cur) ++bucketSize;
        size_t bucketLen = 0;
        while (cur) {
            ++bucketLen;
            cur = cur->_next;
        }
        sum += bucketLen;
        if (bucketLen > maxBucketLen) maxBucketLen = bucketLen;
    }
    averageBucketLen = (double)sum / (double)bucketSize;
    printf("all bucketSize:%d\n", _tables.size());
    printf("bucketSize:%d\n", bucketSize);
    printf("maxBucketLen:%d\n", maxBucketLen);
    printf("averageBucketLen:%lf\n\n", averageBucketLen);
}

#include <set>
#include <unordered_set>
#include "HashTable.h"

void test() {
    const size_t N = 1000000;
    unordered_set<int> us;
    set<int> s;
    hash_bucket::HashTable<int, int> ht;
    vector<int> v;
    v.reserve(N);
    srand(time(0));
    for (size_t i = 0; i < N; ++i) {
        //v.push_back(rand()); // 重复多
        v.push_back(rand() + i); // 重复少
        //v.push_back(i); // 无重复，有序
    }
    size_t begin1 = clock();
    for (auto e : v) s.insert(e);
    size_t end1 = clock();
    cout << "set insert:" << end1 - begin1 << endl;
    size_t begin2 = clock();
    for (auto e : v) us.insert(e);
    size_t end2 = clock();
    cout << "unordered_set insert:" << end2 - begin2 << endl;
    size_t begin10 = clock();
    for (auto e : v) ht.Insert(make_pair(e, e));
    size_t end10 = clock();
    cout << "HashTbale insert:" << end10 - begin10 << endl << endl;
    size_t begin3 = clock();
    for (auto e : v) s.find(e);
    size_t end3 = clock();
    cout << "set find:" << end3 - begin3 << endl;
    size_t begin4 = clock();
    for (auto e : v) us.find(e);
    size_t end4 = clock();
    cout << "unordered_set find:" << end4 - begin4 << endl;
    size_t begin11 = clock();
    for (auto e : v) ht.Find(e);
    size_t end11 = clock();
    cout << "HashTable find:" << end11 - begin11 << endl << endl;
    cout << "插入数据个数：" << us.size() << endl << endl;
    ht.Some();
    size_t begin5 = clock();
    for (auto e : v) s.erase(e);
    size_t end5 = clock();
    cout << "set erase:" << end5 - begin5 << endl;
    size_t begin6 = clock();
    for (auto e : v) us.erase(e);
    size_t end6 = clock();
    cout << "unordered_set erase:" << end6 - begin6 << endl;
    size_t begin12 = clock();
    for (auto e : v) ht.Erase(e);
    size_t end12 = clock();
    cout << "HashTable Erase:" << end12 - begin6 << endl << endl;
}

int main() {
    test();
    return 0;
}

#pragma once
#include <iostream>
#include <vector>
using namespace std;

template<class K> struct HashFunc {
    size_t operator()(const K& key) {
        return (size_t)key;
    }
};

template<> struct HashFunc<string> {
    size_t operator()(const string& key) {
        size_t hash = 0;
        for (auto& e : key) {
            hash *= 31;
            hash += e;
        }
        return hash;
    }
};

namespace hash_bucket {
    template<class T> class HashNode {
    public:
        T _data;
        HashNode<T>* _next;
        HashNode(const T& data) :_data(data), _next(nullptr) {}
    };

    template<class K, class T, class KeyOfT, class Hash> class HashTable;

    template<class K, class T, class Ref, class Ptr, class KeyOfT, class Hash> struct __HTIterator {
        typedef HashNode<T> Node;
        typedef __HTIterator<K, T, Ref, Ptr, KeyOfT, Hash> self;
        Node* _node;
        const HashTable<K, T, KeyOfT, Hash>* _pht;
        size_t _hashi;
        __HTIterator(Node* node, const HashTable<K, T, KeyOfT, Hash>* pht, size_t hashi) :_node(node), _pht(pht), _hashi(hashi) { }
        self& operator++() {
            if (_node->_next) {
                _node = _node->_next;
            } else {
                _hashi++;
                while (_hashi < _pht->_tables.size()) {
                    if (_pht->_tables[_hashi]) {
                        _node = _pht->_tables[_hashi];
                        break;
                    }
                    _hashi++;
                }
                if (_hashi == _pht->_tables.size()) {
                    _node = nullptr;
                }
            }
            return *this;
        }
        Ref operator*() { return _node->_data; }
        Ptr operator->() { return &_node->_data; }
        bool operator!=(const self& s) { return _node != s._node; }
    };

    template<class K, class T, class KeyOfT, class Hash> class HashTable {
        typedef HashNode<T> Node;
        template<class K, class T, class Ref, class Ptr, class KeyOfT, class Hash> friend struct __HTIterator;
    public:
        typedef __HTIterator<K, T, T&, T*, KeyOfT, Hash> iterator;
        typedef __HTIterator<K, T, const T&, const T*, KeyOfT, Hash> const_iterator;
    public:
        iterator begin() {
            for (size_t i = 0; i < _tables.size(); i++) {
                if (_tables[i]) {
                    return iterator(_tables[i], this, i);
                }
            }
            return end();
        }
        iterator end() {
            return iterator(nullptr, this, -1);
        }
        const_iterator begin() const {
            for (size_t i = 0; i < _tables.size(); i++) {
                if (_tables[i]) {
                    return const_iterator(_tables[i], this, i);
                }
            }
            return end();
        }
        const_iterator end() const {
            return const_iterator(nullptr, this, -1);
        }
    public:
        HashTable() { _tables.resize(10); }
        ~HashTable() {
            for (size_t i = 0; i < _tables.size(); i++) {
                Node* cur = _tables[i];
                while (cur) {
                    Node* next = cur->_next;
                    delete cur;
                    cur = next;
                }
                _tables[i] = nullptr;
            }
        }
        iterator Find(const K& key) {
            Hash hf;
            KeyOfT kot;
            size_t hashi = hf(key) % _tables.size();
            Node* cur = _tables[hashi];
            while (cur) {
                if (kot(cur->_data) == key) return iterator(cur, this, hashi);
                cur = cur->_next;
            }
            return end();
        }
        pair<iterator, bool> Insert(const T& data) {
            KeyOfT kot;
            iterator it = Find(kot(data));
            if (it != end()) return make_pair(it, false);
            Hash hf;
            if (_n == _tables.size()) {
                size_t newSize = _tables.size() * 2;
                vector<Node*> newTables;
                newTables.resize(newSize);
                for (size_t i = 0; i < _tables.size(); i++) {
                    Node* cur = _tables[i];
                    while (cur) {
                        Node* next = cur->_next;
                        size_t hashi = hf(kot(cur->_data)) % newSize;
                        cur->_next = newTables[hashi];
                        newTables[hashi] = cur;
                        cur = next;
                    }
                    _tables[i] = nullptr;
                }
                _tables.swap(newTables);
            }
            size_t hashi = hf(kot(data)) % _tables.size();
            Node* newNode = new Node(data);
            newNode->_next = _tables[hashi];
            _tables[hashi] = newNode;
            ++_n;
            return make_pair(iterator(newNode, this, hashi), true);
        }
        bool Erase(const K& key) {
            Hash hf;
            size_t hashi = hf(key) % _tables.size();
            Node* prev = nullptr;
            Node* cur = _tables[hashi];
            while (cur) {
                if (cur->_kv.first == key) {
                    if (prev == nullptr) {
                        _tables[hashi] = cur->_next;
                    } else {
                        prev->_next = cur->_next;
                    }
                    delete cur;
                    return true;
                }
                prev = cur;
                cur = cur->_next;
            }
            return false;
        }
    private:
        vector<Node*> _tables;
        size_t _n;
    };
}

#pragma once
#include "HashTable.h"

namespace dck {
    template<class K, class Hash = HashFunc<K>> class unordered_set {
        struct SetKeyOfT {
            const K& operator()(const K& key) { return key; }
        };
    public:
        typedef typename hash_bucket::HashTable<K, K, SetKeyOfT, Hash>::const_iterator iterator;
        typedef typename hash_bucket::HashTable<K, K, SetKeyOfT, Hash>::const_iterator const_iterator;
        pair<iterator, bool> insert(const K& key) {
            auto ret = _ht.Insert(key);
            return pair<const_iterator, bool>(const_iterator(ret.first._node, ret.first._pht, ret.first._hashi), ret.second);
        }
        iterator find(const K& key) { return _ht.Find(key); }
        iterator erase(const K& key) { return _ht.Erase(key); }
        const_iterator begin() const { return _ht.begin(); }
        const_iterator end() const { return _ht.end(); }
    private:
        hash_bucket::HashTable<K, K, SetKeyOfT, Hash> _ht;
    };
}

#pragma once
#include "HashTable.h"

namespace dck {
    template<class K, class V, class Hash = HashFunc<K>> class unordered_map {
        struct MapKeyOfT {
            const K& operator()(const pair<K, V>& kv) { return kv.first; }
        };
    public:
        typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash>::iterator iterator;
        typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash>::const_iterator const_iterator;
        pair<iterator, bool> insert(const pair<K, V>& kv) { return _ht.Insert(kv); }
        V& operator[](const K& key) {
            pair<iterator, bool> ret = _ht.Insert(make_pair(key, V()));
            return ret.first->second;
        }
        iterator find(const K& key) { return _ht.Find(key); }
        iterator erase(const K& key) { return _ht.Erase(key); }
        iterator begin() { return _ht.begin(); }
        iterator end() { return _ht.end(); }
        const_iterator begin() const { return _ht.begin(); }
        const_iterator end() const { return _ht.end(); }
    private:
        hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT, Hash> _ht;
    };
}

#include <unordered_set>
#include "MyUnorderedSet.h"
#include "MyUnorderedMap.h"

void test_unordered_set() {
    dck::unordered_set<int> st;
    st.insert(4);
    st.insert(1);
    st.insert(2);
    st.insert(3);
    dck::unordered_set<int>::iterator it = st.begin();
    while (it != st.end()) {
        cout << *it << " ";
        ++it;
    }
    cout << endl;  // 桶顺序：1 2 3 4
    unordered_set<int> st1;
    st1.insert(4);
    st1.insert(1);
    st1.insert(2);
    st1.insert(3);
    unordered_set<int>::iterator it1 = st1.begin();
    while (it1 != st1.end()) {
        cout << *it1 << " ";  // 插入顺序：4 1 2 3
        ++it1;
    }
    cout << endl;
}

void print(const dck::unordered_map<int, int>& mp) {
    dck::unordered_map<int, int>::const_iterator it = mp.begin();
    while (it != mp.end()) {
        cout << it->first << " " << it->second << endl;
        ++it;
    }
    cout << endl;
}

void test_unordered_map() {
    dck::unordered_map<int, int> mp;
    mp.insert(make_pair(4, 4));
    mp.insert(make_pair(1, 1));
    mp.insert(make_pair(2, 2));
    mp.insert(make_pair(3, 3));
    print(mp);
    dck::unordered_map<int, int>::iterator it = mp.begin();
    while (it != mp.end()) {
        // it->first++; // 编译错误，key 不可改
        it->second++;
        cout << it->first << " " << it->second << endl;
        ++it;
    }
    string arr[] = { "苹果", "西瓜", "苹果", "西瓜", "苹果", "苹果", "西瓜", "苹果", "香蕉", "苹果", "香蕉" };
    dck::unordered_map<string, int> countMap;
    for (auto x : arr) countMap[x]++;
    for (auto t : countMap) {
        cout << t.first << " " << t.second << endl;
    }
    cout << endl;
}

int main() {
    test_unordered_set();
    test_unordered_map();
    return 0;
}

手写 C++ 哈希表：unordered_set/unordered_map 用法、模拟实现与性能对比

标准库用法

unordered_set

更多推荐文章

相关免费在线工具

unordered_map

模拟实现

哈希节点

封装逻辑

迭代器

哈希表提供迭代器接口

unordered_set / unordered_map 的迭代器类型

插入、查找、删除

桶统计与效率测试

完整代码

更多推荐文章

相关免费在线工具

手写 C++ 哈希表：unordered_set/unordered_map 用法、模拟实现与性能对比

标准库用法

unordered_set

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

unordered_map

模拟实现

哈希节点

封装逻辑

迭代器

哈希表提供迭代器接口

unordered_set / unordered_map 的迭代器类型

插入、查找、删除

桶统计与效率测试

完整代码

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具