C++ 哈希表全家桶：unordered_map/set 底层实现与位图布隆过滤器

深入讲解 C++ 中基于哈希表的容器实现原理。涵盖哈希冲突解决方案（闭散列线性探测、开散列链地址法），详细模拟实现 unordered_map 和 unordered_set 底层结构。介绍位图（BitMap）在大数据统计中的应用及内存优化，阐述布隆过滤器（Bloom Filter）的存在性判断机制及其无法删除的特性。最后探讨哈希切割技术在海量数据交集查找中的精确与近似算法方案，并结合力扣例题巩固知识点。

活在当下发布于 2026/2/8更新于 2026/4/184.1K 浏览

unordered 系列关联式容器

有 unordered_map, unordered_set, unordered_multimap, unordered_multiset

这些是用哈希表实现的，用法跟 set 几乎相同，接口都差不多。

它们可以用范围 for 去遍历。

跟 set 那些的区别:

unordered 系列的容器的迭代器是单向迭代器。

unordered 系列中序遍历出来不是有序的。

unordered 系列的容器的性能比 set 等稍微好些；但是升序或降序的数据插入的话，set 好些。

引申：比较性能要在 release 模式下比较。

哈希

哈希也叫做散列，是存储的值跟存储位置建立出的一个对应关系，跟计数排序很像。

自己模拟实现的哈希不要存同一个 key 进去！

哈希是以牺牲空间为代价，提高查询的效率。

建立对应关系的时候有两个常用的方法:

直接定址法 (值分布范围集中得时候用这个)

比如：统计字符串中字符出现的次数，可以把字符跟下标一一对应。

除留余数法 (适用于值分布范围分散的)

例如：值 % n，把这个东西放在对应下标下面。

哈希冲突

其实就是不同的值映射到了相同的位置上，这个位置存不下了。

解决哈希冲突的方案:

闭散列 – 也叫做开放定址法

做法：当前位置被占用了，按规则去找下一个位置存着。

其中又分为 1. 线性探测 2. 二次探测 …

开散列 – 也叫做链地址法 – 自己一般叫哈希桶

闭散列的模拟实现

这里的话个人搭配的是除留余数法加上线性探测。

二次探测的方法跟线性探测的区别就是:

线性探测是这个位置满了去下一个位置找 (也就是下标加 i 去找)。

二次探测是这个位置满了，下标加上 i^2 去找，比如：本来应该在 0 下标，但是满了，去 1, 4, 9 这样。

enum State { EXIST, EMPTY, DELETE };

template<class K, class V>
struct HashData {
    pair<K, V> _kv;
    State _state = EMPTY;
};

template<class K>
struct DefaultHashFunc {
      {
         ()key;
    }
};

< ,  ,   = DefaultHashFunc<K>>
 HashTable {
:
    () {
        _table.();
    }

    {
        
         (_n *  / _table.() >= ) {
             newSize = _table.() * ;
            HashTable<K, V, HashFunc> newHT;
            newHT._table.(newSize);
            
             ( i = ; i < _table.(); i++) {
                 (_table[i]._state == EXIST) {
                    newHT.(_table[i]._kv);
                }
            }
            _table.(newHT._table);
        }

        
        HashFunc hf;
         hashi = (kv.first) % _table.();
         (_table[hashi]._state == EXIST) {
            ++hashi;
            hashi %= _table.();
        }
        _table[hashi]._kv = kv;
        _table[hashi]._state = EXIST;
        ++_n;
         ;
    }

    {
        HashFunc hf;
         hashi = (key) % _table.();
         (_table[hashi]._state != EMPTY) {
             (_table[hashi]._state == EXIST && _table[hashi]._kv.first == key) {
                 (HashData< K, V>*)&_table[hashi];
            }
            ++hashi;
            hashi %= _table.();
        }
         ;
    }

    {
        HashData< K, V>* ret = (key);
         (ret) {
            ret->_state = DELETE;
            --_n;
             ;
        }
         ;
    }

:
    vector<HashData<K, V>> _table;
     _n = ;
};

相关免费在线工具

加密/解密文本

使用加密算法（如AES、TripleDES、Rabbit或RC4）加密和解密文本明文。在线工具，加密/解密文本在线工具，online

Base64 字符串编码/解码

将字符串编码和解码为其 Base64 格式表示形式即可。在线工具，Base64 字符串编码/解码在线工具，online

Base64 文件转换器

将字符串、文件或图像转换为其 Base64 表示形式。在线工具，Base64 文件转换器在线工具，online

Markdown转HTML

将 Markdown（GFM）转为 HTML 片段，浏览器内 marked 解析；与 HTML转Markdown 互为补充。在线工具，Markdown转HTML在线工具，online

HTML转Markdown

将 HTML 片段转为 GitHub Flavored Markdown，支持标题、列表、链接、代码块与表格等；浏览器内处理，可链接预填。在线工具，HTML转Markdown在线工具，online

JSON 压缩

通过删除不必要的空白来缩小和压缩JSON。在线工具，JSON 压缩在线工具，online

template<class K, class T, class KeyOfT, class HashFunc = DefaultHashFunc<K>> class HashTable { struct HashNode { T _data; HashNode* _next; HashNode(const T& data) : _data(data), _next(nullptr) {} }; typedef HashNode<T> Node; template<class K, class T, class Ptr, class Ref, class KeyOfT, class HashFunc> friend struct HTIterator; public: typedef HTIterator<K, T, T*, T&, KeyOfT, HashFunc> iterator; typedef HTIterator<K, T, const T*, const T&, KeyOfT, HashFunc> const_iterator; iterator begin() { for (size_t i = 0; i < _table.size(); i++) { Node* cur = _table[i]; if (cur) return iterator(cur, this); } return iterator(nullptr, this); } iterator end() { return iterator(nullptr, this); } const_iterator begin() const { for (size_t i = 0; i < _table.size(); i++) { Node* cur = _table[i]; if (cur) return const_iterator(cur, this); } return const_iterator(nullptr, this); } const_iterator end() const { return const_iterator(nullptr, this); } HashTable() { _table.resize(10, nullptr); } ~HashTable() { for (size_t i = 0; i < _table.size(); i++) { Node* cur = _table[i]; while (cur) { Node* next = cur->_next; delete cur; cur = next; } _table[i] = nullptr; } } bool Insert(const T& data) { KeyOfT kot; iterator it = Find(kot(data)); if (it != end()) { return make_pair(it, false); } HashFunc hf; // 负载因子到 1 就扩容 if (_n == _table.size()) { size_t newSize = _table.size() * 2; vector<Node*> newTable; newTable.resize(newSize, nullptr); // 遍历旧表，把节点牵下来挂到新表 for (size_t i = 0; i < _table.size(); i++) { Node* cur = _table[i]; while (cur) { Node* next = cur->_next; size_t hashi = hf(kot(cur->_data)) % newSize; cur->_next = newTable[hashi]; newTable[hashi] = cur; cur = next; } _table[i] = nullptr; } _table.swap(newTable); } size_t hashi = hf(kot(data)) % _table.size(); // 头插 Node* newnode = new Node(data); newnode->_next = _table[hashi]; _table[hashi] = newnode; ++_n; return make_pair(iterator(newnode, this), true); } Node* Find(const K& key) { HashFunc hf; KeyOfT kot; size_t hashi = hf(key) % _table.size(); Node* cur = _table[hashi]; while (cur) { if (kot(cur->_data) == key) { return cur; } cur = cur->_next; } return nullptr; } bool Erase(const K& key) { HashFunc hf; KeyOfT kot; size_t hashi = hf(key) % _table.size(); Node* prev = nullptr; Node* cur = _table[hashi]; while (cur) { if (kot(cur->_data) == key) { if (prev == nullptr) { _table[hashi] = cur->_next; } else { prev->_next = cur->_next; } --_n; delete cur; return true; } prev = cur; cur = cur->_next; } return false; } private: vector<Node*> _table; size_t _n = 0; };

C++ 哈希表全家桶：unordered_map/set 底层实现与位图布隆过滤器

unordered 系列关联式容器

哈希

哈希冲突

闭散列的模拟实现

更多推荐文章

相关免费在线工具

开散列的模拟实现

哈希桶里面迭代器的模拟实现

unordered_set 的封装

unordered_map 的封装

位图

应用

布隆过滤器

布隆过滤器的模拟实现

哈希切割

哈希切割的应用

练习题

C++ 哈希表全家桶：unordered_map/set 底层实现与位图布隆过滤器

unordered 系列关联式容器

哈希

哈希冲突

闭散列的模拟实现

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

开散列的模拟实现

哈希桶里面迭代器的模拟实现

unordered_set 的封装

unordered_map 的封装

位图

应用

布隆过滤器

布隆过滤器的模拟实现

哈希切割

哈希切割的应用

练习题