当前位置：首页 > news >正文

哈希表特性与unordered_map/unordered_set实现分析

news 2025/8/15 8:36:46

目录

一、哈希表核心特性总结

1.开放地址法

2.链地址法

二、unordered_map/unordered_set实现要点分析

1. 哈希表核心实现(HashTable2.h)

(1) 哈希函数处理

(2) 链地址法实现

(3) 迭代器设计

(4) hashtable设计

2. unordered_map实现要点

3. unordered_map实现要点

一、哈希表核心特性总结

哈希表有两种表：一种是闭散列（开放地址法），一种是开散列（链地址法），我将用画图来带大家理解这两种方法的思路

1.开放地址法

线性探测

v

2.链地址法

二、unordered_map/unordered_set实现要点分析

1. 哈希表核心实现(HashTable2.h)

(1) 哈希函数处理

仅使用首字符会导致大量冲突（如所有以相同字母开头的字符串），使用BKDR哈希，通过累乘质数和字符值获得更好分布

// 默认哈希函数（直接类型转换）
template<class K>
struct DefaultHashFunc {size_t operator()(const K& key) {return (size_t)key;}
};// 字符串特化版本
template<>
struct DefaultHashFunc<string> {size_t operator()(const string& str) {size_t hash = 0;for(auto ch : str) {hash += 131;hash += ch;}return hash;}
};

(2) 链地址法实现

template<class T>
struct HashNode
{T _data;HashNode<T>* next;HashNode(const T& data):_data(data), next(nullptr){}
};

(3) 迭代器设计

//前置申明，告诉Iterator,申明了哈希表
template<class K, class T, class KeyOfT, class HashFunc >
class HashTable;template<class K, class T,class Ptr,class Ref, class KeyOfT, class HashFunc>
struct HTIterator
{typedef HashNode<T> Node; typedef HTIterator<K, T,Ptr,Ref, KeyOfT, HashFunc>  Self;//这是什么鬼？？typedef HTIterator<K, T, T*, T&, KeyOfT, HashFunc>  Iterator;Node* _node;//就是不能改*phtconst HashTable<K, T, KeyOfT, HashFunc>* _pht;//为什么需要节点的指针和哈希的指针/*HTIterator(Node * node,HashTable<K, T, KeyOfT, HashFunc>* pht):_node(node),_pht(pht){}*///这个_pht加了const的重载HTIterator(Node* node,const  HashTable<K, T, KeyOfT, HashFunc>* pht):_node(node), _pht(pht){}//普通迭代器时，它是拷贝构造//const迭代器时，它是构造HTIterator(const Iterator & it):_node(it._node), _pht(it._pht){}Ref operator*(){return _node->_data;}Ptr operator->(){return &_node->_data;}Self& operator++(){if (_node->next){//当前桶还没完_node = _node->next;}else{KeyOfT kot;HashFunc hf;size_t hashi = hf(kot(_node->_data)) % _pht->_table.size();//从下一个位置，查找不为空的桶++hashi;while (hashi < _pht->_table.size()){if (_pht->_table[hashi]){//不为空就退出_node = _pht->_table[hashi];return (*this);}else{//为空继续加 ++hashi;}}_node = nullptr;}return *this;}bool operator!=(const Self& s){return  _node != s._node;}bool operator==(const Self& s){return  _node == s._node;}
};

(4) hashtable设计

	template<class K, class T,class KeyOfT, class HashFunc = DefaultHashFunc<K>>class HashTable{typedef HashNode<T> Node;////友元声明，类模版需要把模版参数带上template<class K, class T,class Ptr,class Ref ,class KeyOfT, class HashFunc >friend struct HTIterator;		public:typedef HTIterator<K, T,T*,T&, KeyOfT, HashFunc>  iterator;typedef HTIterator<K, T,const T*,const  T&, KeyOfT, HashFunc>  const_iterator;iterator begin(){//找第一个桶for (size_t i =0 ;i < _table.size();i++){Node* cur = _table[i];if (cur){//这里为什么传this ???  航哥说这里this是哈希表的指针return iterator(cur, this);}}//没有找到return iterator(nullptr, this);}iterator end(){return iterator(nullptr,this);}const_iterator begin()const{//找第一个桶for (size_t i = 0;i < _table.size();i++){Node* cur = _table[i];if (cur){return const_iterator(cur, this);}}//没有找到return const_iterator(nullptr, this);}const_iterator end()const{return const_iterator(nullptr, this);}HashTable(){//先把size开到10,然后把剩余的位置另存为空指针_table.resize(10, nullptr);}~HashTable(){for (size_t i = 0;i < _table.size();i++){Node* cur = _table[i];while (cur){Node* next = cur->next;delete cur;//	free cur;cur = next;}//因为cur是野指针，如果不置空，那么他有可能还会指向原来的节点cur = nullptr;}}pair<iterator,bool> insert(const T& data){KeyOfT kot;HashFunc hf;iterator it = Find(kot(data));//在这里是证明有相同的内容if (it!=end()){return make_pair(it,false);}//负载因子到一就扩容if (_n == _table.size()){size_t newSize = _table.size() * 2;//创建新表HashTable<K,T,KeyOfT,HashFunc> newht;//这个需要开新节点，而且销毁也麻烦//for (size_t i = 0;i < _table.size();i++)//{//	//.......//	ht.insert();//}vector<Node*> newTable;newTable.resize(newSize, nullptr);//便利旧表，顺手牵羊，把节点签下来挂到新表for (size_t i = 0;i < _table.size();i++){Node* cur = _table[i];while (cur){Node* next = cur->next;//头插新表size_t hashi = hf(kot(cur->_data)) % newSize;cur->next = newTable[hashi];newTable[hashi] = cur;cur = next;}_table[i] = nullptr;}_table.swap(newTable);}size_t hashi = hf(kot(data)) % _table.size();//头插,这个没看懂Node* newnode = new Node(data);newnode->next = _table[hashi];_table[hashi] = newnode;++_n;return make_pair(iterator(newnode,this), true);}iterator Find(const K& key){HashFunc hf;KeyOfT kot;size_t hashi = hf(key) % _table.size();Node* cur = _table[hashi];while (cur){if (kot(cur->_data) == key){return iterator(cur,this);}cur = cur->next;}return iterator(nullptr,this);}void Print(){for (size_t i = 0;i < _table.size();i++){printf("[%d]->", i);Node* cur = _table[i];while (cur){cout << cur->_kv.first << "->" << cur->_kv.second << "->";cur = cur->next;}printf("NULL\n");}}bool Erase(const K& key){HashFunc hf;KeyOfT kot;size_t hashi = hf(key) % _table.size();Node* cur = _table[hashi];Node* prev = nullptr;while (cur){if (kot(cur->_data) == key){if (prev == nullptr){_table[hashi] = cur->next;}else{prev->next = cur->next;}delete cur;return true;}prev = cur;cur = cur->next;}--_n;return false;}private:vector<Node*> _table;//指针数组size_t _n = 0;};

2. unordered_map实现要点

template<class K,class V>
class  unordered_map
{struct MapKeyOfT{const K& operator()(const pair<K,V>& kv){return kv.first;}};
public:typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT>::iterator  iterator;typedef typename hash_bucket::HashTable<K, pair<const K, V>, MapKeyOfT>::const_iterator  const_iterator;pair<iterator,bool> insert(const pair<K,V>& kv){return _ht.insert(kv);}iterator begin(){return _ht.begin();}iterator end(){return _ht.end();}const_iterator begin()const{return _ht.begin();}const_iterator end()const{return _ht.end();}V& operator[](const K& key){pair<iterator,bool> ret=_ht.insert(make_pair(key,V()));return ret.first->second;}
private://这种const的特殊属性，一般是自己设置hash_bucket::HashTable<K,pair<const K,V>,MapKeyOfT >  _ht;
};

3. unordered_map实现要点

template<class K>
class unordered_set
{struct SetKeyOfT{const K & operator()(const K & key){return key;}};public:typedef	typename hash_bucket::HashTable<K,K,SetKeyOfT>::const_iterator iterator;typedef	typename hash_bucket::HashTable<K, K, SetKeyOfT>::const_iterator const_iterator;iterator begin()const
{return _ht.begin();
}iterator end()const
{return _ht.end();
}
pair<iterator,bool> insert(const K& key)
{//这样写是错的，因为这里接受的是const_iterator,返回的是iteratorpair<hash_bucket::HashTable<K, K, SetKeyOfT>::iterator, bool> ret = _ht.insert(key);return make_pair(ret.first, ret.second);
}private:hash_bucket::HashTable<K, K,SetKeyOfT>  _ht;
};

http://www.dtcms.com/a/331331.html

相关文章：

风电功率预测实战：从数据清洗到时空建模

从单机到分布式：用飞算JavaAI构建可扩展的TCP多人聊天系统

大规模分布式光伏并网后对电力系统的影响

用SQL实现对DuckDB rusty_sheet插件批量测试

前端-vue全局路由守卫的详情

地测管理部绩效考核关键指标与地质数据分析

如果未来出现了意识移植技术，如何确保移植后的意识是原本的意识而不是复制了一份

C++-setmap详解

无人机图传模块——智能飞行的关键技术

解锁AI潜能：五步写出让大模型神级指令

Cloudflare Tunnels穿透ssh

51单片机-驱动LED模块教程

【C#】Region、Exclude的用法

无需公钥的无损加密解密

深入详解C语言数组：承上启下——从C语言数组基础到数据结构衔接

码上爬第八题【协程+ob混淆】

【Java虚拟机】JVM相关面试题

2025天府杯数学建模C题

2025天府杯数学建模A题分析

智能门锁：安全与便捷的现代家居入口

第1节从函数到神经网络：AI思路的逆袭之路

Mybatis学习笔记(八)

VS2022 C++生成和调用DLL动态链接库

小杰python高级（six day）——pandas库

自由学习记录（84）

nnDetection在windows系统下使用教程

4.Ansible部署文件到主机

Torch -- 卷积学习day2 -- 卷积扩展、数据集、模型

Linux软件编程(四)多任务与多进程管理

机械硬盘模块逻辑与工作原理