哈希表

最新推荐文章于 2023-06-04 19:55:34 发布

Y-ANG

最新推荐文章于 2023-06-04 19:55:34 发布

阅读量483

点赞数

分类专栏：数据结构 Linux & 计算机网络 c++ & 数据结构文章标签：哈希表散列表开放定址法哈希表实现

本文链接：https://blog.csdn.net/qq_33951180/article/details/53227978

版权

Linux & 计算机网络同时被 3 个专栏收录

54 篇文章 9 订阅

订阅专栏

c++ & 数据结构

48 篇文章 8 订阅

订阅专栏

数据结构

24 篇文章 3 订阅

订阅专栏

哈希表，又称为散列表，它是根据关键码（key）直接访问在内存中的存储的一种数据结构。它通过把关键码根据某一函数进行转换后映射到表中的，这个函数称为散列函数，存放记录的数组称为散列表。

一、哈希表的构造

如何构造一个散列表？！请看这篇博客^-^：散列表的构造和哈西冲突

值得一提的是，构造这个表时，我们需要考虑这个位置的状态，是EMPTY，EXIST 还是DELETE？！当表中还没有元素时，我们给的默认状态是EMPTY。

二、哈希表实现Insert、Remove、Find（这篇文章我是用开放定址法处理哈希冲突）

Insert：

每插入一个数，就将该位置的状态改为EXIST，当插入的下一个数如果也映射在该位置，看到这个标志"EXIST"就知道这个位置已经被占用，就继续去探测下一个状态为"EMPTY"或"DELETE"的位置；如果插入的过程中发现已经有相同的key值，那么就直接返回

[cpp]view plaincopy 
   
 //线性探测法  
 bool Insert(const K& key,const V& value)  
 {  
     //先检测容量  
     _CheckSize();  
     //找到这个key值所在的哈希地址  
   
     size_t index = _HashFunc(key);  
     while (_table[index]._status == EXIST)  
     {  
         //表中已经有关键码key  
         if (_table[index]._key == key)  
         {  
             return false;  
         }  
         //如果这个位置的状态为EMPTY或DELET，直接可以将数据放入  
         if (_table[index]._status == EMPTY || _table[index]._status == DELETE)  
         {  
             break;  
         }  
         ++index;  
   
         //如果已经到表尾也没有将数据插入，就从表头再寻找  
         if (index == _table.size())  
         {  
             index = 0;  
         }  
     }  
   
     //index位置状态为EMPTY、DELETE  
     _table[index]._key = key;  
     _table[index]._value = value;  
     _table[index]._status = EXIST;  
     _size++;  
     return true;  
 }  

Find：

查找数据时，也是根据关键码key来寻找的，只要这个位置的状态不为"EMPTY"时，就可以一直寻找，当某一位置的key符合条件时就返回该位置的位置；还有一种情况是找到表尾时没有找到，那么就应该先回表头继续寻找。

[cpp]view plaincopy 
   
 Node* Find(const K& key)  
 {  
     //表有可能为空  
     if (_table.size() == 0)  
     {  
         return false;  
     }  
     size_t index = _HashFunc(key);  
     while (_table[index]._status != EMPTY)  
     {  
         if (_table[index]._key == key)  //index的内容就是要找的  
         {  
             return &_table[index];  
         }  
         ++index;  
   
         if (index == _table.size()) //找到表尾没有找到，就从头重新找  
         {  
             index = 0;  
         }  
     }  
 }  

Delete:

这里删除数据时我们采用的是“懒删除法”，即直接修改该位置的状态为"DELETE"。由于在插入数据时只关心的是该位置的状态是否为"EXIST"，所以其他状态并不会对插入有影响，就算下一次插入数据的位置状态是"DELETE"，直接覆盖掉就好了！！

[cpp]view plaincopy 
   
 bool Remove(const K& key)  
 {  
     for (size_t index=0; index<_table.size(); ++index)  
     {  
         if (_table[index]._key == key)  
         {  
             _table[index]._status = DELETE;  
             return true;  
         }  
     }  
     return false;  
 }  

具体代码实现：

[cpp]view plaincopy 
   
 enum STATUS  
 {  
     EMPTY,  
     EXIST,  
     DELETE,  
 };  
   
 template<class K,class V>  
 struct KVNode  
 {  
     K _key;  
     V _value;  
     STATUS _status; //标示每个位置的状态  
   
     KVNode(const K& key,const V& value)  
         :_key(key)  
         ,_value(value)  
         ,_status(EMPTY)  
     {}  
 };  
   
 template<class K,class V>  
 class HashTable  
 {  
     typedef KVNode<K,V> Node;  
 public:  
     HashTable()  
         :_size(0)  
     {  
         _table.resize(_GetPrimer(0));  
     }  
     ~HashTable()  
     {  
         for (size_t i=0; i<_table.size(); ++i)  
         {<span style="white-space:pre">       </span>//这里应该判断这个位置的状态，如果为EMPTY就可以不用管  
             _table[i]._key = 0;  
             _table[i]._value = 0;  
             _table[i]._status = EMPTY;  
         }  
     }  
   
     Node* Find(const K& key)；  
     bool Remove(const K& key)；  
     //线性探测法  
     bool Insert(const K& key,const V& value)；  
   
     void Display()  
     {  
         for (size_t i=0; i<_table.size(); ++i)  
         {  
             if (_table[i]._status == EXIST)  
             {  
                 cout<<"key->"<<_table[i]._key<<" "<<"value->"<<_table[i]._value<<endl;  
             }  
         }  
     }  
 protected:  
     void _CheckSize()  
     {  
         //当表长度为0或者负载因子大于0.8时进行增容  
         //负载因子 == 插入表中的数据个数/散列表的长度  
         //if (_table.size() == 0 || _size/_table.size() >= 0.8)  //size_t/size_t得不到浮点数  
         if (_table.size() == 0 || _size*10/_table.size() >= 8)  
         {  
             size_t newSize = _GetPrimer(_table.size());  
             HashTable<K,V> newHashTable;  
             newHashTable._table.resize(newSize);  
             //将原表中的数据插入到新表中，并在插入时重新计算哈希地址----借助Insert  
             for (size_t i=0; i<_table.size(); ++i)  
             {  
                 if (_table[i]._status == EXIST)  
                 {  
                     newHashTable.Insert(_table[i]._key,i);  
                 }  
             }  
             swap(this->_table,newHashTable._table);  
             swap(_size,newHashTable._size);  
         }  
     }  
     //利用素数表来获取_table的容量----选素数，会降低冲突  
     size_t _GetPrimer(size_t size)  
     {  
         const int _PrimeSize = 28;  
         static const unsigned long _PrimeList[_PrimeSize] =  
         {  
             53ul, 97ul, 193ul, 389ul, 769ul,  
             1543ul, 3079ul, 6151ul, 12289ul, 24593ul,  
             49157ul, 98317ul, 196613ul, 393241ul,  
             786433ul,  
             1572869ul, 3145739ul, 6291469ul, 12582917ul,  
             25165843ul,  
             50331653ul, 100663319ul, 201326611ul, 402653189ul,  
             805306457ul,  
             1610612741ul, 3221225473ul, 4294967291ul  
         };  
         for (size_t i=0; i<_PrimeSize; ++i)  
         {  
             if (_PrimeList[i] > size)  
             {  
                 return _PrimeList[i];  
             }  
         }  
     }  
     size_t _HashFunc(const K& key)  //散列函数  
     {  
         return key%_table.size();  
     }  
 protected:  
     vector<Node> _table;  
     size_t _size;       //表中的数据个数  
 };