哈希表

最新推荐文章于 2024-08-06 21:51:46 发布

AgilePlus

最新推荐文章于 2024-08-06 21:51:46 发布

阅读量5

点赞数

文章标签：散列表哈希算法数据结构算法

1、哈希/散列：值与值间存在映射（一种算法）

2、哈希表/散列表：值与数据存储位置建立映射（一种数据结构）

3、确定数据位置的方法：

（1）直接定址

优点：快，无哈希冲突（不同的值计算后得到相同的位置数据）

缺点：需要数据范围集中

（2）除留余数法（哈希表主流算法）

hashi = key % N（N为哈希表的大小）

缺点：存在哈希冲突

解决办法：

a、闭散列：按规则去别的位置储存

规则：#线性探测

#二次探测

b、开散列：哈希桶/拉链法

4、代码实现：

闭/开散列共用代码：

//除留余数法：
//缺点：发生哈希冲突，不同值取模后映射到同一位置
//解决：
//（1）闭散列
//（2）开散列

//并不是所有的类型均可以取模，所以我们应该实现仿函数进行整型转换来进行取模运算
//将仿函数放在类外以便两种方法一起使用
template<class K>
struct HashFunc
{
	size_t operator()(const K& key)
	{
		return (size_t)key;
	}
};
//string类型我们需要进行特化来解决不同字符串取模后具有相同的映射的问题
//特化

template<>
struct HashFunc<string>
{
	size_t operator()(const string& key)
	{
		size_t hash = 0;
		for (auto e : key)
		{
			hash *= 31;//实验表明31可以更好的区分
			hash += e;
		}

		return hash;
	}
};

闭散列：

//闭散列（按规则去其他位置储存）（线性探测）（二次探测）
//利用该位置的状态确定该值的存在与否
namespace open_address
{
	//利用枚举确定状态
	enum State
	{
		EXIST,//存在
		EMPTY,//空
		DELETE//删除
	};

	//数据
	template<class K,class V>
	struct HashData
	{
		pair<K, V>_kv;
		State _state = EMPTY;
	};

	//哈希表
	template<class K,class V,class Hash = HashFunc<K>>
	class HashTable
	{
	public:
		//构造
		HashTable()
		{
			_tables.resize(10);
		}

		//插入
		bool Insert(const pair<K, V>& kv)
		{
			Hash hs;
			//存在则插入失败
			if (Find(kv.first))
			{
				return false;
			}

			//位置不够则扩容，利用载荷因子确定是否扩容，载荷因子大概在0.7
			//方法：重新建立一个表，复调用插入建立新表后进行交换
			if (_n*10 / _tables.size() >= 7)
			{
				HashTable<K, V,Hash> newHT;
				newHT._tables.resize(_tables.size() * 2);
				for (int i = 0;i < _tables.size();i++)
				{
					//存在即插入
					if (_tables[i]._state == EXIST)
					{
						newHT.Insert(_tables[i]._kv);
					}
				}
				_tables.swap(newHT._tables);
			}

			//插入（计算位置）
			size_t hashi = hs(kv.first) % _tables.size();
			//位置有值则重新计算
			while (_tables[hashi]._state == EXIST)
			{
				hashi++;
				hashi %= _tables.size();
			}
			_tables[hashi]._kv = kv;
			_tables[hashi]._state = EXIST;
			_n++;

			return true;
		}

		//寻找
		HashData<K, V>* Find(const K& key)
		{
			Hash hs;
			size_t hashi = hs(key) % _tables.size();

			for (int i = 0;i < _tables.size();i++)
			{
				if (_tables[hashi]._state == EXIST && _tables[hashi]._kv.first == key)
				{
					return &_tables[hashi];
				}
				hashi++;
				hashi %= _tables.size();
			}
			return nullptr;
		}

		//删除
		bool Erase(const K& key)
		{
			//利用find找到后删除
			HashData<K, V>* ret = Find(key);
			if (ret == nullptr)
			{
				return false;
			}
			else
			{
				ret->_state = DELETE;
				return true;
			}
		}

	private:
		vector<HashData<K, V>> _tables;//利用数组实现哈希表
		size_t _n = 0;//储存数据个数
	};
  //测试///
	void TestHT1()
	{
		HashTable<int, int> ht;
		int a[] = { 11,21,4,14,24,15,9 };
		for (auto e : a)
		{
			ht.Insert({ e,e });
		}

		ht.Insert({ 19,19 });
		ht.Insert({ 19,190 });
		ht.Insert({ 19,1900 });
		ht.Insert({ 39,1900 });

		cout << ht.Find(24) << endl;
		ht.Erase(4);
		cout << ht.Find(24) << endl;
		cout << ht.Find(4) << endl;
	}
	struct StringHashFunc
	{
		size_t operator()(const string& s)
		{
			size_t hash = 0;
			for (auto e : s)
			{
				hash *= 31;
				hash += e;
			}

			return hash;
		}
	};
	void TestHT2()
	{
		HashTable<string, string> ht;
		ht.Insert({ "sort", "排序" });
		ht.Insert({ "left", "左边" });

		//string s1("sort");
		//string s2("sort");

		cout << StringHashFunc()("bacd") << endl;
		cout << StringHashFunc()("abcd") << endl;
		cout << StringHashFunc()("aadd") << endl;
	}

}

1.
2.
3.
4.
5.
6.
7.
8.
9.
10.
11.
12.
13.
14.
15.
16.
17.
18.
19.
20.
21.
22.
23.
24.
25.
26.
27.
28.
29.
30.
31.
32.
33.
34.
35.
36.
37.
38.
39.
40.
41.
42.
43.
44.
45.
46.
47.
48.
49.
50.
51.
52.
53.
54.
55.
56.
57.
58.
59.
60.
61.
62.
63.
64.
65.
66.
67.
68.
69.
70.
71.
72.
73.
74.
75.
76.
77.
78.
79.
80.
81.
82.
83.
84.
85.
86.
87.
88.
89.
90.
91.
92.
93.
94.
95.
96.
97.
98.
99.
100.
101.
102.
103.
104.
105.
106.
107.
108.
109.
110.
111.
112.
113.
114.
115.
116.
117.
118.
119.
120.
121.
122.
123.
124.
125.
126.
127.
128.
129.
130.
131.
132.
133.
134.
135.
136.
137.
138.
139.
140.
141.
142.
143.
144.
145.
146.
147.
148.
149.
150.
151.
152.
153.
154.
155.
156.
157.
158.
159.
160.

开散列：

//开散列：哈希桶/拉链法
//利用指针数组进行链接

namespace hash_bucket
{
	template<class K,class V>
	struct HashNode
	{
		pair<K, V>_kv;
		HashNode<K, V>* _next;

		HashNode(const pair<K, V>& kv)
			:_kv(kv)
			, _next(nullptr)
		{}
	};

	template<class K, class V, class Hash = HashFunc<K>>
	class HashTable
	{
		typedef HashNode<K, V> Node;
	public:
		HashTable()
		{
			_tables.resize(10, nullptr);
		}

		~HashTable()
		{
			//依次释放每个桶
			for (int i = 0;i < _tables.size();i++)
			{
				Node* cur = _tables[i];
				while (cur)
				{
					Node* next = cur->_next;
					delete cur;
					cur = next;
				}
				//全部释放完后指针数组节点置为空
				_tables[i] = nullptr;
			}
		}

		bool Insert(const pair<K, V>& kv)
		{
			if (Find(kv.first))
			{
				return false;
			}
			Hash hs;
			size_t hashi = hs(kv.first) % _tables.size();
			//载荷因子为一时扩容
			if (_n == _tables.size())//(_n * 10 / _tables.size() >= 1)
			{
				/*HashTable<K, V> newHT;
				newHT._tables.resize(_tables.size() * 2);
				for (size_t i = 0; i < _tables.size(); i++)
				{
					Node* cur = _tables[i];
					while(cur)
					{
						newHT.Insert(cur->_kv);
						cur = cur->_next;
					}
				}

				_tables.swap(newHT._tables);*/
				//新开一个数组
				vector<Node*> newtables(_tables.size() * 2, nullptr);
				for (size_t i = 0; i < _tables.size(); i++)
				{
					//从i节点开始找链接
					Node* cur = _tables[i];
					//链接存在
					while (cur)
					{
						Node* next = cur->_next;
						size_t hashi = hs(cur->_kv.first) % newtables.size();
						
						cur->_next = newtables[hashi];
						newtables[hashi] = cur;
						cur = next;
						
					}
					_tables[i] = nullptr;
				}

				_tables.swap(newtables);
			}
			//头插
			Node* newnode = new Node(kv);
			newnode->_next = _tables[hashi];
			_tables[hashi] = newnode;
			++_n;
			return true;
		}

		Node* Find(const K& key)
		{
			Hash hs;
			size_t hashi = hs(key) % _tables.size();
			Node* cur = _tables[hashi];
			while (cur)
			{
				if (cur->_kv.first == key)
				{
					return cur;
				}

				cur = cur->_next;
			}

			return nullptr;
		}

		bool Erase(const K& key)
		{
			Hash hs;
			size_t hashi = hs(key) % _tables.size();
			Node* cur = _tables[hashi];
			Node* prev = nullptr;
			while (cur)
			{
				if (cur->_kv.first == key)
				{
					if (prev == nullptr)
					{
						_tables[hashi] = cur->_next;
					}
					else
					{
						prev->_next = cur->_next;
					}
					delete cur;
					--_n;
					return true;
				}
				prev = cur;
				cur = cur->_next;
			}
			return false;
		}

	private:
		vector<Node*>_tables;
		size_t _n = 0;
	};
  /测试//
	void TestHT1()
	{
		HashTable<int, int> ht;
		int a[] = { 11,21,4,14,24,15,9,19,29,39 };
		for (auto e : a)
		{
			ht.Insert({ e,e });
		}

		ht.Insert({ -6, 6 });

		for (auto e : a)
		{
			ht.Erase(e);
		}
	}

	void TestHT2()
	{
		HashTable<string, string> ht;
		ht.Insert({ "sort", "排序" });
		ht.Insert({ "left", "左边" });
	}
}

1.
2.
3.
4.
5.
6.
7.
8.
9.
10.
11.
12.
13.
14.
15.
16.
17.
18.
19.
20.
21.
22.
23.
24.
25.
26.
27.
28.
29.
30.
31.
32.
33.
34.
35.
36.
37.
38.
39.
40.
41.
42.
43.
44.
45.
46.
47.
48.
49.
50.
51.
52.
53.
54.
55.
56.
57.
58.
59.
60.
61.
62.
63.
64.
65.
66.
67.
68.
69.
70.
71.
72.
73.
74.
75.
76.
77.
78.
79.
80.
81.
82.
83.
84.
85.
86.
87.
88.
89.
90.
91.
92.
93.
94.
95.
96.
97.
98.
99.
100.
101.
102.
103.
104.
105.
106.
107.
108.
109.
110.
111.
112.
113.
114.
115.
116.
117.
118.
119.
120.
121.
122.
123.
124.
125.
126.
127.
128.
129.
130.
131.
132.
133.
134.
135.
136.
137.
138.
139.
140.
141.
142.
143.
144.
145.
146.
147.
148.
149.
150.
151.
152.
153.
154.
155.
156.
157.
158.
159.
160.
161.
162.
163.
164.
165.
166.
167.
168.
169.
170.
171.
172.
173.

原创作者: u_16298007 转载于: https://blog.51cto.com/u_16298007/11666880

AgilePlus

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
哈希表

1、哈希/散列：值与值间存在映射（一种算法）2、哈希表/散列表：值与数据存储位置建立映射（一种数据结构）3、确定数据位置的方法：（1）直接定址优点：快，无哈希冲突（不同的值计算后得到相同的位置数据）缺点：需要数据范围集中（2）除留余数法（哈希表主流算法）hashi = key % N（N为哈希表的大小）缺点：存在哈希冲突解...
复制链接

扫一扫