【C++】Unordered_map/Unordered_map使用哈希表封装

原创已于 2025-06-03 16:17:48 修改

· 705 阅读

20 ·

版权

文章标签：

#c++ #散列表 #开发语言 #哈希表

于 2024-12-08 20:05:41 首次发布

C++的学习历程专栏收录该内容

17 篇文章

订阅专栏

3.2 解决取key/pair.first问题

3.3 解决类型转换的问题

3.4 实现迭代器Iterator/const_Iterator

4.2 Myunordered_map.h

4.3 Myunordered_set.h

1. 整体学习的思维导图

2. 链地址法哈希表

本次的封装实现基于上次实现完成的链地址法的哈希表，以下是生成实现的整体代码，具体分析参考哈希表那章。

namespace Hashbucket
{
        // 
        template<class K, class V>
        struct HashNode
        {
                pair<K, V> _kv;
                HashNode<K, V>* _next;
                
                HashNode(const pair<K, V>& kv)
                        :_kv(kv)
                        ,_next(nullptr)
                {}
        };

        // 哈希表对象
        template<class K, class V>
        class HashTable
        {
                typedef HashNode<K, V> Node;
        public:

                HashTable()
                        :_tables(11)
                        ,_n(0)
                {}
                
                ~HashTable()
                {
                    for (size_t i = 0; i < _tables.size(); i++)
                    {
                            Node* cur = _tables[i];
                            while (cur)
                            {
                                    Node* next = cur->_next;
                                    delete cur;
                                    cur = next;
                            }
                            _tables[i] = nullptr;
                    }
                }
                
                HashTable(const HashTable& HT)
                    :_tables(HT._tables.size())
                {
                    for (size_t i = 0; i < HT._tables.size(); i++)
                    {
                        Node* cur = HT._tables[i];
                        while (cur)
                        {
                            Insert(cur->_kv);
                            cur = cur->_next;
                        }
                    }
                }
                
                HashTable& operator=(const HashTable& HT)
                {
                    if (this != &HT)
                    {
                        // 释放旧数据
                        for (size_t i = 0; i < _tables.size(); i++)
                        {
                            Node* cur = _tables[i];
                            while (cur)
                            {
                                Node* next = cur->_next;
                                delete cur;
                                cur = next;
                            }
                            _tables[i] = nullptr;
                        }
                
                        // 插入新数据
                        for (size_t i = 0; i < HT._tables.size(); i++)
                        {
                            Node* cur = HT._tables[i];
                            while (cur)
                            {
                                Insert(cur->_kv);
                                cur = cur->_next;
                            }
                        }
                    }
                    return *this;
                }
                
                bool Insert(const pair<K, V>& kv)
                {                
                        if (Find(kv.first))
                                return false;
                        // 扩容
                        if (_n == _tables.size())
                        {
                                // 复用法
                                // 会创建新的节点+使用旧的节点
                                /*HashTable<K, V> newHT;
                                newHT._tables.resize(_tables.size() * 2);
                                for (size_t i = 0; i < _tables.size(); i++)
                                {
                                        Node* cur = _tables[i];
                                        while (cur)
                                        {
                                                newHT.Insert(cur->_kv);
                                                cur = cur->_next;
                                        }
                                }
                                _tables.swap(newHT._tables);*/

                                // 摘取法
                                // 使用旧的节点
                                vector<Node*> newtables(_tables.size() * 2);
                                for (size_t i = 0; i < _tables.size(); i++)
                                {
                                        Node* cur = _tables[i];
                                        while (cur)
                                        {
                                                Node* next = cur->_next;
                                                // 重新计算出映射位置hashi
                                                size_t hashi = kv.first % newtables.size();
                                                cur->_next = newtables[hashi];
                                                newtables[hashi] = cur;
                                                cur = next;
                                        }
                                        _tables[i] = nullptr;
                                }
                                _tables.swap(newtables);
                        }

                        // 计算出映射位置hashi,这个计算必须在扩容下面不然映射会出错
                        size_t hashi = kv.first % _tables.size();
                        // 创建一个新的节点
                        Node* newnode = new Node(kv);
                        // 头插法
                        newnode->_next = _tables[hashi];  // 新节点指向原来的节点
                        _tables[hashi] = newnode;                 // 新节点成为新的头结点
                        ++_n;                                                        // ++节点数
                        return true;
                }

                Node* Find(const K& key)
                {
                        // 算出hashi
                        size_t hashi = key % _tables.size();
                        Node* cur = _tables[hashi];
                        while (cur)
                        {
                                if (cur->_kv.first == key)
                                        return cur;
                                cur = cur->_next;
                        }
                        return nullptr;
                }

                bool Erase(const K& key)
                {
                        // 算出hashi
                        size_t hashi = key % _tables.size();
                        Node* prev = nullptr;
                        Node* cur = _tables[hashi];
                        while (cur)
                        {
                                if (cur->_kv.first == key)
                                {
                                        if (prev == nullptr)
                                        {
                                                _tables[hashi] = cur->_next;
                                        }
                                        else
                                        {
                                                prev->_next = cur->_next;
                                        }
                                        delete cur;
                                        --_n;
                                        return true;
                                }
                                prev = cur;
                                cur = cur->_next;
                        }
                        return false;
                }

        private:
                vector<Node*> _tables;        // 指针数组
                size_t _n = 0;                        // 记录个数
        };

}

3. 封装实现

3.1 解决key/pair问题

由于unordered_set和unordered_map所需要的参数分别为key和pair，所以我们要让底层的哈希表同时支持两者，我们要将模版参数中的数据类型参数改为T。

template<class T>
struct HashNode
{
        T _data;
        HashNode<T>* _next;

        HashNode(const T& data)
                :_data(data)
                , _next(nullptr)
        {}
};

template<class K, class T>
class HashTable
{
        // .......
        typedef HashNode<T> Node;
        bool Insert(const T& data);
        Node* Find(const K& key);
        bool Erase(const K& key);
        // ......
 };

3.2 解决取key/pair.first问题

由于我们需要使用key来计算哈希表的映射位置，但是unordered_set/unordered_map使用的数据类型不同，需要根据不同情况取出key，我们需要再传一个仿函数GetOfKey来解决这个问题。

template<class K, class V>
class Myunordered_map
{
public:
        // 仿函数用于获取key
        struct getofkey
        {
                const K& operator()(const pair<K, V>& kv)
                {
                        return kv.first;
                }
        };

        bool Insert(const pair<K, V>& kv)
        {
                return _tb.Insert(kv);
        }

private:
        HashTable<K, pair<K, V>, getofkey> _tb;
};

template<class K>
class Myunordered_set
{
public:
        // 仿函数用于获取key
        struct getofkey
        {
                const K& operator()(const K& key)
                {
                        return key;
                }
        };

        bool Insert(const K& key)
        {
                return _tb.Insert(key);
        }

private:
        HashTable<K, K, getofkey> _tb;
};

3.3 解决类型转换的问题

对于以上的哈希表存储正整数没有问题，但是遇到负数，字符串等等需要进行特殊处理才可以映射，因此我们需要再传入一个参数用于转换类型为正整数ChangeOfType。该模版参数应用于取模计算hashi时。

vector<string> v = { "Hello", "string", "left", "right" };
ouyang::Myunordered_set<string> st;
for (const auto& e : v)
{
        st.Insert(e);
}

template<class K>
struct changeoftype
{
        size_t operator()(const K& key)
        {
                return (size_t)key;
        }
};

// 模版特化string
template<>
struct changeoftype<string>
{
        size_t operator()(const string& s)
        {
                size_t key = 0;
                for (auto ch : s)
                {
                        key += ch;
                        key *= 131;
                }
                return key;
        }
};

把该模版参数传参位置设定在外壳部分->unordered_set/unordered_map，方便后续自定义类型设计仿函数进行类型转换。

template<class K, class V, class ChangeOfType = changeoftype<K>>
class Myunordered_map
{
public:
// ....
};

template<class K, class ChangeOfType = changeoftype<K>>
class Myunordered_set
{
public:
// ....
};

// 哈希表对象
template<class K, class T, class GetOfKey, class ChangeOfType>
class HashTable
{
// ....
};

3.4 实现迭代器Iterator/const_Iterator

3.4.1 分析迭代器的++

情况一：当前链表没有走到空，继续往下走

情况二：当前链表走到了空，继续找寻下一个挂着链表的哈希映射位
- 【1】找到哈希映射位继续重复情况一
- 【2】找到尾巴_tables.size()都没有挂着链表的哈希映射位结束

这个过程中我们需要当前的节点_node和整个哈希表的大小。

template<class K, class T, class Ref, class Ptr, class GetOfKey, class changeoftype>
struct HashIterator
{
        typedef HashNode<T> Node;
        typedef HashIterator<K, T, Ref, Ptr, GetOfKey, changeoftype> Self;

        Node* _node;
        const HashTable<K, T, GetOfKey, changeoftype>* _HT;
        HashIterator(Node* node, const HashTable<K, T, GetOfKey, changeoftype>* HT)
                :_node(node)
                , _HT(HT)
        {}

        Ref operator*()
        {
                return _node->_data;
        }

        Ptr operator->()
        {
                return &_node->_data;
        }

        bool operator!=(const Self& s)
        {
                return _node != s._node;
        }

        bool operator==(const Self& s)
        {
                return _node == s._node;
        }

        Self& operator++()
        {
                if (_node->_next)
                {
                        // 如果当前桶链还有节点继续往下走
                       _node->_next;
                }
                else
                {
                        // 当前桶链没有节点了，找寻下一个存在的桶链
                        GetOfKey gok;
                        changeoftype cot;
                        size_t hashi = cot(gok(_node->_data)) % _HT->_tables.size();
                        ++hashi;

                        while (hashi < _HT->_tables.size())
                        {
                                if (_HT->_tables[hashi])
                                        break;
                                ++hashi;
                        }

                        // 不在有效范围内
                        if (hashi == _HT->_tables.size())
                        {
                                _node = nullptr;   // end()
                        }
                        else { // 如果哈希映射位在有效范围内
                                _node = _HT->_tables[hashi];
                        }
                }
                return *this;
        }

};

并且我们需要在HashTable处声明友元，HashIterator中访问到了HashTable中的私有成员_n和_tables。

// 友元->HashTable和HashIterator都互相依赖对方，HashIterator会访问私有成员_n和_tables。
template<class K, class T, class Ref, class Ptr, class GetOfKey, class changeoftype>
friend struct HashIterator;