C++ 哈希表原理及开放寻址与链地址法实现

C++ 哈希表原理及开放寻址与链地址法实现 | 极客日志

enum state { EXIST, EMPTY, DELETE };

template<class K,class V> struct hashdata { 
    std::pair<K, V> _kv; 
    state _state=EMPTY; 
}; 

template<class K, class V> class hash { 
public: 
    hash() :_tables(23) ,_n(0) { } 
private: 
    std::vector<hashdata<K, V>> _tables; 
    size_t _n; 
};

bool insert(const std::pair<K,V>& kv) { 
    size_t hash0 = kv.first % _tables.size(); 
    size_t hashi = hash0; 
    size_t i = 1; 
    int flag = 1; 
    while (_tables[hashi]._state == EXIST) { 
        hashi = (hash0 + i) % _tables.size(); 
        ++i; 
    } 
    _tables[hashi]._kv = kv; 
    _tables[hashi]._state = EXIST; 
    ++_n; 
    return true; 
}

if (_n * 100 / _tables.size() >= 70) { 
    hash<K, V> newhash; 
    newhash._tables.resize(2 * _tables.size()); 
    for (auto& e : _tables) { 
        if (e._state == EXIST) { 
            newhash.insert(e._kv); 
        } 
    } 
    _tables.swap(newhash._tables); 
}

newhash._tables.resize(prim(_tables.size()+1));

inline size_t prim(size_t s) { 
    static const size_t prime_list[] = { 53, 97, 193, 389, 769, 1543, 3079, 6151, 12289, 24593, 49157, 98317, 196613, 393241, 786433, 1572869, 3145739, 6291469, 12582917, 25165843, 50331653, 100663319, 201326611, 402653189, 805306457, 1610612741, 3221225473, 4294967291 }; 
    const size_t n = sizeof(prime_list) / sizeof(prime_list[0]); 
    size_t left = 0, right = n; 
    while (left < right) { 
        size_t mid = left + (right - left) / 2; 
        if (prime_list[mid] < s) left = mid + 1; 
        else right = mid; 
    } 
    if (left < n) return prime_list[left]; 
    return prime_list[n - 1]; 
}

hashdata<K, V>* Find(const K& key) { 
    size_t hash0 = key % _tables.size(); 
    size_t hashi = hash0; 
    size_t i = 1; 
    while (_tables[hashi]._state != EMPTY) { 
        if (_tables[hashi]._state == EXIST && _tables[hashi]._kv.first == key) { 
            return &_tables[hashi]; 
        } 
        hashi = (hash0 + i) % _tables.size(); 
        ++i; 
    } 
    return nullptr; 
}

template<class K> struct hashfunc { 
    size_t operator()(const K& key) { 
        return (size_t)key; 
    } 
}; 
template<> struct hashfunc<std::string> { 
    size_t operator()(const std::string& str) { 
        size_t hash = 0; 
        for (auto&e:str) { 
            hash += e; 
            hash *= 131; 
        } 
        return hash; 
    } 
};

struct date { 
    int _year; 
    int _month; 
    int _day; 
    date(int year=1,int month=1,int day=1) :_year(year) ,_month(month) ,_day(day) { } 
    bool operator == (const date & d) { 
        return _year == d._year && _month == d._month && _day == d._day; 
    } 
}; 
struct cmp { 
    size_t operator()(const date& d) const { 
        size_t has = 0; 
        has += d._year; 
        has *= 10000; 
        has += d._month; 
        has *= 100; 
        has += d._day; 
        return has; 
    } 
};

struct hashnode { 
    std::pair<K, V> _kv; 
    hashnode* _next; 
    hashnode(const std::pair<K,V>&kv) :_kv(kv) ,_next(nullptr) { } 
};

bool insert(const std::pair<K, V>& kv) { 
    hash ha; 
    if (_n * 100 / _tab.size() >= 70) { 
        hashtab<K, V, hash> newhash; 
        newhash._tab.resize(prim(_tab.size() + 1)); 
        for (int i = 0; i < _tab.size(); i++) { 
            node* cur = _tab[i]; 
            while (cur) { 
                node* next = cur->_next; 
                size_t has = ha(cur->_kv.first) % newhash._tab.size(); 
                cur->_next = _tab[has]; 
                _tab[has] = cur; 
                cur = next; 
            } 
            _tab[i] = nullptr; 
        } 
        _tab.swap(newhash._tab); 
    } 
    size_t has = ha(kv.first) % _tab.size(); 
    node* newnode = new node(kv); 
    newnode->_next = _tab[has]; 
    _tab[has] = newnode; 
    ++_n; 
    return 1; 
}

Iterator Find(const K& key) { 
    KofT kot; 
    hash _hash; 
    size_t hashi = _hash(key) % _tab.size(); 
    node* cur = _tab[hashi]; 
    while (cur) { 
        if (kot(cur->_data) == key) { 
            return Iterator(cur, this); 
        } 
        cur = cur->_next; 
    } 
    return End(); 
}

bool Erase(const K& key) { 
    KofT kot; 
    size_t hashi = key % _tab.size(); 
    node* prev = nullptr; 
    node* cur = _tab[hashi]; 
    while (cur) { 
        if (kot(cur->_data) == key) { 
            if (prev == nullptr) { // 头结点 
                _tab[hashi] = cur->_next; 
            } else { // 中间节点 
                prev->_next = cur->_next; 
            } 
            delete cur; 
            --_n; 
            return true; 
        } else { 
            prev = cur; 
            cur = cur->_next; 
        } 
    } 
    return false; 
}

template<class K,class T,class ref,class ptr,class KofT,class hash> struct uniterator { 
    typedef hashtab<K, T, KofT, hash> utb; 
    typedef uniterator<K, T, ref, ptr, KofT, hash> self; 
    typedef unordered_node<T> node; 
    node* _node; 
    const utb* _utb; 
    uniterator(node* __node, const utb* __utb) :_node(__node) ,_utb(__utb) { } 
};

ConstIterator Begin() const

ref operator*() { return _node->_data; } 
ptr operator->() { return &(_node->_data); } 
bool operator!=(const self& s) { return _node != s._node; }

self& operator++() { 
    if (_node->_next) { 
        _node = _node->_next; 
    } else { 
        KofT kot; 
        hash ha; 
        size_t hashi = ha(kot(_node->_data)) % _utb->_tab.size(); 
        ++hashi; 
        while (hashi < _utb->_tab.size()) { 
            _node = _utb->_tab[hashi]; 
            if (_node) break; 
            else ++hashi; 
        } 
        // 所有桶都走完了，end() 给的空标识的_node 
        if (hashi == _utb->_tab.size()) { 
            _node = nullptr; 
        } 
    } 
    return *this; 
}

template<class K,class V,class hash= hashfunc<K>> class unorderedmap { 
    struct KofT { 
        const K& operator()(const std::pair<K, V>& kv) { 
            return kv.first; 
        } 
    }; 
    typedef typename hashtab<K, std::pair<const K, V>, KofT, hash>::Iterator iterator; 
    typedef typename hashtab<K, std::pair<const K, V>, KofT, hash>::ConstIterator const_iterator; 
public: 
    iterator begin() { return _ht.Begin(); } 
    iterator end() { return _ht.End(); } 
    const_iterator begin() const { return _ht.Begin(); } 
    const_iterator end() const { return _ht.End(); } 
    std::pair<iterator, bool> insert(const std::pair<K, V>& kv) { return _ht.Insert(kv); } 
    V& operator[](const K& k) { 
        std::pair<iterator, bool> ret = insert({ k,V() }); 
        return ret.first->second; 
    } 
    iterator Find(const K& key) { return _ht.Find(key); } 
    bool Erase(const K& key) { return _ht.Erase(key); } 
private: 
    hashtab<K, std::pair<const K, V>, KofT, hash> _ht; 
};

template<class K, class hash = hashfunc<K>> class unorderedset { 
    struct KofT { 
        const K& operator()(const K& k) const { 
            return k; 
        } 
    }; 
    typedef typename hashtab<K, K, KofT, hash>::Iterator iterator; 
    typedef typename hashtab<K, K, KofT, hash>::ConstIterator const_iterator; 
public: 
    iterator begin() { return _ht.Begin(); } 
    iterator end() { return _ht.End(); } 
    const_iterator begin() const { return _ht.Begin(); } 
    const_iterator end() const { return _ht.End(); } 
    std::pair<iterator, bool> insert(const K& k) { return _ht.Insert(k); } 
    K& operator[](const K& k) { 
        std::pair<iterator, bool> ret = insert(k); 
        return ret.first; 
    } 
    iterator Find(const K& key) { return _ht.Find(key); } 
    bool Erase(const K& key) { return _ht.Erase(key); } 
private: 
    hashtab<K, K, KofT, hash> _ht; 
};

C++ 哈希表原理及开放寻址与链地址法实现

一、哈希表的使用

二、基本概念

三、哈希函数

1. 除法散列法（除留余数法）

2. 乘法散列法

3. 全域散列法

四、开放寻址法哈希表

1. 枚举状态

2. 成员，初始化

3. 插入

4. 扩容

5. 质数处理

6. Find

7. 转无符号整型

8. 自定义类和哈希函数

五、链地址法实现

1. 节点定义

2. 插入加扩容

3. 查询和删除

六、哈希表其它接口

七、封装和模拟实现

1. 迭代器成员声明

2. 迭代器成员函数

3. 迭代器++

4. 封装

更多推荐文章

相关免费在线工具

C++ 哈希表原理及开放寻址与链地址法实现

一、哈希表的使用

二、基本概念

三、哈希函数

1. 除法散列法（除留余数法）

2. 乘法散列法

3. 全域散列法

四、开放寻址法哈希表

1. 枚举状态

2. 成员，初始化

3. 插入

4. 扩容

5. 质数处理

6. Find

7. 转无符号整型

8. 自定义类和哈希函数

五、链地址法实现

1. 节点定义

2. 插入加扩容

3. 查询和删除

六、哈希表其它接口

七、封装和模拟实现

1. 迭代器成员声明

2. 迭代器成员函数

3. 迭代器++

4. 封装

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具