快取淘汰演算法 LRU 和 LFU【轉】

阿新 • • 發佈：2021-10-13

轉自：https://www.jianshu.com/p/1f8e36285539

快取是一個計算機思維，對於重複的計算，快取其結果，下次再算這個任務的時候，不去真正的計算，而是直接返回結果，能加快處理速度。當然有些會隨時間改變的東西，快取會失效，得重新計算。

比如快取空間只有2個，要快取的資料有很多，1，2，3，4，5，那麼當快取空間滿了，需要淘汰一個快取出去，其中淘汰演算法有 LRU，LFU，FIFO，SC二次機會，老化演算法，時鐘工作集演算法等等。

演算法流程

LRU，最近最少使用，把資料加入一個連結串列中，按訪問時間排序，發生淘汰的時候，把訪問時間最舊的淘汰掉。
比如有資料 1，2，1，3，2
此時快取中已有（1，2）
當3加入的時候，得把後面的2淘汰，變成（3，1）

LFU，最近不經常使用，把資料加入到連結串列中，按頻次排序，一個數據被訪問過，把它的頻次+1，發生淘汰的時候，把頻次低的淘汰掉。
比如有資料 1，1，1，2，2，3
快取中有（1(3次)，2(2次)）
當3加入的時候，得把後面的2淘汰，變成（1(3次)，3(1次)）
區別：LRU 是得把 1 淘汰。

顯然
LRU對於迴圈出現的資料，快取命中不高
比如，這樣的資料，1，1，1，2，2，2，3，4，1，1，1，2，2，2.....
當走到3，4的時候，1，2會被淘汰掉，但是後面還有很多1，2

LFU對於交替出現的資料，快取命中不高
比如，1，1，1，2，2，3，4，3，4，3，4，3，4，3，4，3，4......
由於前面被（1(3次)，2(2次)）
3加入把2淘汰，4加入把3淘汰，3加入把4淘汰，然而3，4才是最需要快取的，1去到了3次，誰也淘汰不了它了。

實現

leetcode上有兩個題目
LRU：https://leetcode.com/problems/lru-cache/description/
LFU：https://leetcode.com/problems/lfu-cache/description/

要求是快取的加入put()，快取讀取get()，都要在O(1)內實現。

LRU的一個實現方法：
用一個雙向連結串列記錄訪問時間，因為連結串列插入刪除高效，時間新的在前面，舊的在後面。
用一個雜湊表記錄快取(key, value)，雜湊查詢近似O(1)，發生雜湊衝突時最壞O(n)，同時雜湊表中得記錄 (key, (value, key_ptr))，key_ptr 是key在連結串列中的地址，為了能在O(1)時間內找到該節點，並把節點提升到表頭。
連結串列中的key，能快速找到hash中的value，並刪除。

LFU的一個實現方法：
用一個主雙向連結串列記錄（訪問次數，從連結串列頭），從連結串列中按時間順序記錄著（key）
用一個雜湊表記錄（key，(value, 主連結串列ptr，從連結串列ptr)）ptr表示該key在連結串列中的地址
然後，get，put都在雜湊表中操作，近似O(1)，雜湊表中有個節點在連結串列中的地址，能O(1)找到，並把節點提搞訪問頻次，連結串列插入刪除也都是O(1)。

-------------------- 最後貼個AC的程式碼：--------------------
程式碼效能：1000000次加入，讀取用時
LRU: 480ms
LFU: 510ms
NSCache: 2000ms
YYCache: 1400ms

LRU：

#include <list>
#include <unordered_map>

using namespace std;

class LRUCache {
    
public:
    LRUCache(int capacity);
    ~LRUCache();
    int get(int key);               // 獲取快取，hash查詢的複雜度
    void put(int key, int value);   // 加入快取，相同的key會覆蓋，hash插入的複雜度
    
private:
    int max_capacity;
    list<pair<int, int>> m_list;           // 雙向連結串列，pair<key, value>
    unordered_map<int, list<pair<int, int>>::iterator> u_map;   // 雜湊map, vector + list 實現，<key, list::iter>
};

LRUCache::LRUCache(int capacity) {
    max_capacity = capacity;
}

LRUCache::~LRUCache() {
    max_capacity = 0;
    u_map.clear();
    m_list.clear();
}

int LRUCache::get(int key) {
    auto it = u_map.find(key);      // C++11 自動型別推斷
    if (it != u_map.end()) {
        // splice() 合併 將 m_list 的 iter 移動到 m_list.begin() 中
        m_list.splice(m_list.begin(), m_list, it->second);
        return it->second->second;      // return value
    }
    return -1;
}

void LRUCache::put(int key, int value) {
    auto it = u_map.find(key);
    if (it != u_map.end()) {
        // 更新 key 的 value，並把 key 提前
        it->second->second = value;
        m_list.splice(m_list.begin(), m_list, it->second);
    } else {
        // 先判斷是否滿，滿了要刪除
        if (m_list.size() >= max_capacity) {
            int del_key = m_list.back().first;
            u_map.erase(del_key);
            m_list.pop_back();
        }
        // 插入到 u_map, list 中
        m_list.emplace_front(key, value);   // emplace_front 與 puch_front， emplace_front 不拷貝節點，不移動元素，高效
        u_map[key] = m_list.begin();
    }
}

LFU：

#include <list>
#include <unordered_map>

using namespace std;

// map value 結構
typedef struct LFUMapValue {
    int value;
    list<pair<int, list<int> > >::iterator main_it;    
    list<int>::iterator sub_it;
} LFUMapValue;

class LFUCache {
public:
    LFUCache(int capacity);
    ~LFUCache();
    int get(int key);
    void put(int key, int value);
    void right_move(LFUMapValue *value);  // 把一個節點的key向右提高訪問次數
    
private:
    int max_cap;
    int cur_cap;
    // 儲存 pair<count, subList<key> > 結構，count 訪問次數，count 小到大，key 時間由新到舊
    list<pair<int, list<int> > > m_list;
    unordered_map<int, LFUMapValue> u_map;      // 儲存 <key, LFUMapValue> 結構
    unordered_map<int, LFUMapValue>::iterator map_it;
};

LFUCache::LFUCache(int capacity) {
    cur_cap = 0;
    max_cap = capacity;
    m_list.emplace_front(pair<int, list<int> >(1, list<int>()));    // 插入 count == 1 的節點
}

LFUCache::~LFUCache() {
    m_list.clear();
    u_map.clear();
}

void LFUCache::right_move(LFUMapValue *value) {
    auto pre = value->main_it;
    auto pre_sub_it = value->sub_it;
    auto next = pre;
    next++;
    
    if (next != m_list.end()) {
        if (pre->first + 1 != next->first) {        // 訪問次數+1，判斷是否相等
            if (pre->second.size() == 1) {
                pre->first++;       // 這個 count 的 list 只有1個key，原地+1，不建立新節點
            } else {
                // next 前插入一個節點
                auto it = m_list.emplace(next, pair<int, list<int> >(pre->first + 1, list<int>()));
                it->second.splice(it->second.begin(), pre->second, pre_sub_it);
                value->main_it = it;
                value->sub_it = it->second.begin();
            }
        } else {
            // 追加在 next 的 sub_list 頭部
            next->second.splice(next->second.begin(), pre->second, pre_sub_it);
            value->main_it = next;
            value->sub_it = next->second.begin();
            
            // 如果 pre.size == 0 則釋放
            if (pre->second.size() == 0) {
                m_list.erase(pre);
            }
        }
    } else {
        if (pre->second.size() == 1) {
            pre->first++;       // 原地+1
        } else {
            // 新建一個節點插入
            list<int> tmp_list;
            tmp_list.splice(tmp_list.begin(), pre->second, pre_sub_it);
            // tmp_list 的迭代器不能用，加入 m_list 的時候會對，tmp_list進行拷貝構造，生成新的list插入，tmp_list被釋放
            m_list.emplace_back(pair<int, list<int> >(pre->first + 1, tmp_list));
            value->main_it = m_list.end();
            (value->main_it)--;
            value->sub_it = value->main_it->second.begin();
        }
    }
}

int LFUCache::get(int key) {
    map_it = u_map.find(key);
    if (map_it == u_map.end()) {
        return -1;
    }
    
    LFUMapValue *value = &(map_it->second);
    right_move(value);
    
    return value->value;
}

void LFUCache::put(int key, int value) {
    if (max_cap == 0) {
        return ;
    }
    map_it = u_map.find(key);
    if (map_it == u_map.end()) {
        // 找不到，插入
        list<int> *firstList = &(m_list.front().second);
        if (cur_cap == max_cap) {
            // 淘汰一個
            if (firstList->size() > 0) {
                // u_map 中刪除，list 中刪除
                u_map.erase(firstList->back());
                firstList->pop_back();
                cur_cap--;
            }
        }
        cur_cap++;
        if (m_list.front().first != 1) {
            m_list.emplace_front(pair<int, list<int> >(1, list<int>()));
            firstList = &(m_list.front().second);
        }
        firstList->emplace_front(key);
        LFUMapValue map_value;
        map_value.value = value;
        map_value.main_it = m_list.begin();
        map_value.sub_it = firstList->begin();
        u_map[key] = map_value;
    } else {
        // 找得到，更新，提高一個訪問次數
        map_it->second.value = value;
        right_move(&(map_it->second));
    }
}

作者：ck2016
連結：https://www.jianshu.com/p/1f8e36285539
來源：簡書
著作權歸作者所有。商業轉載請聯絡作者獲得授權，非商業轉載請註明出處。【作者】張昺華【出處】http://www.cnblogs.com/sky-heaven/ 【部落格園】 http://www.cnblogs.com/sky-heaven/ 【知乎】 http://www.zhihu.com/people/zhang-bing-hua 【我的作品---旋轉倒立擺】 http://v.youku.com/v_show/id_XODM5NDAzNjQw.html?spm=a2hzp.8253869.0.0&from=y1.7-2 【我的作品---自平衡自動循跡車】 http://v.youku.com/v_show/id_XODM5MzYyNTIw.html?spm=a2hzp.8253869.0.0&from=y1.7-2 【大餅教你學系列】https://edu.csdn.net/course/detail/10393 【新浪微博】張昺華--sky 【twitter】 @sky2030_ 【微信公眾號】張昺華本文版權歸作者和部落格園共有，歡迎轉載，但未經作者同意必須保留此段宣告，且在文章頁面明顯位置給出原文連線，否則保留追究法律責任的權利.

快取淘汰演算法 LRU 和 LFU【轉】

演算法流程

實現

快取淘汰演算法 LRU 和 LFU【轉】

快取淘汰算法系列(一)【轉】

快取淘汰演算法--LRU演算法

Precision,Recall,F1的介紹和計算【轉】

詳解 Redis 記憶體管理機制和實現【轉】

快取與資料庫的奔跑原理【轉】

Linux記憶體管理：Fixmaps(固定對映地址)和ioremap【轉】

Linux記憶體管理 (19)總結記憶體管理資料結構和API【轉】

Linux核心-記憶體回收邏輯和演算法（LRU）【轉】

快取淘汰演算法（LFU、LRU、ARC、FIFO、2Q）

巧記淘汰策略FIFO、LRU和LFU

工程師必須瞭解的LRU快取淘汰演算法以及python實現過程

a_lc_設計 LRU 和 LFU 快取結構（雙向連結串列+map | ）

LRU快取淘汰演算法

php中cURL會話的curl_setopt的CURLOPT_HEADER和CURLOPT_RETURNTRANSFER引數的使用【轉】

【轉】混淆矩陣和ROC曲線

【轉】Flask 上下文機制和執行緒隔離

【轉】Scala JDBC 查詢和更新MySQL

【轉】go語言筆記——切片函式常見操作，增刪改查和搜尋、排序

【轉】TCP 半連線佇列和全連線佇列滿了會發生什麼？又該如何應對？

快取淘汰演算法 LRU 和 LFU【轉】

演算法流程

實現

相關推薦