簡單無鎖佇列的實現和使用

阿新 • • 發佈：2019-02-19

無鎖佇列越來越流行，在特定的場合使用不同的無鎖佇列，可以起到節省鎖開銷，提高程式效率。

Linux核心中有無鎖佇列的實現，可謂簡潔而不簡單。核心判斷部分利用了整數溢位機制，這個有很多文章專門介紹，我們就不詳細講了。

裡面註釋很詳細，直接來kfifo的原始碼，大家看原始碼註釋應該就可以理解了。原始碼是linux上實現的，為了跨平臺，增加了其他平臺下的實現。

#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#define __u32 unsigned long
#define __u64 unsigned long long

#if defined(__GNUC__)
#define min(x,y) ({ 		\
        typeof(x) _x = (x); \
        typeof(y) _y = (y);	\
        (void) (&_x == &_y);\
        _x < _y ? _x : _y; })

#define max(x,y) ({ 		\
        typeof(x) _x = (x);	\
        typeof(y) _y = (y);	\
        (void) (&_x == &_y);\
        _x > _y ? _x : _y; })

#else
#define max(a,b)            (((a) > (b)) ? (a) : (b))
#define min(a,b)            (((a) < (b)) ? (a) : (b))
#endif

#define MAX_KFIFO_SIZE 0x1000

struct kfifo { 
    unsigned char *buffer; /* the buffer holding the data */ 
    unsigned int size; /* the size of the allocated buffer */ 
    unsigned int in; /* data is added at offset (in % size) */ 
    unsigned int out; /* data is extracted from off. (out % size) */ 
};

/**
 * fls - find last bit set
 * @x: the word to search
 *
 * This is defined the same way as ffs:
 * - return 32..1 to indicate bit 31..0 most significant bit set
 * - return 0 to indicate no bits set
 */
#if defined(__GNUC__)
static inline int fls(int x)
{
    int r;

    __asm__("bsrl %1,%0\n\t"
            "jnz 1f\n\t"
            "movl $-1,%0\n"
            "1:" : "=r" (r) : "rm" (x));
    return r+1;
}
#else
static inline int fls(int x)
{
	int position;
	int i;
	if(0 != x)
	{
		for (i = (x >> 1), position = 0; i != 0; ++position)
			i >>= 1;
	}
	else
	{
		position = -1;
	}		
	return position+1;
}
#endif
/**
 * fls64 - find last bit set in a 64-bit value
 * @n: the value to search
 *
 * This is defined the same way as ffs:
 * - return 64..1 to indicate bit 63..0 most significant bit set
 * - return 0 to indicate no bits set
 */
static inline int fls64(__u64 x)
{
    __u32 h = x >> 32;
    if (h)
        return fls(h) + 32;
    return fls(x);
}

static inline unsigned fls_long(unsigned long l)
{
    if (sizeof(l) == 4)
        return fls(l);
    return fls64(l);
}

static inline unsigned long roundup_pow_of_two(unsigned long x)
{
    return 1UL << fls_long(x - 1);
}

/**
 * * kfifo_alloc - allocates a new FIFO and its internal buffer
 * * @size: the size of the internal buffer to be allocated.
 * * @gfp_mask: get_free_pages mask, passed to kmalloc()
 * * @lock: the lock to be used to protect the fifo buffer
 * *
 * * The size will be rounded-up to a power of 2.
 * */
struct kfifo *kfifo_alloc(unsigned int size)   
{   
    unsigned char *buffer;   
    struct kfifo *fifo;   
  
    /*  
     *       * round up to the next power of 2, since our 'let the indices  
     *            * wrap' tachnique works only in this case.  
     *                 */   
    if (size & (size - 1)) {   
            if(size > 0x80000000);
				return NULL;
            size = roundup_pow_of_two(size);            
        }
  
    buffer = (unsigned char *)malloc(size);   
    if (!buffer)   
        return NULL;   
  
    fifo = (struct kfifo*)malloc(sizeof(struct kfifo));   
  
    if (!fifo)   
    {
         free(buffer);
         return NULL;
    }

    fifo->buffer = buffer;
    fifo->size = size;
    fifo->in = fifo->out = 0;
  
    return fifo;   
} 

/**
 * * kfifo_free - frees the FIFO
 * * @fifo: the fifo to be freed.
 * */
void kfifo_free(struct kfifo *fifo)
{
    free(fifo->buffer);
    free(fifo);
}

/**
* __kfifo_put - puts some data into the FIFO, no locking version
* @fifo: the fifo to be used.
* @buffer: the data to be added.
* @len: the length of the data to be added.
*
* This function copies at most @len bytes from the @buffer into
* the FIFO depending on the free space, and returns the number of
* bytes copied.
*
* Note that with only one concurrent reader and one concurrent
* writer, you don't need extra locking to use these functions.
*/
unsigned int __kfifo_put(struct kfifo *fifo,
                        const unsigned char *buffer, unsigned int len)
{
        unsigned int l;

        len = min(len, fifo->size - fifo->in + fifo->out);

        /* first put the data starting from fifo->in to buffer end */
        l = min(len, fifo->size - (fifo->in & (fifo->size - 1)));
        memcpy(fifo->buffer + (fifo->in & (fifo->size - 1)), buffer, l);

        /* then put the rest (if any) at the beginning of the buffer */
        memcpy(fifo->buffer, buffer + l, len - l);

        fifo->in += len;

        return len;
}

/**
* __kfifo_get - gets some data from the FIFO, no locking version
* @fifo: the fifo to be used.
* @buffer: where the data must be copied.
* @len: the size of the destination buffer.
*
* This function copies at most @len bytes from the FIFO into the
* @buffer and returns the number of copied bytes.
*
* Note that with only one concurrent reader and one concurrent
* writer, you don't need extra locking to use these functions.
*/
unsigned int __kfifo_get(struct kfifo *fifo,
                         unsigned char *buffer, unsigned int len)
{
        unsigned int l;

        len = min(len, fifo->in - fifo->out);

        /* first get the data from fifo->out until the end of the buffer */
        l = min(len, fifo->size - (fifo->out & (fifo->size - 1)));
        memcpy(buffer, fifo->buffer + (fifo->out & (fifo->size - 1)), l);

        /* then get the rest (if any) from the beginning of the buffer */
        memcpy(buffer + l, fifo->buffer, len - l);

        fifo->out += len;

        return len;
}

/**
* __kfifo_reset - removes the entire FIFO contents, no locking version
* @fifo: the fifo to be emptied.
*/
static inline void __kfifo_reset(struct kfifo *fifo)
{
        fifo->in = fifo->out = 0;
}

/**
* __kfifo_len - returns the number of bytes available in the FIFO, no locking version
* @fifo: the fifo to be used.
*/
static inline unsigned int __kfifo_len(struct kfifo *fifo)
{
        return fifo->in - fifo->out;
}

使用的部分寫了一個類，採用了模板封裝，提供了模板型別存取的使用方法。

template <typename T>
class zFifo
{
    private:
        kfifo* _kfifo;
    public:
        zFifo()
        {
            _kfifo = kfifo_alloc(MAX_KFIFO_SIZE);
        }
        ~zFifo()
        {
            if(NULL != _kfifo)
              kfifo_free(_kfifo);
        }
        bool push(T data);
        T get();
};

template <typename T>
bool zFifo<T>::push(T data)
{
    int len = 0;
    len = __kfifo_put(_kfifo, (const unsigned char *)&data, sizeof(T));
    if(len > 0)
        return true;
    else
        return false;
}

template <typename T>
T zFifo<T>::get()
{
    T data;
    int len = __kfifo_get(_kfifo, (unsigned char *)&data, sizeof(T));
    if(len > 0)
        return data;
    else
        return NULL;
}

這種庫一般都用在需要高效處理的地方，為了減少記憶體拷貝，一般都使用指標的形式操作。一個簡單的使用例子：

int main()
{
    zFifo<int*> zf;
    int a = 1;
    zf.push(&a);
    printf("a=%d\n", &a);
    int* b = NULL;
    b = zf.get();
    printf("b=%d\n", b);

    return 0;
}

需要注意的地方：

1.只有一個執行緒負責讀，另一個執行緒負責寫的時候，資料是執行緒安全的。上面的實現是基於這個原理實現的，當有多個執行緒讀或者多個執行緒寫的時候，不保證資料的正確性。
所以使用的時候，一個執行緒寫，一個執行緒讀。網路應用中比較常用，就是開一個執行緒介面資料，然後把資料寫入佇列。然後開一個排程執行緒讀取網路資料，然後分發到處理執行緒。

2.資料長度預設巨集定義了一個長度，超過這個長度的時候，後續的資料會寫入失敗。

簡單無鎖佇列的實現和使用

無鎖佇列越來越流行，在特定的場合使用不同的無鎖佇列，可以起到節省鎖開銷，提高程式效率。 Linux核心中有無鎖佇列的實現，可謂簡潔而不簡單。核心判斷部分利用了整數溢位機制，這個有很多文章專門介紹，我們就不詳細講了。裡面註釋很詳細，直接來kfifo的原始碼，大家看原始碼註釋

lockFreeQueue 無鎖佇列實現與總結

無鎖佇列介紹　　在工程上，為了解決兩個處理器互動速度不一致的問題，我們使用佇列作為快取，生產者將資料放入佇列，消費者從佇列中取出資料。這個時候就會出現四種情況，單生產者單消費者，多生產者單消費者，單生成者多消費者，多生產者多消費者。我們知道，多執行緒往往會帶來資料不一致的情況，一般需要靠加鎖解決問題。

單生產者，單消費者無鎖佇列實現（c）

根據上面連結所說的原理實現的單生產者，單消費者無鎖佇列 bool __sync_bool_compare_and_swap (type *ptr, type oldval，type newval, ...) 函式提供原子的比較和交換，如果*ptr == oldval

Go語言無鎖佇列元件的實現 (chan/interface/select)

1. 背景 go程式碼中要實現非同步很簡單，go funcName()。但是程序需要控制協程數量在合理範圍內，對應大批量任務可以使用“協程池 + 無鎖佇列”實現。 2. golang無鎖佇列實現思路 Channel是Go中的一個核心型別，你可以把它看成一個管道，通過它併發核心單元就可以傳送或者接

多執行緒無鎖佇列的實現

一、什麼是多執行緒無鎖佇列？多執行緒無鎖佇列還是有鎖的，只不過是用了cpu層面的CAS原子操作，用到這個操作，只需要在取佇列元素和新增佇列元素的時候利用CAS原子操作，就可以保證多個執行緒對佇列元素的有序存取；二、什麼是CAS操作？ CAS = Compare &am

一個用 C++ 實現的快速無鎖佇列

在程序間傳遞資料很煩人，真心煩人。一步做錯，資料就會損壞。（相較於其他讀寫方式）即使資料排列正確，也更易出錯。一如既往的，有兩種方式處理這個問題：簡單的方式、麻煩的方式。簡單的方式使用你使用平臺提供的鎖（互斥、臨界區域，或等效）。這從概念上不難理解，使用上更簡單。你無需擔心排列問題，庫

evpp效能測試（3）: 對無鎖佇列boost::lockfree::queue和moodycamel::ConcurrentQueue做一個性能對比測試

Brief 我們使用https://github.com/Qihoo360/evpp專案中的EventLoop::QueueInLoop(...)函式來做這個效能測試。我們通過該函式能夠將一個仿函式執行體從一個執行緒排程到另一個執行緒中執行。這是一個典

無鎖佇列--基於linuxkfifo實現

一直想寫個無鎖的佇列，來提高專案後臺的效率。偶然看到linux核心的kfifo.h 實現原理。於是自己仿照了這個實現，目前linux應該是可以對外提供介面了。 #ifndef _NO_LOCK_QUEUE_H_ #define _NO_LOCK_QUEUE_H_ #i

無鎖佇列的原理與實現

最近幾天在思考無鎖佇列，看了相關文章，也讀了一些部落格，最後寫了一份程式碼，程式碼實現對在多執行緒環境下對佇列的讀和寫是不需要加鎖的。程式碼如下所示： #include <windows.h> #pragma comment(lib, "Kernel32.li

一讀一寫無鎖佇列c++實現

限制一個執行緒讀，一個執行緒寫，不加鎖的佇列，使用單鏈表實現，測試環境：centos 5.9 [[email protected] test]# cat test.cpp #include <iostream> #include <

無鎖佇列的實現

耗子叔曾經寫過一篇同名的部落格，主要參考了John D. Valois 1994年10月在拉斯維加斯的並行和分散式系統國際大會上的一篇論文——《Implementing Lock-Free Queues》。但是從目前現狀來看，這篇論文中提到的演算法是有問題的，並

【DPDK】【ring】從DPDK的ring來看x86無鎖佇列的實現

【前言】　　佇列是眾多資料結構中最常見的一種之一。曾經有人和我說過這麼一句話，叫做“程式等於資料結構+演算法”。因此在設計模組、寫程式碼時，佇列常常作為一個很常見的結構出現在模組設計中。DPDK不僅是一個加速網路IO的框架，其內部還提供眾多的功能元件，rte_ring就是DPDK內部提供的一種無鎖佇列，本篇

基於陣列的無鎖佇列(譯)

原文 1 引言最近對於注重效能的應用程式,我們有了一種能顯著提高程式效能的選擇:多執行緒.執行緒的概念實際上已經存在了很長時間.在過去,多數計算機只有一個處理器,執行緒主要用於將一個大的任務拆分成一系列更小的執行單元.以使得當其中某些執行單元因為等待資源而被阻塞的時候剩餘的執行單元能繼續執行。舉個示例,一個

Disruptor無鎖佇列淺析

近期在看作業系統相關資料的時候，閱讀到“訊號量與PV操作”，主要分三塊：互斥控制，同步控制，生產者與消費者問題。因為我日常與伺服器及訊息佇列打交道較多，對生產者與消費者問題比較感興趣，正好之前曾經研究過“Disruptor無鎖佇列”的實現原理，正好再結合PV操作重新

Boost無鎖佇列

在開發接收轉發agent時，採用了多執行緒的生產者-消費者模式，用了加互斥鎖的方式來實現執行緒同步。互斥鎖會阻塞執行緒，所以壓測時，效率並不高。所以想起用無鎖佇列來實現，效能確實提升了。首先介紹下lock-free和wait-free的區別：阻塞演算法可

深入理解dpdk rte_ring無鎖佇列

同樣用面向物件的思想來理解無鎖佇列ring。dpdk的無鎖佇列ring是借鑑了linux核心kfifo無鎖佇列。ring的實質是FIFO的環形佇列。 ring的特點：無鎖出入隊（除了cas(compare and swap)操作）多消費/生產者同時出入隊使用方法： 1.建立一個ring物件。介面：s

c語言資料結構應用-陣列佇列（無鎖佇列）在多執行緒中的使用

一、背景上篇文章《c語言資料結構實現-陣列佇列/環形佇列》講述了陣列佇列的原理與實現，本文編寫一個雙執行緒進行速度測試二、相關知識多執行緒程式設計介面: 1) 建立執行緒 pthread_create 函式 SYNOPSIS #include <

併發無鎖佇列學習（單生產者單消費者模型）

1、引言本文介紹單生產者單消費者模型的佇列。根據寫入佇列的內容是定長還是變長，分為單生產者單消費者定長佇列和單生產者單消費者變長佇列兩種。單生產者單消費者模型的佇列操作過程是不需要進行加鎖的。生產者通過寫索引控制入隊操作，消費者通過讀索引控制出佇列操作。二者

canvas 簡單的小球拋物線實現和簡單的應用

使用canvas實現簡單的小球下落 canvas可以實現一些有趣的繪畫，可以實現規則或者不規則的圖形。我們這裡的小球就是一個通過canvas的方法arc畫出的圓。我們可以使用storke和fil來實現圓的顏色和邊框，如果你還想讓圓在漂亮一些，使用createR

C++無鎖程式設計資料，無鎖佇列等

1. Lamport's Lock-Free Ring Buffer [Lamport, Comm. of ACM, 1977] 也就常說的單生產者-單消費者的ringbuffer，限制就是隻能一個讀執行緒（消費者），一個寫程序（生產者）。

簡單無鎖佇列的實現和使用

相關推薦