Windows和pthread中提供的自旋锁

Windows和POSIX中都提供了自旋锁，我们也可以通过C++11的atomic来实现自旋锁。那么两者性能上面是什么关系？先引入实现代码：

#ifndef __spinlock_h__

#define __spinlock_h__

#include <atomic>

#ifdef _WIN32

#include <Windows.h>

class spinlock_mutex

{

public:

    static constexpr DWORD SPINLOCK_COUNT = -;

public:

    // 在初始化时，会出现资源不足的问题，这里忽略这个问题

    // 具体参考Critical Sections and Error Handling(Windows via C/C++)

    spinlock_mutex()

    {

        InitializeCriticalSectionAndSpinCount(&m_cs, SPINLOCK_COUNT);

    }

    ~spinlock_mutex()

    {

        DeleteCriticalSection(&m_cs);

    }

    void lock()

    {

        EnterCriticalSection(&m_cs);

    }

    bool try_lock()

    {

        return TryEnterCriticalSection(&m_cs) == TRUE;

    }

    void unlock()

    {

        LeaveCriticalSection(&m_cs);

    }

private:

    CRITICAL_SECTION m_cs;

};

#elif defined(_POSIX_C_SOURCE)

#include <pthread.h>

class spinlock_mutex

{

public:

    // 这里不处理可能出现的调用错误

    spinlock_mutex()

    {

        pthread_spin_init(&m_cs, PTHREAD_PROCESS_PRIVATE);

    }

    ~spinlock_mutex()

    {

        pthread_spin_destroy(&m_cs);

    }

    void lock()

    {

        pthread_spin_lock(&m_cs);

    }

    bool try_lock()

    {

        return pthread_spin_trylock(&m_cs) == ;

    }

    void unlock()

    {

        pthread_spin_unlock(&m_cs);

    }

private:

    pthread_spinlock_t m_cs;

};

#else

class spinlock_mutex

{

    std::atomic_flag flag;

public:

    spinlock_mutex() :

        flag{ ATOMIC_FLAG_INIT }

    {}

    void lock()

    {

        while (flag.test_and_set(std::memory_order_acquire));

    }

    void unlock()

    {

        flag.clear(std::memory_order_release);

    }

    bool try_lock()

    {

        return !flag.test_and_set(std::memory_order_acquire);

    }

};

#endif

#endif    // __spinlock_h__

下面给出一个简单测试，两组线程，一组用来插入，另外一组用来取出。测试结果显示：

（1）无论是Windows，还是POSIX提供的C语言版本的自旋锁，都和C++11使用atomic构建的自旋锁效率相近。

（2）在插入线程数和取出线程数相同的情况下，线程数越多，效率越低。

下面是测试代码：

#include <memory>

#include <cassert>

#include <iostream>

#include <vector>

#include <thread>

#include <future>

#include <random>

#include <chrono>

#include "spinlock.h"

#include <forward_list>

struct student_name

{

    student_name(int age = )

        : age(age), next(nullptr)

    {

    }

    int age;

    student_name* next;

};

spinlock_mutex g_mtx;

std::forward_list<int> g_students;

std::atomic<int> g_inserts; // insert num (successful)

std::atomic<int> g_drops;   // drop num (successful)

std::atomic<int> g_printNum;    // as same as g_drops

std::atomic<long long> g_ageInSum;   // age sum when producing student_name

std::atomic<long long> g_ageOutSum;  // age sum when consuming student_name

std::atomic<bool> goOn(true);

constexpr int INSERT_THREAD_NUM = ;

constexpr int DROP_THREAD_NUM = ;

constexpr int ONE_THREAD_PRODUCE_NUM = ;    // when testing, no more than this number, you know 20,000,00 * 100 * 10 ~= MAX_INT if thread num <= 10

inline void printOne(student_name* t)

{

    g_printNum.fetch_add(, std::memory_order_relaxed);

    g_ageOutSum.fetch_add(t->age, std::memory_order_relaxed);

    g_drops.fetch_add(, std::memory_order_relaxed);

    delete t;

}

void insert_students(int idNo)

{

    std::default_random_engine dre(time(nullptr));

    std::uniform_int_distribution<int> ageDi(, );

    for (int i = ; i < ONE_THREAD_PRODUCE_NUM; ++i)

    {

        int newAge = ageDi(dre);

        g_ageInSum.fetch_add(newAge, std::memory_order_relaxed);

        {

            std::lock_guard<spinlock_mutex> lock(g_mtx);

            g_students.push_front(newAge);

        }

        // use memory_order_relaxed avoiding affect folly memory order

        g_inserts.fetch_add(, std::memory_order_relaxed);

    }

}

void drop_students(int idNo)

{

    while (auto go = goOn.load(std::memory_order_consume))

    {

        {

            std::forward_list<int> tmp;

            {

                std::lock_guard<spinlock_mutex> lock(g_mtx);

                std::swap(g_students, tmp);

            }

            auto it = tmp.begin();

            while (it != tmp.end())

            {

                g_printNum.fetch_add(, std::memory_order_relaxed);

                g_ageOutSum.fetch_add(*it, std::memory_order_relaxed);

                g_drops.fetch_add(, std::memory_order_relaxed);

                ++it;

            }

        }

    }

}

int main()

{

    auto start = std::chrono::system_clock::now();

    std::vector<std::future<void>> insert_threads;

    std::vector<std::future<void>> drop_threads;

    for (auto i = ; i != INSERT_THREAD_NUM; ++i)

    {

        insert_threads.push_back(std::async(std::launch::async, insert_students, i));

    }

    for (auto i = ; i != DROP_THREAD_NUM; ++i)

    {

        drop_threads.push_back(std::async(std::launch::async, drop_students, i));

    }

    for (auto& thread : insert_threads)

    {

        thread.get();

    }

    std::this_thread::sleep_for(std::chrono::milliseconds());

    goOn.store(false, std::memory_order_release);

    for (auto& thread : drop_threads)

    {

        thread.get();

    }

    {

        std::forward_list<int> tmp;

        {

            std::lock_guard<spinlock_mutex> lock(g_mtx);

            std::swap(g_students, tmp);

        }

        auto it = tmp.begin();

        while (it != tmp.end())

        {

            g_printNum.fetch_add(, std::memory_order_relaxed);

            g_ageOutSum.fetch_add(*it, std::memory_order_relaxed);

            g_drops.fetch_add(, std::memory_order_relaxed);

            ++it;

        }

    }

    auto end = std::chrono::system_clock::now();

    std::chrono::duration<double> diff = end - start;

    std::cout << "Time to insert and drop is: " << diff.count() << " s\n";

    std::cout << "insert count1: " << g_inserts.load() << std::endl;

    std::cout << "drop count1: " << g_drops.load() << std::endl;

    std::cout << "print num1: " << g_printNum.load() << std::endl;

    std::cout << "age in1: " << g_ageInSum.load() << std::endl;

    std::cout << "age out1: " << g_ageOutSum.load() << std::endl;

    std::cout << std::endl;

}

关于自选锁，还有以下内容需要说明：

（1）应用层用spinlock的最大问题是不能跟kernel一样的关中断（cli/sti），假设并发稍微多点，线程1在lock之后unlock之前发生了时钟中断，
* 一段时间后才会被切回来调用unlock，那么这段时间中另一个调用lock的线程不就得空跑while了？这才是最浪费cpu时间的地方。
* 所以不能关中断就只能sleep了，怎么着都存在巨大的冲突代价。

（2）具体参考：https://www.zhihu.com/question/55764216

Windows和pthread中提供的自旋锁的更多相关文章

pthread中互斥量，锁和条件变量
互斥量 #include <pthread.h> pthread_mutex_t mutex=PTHREAD_MUTEX_INTIIALIZER; int pthread_mutex_in ...
Linux中自旋锁
传统的spinlock Linux的的内核最常见的锁是自旋锁.自旋锁最多只能被一个可执行线程持有.如果一个执行线程试图获得一个被已经持有(争用)的自旋锁,那么该线程就会一直进行忙循环-旋转-等待锁重新 ...
Linux内核同步：自旋锁
linux内核--自旋锁的理解自旋锁:如果内核配置为SMP系统,自旋锁就按SMP系统上的要求来实现真正的自旋等待,但是对于UP系统,自旋锁仅做抢占和中断操作,没有实现真正的“自旋”.如果配置了CON ...
Optimistic concurrency control 死锁悲观锁乐观锁自旋锁
Optimistic concurrency control https://en.wikipedia.org/wiki/Optimistic_concurrency_control Optimist ...
spinlock自旋锁de使用
Linux内核中最常见的锁是自旋锁.一个自旋锁就是一个互斥设备,它只能有两个值:"锁定"和"解锁".如果锁可用,则"锁定"位被设置,而代码继 ...
Nginx学习之四-Nginx进程同步方式-自旋锁（spinlock）
自旋锁简介 Nginx框架使用了三种消息传递方式:共享内存.套接字.信号. Nginx主要使用了三种同步方式:原子操作.信号量.文件锁. 基于原子操作,nginx实现了一个自旋锁.自旋锁是一种非睡眠锁 ...
JAVA锁机制-可重入锁,可中断锁，公平锁，读写锁，自旋锁,
如果需要查看具体的synchronized和lock的实现原理,请参考:解决多线程安全问题-无非两个方法synchronized和lock 具体原理(百度) 在并发编程中,经常遇到多个线程访问同一个 ...
Linux 同步方法剖析--内核原子，自旋锁和相互排斥锁
在学习 Linux® 的过程中,您或许接触过并发(concurrency).临界段(critical section)和锁定,可是怎样在内核中使用这些概念呢?本文讨论了 2.6 版内核中可用的锁定机制 ...
linux 自旋锁和信号量【转】
转自:http://blog.csdn.net/xu_guo/article/details/6072823 版权声明:本文为博主原创文章,未经博主允许不得转载. 自旋锁最多只能被一个可执行线程持有( ...

随机推荐

（11）线程池（最新的concurrent.futures包去开启）
'''concurrent.futures是最新的开启线程池的包'''import timefrom concurrent.futures import ThreadPoolExecutor #开启线 ...
C++学习（二十九）（C语言部分）之顺序表
一.数据结构组织存放数据的方式精心选择的数据结构可以提升效率数据结构 1.逻辑结构一对多关系父与子一对一关系排队中多对多关系两地的路线 2.存储结构数据存放的位置关系顺序存储数据 ...
【HDOJ4109】【拓扑OR差分约束求关键路径】
http://acm.hdu.edu.cn/showproblem.php?pid=4109 Instrction Arrangement Time Limit: 2000/1000 MS (Java ...
Linux命令速查手册
Others make 通过外部编译器的,比如linux中的gcc集来编译源码获取Makefile文件的命令触发编译 curl -X GET/POST -I 获取head curl有cache 查看 ...
jsp的服务器响应，out.println 与response.setIntHeader的报错解决方案，附：导入jar包的方法
在九大内置对象中,笔者认为用的最多的就是out.println 与response.setIntHeader,今天刚写了一个服务器响应的代码,也总是这两个报错.具体请看图. 先来说说response. ...
Redis 5.0.0 releases notes
Redis 5.0 release notes ======================= ---------------------------------------------------- ...
【BZOJ3144】【HNOI2013】切糕
总算做了一道2011以后的省选题了……原题: 图片题面好评! P,Q,R≤40,0≤D≤R,给出的所有的不和谐值不超过1000. 文本样例好评! 恩这个是听妹主席讲过后会写的,首先把每个点拆成链,那么 ...
【java编程】Java魔法类：Unsafe应用解析
转载来源:https://tech.meituan.com/2019/02/14/talk-about-java-magic-class-unsafe.html 前言 Unsafe是位于sun.mis ...
oracle之rman备份
rman必须在oracle的归档模式下才能进行查看数据库是否为归档状态,在oracle数据库的命令行输入 archive log list; 首先关闭数据库 shutdown immediate; ...
makefile——小试牛刀
//a.h,包含头文件stdio.h,并且定义一个函数print #include<stdio.h> void print(); //b.c,包含头文件a.h,然后就可以写print函数的 ...

Windows和pthread中提供的自旋锁

Windows和pthread中提供的自旋锁的更多相关文章

随机推荐

热门专题