关于x86_64架构下atomic、mutex、rwlock的性能对比-embeddedlwp-ChinaUnix博客

Wanpeng&nbsp;Li(李万鹏)

首页　| 　博文目录　| 　关于我

embeddedlwp

博客访问： 578760
博文数量： 168
博客积分： 62
博客等级：民兵
技术积分： 442
用户组：普通用户
注册时间： 2011-04-30 11:45

文章分类

全部博文（168）

未分配的博文（168）

文章存档

2016年（2）

2015年（19）

2014年（98）

2013年（22）

2012年（6）

2011年（21）

我的朋友

相关博文

关于x86_64架构下atomic、mutex、rwlock的性能对比

分类： LINUX

2014-09-23 08:27:04

原文地址：关于x86_64架构下atomic、mutex、rwlock的性能对比作者：瀚海书香

这里以多线程操作long类型变量，进行加法运算1亿次的时间作为性能对比的标准。

测试使用SLES 11SP2操作系统，3.0.80内核，CPU使用Xeon 5506（2 socket, 4 cores, 1thread）

由于针对64位类型的atomic glibc没有提供相应的库，将内核实现代码移植到应用层
atomic64.h

点击(此处)折叠或打开

#ifndef __HI_ATOMIC64_H__
#define __HI_ATOMIC64_H__
#include <stdio.h>
#include <getopt.h>
#include <limits.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <pthread.h>
#include <sys/time.h>
#include <arpa/inet.h>
#include <fcntl.h>
#include <signal.h>
#include <errno.h>
#include <sys/time.h>
/* Learn from kernel */
#ifdef __x86_64__
#define LOCK_PREFIX "lock ;"
typedef struct {
long long counter;
} atomic64_t;
/**
* atomic64_read - read atomic64 variable
* @v: pointer of type atomic64_t
*
* Atomically reads the value of @v.
* Doesn't imply a read memory barrier.
*/
static inline long atomic64_read(const atomic64_t *v)
{
return (*(volatile long *)&(v)->counter);
}
/**
* atomic64_set - set atomic64 variable
* @v: pointer to type atomic64_t
* @i: required value
*
* Atomically sets the value of @v to @i.
*/
static inline void atomic64_set(atomic64_t *v, long i)
{
v->counter = i;
}
/**
* atomic64_add - add integer to atomic64 variable
* @i: integer value to add
* @v: pointer to type atomic64_t
*
* Atomically adds @i to @v.
*/
static inline void atomic64_add(long i, atomic64_t *v)
{
asm volatile(LOCK_PREFIX "addq %1,%0"
: "=m" (v->counter)
: "er" (i), "m" (v->counter));
}
/**
* atomic64_sub - subtract the atomic64 variable
* @i: integer value to subtract
* @v: pointer to type atomic64_t
*
* Atomically subtracts @i from @v.
*/
static inline void atomic64_sub(long i, atomic64_t *v)
{
asm volatile(LOCK_PREFIX "subq %1,%0"
: "=m" (v->counter)
: "er" (i), "m" (v->counter));
}
#else /* __x86_64__ */
/*FIXME:
* This program will run on x86_64 machine in the expected future, we
* do _not_ need to care other cpu architecture.
*/
#endif
#endif

测试代码performance.c

点击(此处)折叠或打开

/*******************************************************************************
This program is free software; you can redistribute it and/or modify it
under the terms and conditions of the GNU General Public License,
version 2, as published by the Free Software Foundation.
This program is distributed in the hope it will be useful, but WITHOUT
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
more details.
You should have received a copy of the GNU General Public License along with
this program; if not, write to the Free Software Foundation, Inc.,
51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
The full GNU General Public License is included in this distribution in
the file called "COPYING".
Date: 2014-04-15 21:27:57 CST
Contact Information:
Tony <tingw.liu@gmail.com>
Home, Qingdao, China.
*******************************************************************************/
#include "atomic64.h"
atomic64_t num;
long mutexnum = 0;
long maxnum;
struct timeval tv;
long starttime;
//FIXME: gettimeofday is a non-thread safe sysycall
static pthread_mutex_t timelock = PTHREAD_MUTEX_INITIALIZER;
#define TIME_LOCK() pthread_mutex_lock(&timelock)
#define TIME_UNLOCK() pthread_mutex_unlock(&timelock)
static pthread_mutex_t numlock = PTHREAD_MUTEX_INITIALIZER;
#define MUTEX_LOCK() pthread_mutex_lock(&numlock)
#define MUTEX_UNLOCK() pthread_mutex_unlock(&numlock)
static pthread_rwlock_t rwnumlock = PTHREAD_RWLOCK_INITIALIZER;
#define RW_LOCK() pthread_rwlock_wrlock(&rwnumlock)
#define RW_UNLOCK() pthread_rwlock_unlock(&rwnumlock);
static void * add_func(void *arg)
{
long stoptime;
while(1) {
atomic64_add(1, &num);
if (atomic64_read(&num) > maxnum) {
TIME_LOCK();
gettimeofday(&tv, 0);
TIME_UNLOCK();
stoptime= (long)tv.tv_sec * (long)1000000 +
(long)tv.tv_usec;
printf("Used %ld microseconds\n", stoptime - starttime);
break;
}
}
}
static void *add_func_rwlock(void *arg)
{
long stoptime;
while(1) {
RW_LOCK();
++mutexnum;
if (mutexnum > maxnum) {
RW_UNLOCK();
TIME_LOCK();
gettimeofday(&tv, 0);
TIME_UNLOCK();
stoptime= (long)tv.tv_sec * (long)1000000 +
(long)tv.tv_usec;
printf("Used %ld microseconds\n", stoptime - starttime);
break;
}
RW_UNLOCK();
}
}
static void *add_func_mutex(void *arg)
{
long stoptime;
while(1) {
MUTEX_LOCK();
++mutexnum;
if (mutexnum > maxnum) {
MUTEX_UNLOCK();
TIME_LOCK();
gettimeofday(&tv, 0);
TIME_UNLOCK();
stoptime= (long)tv.tv_sec * (long)1000000 +
(long)tv.tv_usec;
printf("Used %ld microseconds\n", stoptime - starttime);
break;
}
MUTEX_UNLOCK();
}
}
#define ATOMIC_TYPE 0
#define MUTEX_TYPE 1
#define RW_TYPE 2
int main(int argc, char **argv)
{
pthread_t thread;
pthread_attr_t thread_attr;
int threadnum, i, type;
if (argc != 4) {
printf("Usage: %s threadnum maxnum type[0-atomic, 1-mutex, 2-rwlock]\n",
argv[0]);
exit(0);
}
threadnum = atoi(argv[1]);
maxnum = atoll(argv[2]);
type = atoi(argv[3]);
printf("Use %d threads add num from 0 to %ld\n", threadnum, maxnum);
gettimeofday(&tv, 0);
starttime= (long)tv.tv_sec * (long)1000000 + (long)tv.tv_usec;
atomic64_set(&num, 0);
pthread_attr_init(&thread_attr);
//pthread_attr_setdetachstate(&thread_attr, PTHREAD_CREATE_DETACHED);
for (i = 0; i < threadnum; i++) {
if (type == ATOMIC_TYPE)
pthread_create(&thread, &thread_attr, add_func, 0);
else if (type == MUTEX_TYPE)
pthread_create(&thread, &thread_attr, add_func_mutex, 0);
else if (type == RW_TYPE)
pthread_create(&thread, &thread_attr, add_func_rwlock, 0);
}
while(1)
sleep(10);
}

运行结果这里就不详细列出来了，可以直接看这个曲线图。

横坐标是线程数，纵坐标是运算1亿次耗费的微秒数。
从这个图中可以看出，对于频繁写操作的情况atomic > mutex > rwlock
对于同一种同步类型，并不是随着线程数的增加而一直增加，不过因为只有8个核心，所以没有测试更多线程的情况。

欢迎转载，转载请注明出处：http://forever.blog.chinaunix.net

阅读(1188) | 评论(0) | 转发(0) |

上一篇：ubuntu 12.04下如何将物理网卡加入bridge连接外网

下一篇：F2FS文件系统架构与原理分析(一)——设计背景与功能

给主人留下些什么吧！~~

感谢所有关心和支持过ChinaUnix的朋友们

16024965号-6