mirror of
https://github.com/MariaDB/server.git
synced 2025-08-08 11:22:35 +03:00
amd64 atomic ops
lock-free alloc (WL#3229), lock-free hash (WL#3230) bit functions made inline include/Makefile.am: lf.h added mysys/Makefile.am: lf_hash.c lf_dynarray.c lf_alloc-pin.c include/atomic/nolock.h: amd64 atomic ops include/atomic/rwlock.h: s/rw_lock/mutex/g include/atomic/x86-gcc.h: amd64 atomic ops try PAUSE include/my_global.h: STATIC_INLINE mysys/mf_keycache.c: make bit functions inline mysys/my_atomic.c: STATIC_INLINE mysys/my_bitmap.c: make bit functions inline sql/ha_myisam.cc: make bit functions inline sql/item_func.cc: make bit functions inline include/my_atomic.h: STATIC_INLINE mysys/my_bit.c: make bit functions inline sql/sql_select.cc: make bit functions inline storage/myisam/mi_create.c: make bit functions inline storage/myisam/mi_test2.c: make bit functions inline storage/myisam/myisamchk.c: make bit functions inline mysys/my_init.c: thread_size moved to mysys sql/mysql_priv.h: thread_size moved to mysys sql/set_var.cc: thread_size moved to mysys include/my_sys.h: thread_size moved to mysys sql/mysqld.cc: thread_size moved to mysys sql/sql_parse.cc: thread_size moved to mysys sql/sql_test.cc: thread_size moved to mysys include/lf.h: dylf_dynarray refactored to remove 65536 elements limit mysys/lf_alloc-pin.c: dylf_dynarray refactored to remove 65536 elements limit mysys/lf_dynarray.c: dylf_dynarray refactored to remove 65536 elements limit mysys/lf_hash.c: dylf_dynarray refactored to remove 65536 elements limit unittest/mysys/my_atomic-t.c: fix to commit (remove debug code)
This commit is contained in:
@@ -14,13 +14,20 @@
|
||||
along with this program; if not, write to the Free Software
|
||||
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */
|
||||
|
||||
#include <my_global.h>
|
||||
//#define MY_ATOMIC_MODE_RWLOCKS
|
||||
//#define MY_ATOMIC_MODE_DUMMY
|
||||
|
||||
#include <tap.h>
|
||||
|
||||
#include <my_global.h>
|
||||
#include <my_sys.h>
|
||||
#include <my_atomic.h>
|
||||
#include <lf.h>
|
||||
|
||||
int32 a32,b32,c32;
|
||||
volatile uint32 a32,b32,c32;
|
||||
my_atomic_rwlock_t rwl;
|
||||
LF_ALLOCATOR lf_allocator;
|
||||
LF_HASH lf_hash;
|
||||
|
||||
pthread_attr_t thr_attr;
|
||||
pthread_mutex_t mutex;
|
||||
@@ -30,9 +37,9 @@ int N;
|
||||
/* add and sub a random number in a loop. Must get 0 at the end */
|
||||
pthread_handler_t test_atomic_add_handler(void *arg)
|
||||
{
|
||||
int m=*(int *)arg;
|
||||
int m=(*(int *)arg)/2;
|
||||
int32 x;
|
||||
for (x=((int)(&m)); m ; m--)
|
||||
for (x=((int)(intptr)(&m)); m ; m--)
|
||||
{
|
||||
x=x*m+0x87654321;
|
||||
my_atomic_rwlock_wrlock(&rwl);
|
||||
@@ -61,15 +68,9 @@ pthread_handler_t test_atomic_add_handler(void *arg)
|
||||
pthread_handler_t test_atomic_swap_handler(void *arg)
|
||||
{
|
||||
int m=*(int *)arg;
|
||||
int32 x;
|
||||
uint32 x=my_atomic_add32(&b32, 1);
|
||||
|
||||
my_atomic_rwlock_wrlock(&rwl);
|
||||
x=my_atomic_add32(&b32, 1);
|
||||
my_atomic_rwlock_wrunlock(&rwl);
|
||||
|
||||
my_atomic_rwlock_wrlock(&rwl);
|
||||
my_atomic_add32(&a32, x);
|
||||
my_atomic_rwlock_wrunlock(&rwl);
|
||||
|
||||
for (; m ; m--)
|
||||
{
|
||||
@@ -98,29 +99,29 @@ pthread_handler_t test_atomic_swap_handler(void *arg)
|
||||
|
||||
/*
|
||||
same as test_atomic_add_handler, but my_atomic_add32 is emulated with
|
||||
(slower) my_atomic_cas32
|
||||
my_atomic_cas32 - notice that the slowdown is proportional to the
|
||||
number of CPUs
|
||||
*/
|
||||
pthread_handler_t test_atomic_cas_handler(void *arg)
|
||||
{
|
||||
int m=*(int *)arg, ok;
|
||||
int32 x,y;
|
||||
for (x=((int)(&m)); m ; m--)
|
||||
int m=(*(int *)arg)/2, ok=0;
|
||||
int32 x, y;
|
||||
for (x=((int)(intptr)(&m)); m ; m--)
|
||||
{
|
||||
my_atomic_rwlock_wrlock(&rwl);
|
||||
y=my_atomic_load32(&a32);
|
||||
my_atomic_rwlock_wrunlock(&rwl);
|
||||
|
||||
x=x*m+0x87654321;
|
||||
do {
|
||||
my_atomic_rwlock_wrlock(&rwl);
|
||||
ok=my_atomic_cas32(&a32, &y, y+x);
|
||||
my_atomic_rwlock_wrunlock(&rwl);
|
||||
} while (!ok);
|
||||
} while (!ok) ;
|
||||
do {
|
||||
my_atomic_rwlock_wrlock(&rwl);
|
||||
ok=my_atomic_cas32(&a32, &y, y-x);
|
||||
my_atomic_rwlock_wrunlock(&rwl);
|
||||
} while (!ok);
|
||||
} while (!ok) ;
|
||||
}
|
||||
pthread_mutex_lock(&mutex);
|
||||
N--;
|
||||
@@ -129,6 +130,128 @@ pthread_handler_t test_atomic_cas_handler(void *arg)
|
||||
return 0;
|
||||
}
|
||||
|
||||
/*
|
||||
pin allocator - alloc and release an element in a loop
|
||||
*/
|
||||
pthread_handler_t test_lf_pinbox(void *arg)
|
||||
{
|
||||
int m=*(int *)arg;
|
||||
int32 x=0;
|
||||
LF_PINS *pins;
|
||||
|
||||
pins=lf_pinbox_get_pins(&lf_allocator.pinbox);
|
||||
|
||||
for (x=((int)(intptr)(&m)); m ; m--)
|
||||
{
|
||||
lf_pinbox_put_pins(pins);
|
||||
pins=lf_pinbox_get_pins(&lf_allocator.pinbox);
|
||||
}
|
||||
lf_pinbox_put_pins(pins);
|
||||
pthread_mutex_lock(&mutex);
|
||||
N--;
|
||||
if (!N)
|
||||
pthread_cond_signal(&cond);
|
||||
pthread_mutex_unlock(&mutex);
|
||||
return 0;
|
||||
}
|
||||
|
||||
typedef union {
|
||||
int32 data;
|
||||
void *not_used; /* to guarantee sizeof(TLA) >= sizeof(void *) */
|
||||
} TLA;
|
||||
|
||||
pthread_handler_t test_lf_alloc(void *arg)
|
||||
{
|
||||
int m=(*(int *)arg)/2;
|
||||
int32 x,y=0;
|
||||
LF_PINS *pins;
|
||||
|
||||
pins=lf_alloc_get_pins(&lf_allocator);
|
||||
|
||||
for (x=((int)(intptr)(&m)); m ; m--)
|
||||
{
|
||||
TLA *node1, *node2;
|
||||
x=x*m+0x87654321;
|
||||
node1=(TLA *)lf_alloc_new(pins);
|
||||
node1->data=x;
|
||||
y+=node1->data;
|
||||
node1->data=0;
|
||||
node2=(TLA *)lf_alloc_new(pins);
|
||||
node2->data=x;
|
||||
y-=node2->data;
|
||||
node2->data=0;
|
||||
lf_alloc_free(pins, node1);
|
||||
lf_alloc_free(pins, node2);
|
||||
}
|
||||
lf_alloc_put_pins(pins);
|
||||
my_atomic_rwlock_wrlock(&rwl);
|
||||
my_atomic_add32(&a32, y);
|
||||
my_atomic_rwlock_wrunlock(&rwl);
|
||||
pthread_mutex_lock(&mutex);
|
||||
N--;
|
||||
if (!N)
|
||||
{
|
||||
diag("%d mallocs, %d pins in stack",
|
||||
lf_allocator.mallocs, lf_allocator.pinbox.pins_in_stack);
|
||||
#ifdef MY_LF_EXTRA_DEBUG
|
||||
a32|=lf_allocator.mallocs - lf_alloc_in_pool(&lf_allocator);
|
||||
#endif
|
||||
pthread_cond_signal(&cond);
|
||||
}
|
||||
pthread_mutex_unlock(&mutex);
|
||||
return 0;
|
||||
}
|
||||
|
||||
#define N_TLH 1000
|
||||
pthread_handler_t test_lf_hash(void *arg)
|
||||
{
|
||||
int m=(*(int *)arg)/(2*N_TLH);
|
||||
int32 x,y,z,sum=0, ins=0;
|
||||
LF_PINS *pins;
|
||||
|
||||
pins=lf_hash_get_pins(&lf_hash);
|
||||
|
||||
for (x=((int)(intptr)(&m)); m ; m--)
|
||||
{
|
||||
int i;
|
||||
y=x;
|
||||
for (i=0; i < N_TLH; i++)
|
||||
{
|
||||
x=x*(m+i)+0x87654321;
|
||||
z=(x<0) ? -x : x;
|
||||
if (lf_hash_insert(&lf_hash, pins, &z))
|
||||
{
|
||||
sum+=z;
|
||||
ins++;
|
||||
}
|
||||
}
|
||||
for (i=0; i < N_TLH; i++)
|
||||
{
|
||||
y=y*(m+i)+0x87654321;
|
||||
z=(y<0) ? -y : y;
|
||||
if (lf_hash_delete(&lf_hash, pins, (uchar *)&z, sizeof(z)))
|
||||
sum-=z;
|
||||
}
|
||||
}
|
||||
lf_hash_put_pins(pins);
|
||||
my_atomic_rwlock_wrlock(&rwl);
|
||||
my_atomic_add32(&a32, sum);
|
||||
my_atomic_add32(&b32, ins);
|
||||
my_atomic_rwlock_wrunlock(&rwl);
|
||||
pthread_mutex_lock(&mutex);
|
||||
N--;
|
||||
if (!N)
|
||||
{
|
||||
diag("%d mallocs, %d pins in stack, %d hash size, %d inserts",
|
||||
lf_hash.alloc.mallocs, lf_hash.alloc.pinbox.pins_in_stack,
|
||||
lf_hash.size, b32);
|
||||
a32|=lf_hash.count;
|
||||
pthread_cond_signal(&cond);
|
||||
}
|
||||
pthread_mutex_unlock(&mutex);
|
||||
return 0;
|
||||
}
|
||||
|
||||
void test_atomic(const char *test, pthread_handler handler, int n, int m)
|
||||
{
|
||||
pthread_t t;
|
||||
@@ -141,23 +264,24 @@ void test_atomic(const char *test, pthread_handler handler, int n, int m)
|
||||
diag("Testing %s with %d threads, %d iterations... ", test, n, m);
|
||||
for (N=n ; n ; n--)
|
||||
pthread_create(&t, &thr_attr, handler, &m);
|
||||
|
||||
pthread_mutex_lock(&mutex);
|
||||
while (N)
|
||||
pthread_cond_wait(&cond, &mutex);
|
||||
pthread_mutex_unlock(&mutex);
|
||||
now=my_getsystime()-now;
|
||||
ok(a32 == 0, "tested %s in %g secs", test, ((double)now)/1e7);
|
||||
ok(a32 == 0, "tested %s in %g secs (%d)", test, ((double)now)/1e7, a32);
|
||||
}
|
||||
|
||||
int main()
|
||||
{
|
||||
int err;
|
||||
|
||||
diag("N CPUs: %d", my_getncpus());
|
||||
my_init();
|
||||
|
||||
diag("N CPUs: %d, atomic ops: %s", my_getncpus(), MY_ATOMIC_MODE);
|
||||
err= my_atomic_initialize();
|
||||
|
||||
plan(4);
|
||||
plan(7);
|
||||
ok(err == 0, "my_atomic_initialize() returned %d", err);
|
||||
|
||||
pthread_attr_init(&thr_attr);
|
||||
@@ -165,15 +289,31 @@ int main()
|
||||
pthread_mutex_init(&mutex, 0);
|
||||
pthread_cond_init(&cond, 0);
|
||||
my_atomic_rwlock_init(&rwl);
|
||||
lf_alloc_init(&lf_allocator, sizeof(TLA));
|
||||
lf_hash_init(&lf_hash, sizeof(int), LF_HASH_UNIQUE, 0, sizeof(int), 0,
|
||||
&my_charset_bin);
|
||||
|
||||
test_atomic("my_atomic_add32", test_atomic_add_handler, 100,1000000);
|
||||
test_atomic("my_atomic_swap32", test_atomic_swap_handler, 100,1000000);
|
||||
test_atomic("my_atomic_cas32", test_atomic_cas_handler, 100,1000000);
|
||||
#ifdef MY_ATOMIC_MODE_RWLOCKS
|
||||
#define CYCLES 10000
|
||||
#else
|
||||
#define CYCLES 1000000
|
||||
#endif
|
||||
#define THREADS 100
|
||||
|
||||
test_atomic("my_atomic_add32", test_atomic_add_handler, THREADS,CYCLES);
|
||||
test_atomic("my_atomic_swap32", test_atomic_swap_handler, THREADS,CYCLES);
|
||||
test_atomic("my_atomic_cas32", test_atomic_cas_handler, THREADS,CYCLES);
|
||||
test_atomic("lf_pinbox", test_lf_pinbox, THREADS,CYCLES);
|
||||
test_atomic("lf_alloc", test_lf_alloc, THREADS,CYCLES);
|
||||
test_atomic("lf_hash", test_lf_hash, THREADS,CYCLES);
|
||||
|
||||
lf_hash_end(&lf_hash);
|
||||
lf_alloc_end(&lf_allocator);
|
||||
pthread_mutex_destroy(&mutex);
|
||||
pthread_cond_destroy(&cond);
|
||||
pthread_attr_destroy(&thr_attr);
|
||||
my_atomic_rwlock_destroy(&rwl);
|
||||
my_end(0);
|
||||
return exit_status();
|
||||
}
|
||||
|
||||
|
Reference in New Issue
Block a user