mirror of
https://github.com/MariaDB/server.git
synced 2025-08-07 00:04:31 +03:00
MDEV-4506: Parallel replication of group-committed transactions: Intermediate commit
First very rough sketch. We spawn and retire a pool of slave threads. Test main.alias works, most likely not much else does.
This commit is contained in:
509
sql/rpl_parallel.cc
Normal file
509
sql/rpl_parallel.cc
Normal file
@@ -0,0 +1,509 @@
|
||||
#include "my_global.h"
|
||||
#include "rpl_parallel.h"
|
||||
#include "slave.h"
|
||||
#include "rpl_mi.h"
|
||||
|
||||
|
||||
struct rpl_parallel_thread_pool global_rpl_thread_pool;
|
||||
|
||||
|
||||
static void
|
||||
rpt_handle_event(rpl_parallel_thread::queued_event *qev,
|
||||
THD *thd,
|
||||
struct rpl_parallel_thread *rpt)
|
||||
{
|
||||
int err;
|
||||
|
||||
/* ToDo: Access to thd, and what about rli, split out a parallel part? */
|
||||
err= apply_event_and_update_pos(qev->ev, thd, qev->rli, rpt);
|
||||
/* ToDo: error handling. */
|
||||
/* ToDo: also free qev->ev, or hold on to it for a bit if necessary. */
|
||||
}
|
||||
|
||||
|
||||
pthread_handler_t
|
||||
handle_rpl_parallel_thread(void *arg)
|
||||
{
|
||||
THD *thd;
|
||||
const char* old_msg;
|
||||
struct rpl_parallel_thread::queued_event *events;
|
||||
bool group_standalone= true;
|
||||
bool in_event_group= false;
|
||||
|
||||
struct rpl_parallel_thread *rpt= (struct rpl_parallel_thread *)arg;
|
||||
|
||||
my_thread_init();
|
||||
thd = new THD;
|
||||
thd->thread_stack = (char*)&thd;
|
||||
mysql_mutex_lock(&LOCK_thread_count);
|
||||
thd->thread_id= thd->variables.pseudo_thread_id= thread_id++;
|
||||
threads.append(thd);
|
||||
mysql_mutex_unlock(&LOCK_thread_count);
|
||||
set_current_thd(thd);
|
||||
pthread_detach_this_thread();
|
||||
thd->init_for_queries();
|
||||
thd->variables.binlog_annotate_row_events= 0;
|
||||
init_thr_lock();
|
||||
thd->store_globals();
|
||||
thd->system_thread= SYSTEM_THREAD_SLAVE_SQL;
|
||||
thd->security_ctx->skip_grants();
|
||||
thd->variables.max_allowed_packet= slave_max_allowed_packet;
|
||||
thd->slave_thread= 1;
|
||||
thd->enable_slow_log= opt_log_slow_slave_statements;
|
||||
thd->variables.log_slow_filter= global_system_variables.log_slow_filter;
|
||||
set_slave_thread_options(thd);
|
||||
thd->client_capabilities = CLIENT_LOCAL_FILES;
|
||||
thd_proc_info(thd, "Waiting for work from main SQL threads");
|
||||
thd->set_time();
|
||||
thd->variables.lock_wait_timeout= LONG_TIMEOUT;
|
||||
|
||||
mysql_mutex_lock(&rpt->LOCK_rpl_thread);
|
||||
rpt->thd= thd;
|
||||
|
||||
while (rpt->delay_start)
|
||||
mysql_cond_wait(&rpt->COND_rpl_thread, &rpt->LOCK_rpl_thread);
|
||||
|
||||
rpt->running= true;
|
||||
|
||||
while (!rpt->stop && !thd->killed)
|
||||
{
|
||||
rpl_parallel_thread *list;
|
||||
|
||||
old_msg= thd->proc_info;
|
||||
thd->enter_cond(&rpt->COND_rpl_thread, &rpt->LOCK_rpl_thread,
|
||||
"Waiting for work from SQL thread");
|
||||
while (!rpt->stop && !thd->killed && !(events= rpt->event_queue))
|
||||
mysql_cond_wait(&rpt->COND_rpl_thread, &rpt->LOCK_rpl_thread);
|
||||
rpt->free= false;
|
||||
rpt->event_queue= rpt->last_in_queue= NULL;
|
||||
thd->exit_cond(old_msg);
|
||||
|
||||
more_events:
|
||||
while (events)
|
||||
{
|
||||
struct rpl_parallel_thread::queued_event *next= events->next;
|
||||
Log_event_type event_type= events->ev->get_type_code();
|
||||
if (event_type == GTID_EVENT)
|
||||
{
|
||||
group_standalone=
|
||||
(0 != (static_cast<Gtid_log_event *>(events->ev)->flags2 &
|
||||
Gtid_log_event::FL_STANDALONE));
|
||||
in_event_group= true;
|
||||
}
|
||||
else
|
||||
{
|
||||
if (group_standalone)
|
||||
{
|
||||
if (!Log_event::is_part_of_group(event_type))
|
||||
in_event_group= false;
|
||||
}
|
||||
else if (event_type == XID_EVENT)
|
||||
in_event_group= false;
|
||||
else if (event_type == QUERY_EVENT)
|
||||
{
|
||||
Query_log_event *query= static_cast<Query_log_event *>(events->ev);
|
||||
if (!strcmp("COMMIT", query->query) ||
|
||||
!strcmp("ROLLBACK", query->query))
|
||||
in_event_group= false;
|
||||
}
|
||||
}
|
||||
rpt_handle_event(events, thd, rpt);
|
||||
free(events);
|
||||
events= next;
|
||||
}
|
||||
|
||||
mysql_mutex_lock(&rpt->LOCK_rpl_thread);
|
||||
if ((events= rpt->event_queue) != NULL)
|
||||
{
|
||||
rpt->event_queue= rpt->last_in_queue= NULL;
|
||||
mysql_mutex_unlock(&rpt->LOCK_rpl_thread);
|
||||
goto more_events;
|
||||
}
|
||||
|
||||
if (!in_event_group)
|
||||
{
|
||||
rpt->current_entry= NULL;
|
||||
if (!rpt->free)
|
||||
{
|
||||
mysql_mutex_lock(&rpt->pool->LOCK_rpl_thread_pool);
|
||||
list= rpt->pool->free_list;
|
||||
rpt->next= list;
|
||||
rpt->pool->free_list= list;
|
||||
if (!list)
|
||||
mysql_cond_signal(&rpt->pool->COND_rpl_thread_pool);
|
||||
mysql_mutex_unlock(&rpt->pool->LOCK_rpl_thread_pool);
|
||||
rpt->free= true;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
rpt->running= false;
|
||||
mysql_mutex_unlock(&rpt->LOCK_rpl_thread);
|
||||
|
||||
return NULL;
|
||||
}
|
||||
|
||||
|
||||
int
|
||||
rpl_parallel_change_thread_count(rpl_parallel_thread_pool *pool,
|
||||
uint32 new_count, bool skip_check)
|
||||
{
|
||||
uint32 i;
|
||||
rpl_parallel_thread **new_list= NULL;
|
||||
rpl_parallel_thread *new_free_list= NULL;
|
||||
|
||||
/*
|
||||
Allocate the new list of threads up-front.
|
||||
That way, if we fail half-way, we only need to free whatever we managed
|
||||
to allocate, and will not be left with a half-functional thread pool.
|
||||
*/
|
||||
if (new_count &&
|
||||
!(new_list= (rpl_parallel_thread **)my_malloc(new_count*sizeof(*new_list),
|
||||
MYF(MY_WME))))
|
||||
{
|
||||
my_error(ER_OUTOFMEMORY, MYF(0), (int(new_count*sizeof(*new_list))));
|
||||
goto err;;
|
||||
}
|
||||
|
||||
for (i= 0; i < new_count; ++i)
|
||||
{
|
||||
pthread_t th;
|
||||
|
||||
if (!(new_list[i]= (rpl_parallel_thread *)my_malloc(sizeof(*(new_list[i])),
|
||||
MYF(MY_WME))))
|
||||
{
|
||||
my_error(ER_OUTOFMEMORY, MYF(0), sizeof(*(new_list[i])));
|
||||
goto err;
|
||||
}
|
||||
new_list[i]->delay_start= true;
|
||||
new_list[i]->running= false;
|
||||
new_list[i]->stop= false;
|
||||
new_list[i]->free= false;
|
||||
mysql_mutex_init(key_LOCK_rpl_thread, &new_list[i]->LOCK_rpl_thread,
|
||||
MY_MUTEX_INIT_SLOW);
|
||||
mysql_cond_init(key_COND_rpl_thread, &new_list[i]->COND_rpl_thread, NULL);
|
||||
new_list[i]->pool= pool;
|
||||
new_list[i]->current_entry= NULL;
|
||||
new_list[i]->event_queue= NULL;
|
||||
new_list[i]->last_in_queue= NULL;
|
||||
if (mysql_thread_create(key_rpl_parallel_thread, &th, NULL,
|
||||
handle_rpl_parallel_thread, new_list[i]))
|
||||
{
|
||||
my_error(ER_OUT_OF_RESOURCES, MYF(0));
|
||||
my_free(new_list[i]);
|
||||
goto err;
|
||||
}
|
||||
new_list[i]->next= new_free_list;
|
||||
new_free_list= new_list[i];
|
||||
}
|
||||
|
||||
if (!skip_check)
|
||||
{
|
||||
mysql_mutex_lock(&LOCK_active_mi);
|
||||
if (master_info_index->give_error_if_slave_running())
|
||||
{
|
||||
mysql_mutex_unlock(&LOCK_active_mi);
|
||||
goto err;
|
||||
}
|
||||
if (pool->changing)
|
||||
{
|
||||
mysql_mutex_unlock(&LOCK_active_mi);
|
||||
my_error(ER_CHANGE_SLAVE_PARALLEL_THREADS_ACTIVE, MYF(0));
|
||||
goto err;
|
||||
}
|
||||
pool->changing= true;
|
||||
mysql_mutex_unlock(&LOCK_active_mi);
|
||||
}
|
||||
|
||||
for (i= 0; i < pool->count; ++i)
|
||||
{
|
||||
rpl_parallel_thread *rpt= pool->get_thread(NULL);
|
||||
rpt->stop= true;
|
||||
mysql_mutex_unlock(&rpt->LOCK_rpl_thread);
|
||||
}
|
||||
|
||||
for (i= 0; i < pool->count; ++i)
|
||||
{
|
||||
rpl_parallel_thread *rpt= pool->threads[i];
|
||||
mysql_mutex_lock(&rpt->LOCK_rpl_thread);
|
||||
while (rpt->running)
|
||||
mysql_cond_wait(&rpt->COND_rpl_thread, &rpt->LOCK_rpl_thread);
|
||||
mysql_mutex_unlock(&rpt->LOCK_rpl_thread);
|
||||
delete rpt;
|
||||
}
|
||||
|
||||
my_free(pool->threads);
|
||||
pool->threads= new_list;
|
||||
pool->free_list= new_free_list;
|
||||
pool->count= new_count;
|
||||
for (i= 0; i < pool->count; ++i)
|
||||
{
|
||||
mysql_mutex_lock(&pool->threads[i]->LOCK_rpl_thread);
|
||||
pool->threads[i]->delay_start= false;
|
||||
mysql_cond_signal(&pool->threads[i]->COND_rpl_thread);
|
||||
mysql_mutex_unlock(&pool->threads[i]->LOCK_rpl_thread);
|
||||
}
|
||||
|
||||
if (!skip_check)
|
||||
{
|
||||
mysql_mutex_lock(&LOCK_active_mi);
|
||||
pool->changing= false;
|
||||
mysql_mutex_unlock(&LOCK_active_mi);
|
||||
}
|
||||
return 0;
|
||||
|
||||
err:
|
||||
if (new_list)
|
||||
{
|
||||
while (new_free_list)
|
||||
{
|
||||
rpl_parallel_thread *next= new_free_list->next;
|
||||
mysql_mutex_lock(&new_free_list->LOCK_rpl_thread);
|
||||
new_free_list->delay_start= false;
|
||||
new_free_list->stop= true;
|
||||
while (!new_free_list->running)
|
||||
mysql_cond_wait(&new_free_list->COND_rpl_thread,
|
||||
&new_free_list->LOCK_rpl_thread);
|
||||
while (new_free_list->running)
|
||||
mysql_cond_wait(&new_free_list->COND_rpl_thread,
|
||||
&new_free_list->LOCK_rpl_thread);
|
||||
my_free(new_free_list);
|
||||
new_free_list= next;
|
||||
}
|
||||
my_free(new_list);
|
||||
}
|
||||
if (!skip_check)
|
||||
{
|
||||
mysql_mutex_lock(&LOCK_active_mi);
|
||||
pool->changing= false;
|
||||
mysql_mutex_unlock(&LOCK_active_mi);
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
|
||||
|
||||
rpl_parallel_thread_pool::rpl_parallel_thread_pool()
|
||||
: count(0), threads(0), free_list(0), changing(false), inited(false)
|
||||
{
|
||||
}
|
||||
|
||||
|
||||
int
|
||||
rpl_parallel_thread_pool::init(uint32 size)
|
||||
{
|
||||
count= 0;
|
||||
threads= NULL;
|
||||
free_list= NULL;
|
||||
|
||||
mysql_mutex_init(key_LOCK_rpl_thread_pool, &LOCK_rpl_thread_pool,
|
||||
MY_MUTEX_INIT_SLOW);
|
||||
mysql_cond_init(key_COND_rpl_thread_pool, &COND_rpl_thread_pool, NULL);
|
||||
changing= false;
|
||||
inited= true;
|
||||
|
||||
return rpl_parallel_change_thread_count(this, size, true);
|
||||
}
|
||||
|
||||
|
||||
void
|
||||
rpl_parallel_thread_pool::destroy()
|
||||
{
|
||||
if (!inited)
|
||||
return;
|
||||
rpl_parallel_change_thread_count(this, 0, true);
|
||||
mysql_mutex_destroy(&LOCK_rpl_thread_pool);
|
||||
mysql_cond_destroy(&COND_rpl_thread_pool);
|
||||
}
|
||||
|
||||
|
||||
struct rpl_parallel_thread *
|
||||
rpl_parallel_thread_pool::get_thread(rpl_parallel_entry *entry)
|
||||
{
|
||||
rpl_parallel_thread *rpt;
|
||||
|
||||
mysql_mutex_lock(&LOCK_rpl_thread_pool);
|
||||
while ((rpt= free_list) == NULL)
|
||||
mysql_cond_wait(&COND_rpl_thread_pool, &LOCK_rpl_thread_pool);
|
||||
free_list= rpt->next;
|
||||
mysql_mutex_lock(&rpt->LOCK_rpl_thread);
|
||||
mysql_mutex_unlock(&LOCK_rpl_thread_pool);
|
||||
rpt->current_entry= entry;
|
||||
|
||||
return rpt;
|
||||
}
|
||||
|
||||
|
||||
rpl_parallel::rpl_parallel() :
|
||||
current(NULL)
|
||||
{
|
||||
my_hash_init(&domain_hash, &my_charset_bin, 32,
|
||||
offsetof(rpl_parallel_entry, domain_id), sizeof(uint32),
|
||||
NULL, NULL, HASH_UNIQUE);
|
||||
}
|
||||
|
||||
|
||||
rpl_parallel::~rpl_parallel()
|
||||
{
|
||||
my_hash_free(&domain_hash);
|
||||
}
|
||||
|
||||
|
||||
rpl_parallel_entry *
|
||||
rpl_parallel::find(uint32 domain_id)
|
||||
{
|
||||
struct rpl_parallel_entry *e;
|
||||
|
||||
if (!(e= (rpl_parallel_entry *)my_hash_search(&domain_hash,
|
||||
(const uchar *)&domain_id, 0)))
|
||||
{
|
||||
/* Allocate a new, empty one. */
|
||||
if (!(e= (struct rpl_parallel_entry *)my_malloc(sizeof(*e), MYF(0))))
|
||||
return NULL;
|
||||
e->domain_id= domain_id;
|
||||
e->last_server_id= 0;
|
||||
e->last_seq_no= 0;
|
||||
e->last_commit_id= 0;
|
||||
e->active= false;
|
||||
e->rpl_thread= NULL;
|
||||
if (my_hash_insert(&domain_hash, (uchar *)e))
|
||||
{
|
||||
my_free(e);
|
||||
return NULL;
|
||||
}
|
||||
}
|
||||
|
||||
return e;
|
||||
}
|
||||
|
||||
|
||||
bool
|
||||
rpl_parallel::do_event(Relay_log_info *rli, Log_event *ev, THD *parent_thd)
|
||||
{
|
||||
rpl_parallel_entry *e;
|
||||
rpl_parallel_thread *cur_thread;
|
||||
rpl_parallel_thread::queued_event *qev;
|
||||
|
||||
if (!(qev= (rpl_parallel_thread::queued_event *)my_malloc(sizeof(*qev),
|
||||
MYF(0))))
|
||||
{
|
||||
my_error(ER_OUT_OF_RESOURCES, MYF(0));
|
||||
return true;
|
||||
}
|
||||
qev->ev= ev;
|
||||
qev->rli= rli;
|
||||
qev->next= NULL;
|
||||
|
||||
if (ev->get_type_code() == GTID_EVENT)
|
||||
{
|
||||
Gtid_log_event *gtid_ev= static_cast<Gtid_log_event *>(ev);
|
||||
|
||||
if (!(e= find(gtid_ev->domain_id)))
|
||||
{
|
||||
my_error(ER_OUT_OF_RESOURCES, MYF(0));
|
||||
return true;
|
||||
}
|
||||
|
||||
/* Check if we already have a worker thread for this entry. */
|
||||
cur_thread= e->rpl_thread;
|
||||
if (cur_thread)
|
||||
{
|
||||
mysql_mutex_lock(&cur_thread->LOCK_rpl_thread);
|
||||
if (cur_thread->current_entry != e)
|
||||
{
|
||||
/* Not ours anymore, we need to grab a new one. */
|
||||
mysql_mutex_unlock(&cur_thread->LOCK_rpl_thread);
|
||||
e->rpl_thread= cur_thread= NULL;
|
||||
}
|
||||
}
|
||||
|
||||
if (!cur_thread)
|
||||
{
|
||||
/*
|
||||
Nothing else is currently running in this domain. We can spawn a new
|
||||
thread to do this event group in parallel with anything else that might
|
||||
be running in other domains.
|
||||
*/
|
||||
if (gtid_ev->flags & Gtid_log_event::FL_GROUP_COMMIT_ID)
|
||||
{
|
||||
e->last_server_id= gtid_ev->server_id;
|
||||
e->last_seq_no= gtid_ev->seq_no;
|
||||
e->last_commit_id= gtid_ev->commit_id;
|
||||
}
|
||||
else
|
||||
{
|
||||
e->last_server_id= 0;
|
||||
e->last_seq_no= 0;
|
||||
e->last_commit_id= 0;
|
||||
}
|
||||
cur_thread= e->rpl_thread= global_rpl_thread_pool.get_thread(e);
|
||||
e->rpl_thread->wait_for= NULL; /* ToDo */
|
||||
/* get_thread() returns with the LOCK_rpl_thread locked. */
|
||||
}
|
||||
else if ((gtid_ev->flags & Gtid_log_event::FL_GROUP_COMMIT_ID) &&
|
||||
e->last_commit_id == gtid_ev->commit_id)
|
||||
{
|
||||
/*
|
||||
We are already executing something else in this domain. But the two
|
||||
event groups were committed together in the same group commit on the
|
||||
master, so we can still do them in parallel here on the slave.
|
||||
|
||||
However, the commit of this event must wait for the commit of the prior
|
||||
event, to preserve binlog commit order and visibility across all
|
||||
servers in the replication hierarchy.
|
||||
*/
|
||||
rpl_parallel_thread *rpt= global_rpl_thread_pool.get_thread(e);
|
||||
rpt->wait_for= cur_thread; /* ToDo */
|
||||
mysql_mutex_unlock(&cur_thread->LOCK_rpl_thread);
|
||||
e->rpl_thread= cur_thread= rpt;
|
||||
/* get_thread() returns with the LOCK_rpl_thread locked. */
|
||||
}
|
||||
else
|
||||
{
|
||||
/*
|
||||
We are still executing the previous event group for this replication
|
||||
domain, and we have to wait for that to finish before we can start on
|
||||
the next one. So just re-use the thread.
|
||||
*/
|
||||
}
|
||||
|
||||
current= e;
|
||||
}
|
||||
else
|
||||
{
|
||||
if (!current)
|
||||
{
|
||||
/* We have no domain_id yet, just run non-parallel. */
|
||||
rpt_handle_event(qev, parent_thd, NULL);
|
||||
return false;
|
||||
}
|
||||
cur_thread= current->rpl_thread;
|
||||
if (cur_thread)
|
||||
{
|
||||
mysql_mutex_lock(&cur_thread->LOCK_rpl_thread);
|
||||
if (cur_thread->current_entry != current)
|
||||
{
|
||||
/* Not ours anymore, we need to grab a new one. */
|
||||
mysql_mutex_unlock(&cur_thread->LOCK_rpl_thread);
|
||||
cur_thread= NULL;
|
||||
}
|
||||
}
|
||||
if (!cur_thread)
|
||||
{
|
||||
cur_thread= current->rpl_thread=
|
||||
global_rpl_thread_pool.get_thread(current);
|
||||
cur_thread->wait_for= NULL; /* ToDo */
|
||||
}
|
||||
}
|
||||
/*
|
||||
Queue the event for processing.
|
||||
*/
|
||||
if (cur_thread->last_in_queue)
|
||||
cur_thread->last_in_queue->next= qev;
|
||||
else
|
||||
cur_thread->event_queue= qev;
|
||||
cur_thread->last_in_queue= qev;
|
||||
mysql_cond_signal(&cur_thread->COND_rpl_thread);
|
||||
mysql_mutex_unlock(&cur_thread->LOCK_rpl_thread);
|
||||
|
||||
return false;
|
||||
}
|
Reference in New Issue
Block a user