mirror of
https://github.com/mariadb-corporation/mariadb-columnstore-engine.git
synced 2025-04-18 21:44:02 +03:00
This patch improves handling of NULLs in textual fields in ColumnStore. Previously empty strings were considered NULLs and it could be a problem if data scheme allows for empty strings. It was also one of major reasons of behavior difference between ColumnStore and other engines in MariaDB family. Also, this patch fixes some other bugs and incorrect behavior, for example, incorrect comparison for "column <= ''" which evaluates to constant True for all purposes before this patch.
1005 lines
28 KiB
C++
1005 lines
28 KiB
C++
/* Copyright (C) 2014 InfiniDB, Inc.
|
|
Copyright (C) 2019 MariaDB Corporation
|
|
|
|
This program is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU General Public License
|
|
as published by the Free Software Foundation; version 2 of
|
|
the License.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
|
|
MA 02110-1301, USA. */
|
|
|
|
/*
|
|
* $Id: ha_mcs_dml.cpp 9711 2013-07-23 21:01:27Z chao $
|
|
*/
|
|
|
|
#define PREFER_MY_CONFIG_H
|
|
#include <my_config.h>
|
|
#include <string>
|
|
#include <iostream>
|
|
#include <stack>
|
|
#include <tr1/unordered_map>
|
|
#include <tr1/unordered_set>
|
|
#include <fstream>
|
|
#include <sstream>
|
|
#include <cerrno>
|
|
#include <cstring>
|
|
using namespace std;
|
|
|
|
#include <boost/shared_ptr.hpp>
|
|
using namespace boost;
|
|
|
|
#include "idb_mysql.h"
|
|
|
|
#define NEED_CALPONT_INTERFACE
|
|
#include "ha_mcs_impl.h"
|
|
|
|
#include "ha_mcs_impl_if.h"
|
|
using namespace cal_impl_if;
|
|
|
|
#include "vendordmlstatement.h"
|
|
#include "calpontdmlpackage.h"
|
|
#include "calpontdmlfactory.h"
|
|
using namespace dmlpackage;
|
|
|
|
#include "dmlpackageprocessor.h"
|
|
using namespace dmlpackageprocessor;
|
|
|
|
#include "dataconvert.h"
|
|
using namespace dataconvert;
|
|
|
|
#include "bytestream.h"
|
|
using namespace messageqcpp;
|
|
|
|
#include "configcpp.h"
|
|
using namespace config;
|
|
|
|
#include "calpontsystemcatalog.h"
|
|
using namespace execplan;
|
|
|
|
#include "resourcemanager.h"
|
|
using namespace joblist;
|
|
//#include "stopwatch.h"
|
|
// using namespace logging;
|
|
|
|
#include "dbrm.h"
|
|
|
|
#include "ha_mcs_datatype.h"
|
|
|
|
#include "nullstring.h"
|
|
|
|
namespace
|
|
{
|
|
#define BATCH_INSERT_GROUP_ROWS_FOR_CACHE 100000
|
|
uint64_t fBatchInsertGroupRows = 0; // ResourceManager::instance()->getRowsPerBatch();
|
|
// HDFS is never used nowadays, so don't bother
|
|
bool useHdfs = false; // ResourceManager::instance()->useHdfs();
|
|
|
|
// convenience fcn
|
|
inline uint32_t tid2sid(const uint32_t tid)
|
|
{
|
|
return execplan::CalpontSystemCatalog::idb_tid2sid(tid);
|
|
}
|
|
|
|
// StopWatch timer;
|
|
uint32_t buildValueList(TABLE* table, cal_connection_info& ci)
|
|
{
|
|
char attribute_buffer[1024];
|
|
String attribute(attribute_buffer, sizeof(attribute_buffer), &my_charset_bin);
|
|
uint32_t size = 0;
|
|
int columnPos = 0;
|
|
double dbval;
|
|
ci.nullValuesBitset.reset();
|
|
NullString null;
|
|
|
|
|
|
for (Field** field = table->field; *field; field++)
|
|
{
|
|
if ((*field)->is_null())
|
|
{
|
|
ci.tableValuesMap[columnPos].push_back(null);
|
|
ci.nullValuesBitset[columnPos] = true;
|
|
}
|
|
else
|
|
{
|
|
bitmap_set_bit(table->read_set, (*field)->field_index);
|
|
ci.nullValuesBitset[columnPos] = false;
|
|
|
|
// @bug 3798 get real value for float/double type
|
|
if ((*field)->result_type() == REAL_RESULT)
|
|
{
|
|
dbval = (*field)->val_real();
|
|
// int maxlen = (*field)->max_display_length();
|
|
const unsigned maxlen = 1024 + 1 + 1 + 1; // 1 for leading zero, 1 for dp, 1 for null
|
|
char buf[maxlen];
|
|
memset(buf, 0, maxlen);
|
|
snprintf(buf, maxlen, "%.1024f", dbval);
|
|
NullString value(buf, strlen(buf));
|
|
ci.tableValuesMap[columnPos].push_back(value);
|
|
}
|
|
else
|
|
{
|
|
// fetch different data type
|
|
(*field)->val_str(&attribute, &attribute);
|
|
|
|
// if (attribute.length() == 0)
|
|
// {
|
|
// ci.tableValuesMap[columnPos].push_back(null); // currently, empty string is treated as null.
|
|
// }
|
|
// else
|
|
{
|
|
string val(attribute.ptr(), attribute.length());
|
|
NullString nonNull(val);
|
|
ci.tableValuesMap[columnPos].push_back(nonNull);
|
|
}
|
|
}
|
|
}
|
|
|
|
ci.colNameList.push_back((*field)->field_name.str);
|
|
|
|
columnPos++;
|
|
}
|
|
|
|
size = ci.tableValuesMap[0].size();
|
|
return size;
|
|
}
|
|
|
|
int ProcessCommandStatement(THD* thd, string& dmlStatement, cal_connection_info& ci, std::string schema = "")
|
|
{
|
|
int rc = 0;
|
|
|
|
ulong sessionID = tid2sid(thd->thread_id);
|
|
|
|
CalpontDMLPackage* pDMLPackage;
|
|
|
|
//@Bug 2721 and 2722. Log the statement before issuing commit/rollback
|
|
if (dmlStatement == "LOGGING")
|
|
{
|
|
char* query_char = idb_mysql_query_str(thd);
|
|
std::string query_str;
|
|
if (!query_char)
|
|
{
|
|
query_str = "<Replication event>";
|
|
}
|
|
else
|
|
{
|
|
query_str = query_char;
|
|
}
|
|
VendorDMLStatement cmdStmt(query_str, DML_COMMAND, sessionID);
|
|
cmdStmt.set_Logging(false);
|
|
pDMLPackage = CalpontDMLFactory::makeCalpontDMLPackageFromMysqlBuffer(cmdStmt);
|
|
pDMLPackage->set_Logging(false);
|
|
pDMLPackage->set_SchemaName(schema);
|
|
}
|
|
else
|
|
{
|
|
VendorDMLStatement cmdStmt(dmlStatement, DML_COMMAND, sessionID);
|
|
pDMLPackage = CalpontDMLFactory::makeCalpontDMLPackageFromMysqlBuffer(cmdStmt);
|
|
}
|
|
|
|
pDMLPackage->setTableOid(ci.tableOid);
|
|
|
|
if (!ci.singleInsert)
|
|
{
|
|
pDMLPackage->set_isBatchInsert(true);
|
|
}
|
|
|
|
if (!(thd->variables.option_bits & (OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN)))
|
|
pDMLPackage->set_isAutocommitOn(true);
|
|
|
|
if (useHdfs)
|
|
pDMLPackage->set_isAutocommitOn(true);
|
|
|
|
ByteStream bytestream;
|
|
bytestream << static_cast<uint32_t>(sessionID);
|
|
|
|
pDMLPackage->write(bytestream);
|
|
delete pDMLPackage;
|
|
|
|
ByteStream::byte b = 0;
|
|
string errormsg;
|
|
ByteStream::octbyte rows;
|
|
|
|
try
|
|
{
|
|
ci.dmlProc->write(bytestream);
|
|
bytestream = ci.dmlProc->read();
|
|
|
|
if (bytestream.length() == 0)
|
|
{
|
|
rc = 1;
|
|
thd->killed = KILL_QUERY;
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, "Lost connection to DMLProc [1]");
|
|
}
|
|
else
|
|
{
|
|
bytestream >> b;
|
|
bytestream >> rows;
|
|
bytestream >> errormsg;
|
|
}
|
|
}
|
|
catch (runtime_error&)
|
|
{
|
|
rc = 1;
|
|
thd->killed = KILL_QUERY;
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, "Lost connection to DMLProc [2]");
|
|
}
|
|
catch (...)
|
|
{
|
|
rc = 1;
|
|
thd->killed = KILL_QUERY;
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, "Caught unknown error");
|
|
}
|
|
|
|
if ((b != 0) && (!thd->get_stmt_da()->is_set()))
|
|
{
|
|
rc = 1;
|
|
thd->killed = KILL_QUERY;
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, errormsg.c_str());
|
|
}
|
|
|
|
delete ci.dmlProc;
|
|
ci.dmlProc = NULL;
|
|
return rc;
|
|
}
|
|
|
|
int doProcessInsertValues(TABLE* table, uint32_t size, cal_connection_info& ci, bool lastBatch = false)
|
|
{
|
|
THD* thd = current_thd;
|
|
uint32_t sessionID = tid2sid(thd->thread_id);
|
|
|
|
int rc = 0;
|
|
|
|
char* query_char = idb_mysql_query_str(thd);
|
|
std::string query_str;
|
|
if (!query_char)
|
|
{
|
|
query_str = "<Replication event>";
|
|
}
|
|
else
|
|
{
|
|
query_str = query_char;
|
|
}
|
|
|
|
VendorDMLStatement dmlStmts(query_str, DML_INSERT, table->s->table_name.str, table->s->db.str, size,
|
|
ci.colNameList.size(), ci.colNameList, ci.tableValuesMap, ci.nullValuesBitset,
|
|
sessionID);
|
|
|
|
CalpontDMLPackage* pDMLPackage = CalpontDMLFactory::makeCalpontDMLPackageFromMysqlBuffer(dmlStmts);
|
|
//@Bug 2466 Move the clean up earlier to avoid the second insert in another session to get the data
|
|
ci.tableValuesMap.clear();
|
|
ci.colNameList.clear();
|
|
|
|
pDMLPackage->set_isCacheInsert(ci.isCacheInsert);
|
|
|
|
if (!pDMLPackage)
|
|
{
|
|
rc = -1;
|
|
string emsg("Calpont DML package cannot build. ");
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, emsg.c_str());
|
|
return rc;
|
|
}
|
|
|
|
//@Bug 2721 and 2722 log batch insert statement only once in the bebug file.
|
|
if (((ci.isLoaddataInfile) || ((ci.rowsHaveInserted + size) < ci.bulkInsertRows)) &&
|
|
(ci.rowsHaveInserted > 0))
|
|
{
|
|
pDMLPackage->set_Logging(false);
|
|
pDMLPackage->set_Logending(false);
|
|
}
|
|
else if (((ci.isLoaddataInfile) || ((ci.rowsHaveInserted + size) < ci.bulkInsertRows)) &&
|
|
(ci.rowsHaveInserted == 0))
|
|
{
|
|
pDMLPackage->set_Logging(true);
|
|
pDMLPackage->set_Logending(false);
|
|
}
|
|
|
|
if (ci.singleInsert)
|
|
{
|
|
pDMLPackage->set_Logging(true);
|
|
pDMLPackage->set_Logending(true);
|
|
}
|
|
|
|
if (!ci.singleInsert)
|
|
{
|
|
pDMLPackage->set_isBatchInsert(true);
|
|
}
|
|
|
|
if (thd->is_strict_mode())
|
|
{
|
|
pDMLPackage->set_isWarnToError(true);
|
|
}
|
|
|
|
pDMLPackage->setTableOid(ci.tableOid);
|
|
|
|
if (lastBatch)
|
|
{
|
|
pDMLPackage->set_Logending(true);
|
|
}
|
|
|
|
if (lastBatch && (ci.rowsHaveInserted > 0))
|
|
pDMLPackage->set_Logging(false);
|
|
|
|
std::string name = table->s->table_name.str;
|
|
pDMLPackage->set_TableName(name);
|
|
name = table->s->db.str;
|
|
pDMLPackage->set_SchemaName(name);
|
|
const char* timeZone = thd->variables.time_zone->get_name()->ptr();
|
|
long timeZoneOffset;
|
|
dataconvert::timeZoneToOffset(timeZone, strlen(timeZone), &timeZoneOffset);
|
|
pDMLPackage->set_TimeZone(timeZoneOffset);
|
|
|
|
if (thd->lex->sql_command == SQLCOM_INSERT_SELECT)
|
|
pDMLPackage->set_isInsertSelect(true);
|
|
|
|
// Carry session autocommit info in the pkg to use in DMLProc
|
|
// cout << "Thread options = " << thd->variables.option_bits << " and OPTION_NOT_AUTOCOMMIT:OPTION_BEGIN =
|
|
// " << OPTION_NOT_AUTOCOMMIT << ":" << OPTION_BEGIN << endl;
|
|
if (!(thd->variables.option_bits & (OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN)))
|
|
{
|
|
// cout << "autocommit is on" << endl;
|
|
pDMLPackage->set_isAutocommitOn(true);
|
|
}
|
|
else if (useHdfs)
|
|
{
|
|
pDMLPackage->set_isAutocommitOn(true);
|
|
}
|
|
|
|
ByteStream bytestream, bytestreamRcv;
|
|
bytestream << sessionID;
|
|
|
|
pDMLPackage->write(bytestream);
|
|
delete pDMLPackage;
|
|
|
|
ByteStream::byte b = 0;
|
|
string errormsg;
|
|
ByteStream::octbyte rows;
|
|
|
|
try
|
|
{
|
|
ci.dmlProc->write(bytestream);
|
|
bytestreamRcv = ci.dmlProc->read();
|
|
|
|
if (bytestreamRcv.length() == 0)
|
|
{
|
|
// check if it is first batch and DMLProc restarted. Only this case, get a new client and resend
|
|
if (ci.rowsHaveInserted == 0)
|
|
{
|
|
delete ci.dmlProc;
|
|
ci.dmlProc = new MessageQueueClient("DMLProc");
|
|
|
|
// cout << "doProcessInsertValues starts a client " << ci.dmlProc << " for session " << thd->thread_id
|
|
// << endl;
|
|
try
|
|
{
|
|
ci.dmlProc->write(bytestream);
|
|
bytestreamRcv = ci.dmlProc->read();
|
|
|
|
if (bytestreamRcv.length() == 0)
|
|
{
|
|
rc = -1;
|
|
b = 1;
|
|
errormsg = "Lost connection to DMLProc [3]";
|
|
}
|
|
else
|
|
{
|
|
bytestreamRcv >> b;
|
|
bytestreamRcv >> rows;
|
|
bytestreamRcv >> errormsg;
|
|
rc = b;
|
|
}
|
|
}
|
|
catch (runtime_error&)
|
|
{
|
|
rc = -1;
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
errormsg = "Lost connection to DMLProc [4]";
|
|
b = 1;
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
bytestreamRcv >> b;
|
|
bytestreamRcv >> rows;
|
|
bytestreamRcv >> errormsg;
|
|
rc = b;
|
|
}
|
|
}
|
|
catch (std::exception& rex)
|
|
{
|
|
// check if it is first batch and DMLProc restarted. Only this case, get a new client and resend
|
|
if (ci.rowsHaveInserted == 0)
|
|
{
|
|
delete ci.dmlProc;
|
|
ci.dmlProc = new MessageQueueClient("DMLProc");
|
|
|
|
// cout << "doProcessInsertValues exception starts a client " << ci.dmlProc << " for session " <<
|
|
// thd->thread_id << endl;
|
|
try
|
|
{
|
|
ci.dmlProc->write(bytestream);
|
|
bytestreamRcv = ci.dmlProc->read();
|
|
|
|
if (bytestreamRcv.length() == 0)
|
|
{
|
|
rc = -1;
|
|
b = 1;
|
|
errormsg = string("Lost connection to DMLProc after getting a new client [1:") + rex.what() + "]";
|
|
}
|
|
else
|
|
{
|
|
bytestreamRcv >> b;
|
|
bytestreamRcv >> rows;
|
|
bytestreamRcv >> errormsg;
|
|
rc = b;
|
|
}
|
|
}
|
|
catch (std::exception& rrex)
|
|
{
|
|
rc = -1;
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
errormsg = string("Lost connection to DMLProc after getting a new client [2:") + rex.what() +
|
|
" then " + rrex.what() + "]";
|
|
b = 1;
|
|
}
|
|
}
|
|
else // really lost connection
|
|
{
|
|
rc = -1;
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
errormsg = string("Lost connection to DMLProc really [1:") + rex.what() + "]";
|
|
b = 1;
|
|
}
|
|
}
|
|
catch (...)
|
|
{
|
|
rc = -1;
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
errormsg = "Unknown error caught";
|
|
b = 1;
|
|
}
|
|
|
|
if ((b != 0) && (b != dmlpackageprocessor::DMLPackageProcessor::IDBRANGE_WARNING))
|
|
{
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, errormsg.c_str());
|
|
}
|
|
|
|
if (b == dmlpackageprocessor::DMLPackageProcessor::IDBRANGE_WARNING)
|
|
{
|
|
if (!thd->is_strict_mode())
|
|
{
|
|
rc = 0;
|
|
}
|
|
|
|
push_warning(thd, Sql_condition::WARN_LEVEL_WARN, ER_WARN_DATA_OUT_OF_RANGE, errormsg.c_str());
|
|
}
|
|
|
|
if (rc != 0)
|
|
ci.rc = rc;
|
|
|
|
if (b == dmlpackageprocessor::DMLPackageProcessor::ACTIVE_TRANSACTION_ERROR)
|
|
rc = b;
|
|
|
|
return rc;
|
|
}
|
|
|
|
} // namespace
|
|
|
|
int ha_mcs_impl_write_last_batch(TABLE* table, cal_connection_info& ci, bool abort)
|
|
{
|
|
int rc = 0;
|
|
THD* thd = current_thd;
|
|
std::string command;
|
|
uint32_t size = ci.tableValuesMap[0].size();
|
|
//@Bug 2468. Add a logging statement command
|
|
command = "COMMIT";
|
|
std::string schema;
|
|
schema = table->s->db.str;
|
|
|
|
//@Bug 6112. if no row to be insert and no rows have been inserted, no need to send to DMLProc
|
|
if ((size == 0) && (ci.rowsHaveInserted == 0))
|
|
return rc;
|
|
|
|
//@Bug 2715 Check the saved error code.
|
|
//@Bug 4516 always send the last package to allow DMLProc receive all messages from WES
|
|
if ((ci.rc != 0) || abort)
|
|
{
|
|
if (abort) //@Bug 5285. abort is different from error, dmlproc only clean up when erroring out
|
|
rc = doProcessInsertValues(table, size, ci, true);
|
|
|
|
//@Bug 2722 Log the statement into datamod log
|
|
//@Bug 4605 if error, rollback and no need to check whether the session is autocommit off
|
|
|
|
command = "ROLLBACK";
|
|
rc = ProcessCommandStatement(thd, command, ci, schema);
|
|
rc = ci.rc;
|
|
ci.rc = 0;
|
|
|
|
if (size > 0)
|
|
{
|
|
ci.tableValuesMap.clear();
|
|
ci.colNameList.clear();
|
|
}
|
|
|
|
return rc;
|
|
}
|
|
else
|
|
{
|
|
rc = doProcessInsertValues(table, size, ci, true);
|
|
}
|
|
|
|
if (abort)
|
|
{
|
|
rc = 1;
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
std::string errormsg = "statement is aborted.";
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, errormsg.c_str());
|
|
}
|
|
|
|
if (rc == dmlpackageprocessor::DMLPackageProcessor::ACTIVE_TRANSACTION_ERROR)
|
|
return rc;
|
|
|
|
//@Bug 4605
|
|
int rc1 = 0;
|
|
if ((rc == 0) && !abort && (!(thd->variables.option_bits & (OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN))))
|
|
{
|
|
ci.rowsHaveInserted += size;
|
|
command = "COMMIT";
|
|
rc1 = ProcessCommandStatement(thd, command, ci, schema);
|
|
}
|
|
else if (useHdfs)
|
|
{
|
|
ci.rowsHaveInserted += size;
|
|
command = "COMMIT";
|
|
rc1 = ProcessCommandStatement(thd, command, ci, schema);
|
|
}
|
|
else if ((rc != 0) || abort)
|
|
{
|
|
command = "ROLLBACK";
|
|
rc1 = ProcessCommandStatement(thd, command, ci, schema);
|
|
}
|
|
rc = max(rc, rc1);
|
|
|
|
return rc;
|
|
}
|
|
|
|
int ha_mcs_impl_write_row_(const uchar* buf, TABLE* table, cal_connection_info& ci, ha_rows& rowsInserted)
|
|
{
|
|
int rc = 0;
|
|
// timer.start( "buildValueList");
|
|
ci.colNameList.clear();
|
|
THD* thd = current_thd;
|
|
uint32_t size = 0;
|
|
std::string schema;
|
|
schema = table->s->db.str;
|
|
|
|
//@Bug 2086 Added syntax check for '\0'
|
|
try
|
|
{
|
|
size = buildValueList(table, ci);
|
|
}
|
|
catch (runtime_error& rex)
|
|
{
|
|
rc = 1;
|
|
ci.rc = rc; //@Bug 2790 Save the error infomation.
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, rex.what());
|
|
return rc;
|
|
}
|
|
|
|
if (fBatchInsertGroupRows == 0)
|
|
{
|
|
fBatchInsertGroupRows = ResourceManager::instance()->getRowsPerBatch();
|
|
}
|
|
|
|
// timer.stop( "buildValueList");
|
|
if (ci.singleInsert // Single insert
|
|
|| ((ci.bulkInsertRows > 0) && (((ci.rowsHaveInserted + size) >= ci.bulkInsertRows) ||
|
|
((!ci.isCacheInsert && size >= fBatchInsertGroupRows) ||
|
|
(ci.isCacheInsert && size >= BATCH_INSERT_GROUP_ROWS_FOR_CACHE))))
|
|
// Insert with mutilple value case: processed batch by batch. Last batch is sent also.
|
|
|| ((ci.bulkInsertRows == 0) &&
|
|
((!ci.isCacheInsert && size >= fBatchInsertGroupRows) ||
|
|
(ci.isCacheInsert &&
|
|
size >= BATCH_INSERT_GROUP_ROWS_FOR_CACHE)))) // Load data in file is processed batch by batch
|
|
{
|
|
// timer.start( "DMLProc takes");
|
|
// cout <<" sending a batch to DMLProc ... The size is " << size << " the current bulkInsertRows = " <<
|
|
// ci.bulkInsertRows << endl; Build dmlpackage
|
|
if ((ci.bulkInsertRows > 0) && ((ci.rowsHaveInserted + size) >= ci.bulkInsertRows))
|
|
{
|
|
rc = doProcessInsertValues(table, size, ci, true);
|
|
}
|
|
else
|
|
{
|
|
rc = doProcessInsertValues(table, size, ci);
|
|
}
|
|
|
|
if (rc == 0)
|
|
rowsInserted = size;
|
|
else
|
|
ci.rc = rc;
|
|
|
|
//@Bug 2481. The current active transaction needs to be released if autocommit is on
|
|
//@Bug 2438 Added a check for batchinsert's last batch to send commit if autocommit is on
|
|
std::string command;
|
|
|
|
if (ci.singleInsert || ((ci.bulkInsertRows > 0) && ((ci.rowsHaveInserted + size) >= ci.bulkInsertRows)))
|
|
{
|
|
if (thd->killed > 0)
|
|
{
|
|
command = "ROLLBACK";
|
|
rc = ProcessCommandStatement(thd, command, ci, schema);
|
|
}
|
|
else if (rc != dmlpackageprocessor::DMLPackageProcessor::ACTIVE_TRANSACTION_ERROR)
|
|
{
|
|
//@Bug 4605
|
|
int rc1 = 0;
|
|
if (rc != 0)
|
|
{
|
|
command = "ROLLBACK";
|
|
rc1 = ProcessCommandStatement(thd, command, ci, schema);
|
|
}
|
|
else if ((rc == 0) && (!(thd->variables.option_bits & (OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN))))
|
|
{
|
|
command = "COMMIT";
|
|
rc1 = ProcessCommandStatement(thd, command, ci, schema);
|
|
}
|
|
else if (useHdfs)
|
|
{
|
|
command = "COMMIT";
|
|
rc1 = ProcessCommandStatement(thd, command, ci, schema);
|
|
}
|
|
rc = max(rc, rc1);
|
|
}
|
|
}
|
|
|
|
// timer.stop( "DMLProc takes");
|
|
// timer.finish();
|
|
return rc;
|
|
}
|
|
else
|
|
{
|
|
return rc;
|
|
}
|
|
}
|
|
|
|
int ha_mcs_impl_write_batch_row_(const uchar* buf, TABLE* table, cal_impl_if::cal_connection_info& ci,
|
|
long timeZone)
|
|
{
|
|
ByteStream rowData;
|
|
int rc = 0;
|
|
// std::ostringstream data;
|
|
bool nullVal = false;
|
|
const uchar* bufHdr =
|
|
buf; // bit flag indicating a field is null. Only those fields that are nullable are represented.
|
|
int32_t headerByte = 0; // Current byte in the bufHdr
|
|
int32_t headerBit = 0; // current bit in the bufHdr current byte.
|
|
uint16_t colpos = 0;
|
|
buf = buf + ci.headerLength; // Number of bytes used for null bits.
|
|
//@Bug 6122 if all columns have not null constraint, there is no information in the header
|
|
char nullBits = *bufHdr++;
|
|
|
|
if (!ci.useXbit)
|
|
{
|
|
// Skip the first bit. For some reason, mysql reserves the first bit of the first byte, unless there's a
|
|
// varchar column in the table.
|
|
nullBits = nullBits >> 1;
|
|
++headerBit;
|
|
}
|
|
|
|
while (colpos < ci.columnTypes.size()) // test bitmap for null values
|
|
{
|
|
uint8_t numLoop = 7;
|
|
|
|
if ((ci.useXbit) || (colpos > 6))
|
|
numLoop++;
|
|
|
|
for (uint8_t i = 0; i < numLoop; i++)
|
|
{
|
|
if (colpos == ci.columnTypes.size())
|
|
break;
|
|
|
|
// if a column has not null constraint, it will not be in the bit map
|
|
if (ci.columnTypes[colpos].constraintType != CalpontSystemCatalog::NOTNULL_CONSTRAINT)
|
|
{
|
|
if (ci.headerLength > 0 && headerByte >= ci.headerLength)
|
|
{
|
|
// We've used more null bits than allowed. Something is seriously wrong.
|
|
std::string errormsg = "Null bit header is wrong size";
|
|
setError(current_thd, ER_INTERNAL_ERROR, errormsg);
|
|
return -1;
|
|
}
|
|
|
|
nullVal = nullBits & 0x01;
|
|
nullBits = nullBits >> 1;
|
|
++headerBit;
|
|
|
|
if (headerBit == 8)
|
|
{
|
|
nullBits = *bufHdr++;
|
|
headerBit = 0;
|
|
++headerByte;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
nullVal = false;
|
|
}
|
|
|
|
const CalpontSystemCatalog::ColType& colType = ci.columnTypes[colpos];
|
|
const datatypes::TypeHandler* h = colType.typeHandler();
|
|
if (h) // QQ: error reporting
|
|
{
|
|
datatypes::ColBatchWriter writer(ci.filePtr, ci.delimiter, ci.enclosed_by);
|
|
Field* fieldPtr = table->field[colpos];
|
|
uint32_t mbmaxlen =
|
|
(fieldPtr->charset() && fieldPtr->charset()->mbmaxlen) ? fieldPtr->charset()->mbmaxlen : 0;
|
|
datatypes::WriteBatchFieldMariaDB field(fieldPtr, colType, mbmaxlen, timeZone);
|
|
idbassert(table == table->field[colpos]->table);
|
|
buf += h->ColWriteBatch(&field, buf, nullVal, writer);
|
|
}
|
|
colpos++;
|
|
}
|
|
}
|
|
|
|
rc = fprintf(ci.filePtr, "\n"); //@bug 6077 check whether the pipe is still open
|
|
|
|
if (rc < 0)
|
|
rc = -1;
|
|
else
|
|
rc = 0;
|
|
|
|
return rc;
|
|
}
|
|
|
|
std::string ha_mcs_impl_viewtablelock(cal_impl_if::cal_connection_info& ci,
|
|
execplan::CalpontSystemCatalog::TableName& tablename)
|
|
{
|
|
THD* thd = current_thd;
|
|
ulong sessionID = tid2sid(thd->thread_id);
|
|
CalpontDMLPackage* pDMLPackage;
|
|
std::string dmlStatement("VIEWTABLELOCK");
|
|
VendorDMLStatement cmdStmt(dmlStatement, DML_COMMAND, sessionID);
|
|
pDMLPackage = CalpontDMLFactory::makeCalpontDMLPackageFromMysqlBuffer(cmdStmt);
|
|
if (lower_case_table_names)
|
|
{
|
|
boost::algorithm::to_lower(tablename.schema);
|
|
boost::algorithm::to_lower(tablename.table);
|
|
}
|
|
pDMLPackage->set_SchemaName(tablename.schema);
|
|
pDMLPackage->set_TableName(tablename.table);
|
|
|
|
ByteStream bytestream;
|
|
bytestream << static_cast<uint32_t>(sessionID);
|
|
pDMLPackage->write(bytestream);
|
|
delete pDMLPackage;
|
|
|
|
ByteStream::byte b = 0;
|
|
ByteStream::octbyte rows;
|
|
std::string errorMsg;
|
|
std::string tableLockInfo;
|
|
// int dmlRowCount = 0;
|
|
|
|
try
|
|
{
|
|
ci.dmlProc->write(bytestream);
|
|
bytestream = ci.dmlProc->read();
|
|
|
|
if (bytestream.length() == 0)
|
|
{
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, "Lost connection to DMLProc [5]");
|
|
}
|
|
else
|
|
{
|
|
bytestream >> b;
|
|
bytestream >> rows;
|
|
bytestream >> errorMsg;
|
|
bytestream >> tableLockInfo;
|
|
}
|
|
}
|
|
catch (runtime_error&)
|
|
{
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, "Lost connection to DMLProc [6]");
|
|
}
|
|
catch (...)
|
|
{
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, "Caught unknown error");
|
|
}
|
|
|
|
if (b != 0)
|
|
tableLockInfo = errorMsg;
|
|
|
|
return tableLockInfo;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Clear the table lock associated with the specified table lock id.
|
|
// Any bulk rollback that is pending will be applied before the table
|
|
// lock is released.
|
|
//------------------------------------------------------------------------------
|
|
std::string ha_mcs_impl_cleartablelock(cal_impl_if::cal_connection_info& ci, uint64_t tableLockID)
|
|
{
|
|
execplan::CalpontSystemCatalog::TableName tblName;
|
|
THD* thd = current_thd;
|
|
ulong sessionID = tid2sid(thd->thread_id);
|
|
std::string tableLockInfo;
|
|
BRM::TableLockInfo lockInfo;
|
|
|
|
// Perform preliminary setup. CalpontDMLPackage expects schema and table
|
|
// name to be provided, so we get the table OID for the specified table
|
|
// lock, and then get the table name for the applicable table OID.
|
|
std::string prelimTask;
|
|
|
|
try
|
|
{
|
|
BRM::DBRM brm;
|
|
prelimTask = "getting table locks from BRM.";
|
|
bool getLockInfo = brm.getTableLockInfo(tableLockID, &lockInfo);
|
|
|
|
if (!getLockInfo)
|
|
{
|
|
tableLockInfo = "No table lock found for specified table lock ID";
|
|
return tableLockInfo;
|
|
}
|
|
|
|
boost::shared_ptr<execplan::CalpontSystemCatalog> csc =
|
|
execplan::CalpontSystemCatalog::makeCalpontSystemCatalog(sessionID);
|
|
csc->identity(execplan::CalpontSystemCatalog::FE);
|
|
|
|
prelimTask = "getting table name from system catalog.";
|
|
tblName = csc->tableName(lockInfo.tableOID);
|
|
}
|
|
catch (std::exception& ex)
|
|
{
|
|
std::string eMsg(ex.what());
|
|
eMsg += " Error ";
|
|
eMsg += prelimTask;
|
|
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, eMsg.c_str());
|
|
return tableLockInfo;
|
|
}
|
|
catch (...)
|
|
{
|
|
std::string eMsg(" Error ");
|
|
eMsg += prelimTask;
|
|
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, eMsg.c_str());
|
|
return tableLockInfo;
|
|
}
|
|
|
|
std::string dmlStatement("CLEARTABLELOCK");
|
|
VendorDMLStatement cmdStmt(dmlStatement, DML_COMMAND, sessionID);
|
|
CalpontDMLPackage* pDMLPackage = CalpontDMLFactory::makeCalpontDMLPackageFromMysqlBuffer(cmdStmt);
|
|
pDMLPackage->set_SchemaName(tblName.schema);
|
|
pDMLPackage->set_TableName(tblName.table);
|
|
|
|
// Table lock ID is passed in the SQL statement attribute
|
|
std::ostringstream lockIDString;
|
|
lockIDString << tableLockID;
|
|
pDMLPackage->set_SQLStatement(lockIDString.str());
|
|
|
|
ByteStream bytestream;
|
|
bytestream << static_cast<uint32_t>(sessionID);
|
|
pDMLPackage->write(bytestream);
|
|
delete pDMLPackage;
|
|
|
|
ByteStream::byte b = 0;
|
|
ByteStream::octbyte rows;
|
|
std::string errorMsg;
|
|
|
|
try
|
|
{
|
|
ci.dmlProc->write(bytestream);
|
|
bytestream = ci.dmlProc->read();
|
|
|
|
if (bytestream.length() == 0)
|
|
{
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, "Lost connection to DMLProc [7]");
|
|
}
|
|
else
|
|
{
|
|
bytestream >> b;
|
|
bytestream >> rows;
|
|
bytestream >> errorMsg;
|
|
bytestream >> tableLockInfo;
|
|
}
|
|
}
|
|
catch (runtime_error&)
|
|
{
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, "Lost connection to DMLProc [8]");
|
|
}
|
|
catch (...)
|
|
{
|
|
thd->get_stmt_da()->set_overwrite_status(true);
|
|
thd->raise_error_printf(ER_INTERNAL_ERROR, "Caught unknown error");
|
|
}
|
|
|
|
//@Bug 2606. Send error message back to sql session
|
|
if (b != 0)
|
|
tableLockInfo = errorMsg;
|
|
|
|
return tableLockInfo;
|
|
}
|
|
|
|
int ha_mcs_impl_commit_(handlerton* hton, THD* thd, bool all, cal_connection_info& ci)
|
|
{
|
|
if (thd->slave_thread && !get_replication_slave(thd))
|
|
return 0;
|
|
|
|
int rc = 0;
|
|
|
|
std::string command("COMMIT");
|
|
#ifdef INFINIDB_DEBUG
|
|
cout << "COMMIT" << endl;
|
|
#endif
|
|
rc = ProcessCommandStatement(thd, command, ci);
|
|
return rc;
|
|
}
|
|
|
|
int ha_mcs_impl_rollback_(handlerton* hton, THD* thd, bool all, cal_connection_info& ci)
|
|
{
|
|
int rc = 0;
|
|
#ifdef INFINIDB_DEBUG
|
|
cout << "ROLLBACK" << endl;
|
|
#endif
|
|
|
|
if (useHdfs)
|
|
{
|
|
string msg = string("Some non-transactional changed tables couldn't be rolled back");
|
|
// cout << "Some non-transactional changed tables couldn't be rolled back" << endl;
|
|
push_warning(thd, Sql_condition::WARN_LEVEL_WARN, 1196, msg.c_str());
|
|
return rc;
|
|
}
|
|
|
|
std::string command("ROLLBACK");
|
|
rc = ProcessCommandStatement(thd, command, ci);
|
|
return rc;
|
|
}
|
|
|
|
int ha_mcs_impl_close_connection_(handlerton* hton, THD* thd, cal_connection_info& ci)
|
|
{
|
|
int rc = 0;
|
|
#ifdef INFINIDB_DEBUG
|
|
cout << "Close connection session ID " << thd->thread_id << endl;
|
|
#endif
|
|
|
|
if (!ci.dmlProc)
|
|
{
|
|
return rc;
|
|
}
|
|
|
|
std::string command("CLEANUP");
|
|
rc = ProcessCommandStatement(thd, command, ci);
|
|
// @bug 1622. remove calpontsystemcatalog and close the socket when session quit.
|
|
// @info when Calpont process a select query, an alter table phase is involved in
|
|
// the vtable design, which will auto start a transaction. when autocommit on (by default), rollback is
|
|
// automically called when session quit. rollback can also be called by user explicitly to rollback a
|
|
// transaction. Under either situation, system catalog cache for this session should be removed
|
|
return rc;
|
|
}
|
|
|