mirror of
https://github.com/mariadb-corporation/mariadb-columnstore-engine.git
synced 2025-04-23 07:05:36 +03:00
3766 lines
91 KiB
C++
3766 lines
91 KiB
C++
/* Copyright (C) 2014 InfiniDB, Inc.
|
|
Copyright (C) 2019 MariaDB Corporation
|
|
|
|
This program is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU General Public License
|
|
as published by the Free Software Foundation; version 2 of
|
|
the License.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
|
|
MA 02110-1301, USA. */
|
|
|
|
/****************************************************************************
|
|
* $Id: dataconvert.cpp 3901 2013-06-17 20:59:13Z rdempsey $
|
|
*
|
|
*
|
|
****************************************************************************/
|
|
|
|
#include <string>
|
|
#include <cmath>
|
|
#include <errno.h>
|
|
#include <ctime>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <type_traits>
|
|
#include <chrono>
|
|
#include "mcs_decimal.h"
|
|
using namespace std;
|
|
#include <boost/algorithm/string/case_conv.hpp>
|
|
#include <boost/algorithm/string.hpp>
|
|
using namespace boost::algorithm;
|
|
#include <boost/tokenizer.hpp>
|
|
#include "calpontselectexecutionplan.h"
|
|
#include "columnresult.h"
|
|
|
|
#include "joblisttypes.h"
|
|
|
|
#define DATACONVERT_DLLEXPORT
|
|
#include "dataconvert.h"
|
|
#undef DATACONVERT_DLLEXPORT
|
|
|
|
using namespace logging;
|
|
|
|
namespace
|
|
{
|
|
template <class T>
|
|
bool from_string(T& t, const std::string& s, std::ios_base& (*f)(std::ios_base&))
|
|
{
|
|
std::istringstream iss(s);
|
|
return !(iss >> f >> t).fail();
|
|
}
|
|
|
|
bool number_value(const string& data)
|
|
{
|
|
for (unsigned int i = 0; i < strlen(data.c_str()); i++)
|
|
{
|
|
if (data[i] > '9' || data[i] < '0')
|
|
{
|
|
if (data[i] != '+' && data[i] != '-' && data[i] != '.' && data[i] != ' ' && data[i] != 'E' &&
|
|
data[i] != 'e')
|
|
{
|
|
throw QueryDataExcept("value is not numerical.", formatErr);
|
|
}
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
} // namespace
|
|
|
|
namespace dataconvert
|
|
{
|
|
// LE stands for Little Endian
|
|
uint32_t getUInt32LE(const char* ptr)
|
|
{
|
|
return reinterpret_cast<const uint32_t*>(ptr)[0];
|
|
}
|
|
|
|
int32_t getSInt32LE(const char* ptr)
|
|
{
|
|
return reinterpret_cast<const int32_t*>(ptr)[0];
|
|
}
|
|
|
|
uint64_t getUInt64LE(const char* ptr)
|
|
{
|
|
return reinterpret_cast<const uint64_t*>(ptr)[0];
|
|
}
|
|
|
|
int64_t getSInt64LE(const char* ptr)
|
|
{
|
|
return reinterpret_cast<const int64_t*>(ptr)[0];
|
|
}
|
|
|
|
template <typename T>
|
|
void number_int_value(const string& data, cscDataType typeCode, const datatypes::TypeAttributesStd& ct,
|
|
bool& pushwarning, bool noRoundup, T& intVal, bool* saturate)
|
|
{
|
|
// copy of the original input
|
|
string valStr(data);
|
|
|
|
// in case, the values are in parentheses
|
|
string::size_type x = valStr.find('(');
|
|
string::size_type y = valStr.find(')');
|
|
|
|
while (x < string::npos)
|
|
{
|
|
// erase y first
|
|
if (y == string::npos)
|
|
throw QueryDataExcept("'(' is not matched.", formatErr);
|
|
|
|
valStr.erase(y, 1);
|
|
valStr.erase(x, 1);
|
|
x = valStr.find('(');
|
|
y = valStr.find(')');
|
|
}
|
|
|
|
if (y != string::npos)
|
|
throw QueryDataExcept("')' is not matched.", formatErr);
|
|
|
|
if (boost::iequals(valStr, "true"))
|
|
{
|
|
intVal = 1;
|
|
return;
|
|
}
|
|
if (boost::iequals(valStr, "false"))
|
|
{
|
|
intVal = 0;
|
|
return;
|
|
}
|
|
|
|
// convert to fixed-point notation if input is in scientific notation
|
|
if (valStr.find('E') < string::npos || valStr.find('e') < string::npos)
|
|
{
|
|
size_t epos = valStr.find('E');
|
|
|
|
if (epos == string::npos)
|
|
epos = valStr.find('e');
|
|
|
|
// get the coefficient
|
|
string coef = valStr.substr(0, epos);
|
|
// get the exponent
|
|
string exp = valStr.substr(epos + 1);
|
|
bool overflow = false;
|
|
T exponent = dataconvert::string_to_ll<T>(exp, overflow);
|
|
|
|
// if the exponent can not be held in 64 or 128 bits, not supported or saturated.
|
|
if (overflow)
|
|
throw QueryDataExcept("value is invalid.", formatErr);
|
|
|
|
// find the optional "." point
|
|
size_t dpos = coef.find('.');
|
|
|
|
if (dpos != string::npos)
|
|
{
|
|
// move "." to the end by mutiply 10 ** (# of fraction digits)
|
|
coef.erase(dpos, 1);
|
|
exponent -= coef.length() - dpos;
|
|
}
|
|
|
|
if (exponent >= 0)
|
|
{
|
|
coef.resize(coef.length() + exponent, '0');
|
|
}
|
|
else
|
|
{
|
|
size_t bpos = coef.find_first_of("0123456789");
|
|
size_t epos = coef.length();
|
|
size_t mpos = -exponent;
|
|
dpos = epos - mpos;
|
|
int64_t padding = (int64_t)mpos - (int64_t)(epos - bpos);
|
|
|
|
if (padding > 0)
|
|
{
|
|
coef.insert(bpos, padding, '0');
|
|
dpos = bpos;
|
|
}
|
|
|
|
coef.insert(dpos, ".");
|
|
}
|
|
|
|
valStr = coef;
|
|
}
|
|
|
|
// apply the scale
|
|
if (ct.scale != 0)
|
|
{
|
|
uint64_t scale = (uint64_t)(ct.scale < 0) ? (-ct.scale) : (ct.scale);
|
|
size_t dpos = valStr.find('.');
|
|
string intPart = valStr.substr(0, dpos);
|
|
string leftStr;
|
|
|
|
if (ct.scale > 0)
|
|
{
|
|
if (dpos != string::npos)
|
|
{
|
|
// decimal point exist, prepare "#scale" digits in fraction part
|
|
++dpos;
|
|
string frnStr = valStr.substr(dpos, scale);
|
|
|
|
if (frnStr.length() < scale)
|
|
frnStr.resize(scale, '0'); // padding digit 0, not null.
|
|
|
|
// effectly shift "#scale" digits to left.
|
|
intPart += frnStr;
|
|
leftStr = valStr.substr(dpos);
|
|
leftStr.erase(0, scale);
|
|
}
|
|
else
|
|
{
|
|
// no decimal point, shift "#scale" digits to left.
|
|
intPart.resize(intPart.length() + scale, '0'); // padding digit 0, not null.
|
|
}
|
|
}
|
|
else // if (ct.scale < 0) -- in ct.scale != 0 block
|
|
{
|
|
if (dpos != string::npos)
|
|
{
|
|
// decimal point exist, get the fraction part
|
|
++dpos;
|
|
leftStr = valStr.substr(dpos);
|
|
}
|
|
}
|
|
|
|
valStr = intPart;
|
|
|
|
if (leftStr.length() > 0)
|
|
valStr += "." + leftStr;
|
|
}
|
|
|
|
// now, convert to long long int
|
|
string intStr(valStr);
|
|
string frnStr = "";
|
|
size_t dp = valStr.find('.');
|
|
int roundup = 0;
|
|
|
|
if (dp != string::npos)
|
|
{
|
|
// Check if need round up
|
|
int frac1 = dataconvert::string_to_ll<int64_t>(valStr.substr(dp + 1, 1), pushwarning);
|
|
|
|
if ((!noRoundup) && frac1 >= 5)
|
|
roundup = 1;
|
|
|
|
intStr.erase(dp);
|
|
frnStr = valStr.substr(dp + 1);
|
|
|
|
if (intStr.length() == 0)
|
|
intStr = "0";
|
|
else if ((intStr.length() == 1) && ((intStr[0] == '+') || (intStr[0] == '-')))
|
|
{
|
|
intStr.insert(1, 1, '0');
|
|
}
|
|
}
|
|
|
|
intVal = dataconvert::string_to_ll<T>(intStr, pushwarning);
|
|
//@Bug 3350 negative value round up.
|
|
intVal += intVal >= 0 ? roundup : -roundup;
|
|
bool dummy = false;
|
|
T frnVal = (frnStr.length() > 0) ? dataconvert::string_to_ll<T>(frnStr, dummy) : 0;
|
|
|
|
if (frnVal != 0)
|
|
pushwarning = true;
|
|
|
|
switch (typeCode)
|
|
{
|
|
case datatypes::SystemCatalog::TINYINT:
|
|
if (intVal < MIN_TINYINT)
|
|
{
|
|
intVal = MIN_TINYINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
else if (intVal > MAX_TINYINT)
|
|
{
|
|
intVal = MAX_TINYINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::SMALLINT:
|
|
if (intVal < MIN_SMALLINT)
|
|
{
|
|
intVal = MIN_SMALLINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
else if (intVal > MAX_SMALLINT)
|
|
{
|
|
intVal = MAX_SMALLINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::MEDINT:
|
|
if (intVal < MIN_MEDINT)
|
|
{
|
|
intVal = MIN_MEDINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
else if (intVal > MAX_MEDINT)
|
|
{
|
|
intVal = MAX_MEDINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::INT:
|
|
if (intVal < MIN_INT)
|
|
{
|
|
intVal = MIN_INT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
else if (intVal > MAX_INT)
|
|
{
|
|
intVal = MAX_INT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::BIGINT:
|
|
if (intVal < MIN_BIGINT)
|
|
{
|
|
intVal = MIN_BIGINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DECIMAL:
|
|
case datatypes::SystemCatalog::UDECIMAL:
|
|
if (LIKELY(ct.colWidth == 16))
|
|
{
|
|
int128_t tmp;
|
|
utils::int128Min(tmp);
|
|
if (intVal < tmp + 2) // + 2 for NULL and EMPTY values
|
|
{
|
|
intVal = tmp + 2;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
}
|
|
else if (ct.colWidth == 8)
|
|
{
|
|
if (intVal < MIN_BIGINT)
|
|
{
|
|
intVal = MIN_BIGINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
}
|
|
else if (ct.colWidth == 4)
|
|
{
|
|
if (intVal < MIN_INT)
|
|
{
|
|
intVal = MIN_INT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
else if (intVal > MAX_INT)
|
|
{
|
|
intVal = MAX_INT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
}
|
|
else if (ct.colWidth == 2)
|
|
{
|
|
if (intVal < MIN_SMALLINT)
|
|
{
|
|
intVal = MIN_SMALLINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
else if (intVal > MAX_SMALLINT)
|
|
{
|
|
intVal = MAX_SMALLINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
}
|
|
else if (ct.colWidth == 1)
|
|
{
|
|
if (intVal < MIN_TINYINT)
|
|
{
|
|
intVal = MIN_TINYINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
else if (intVal > MAX_TINYINT)
|
|
{
|
|
intVal = MAX_TINYINT;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
}
|
|
|
|
break;
|
|
|
|
default: break;
|
|
}
|
|
|
|
// @ bug 3285 make sure the value is in precision range for decimal data type
|
|
if ((typeCode == datatypes::SystemCatalog::DECIMAL) || (typeCode == datatypes::SystemCatalog::UDECIMAL) ||
|
|
(ct.scale > 0))
|
|
{
|
|
auto precision =
|
|
ct.precision == rowgroup::MagicPrecisionForCountAgg ? datatypes::INT128MAXPRECISION : ct.precision;
|
|
if (precision > datatypes::INT128MAXPRECISION || precision < 0)
|
|
{
|
|
throw QueryDataExcept("Unsupported precision " + std::to_string(precision) + " converting DECIMAL ",
|
|
dataTypeErr);
|
|
}
|
|
|
|
T rangeUp = dataconvert::decimalRangeUp<T>(precision);
|
|
T rangeLow = -rangeUp;
|
|
|
|
if (intVal > rangeUp)
|
|
{
|
|
intVal = rangeUp;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
else if (intVal < rangeLow)
|
|
{
|
|
intVal = rangeLow;
|
|
pushwarning = true;
|
|
|
|
if (saturate)
|
|
*saturate = true;
|
|
}
|
|
}
|
|
}
|
|
|
|
// Explicit template instantiation
|
|
template void number_int_value<int64_t>(const std::string& data, cscDataType typeCode,
|
|
const datatypes::TypeAttributesStd& ct, bool& pushwarning,
|
|
bool noRoundup, int64_t& intVal, bool* saturate);
|
|
|
|
template void number_int_value<int128_t>(const std::string& data, cscDataType typeCode,
|
|
const datatypes::TypeAttributesStd& ct, bool& pushwarning,
|
|
bool noRoundup, int128_t& intVal, bool* saturate);
|
|
|
|
uint64_t number_uint_value(const string& data, cscDataType typeCode, const datatypes::TypeAttributesStd& ct,
|
|
bool& pushwarning, bool noRoundup)
|
|
{
|
|
// copy of the original input
|
|
string valStr(data);
|
|
|
|
// in case, the values are in parentheses
|
|
string::size_type x = valStr.find('(');
|
|
string::size_type y = valStr.find(')');
|
|
|
|
while (x < string::npos)
|
|
{
|
|
// erase y first
|
|
if (y == string::npos)
|
|
throw QueryDataExcept("'(' is not matched.", formatErr);
|
|
|
|
valStr.erase(y, 1);
|
|
valStr.erase(x, 1);
|
|
x = valStr.find('(');
|
|
y = valStr.find(')');
|
|
}
|
|
|
|
if (y != string::npos)
|
|
throw QueryDataExcept("')' is not matched.", formatErr);
|
|
|
|
// convert to fixed-point notation if input is in scientific notation
|
|
if (valStr.find('E') < string::npos || valStr.find('e') < string::npos)
|
|
{
|
|
size_t epos = valStr.find('E');
|
|
|
|
if (epos == string::npos)
|
|
epos = valStr.find('e');
|
|
|
|
// get the coefficient
|
|
string coef = valStr.substr(0, epos);
|
|
// get the exponent
|
|
string exp = valStr.substr(epos + 1);
|
|
bool overflow = false;
|
|
int64_t exponent = dataconvert::string_to_ll<int64_t>(exp, overflow);
|
|
|
|
// if the exponent can not be held in 64-bit, not supported or saturated.
|
|
if (overflow)
|
|
throw QueryDataExcept("value is invalid.", formatErr);
|
|
|
|
// find the optional "." point
|
|
size_t dpos = coef.find('.');
|
|
|
|
if (dpos != string::npos)
|
|
{
|
|
// move "." to the end by mutiply 10 ** (# of fraction digits)
|
|
coef.erase(dpos, 1);
|
|
exponent -= coef.length() - dpos;
|
|
}
|
|
|
|
if (exponent >= 0)
|
|
{
|
|
coef.resize(coef.length() + exponent, '0');
|
|
}
|
|
else
|
|
{
|
|
size_t bpos = coef.find_first_of("0123456789");
|
|
size_t epos = coef.length();
|
|
size_t mpos = -exponent;
|
|
dpos = epos - mpos;
|
|
int64_t padding = (int64_t)mpos - (int64_t)(epos - bpos);
|
|
|
|
if (padding > 0)
|
|
{
|
|
coef.insert(bpos, padding, '0');
|
|
dpos = bpos;
|
|
}
|
|
|
|
coef.insert(dpos, ".");
|
|
}
|
|
|
|
valStr = coef;
|
|
}
|
|
|
|
// now, convert to uint64_t
|
|
string intStr(valStr);
|
|
string frnStr = "";
|
|
size_t dp = valStr.find('.');
|
|
|
|
if (dp != string::npos)
|
|
{
|
|
intStr.erase(dp);
|
|
frnStr = valStr.substr(dp + 1);
|
|
|
|
if (intStr.length() == 0)
|
|
intStr = "0";
|
|
else if ((intStr.length() == 1) && ((intStr[0] == '+') || (intStr[0] == '-')))
|
|
{
|
|
intStr.insert(1, 1, '0');
|
|
}
|
|
}
|
|
|
|
uint64_t uintVal = dataconvert::string_to_ull(intStr, pushwarning);
|
|
|
|
bool dummy = false;
|
|
uint64_t frnVal = (frnStr.length() > 0) ? dataconvert::string_to_ull(frnStr, dummy) : 0;
|
|
|
|
if (frnVal != 0)
|
|
pushwarning = true;
|
|
|
|
switch (typeCode)
|
|
{
|
|
case datatypes::SystemCatalog::UTINYINT:
|
|
if (uintVal > MAX_UTINYINT)
|
|
{
|
|
uintVal = MAX_UTINYINT;
|
|
pushwarning = true;
|
|
}
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::USMALLINT:
|
|
if (uintVal > MAX_USMALLINT)
|
|
{
|
|
uintVal = MAX_USMALLINT;
|
|
pushwarning = true;
|
|
}
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::UMEDINT:
|
|
if (uintVal > MAX_UMEDINT)
|
|
{
|
|
uintVal = MAX_UMEDINT;
|
|
pushwarning = true;
|
|
}
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::UINT:
|
|
if (uintVal > MAX_UINT)
|
|
{
|
|
uintVal = MAX_UINT;
|
|
pushwarning = true;
|
|
}
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::UBIGINT:
|
|
if (uintVal > MAX_UBIGINT)
|
|
{
|
|
uintVal = MAX_UBIGINT;
|
|
pushwarning = true;
|
|
}
|
|
|
|
break;
|
|
|
|
default: break;
|
|
}
|
|
|
|
return uintVal;
|
|
}
|
|
|
|
/**
|
|
* This function reads a decimal value from a string. It will stop processing
|
|
* in 3 cases:
|
|
* 1) end of input string (null-terminated)
|
|
* 2) non-digit hit
|
|
* 3) max characters read (if max != 0 then at most max characters read)
|
|
*
|
|
* It's up to the caller to figure out whether an error occurred based on
|
|
* their definition of an error and how many characters were read
|
|
*/
|
|
uint32_t readDecimal(const char*& str, int32_t& value, uint32_t max = 0)
|
|
{
|
|
value = 0;
|
|
uint32_t numread = 0;
|
|
|
|
while ((!max || numread < max) && *str && isdigit(*str))
|
|
{
|
|
value = value * 10 + ((*str) - '0');
|
|
++numread;
|
|
++str;
|
|
}
|
|
|
|
return numread;
|
|
}
|
|
|
|
bool mysql_str_to_datetime(const string& input, DateTime& output, bool& isDate)
|
|
{
|
|
/**
|
|
* First we are going to identify the stop/start of the date portion.
|
|
* The rules are:
|
|
* - Date portion must come before anything else
|
|
* - Date portion may only contain numbers and '-'
|
|
* - Date portion ends with ' ', 'T', or '\0'
|
|
* - Date portion always starts with Year
|
|
* - Without date separators ('-'):
|
|
* YYMMDD
|
|
* YYYYMMDD
|
|
* - With date separators there are no specific field length
|
|
* requirements
|
|
*/
|
|
int32_t datesepct = 0;
|
|
uint32_t dtend = 0;
|
|
|
|
for (; dtend < input.length(); ++dtend)
|
|
{
|
|
char c = input[dtend];
|
|
|
|
if (isdigit(c))
|
|
{
|
|
continue;
|
|
}
|
|
// else if( dtend != 0 && c == '-' )
|
|
else if (dtend != 0 && ispunct(c))
|
|
{
|
|
++datesepct;
|
|
}
|
|
else if (c == 'T' || c == ' ')
|
|
{
|
|
break;
|
|
}
|
|
else
|
|
{
|
|
// some other character showed up
|
|
output.reset();
|
|
return false;
|
|
}
|
|
}
|
|
|
|
int32_t year = -1;
|
|
int32_t mon = -1;
|
|
int32_t day = -1;
|
|
const char* ptr = input.c_str();
|
|
|
|
if (datesepct == 0)
|
|
{
|
|
if (dtend == 6 || dtend == 12)
|
|
{
|
|
readDecimal(ptr, year, 2);
|
|
readDecimal(ptr, mon, 2);
|
|
readDecimal(ptr, day, 2);
|
|
year += 2000;
|
|
|
|
if (year > 2069)
|
|
year -= 100;
|
|
|
|
if (dtend == 12)
|
|
dtend -= 6;
|
|
}
|
|
else if (dtend == 8 || dtend == 14)
|
|
{
|
|
readDecimal(ptr, year, 4);
|
|
readDecimal(ptr, mon, 2);
|
|
readDecimal(ptr, day, 2);
|
|
|
|
if (dtend == 14)
|
|
dtend -= 6;
|
|
}
|
|
else
|
|
{
|
|
output.reset();
|
|
return false;
|
|
}
|
|
}
|
|
else if (datesepct == 2)
|
|
{
|
|
uint32_t numread = readDecimal(ptr, year);
|
|
|
|
if (numread == 2)
|
|
{
|
|
// special handling if we read a 2-byte year
|
|
year += 2000;
|
|
|
|
if (year > 2069)
|
|
year -= 100;
|
|
}
|
|
|
|
++ptr; // skip one separator
|
|
readDecimal(ptr, mon);
|
|
++ptr; // skip one separator
|
|
readDecimal(ptr, day); // skip two separators
|
|
}
|
|
else
|
|
{
|
|
output.reset();
|
|
return false;
|
|
}
|
|
|
|
if (!isDateValid(day, mon, year))
|
|
{
|
|
output.reset();
|
|
return false;
|
|
}
|
|
|
|
output.year = year;
|
|
output.month = mon;
|
|
output.day = day;
|
|
|
|
/**
|
|
* Now we need to deal with the time portion.
|
|
* The rules are:
|
|
* - Time portion may be empty
|
|
* - Time portion may start with 'T'
|
|
* - Time portion always ends with '\0'
|
|
* - Time portion always starts with hour
|
|
* - Without time separators (':'):
|
|
* HHMMSS
|
|
* - All Times can end with option .[microseconds]
|
|
* - With time separators there are no specific field length
|
|
* requirements
|
|
*/
|
|
while (input[dtend] == ' ' && dtend < input.length())
|
|
{
|
|
++dtend;
|
|
}
|
|
|
|
if (dtend == input.length())
|
|
{
|
|
isDate = true;
|
|
return true;
|
|
}
|
|
|
|
uint32_t timesep_ct = 0;
|
|
bool has_usec = false;
|
|
uint32_t len_before_msec = 0;
|
|
uint32_t tmstart = (input[dtend] == ' ' || input[dtend] == 'T') ? dtend + 1 : dtend;
|
|
uint32_t tmend = tmstart;
|
|
|
|
for (; tmend < input.length(); ++tmend)
|
|
{
|
|
char c = input[tmend];
|
|
|
|
if (isdigit(c))
|
|
{
|
|
// digits always ok
|
|
continue;
|
|
}
|
|
// else if( c == ':' )
|
|
// {
|
|
// timesep_ct++;
|
|
// }
|
|
// else if( c == '.' )
|
|
// {
|
|
// len_before_msec = ( tmend - tmstart );
|
|
// has_usec = true;
|
|
// }
|
|
else if (ispunct(c))
|
|
{
|
|
if (c == '.' && timesep_ct == 2)
|
|
{
|
|
len_before_msec = (tmend - tmstart);
|
|
has_usec = true;
|
|
}
|
|
else
|
|
{
|
|
timesep_ct++;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// some other character showed up
|
|
output.reset();
|
|
return false;
|
|
}
|
|
}
|
|
|
|
if (!len_before_msec)
|
|
len_before_msec = (tmend - tmstart);
|
|
|
|
int32_t hour = -1;
|
|
int32_t min = 0;
|
|
int32_t sec = 0;
|
|
int32_t usec = 0;
|
|
const char* tstart = input.c_str() + tmstart;
|
|
|
|
if (timesep_ct == 2)
|
|
{
|
|
readDecimal(tstart, hour);
|
|
++tstart; // skip one separator
|
|
readDecimal(tstart, min);
|
|
++tstart; // skip one separator
|
|
readDecimal(tstart, sec);
|
|
}
|
|
else if (timesep_ct == 1)
|
|
{
|
|
readDecimal(tstart, hour);
|
|
++tstart; // skip one separator
|
|
readDecimal(tstart, min);
|
|
}
|
|
else if (timesep_ct == 0 && len_before_msec == 6)
|
|
{
|
|
readDecimal(tstart, hour, 2);
|
|
readDecimal(tstart, min, 2);
|
|
readDecimal(tstart, sec, 2);
|
|
}
|
|
else if (timesep_ct == 0 && len_before_msec == 4)
|
|
{
|
|
readDecimal(tstart, hour, 2);
|
|
readDecimal(tstart, min, 2);
|
|
}
|
|
else if (timesep_ct == 0 && len_before_msec == 2)
|
|
{
|
|
readDecimal(tstart, hour, 2);
|
|
}
|
|
else
|
|
{
|
|
output.reset();
|
|
return false;
|
|
}
|
|
|
|
if (has_usec)
|
|
{
|
|
++tstart; // skip '.' character. We could error check if we wanted to
|
|
uint32_t numread = readDecimal(tstart, usec);
|
|
|
|
if (numread > 6 || numread < 1)
|
|
{
|
|
// don't allow more than 6 digits when specifying microseconds
|
|
output.reset();
|
|
return false;
|
|
}
|
|
|
|
// usec have to be scaled up so that it always represents microseconds
|
|
for (int i = numread; i < 6; i++)
|
|
usec *= 10;
|
|
}
|
|
|
|
if (!isDateTimeValid(hour, min, sec, usec))
|
|
{
|
|
output.reset();
|
|
return false;
|
|
}
|
|
|
|
output.hour = hour;
|
|
output.minute = min;
|
|
output.second = sec;
|
|
output.msecond = usec;
|
|
isDate = false;
|
|
return true;
|
|
}
|
|
|
|
bool mysql_str_to_time(const string& input, Time& output, long decimals)
|
|
{
|
|
uint32_t dtend = 0;
|
|
bool isNeg = false;
|
|
|
|
/**
|
|
* We need to deal with the time portion.
|
|
* The rules are:
|
|
* - Time portion always ends with '\0'
|
|
* - Time portion always starts with hour
|
|
* - Without time separators (':'):
|
|
* HHMMSS
|
|
* - All Times can end with option .[microseconds]
|
|
* - With time separators there are no specific field length
|
|
* requirements
|
|
*/
|
|
while (input[dtend] == ' ' && dtend < input.length())
|
|
{
|
|
++dtend;
|
|
}
|
|
|
|
if (dtend == input.length())
|
|
{
|
|
return false;
|
|
}
|
|
|
|
uint32_t timesep_ct = 0;
|
|
bool has_usec = false;
|
|
uint32_t len_before_msec = 0;
|
|
uint32_t tmstart = dtend;
|
|
uint32_t tmend = tmstart;
|
|
|
|
for (; tmend < input.length(); ++tmend)
|
|
{
|
|
char c = input[tmend];
|
|
|
|
if (isdigit(c))
|
|
{
|
|
// digits always ok
|
|
continue;
|
|
}
|
|
// else if( c == ':' )
|
|
// {
|
|
// timesep_ct++;
|
|
// }
|
|
// else if( c == '.' )
|
|
// {
|
|
// len_before_msec = ( tmend - tmstart );
|
|
// has_usec = true;
|
|
// }
|
|
else if (ispunct(c))
|
|
{
|
|
if (c == '.' && timesep_ct == 2)
|
|
{
|
|
len_before_msec = (tmend - tmstart);
|
|
has_usec = true;
|
|
}
|
|
else if (c == '-' && (tmend == tmstart))
|
|
{
|
|
isNeg = true;
|
|
++tmstart;
|
|
}
|
|
else
|
|
{
|
|
timesep_ct++;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// some other character showed up
|
|
output.reset();
|
|
return false;
|
|
}
|
|
}
|
|
|
|
if (!len_before_msec)
|
|
len_before_msec = (tmend - tmstart);
|
|
|
|
int32_t hour = -1;
|
|
int32_t min = 0;
|
|
int32_t sec = 0;
|
|
int32_t usec = 0;
|
|
const char* tstart = input.c_str() + tmstart;
|
|
|
|
if (timesep_ct == 2)
|
|
{
|
|
readDecimal(tstart, hour);
|
|
++tstart; // skip one separator
|
|
readDecimal(tstart, min);
|
|
++tstart; // skip one separator
|
|
readDecimal(tstart, sec);
|
|
}
|
|
else if (timesep_ct == 1)
|
|
{
|
|
readDecimal(tstart, hour);
|
|
++tstart; // skip one separator
|
|
readDecimal(tstart, min);
|
|
}
|
|
else if (timesep_ct == 0 && len_before_msec == 6)
|
|
{
|
|
readDecimal(tstart, hour, 2);
|
|
readDecimal(tstart, min, 2);
|
|
readDecimal(tstart, sec, 2);
|
|
}
|
|
else if (timesep_ct == 0 && len_before_msec == 4)
|
|
{
|
|
readDecimal(tstart, hour, 2);
|
|
readDecimal(tstart, min, 2);
|
|
}
|
|
else if (timesep_ct == 0 && len_before_msec == 2)
|
|
{
|
|
readDecimal(tstart, hour, 2);
|
|
}
|
|
else
|
|
{
|
|
output.reset();
|
|
return false;
|
|
}
|
|
|
|
if (has_usec)
|
|
{
|
|
++tstart; // skip '.' character. We could error check if we wanted to
|
|
uint32_t numread = readDecimal(tstart, usec);
|
|
|
|
if (numread > 6 || numread < 1)
|
|
{
|
|
// don't allow more than 6 digits when specifying microseconds
|
|
output.reset();
|
|
return false;
|
|
}
|
|
|
|
// usec have to be scaled up so that it always represents microseconds
|
|
for (int i = numread; i < 6; i++)
|
|
usec *= 10;
|
|
}
|
|
|
|
if (!isTimeValid(hour, min, sec, usec))
|
|
{
|
|
// Emulate MariaDB's time saturation
|
|
// TODO: msec saturation
|
|
if ((hour > 838) && !isNeg)
|
|
{
|
|
output.hour = 838;
|
|
output.minute = 59;
|
|
output.second = 59;
|
|
output.msecond = exp10(decimals) - 1;
|
|
output.is_neg = 0;
|
|
}
|
|
else if ((hour < -838) || ((hour > 838) && isNeg))
|
|
{
|
|
output.hour = -838;
|
|
output.minute = 59;
|
|
output.second = 59;
|
|
output.msecond = exp10(decimals) - 1;
|
|
output.is_neg = -1;
|
|
}
|
|
// If neither of the above match then we return a 0 time
|
|
else
|
|
{
|
|
output.reset();
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
output.hour = isNeg ? 0 - hour : hour;
|
|
output.minute = min;
|
|
output.second = sec;
|
|
output.msecond = usec;
|
|
output.is_neg = isNeg;
|
|
return true;
|
|
}
|
|
|
|
bool stringToDateStruct(const string& data, Date& date)
|
|
{
|
|
bool isDate;
|
|
DateTime dt;
|
|
|
|
if (!mysql_str_to_datetime(data, dt, isDate))
|
|
return false;
|
|
|
|
date.year = dt.year;
|
|
date.month = dt.month;
|
|
date.day = dt.day;
|
|
return true;
|
|
}
|
|
|
|
bool stringToDatetimeStruct(const string& data, DateTime& dtime, bool* date)
|
|
{
|
|
bool isDate;
|
|
|
|
if (!mysql_str_to_datetime(data, dtime, isDate))
|
|
return false;
|
|
|
|
if (isDate)
|
|
{
|
|
if (date)
|
|
*date = true;
|
|
|
|
dtime.hour = 0;
|
|
dtime.minute = 0;
|
|
dtime.second = 0;
|
|
dtime.msecond = 0;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
bool stringToTimeStruct(const string& data, Time& dtime, long decimals)
|
|
{
|
|
if (!mysql_str_to_time(data, dtime, decimals))
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
bool stringToTimestampStruct(const string& data, TimeStamp& timeStamp, long timeZone)
|
|
{
|
|
// special handling for 0000-00-00 00:00:00
|
|
// "0" is sent by the server when checking for default value
|
|
// in the DDL. This is equivalent of 0000-00-00 00:00:00
|
|
if (data.substr(0, 19) == "0000-00-00 00:00:00" || data == "0")
|
|
{
|
|
timeStamp.second = 0;
|
|
timeStamp.msecond = 0;
|
|
return true;
|
|
}
|
|
|
|
// for alter table add column <columnname> timestamp,
|
|
// if the table is non-empty, then columnstore will apply
|
|
// default value to populate the new column
|
|
if (data == "current_timestamp() ON UPDATE current_timestamp()")
|
|
{
|
|
struct timeval tv;
|
|
gettimeofday(&tv, 0);
|
|
timeStamp.second = tv.tv_sec;
|
|
timeStamp.msecond = tv.tv_usec;
|
|
return true;
|
|
}
|
|
|
|
bool isDate;
|
|
|
|
DateTime dtime;
|
|
|
|
if (!mysql_str_to_datetime(data, dtime, isDate))
|
|
{
|
|
timeStamp.reset();
|
|
return false;
|
|
}
|
|
|
|
if (isDate)
|
|
{
|
|
dtime.hour = 0;
|
|
dtime.minute = 0;
|
|
dtime.second = 0;
|
|
dtime.msecond = 0;
|
|
}
|
|
|
|
MySQLTime m_time;
|
|
m_time.year = dtime.year;
|
|
m_time.month = dtime.month;
|
|
m_time.day = dtime.day;
|
|
m_time.hour = dtime.hour;
|
|
m_time.minute = dtime.minute;
|
|
m_time.second = dtime.second;
|
|
m_time.second_part = dtime.msecond;
|
|
|
|
bool isValid = true;
|
|
int64_t seconds = mySQLTimeToGmtSec(m_time, timeZone, isValid);
|
|
|
|
if (!isValid)
|
|
{
|
|
timeStamp.reset();
|
|
return false;
|
|
}
|
|
|
|
timeStamp.second = seconds;
|
|
timeStamp.msecond = m_time.second_part;
|
|
|
|
return true;
|
|
}
|
|
|
|
boost::any DataConvert::StringToBit(const datatypes::TypeAttributesStd& colType,
|
|
const datatypes::ConvertFromStringParam& prm, const std::string& dataOrig,
|
|
bool& pushWarning)
|
|
{
|
|
std::string data(dataOrig);
|
|
unsigned int x = data.find("(");
|
|
|
|
if (x <= data.length())
|
|
{
|
|
data.replace(x, 1, " ");
|
|
}
|
|
|
|
x = data.find(")");
|
|
|
|
if (x <= data.length())
|
|
{
|
|
data.replace(x, 1, " ");
|
|
}
|
|
|
|
int64_t tmp = 0;
|
|
|
|
number_int_value(data, datatypes::SystemCatalog::BIT, colType, pushWarning, prm.noRoundup(), tmp);
|
|
|
|
if (tmp)
|
|
{
|
|
bool bitvalue;
|
|
|
|
if (from_string<bool>(bitvalue, data, std::dec))
|
|
{
|
|
boost::any value = bitvalue;
|
|
return value;
|
|
}
|
|
else
|
|
{
|
|
throw QueryDataExcept("range, valid value or conversion error on BIT type.", formatErr);
|
|
}
|
|
}
|
|
return boost::any();
|
|
}
|
|
|
|
boost::any DataConvert::StringToSDecimal(const datatypes::TypeAttributesStd& colType,
|
|
const datatypes::ConvertFromStringParam& prm,
|
|
const std::string& data, bool& pushWarning)
|
|
{
|
|
const cscDataType typeCode = datatypes::SystemCatalog::DECIMAL;
|
|
if (LIKELY(colType.colWidth == 16))
|
|
{
|
|
int128_t val128;
|
|
number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val128);
|
|
boost::any value = (int128_t)val128;
|
|
return value;
|
|
}
|
|
else if (colType.colWidth == 8)
|
|
{
|
|
int64_t val64;
|
|
number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
|
|
boost::any value = (long long)val64;
|
|
return value;
|
|
}
|
|
else if (colType.colWidth == 4)
|
|
{
|
|
int64_t val64;
|
|
number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
|
|
boost::any value = (int)val64;
|
|
return value;
|
|
}
|
|
else if (colType.colWidth == 2)
|
|
{
|
|
int64_t val64;
|
|
number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
|
|
boost::any value = (short)val64;
|
|
return value;
|
|
}
|
|
else if (colType.colWidth == 1)
|
|
{
|
|
int64_t val64;
|
|
number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
|
|
boost::any value = (char)val64;
|
|
return value;
|
|
}
|
|
// else if (colType.colWidth == 32)
|
|
// value = data;
|
|
return boost::any();
|
|
}
|
|
|
|
boost::any DataConvert::StringToUDecimal(const datatypes::TypeAttributesStd& colType,
|
|
const datatypes::ConvertFromStringParam& prm,
|
|
const std::string& data, bool& pushWarning)
|
|
{
|
|
const cscDataType typeCode = datatypes::SystemCatalog::UDECIMAL;
|
|
|
|
// UDECIMAL numbers may not be negative
|
|
if (LIKELY(colType.colWidth == 16))
|
|
{
|
|
int128_t val128;
|
|
number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val128);
|
|
|
|
if (val128 < 0 && !datatypes::Decimal::isWideDecimalNullValue(val128) &&
|
|
!datatypes::Decimal::isWideDecimalEmptyValue(val128))
|
|
{
|
|
val128 = 0;
|
|
pushWarning = true;
|
|
}
|
|
|
|
boost::any value = val128;
|
|
return value;
|
|
}
|
|
else if (colType.colWidth == 8)
|
|
{
|
|
int64_t val64;
|
|
number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
|
|
long long ival = static_cast<long long>(val64);
|
|
|
|
if (ival < 0 && ival != static_cast<long long>(joblist::BIGINTEMPTYROW) &&
|
|
ival != static_cast<long long>(joblist::BIGINTNULL))
|
|
{
|
|
ival = 0;
|
|
pushWarning = true;
|
|
}
|
|
|
|
boost::any value = ival;
|
|
return value;
|
|
}
|
|
else if (colType.colWidth == 4)
|
|
{
|
|
int64_t val64;
|
|
number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
|
|
int ival = static_cast<int>(val64);
|
|
|
|
if (ival < 0 && ival != static_cast<int>(joblist::INTEMPTYROW) &&
|
|
ival != static_cast<int>(joblist::INTNULL))
|
|
{
|
|
ival = 0;
|
|
pushWarning = true;
|
|
}
|
|
|
|
boost::any value = ival;
|
|
return value;
|
|
}
|
|
else if (colType.colWidth == 2)
|
|
{
|
|
int64_t val64;
|
|
number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
|
|
short ival = (short)val64;
|
|
|
|
if (ival < 0 && ival != static_cast<int16_t>(joblist::SMALLINTEMPTYROW) &&
|
|
ival != static_cast<int16_t>(joblist::SMALLINTNULL))
|
|
{
|
|
ival = 0;
|
|
pushWarning = true;
|
|
}
|
|
|
|
boost::any value = ival;
|
|
return value;
|
|
}
|
|
else if (colType.colWidth == 1)
|
|
{
|
|
int64_t val64;
|
|
number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
|
|
signed char ival = (signed char)val64;
|
|
|
|
if (ival < 0 && ival != static_cast<int8_t>(joblist::TINYINTEMPTYROW) &&
|
|
ival != static_cast<int8_t>(joblist::TINYINTNULL))
|
|
{
|
|
ival = 0;
|
|
pushWarning = true;
|
|
}
|
|
|
|
boost::any value = ival;
|
|
return value;
|
|
}
|
|
return boost::any();
|
|
}
|
|
|
|
boost::any DataConvert::StringToFloat(cscDataType typeCode, const std::string& dataOrig, bool& pushWarning)
|
|
{
|
|
boost::any value;
|
|
std::string data(dataOrig);
|
|
|
|
string::size_type x = data.find('(');
|
|
|
|
if (x < string::npos)
|
|
data.erase(x, 1);
|
|
|
|
x = data.find(')');
|
|
|
|
if (x < string::npos)
|
|
data.erase(x, 1);
|
|
|
|
if (number_value(data))
|
|
{
|
|
float floatvalue;
|
|
errno = 0;
|
|
floatvalue = strtof(data.c_str(), 0);
|
|
|
|
if (errno == ERANGE)
|
|
{
|
|
pushWarning = true;
|
|
if (abs(floatvalue) == HUGE_VALF)
|
|
{
|
|
if (floatvalue > 0)
|
|
floatvalue = MAX_FLOAT;
|
|
else
|
|
floatvalue = MIN_FLOAT;
|
|
}
|
|
else
|
|
floatvalue = 0;
|
|
}
|
|
|
|
if (floatvalue < 0.0 && typeCode == datatypes::SystemCatalog::UFLOAT &&
|
|
floatvalue != static_cast<float>(joblist::FLOATEMPTYROW) &&
|
|
floatvalue != static_cast<float>(joblist::FLOATNULL))
|
|
{
|
|
value = 0.0; // QQ: should it assign floatvalue?
|
|
pushWarning = true;
|
|
}
|
|
|
|
value = floatvalue;
|
|
}
|
|
else
|
|
throw QueryDataExcept("range, valid value or conversion error on FLOAT type.", formatErr);
|
|
return value;
|
|
}
|
|
|
|
boost::any DataConvert::StringToDouble(cscDataType typeCode, const std::string& dataOrig, bool& pushWarning)
|
|
{
|
|
boost::any value;
|
|
std::string data(dataOrig);
|
|
|
|
string::size_type x = data.find('(');
|
|
|
|
if (x < string::npos)
|
|
data.erase(x, 1);
|
|
|
|
x = data.find(')');
|
|
|
|
if (x < string::npos)
|
|
data.erase(x, 1);
|
|
|
|
if (number_value(data))
|
|
{
|
|
double doublevalue;
|
|
errno = 0;
|
|
doublevalue = strtod(data.c_str(), 0);
|
|
|
|
if (errno == ERANGE)
|
|
{
|
|
pushWarning = true;
|
|
if (abs(doublevalue) == HUGE_VALL)
|
|
{
|
|
if (doublevalue > 0)
|
|
value = MAX_DOUBLE;
|
|
else
|
|
value = MIN_DOUBLE;
|
|
}
|
|
else
|
|
value = 0;
|
|
}
|
|
else
|
|
value = doublevalue;
|
|
|
|
if (doublevalue < 0.0 && typeCode == datatypes::SystemCatalog::UDOUBLE &&
|
|
doublevalue != static_cast<double>(joblist::DOUBLEEMPTYROW) &&
|
|
doublevalue != static_cast<double>(joblist::DOUBLENULL))
|
|
{
|
|
doublevalue = 0.0; // QQ: should it assign "value" ?
|
|
pushWarning = true;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
throw QueryDataExcept("range, valid value or conversion error on DOUBLE type.", formatErr);
|
|
}
|
|
return value;
|
|
}
|
|
|
|
boost::any DataConvert::StringToString(const datatypes::TypeAttributesStd& colType,
|
|
const std::string& dataOrig, bool& pushWarning)
|
|
|
|
{
|
|
std::string data(dataOrig);
|
|
// check data length
|
|
if (data.length() > (unsigned int)colType.colWidth)
|
|
{
|
|
// TODO: charsetNumber should be moved to TypeStdAttributes ASAP
|
|
const execplan::CalpontSystemCatalog::ColType& colType2 =
|
|
static_cast<const execplan::CalpontSystemCatalog::ColType&>(colType);
|
|
datatypes::Charset cs(colType2.charsetNumber);
|
|
const char* newEnd = data.data() + colType.colWidth;
|
|
const char* origEnd = data.data() + data.length();
|
|
pushWarning = cs.test_if_important_data(newEnd, origEnd);
|
|
data = data.substr(0, colType.colWidth);
|
|
boost::any value = data;
|
|
return value;
|
|
}
|
|
if ((unsigned int)colType.colWidth > data.length())
|
|
{
|
|
// Pad null character to the string
|
|
data.resize(colType.colWidth, 0);
|
|
}
|
|
boost::any value = data;
|
|
return value;
|
|
}
|
|
|
|
boost::any DataConvert::StringToDate(const std::string& data, bool& pushWarning)
|
|
{
|
|
Date aDay;
|
|
|
|
if (stringToDateStruct(data, aDay))
|
|
{
|
|
boost::any value = getUInt32LE((const char*)&aDay);
|
|
return value;
|
|
}
|
|
boost::any value = (uint32_t)0;
|
|
pushWarning = true;
|
|
return value;
|
|
}
|
|
|
|
boost::any DataConvert::StringToDatetime(const std::string& data, bool& pushWarning)
|
|
{
|
|
DateTime aDatetime;
|
|
|
|
if (stringToDatetimeStruct(data, aDatetime, 0)) // QQ: why 0?
|
|
{
|
|
boost::any value = getUInt64LE((const char*)&aDatetime);
|
|
return value;
|
|
}
|
|
boost::any value = (uint64_t)0;
|
|
pushWarning = true;
|
|
return value;
|
|
}
|
|
|
|
boost::any DataConvert::StringToTime(const datatypes::TypeAttributesStd& colType, const std::string& data,
|
|
bool& pushWarning)
|
|
{
|
|
Time aTime;
|
|
|
|
if (!stringToTimeStruct(data, aTime, colType.precision))
|
|
{
|
|
pushWarning = true;
|
|
}
|
|
|
|
boost::any value = getSInt64LE((const char*)&aTime);
|
|
return value;
|
|
}
|
|
|
|
boost::any DataConvert::StringToTimestamp(const datatypes::ConvertFromStringParam& prm,
|
|
const std::string& data, bool& pushWarning)
|
|
{
|
|
TimeStamp aTimestamp;
|
|
|
|
if (!stringToTimestampStruct(data, aTimestamp, prm.timeZone()))
|
|
{
|
|
pushWarning = true;
|
|
}
|
|
|
|
boost::any value = getUInt64LE((const char*)&aTimestamp);
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert date32 parquet data to binary date. Used by BulkLoad.
|
|
//------------------------------------------------------------------------------
|
|
int32_t DataConvert::convertArrowColumnDate(int32_t dayVal, int& status)
|
|
{
|
|
int inYear;
|
|
int inMonth;
|
|
int inDay;
|
|
int32_t value = 0;
|
|
|
|
int64_t secondsSinceEpoch = dayVal;
|
|
secondsSinceEpoch *= 86400;
|
|
std::chrono::seconds duration(secondsSinceEpoch);
|
|
|
|
std::chrono::system_clock::time_point timePoint(duration);
|
|
|
|
std::time_t ttime = std::chrono::system_clock::to_time_t(timePoint);
|
|
std::tm* timeInfo = std::localtime(&ttime);
|
|
|
|
inYear = timeInfo->tm_year + 1900;
|
|
inMonth = timeInfo->tm_mon + 1;
|
|
inDay = timeInfo->tm_mday;
|
|
|
|
if (isDateValid(inDay, inMonth, inYear))
|
|
{
|
|
Date aDay;
|
|
aDay.year = inYear;
|
|
aDay.month = inMonth;
|
|
aDay.day = inDay;
|
|
memcpy(&value, &aDay, 4);
|
|
}
|
|
else
|
|
{
|
|
status = -1;
|
|
}
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert date string to binary date. Used by BulkLoad.
|
|
//------------------------------------------------------------------------------
|
|
int32_t DataConvert::convertColumnDate(const char* dataOrg, CalpontDateTimeFormat dateFormat, int& status,
|
|
unsigned int dataOrgLen)
|
|
{
|
|
status = 0;
|
|
const char* p;
|
|
p = dataOrg;
|
|
char fld[10];
|
|
int32_t value = 0;
|
|
|
|
if (dateFormat != CALPONTDATE_ENUM)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
// @bug 5787: allow for leading blanks
|
|
unsigned int dataLen = dataOrgLen;
|
|
|
|
if ((dataOrgLen > 0) && (dataOrg[0] == ' '))
|
|
{
|
|
unsigned nblanks = 0;
|
|
|
|
for (unsigned nn = 0; nn < dataOrgLen; nn++)
|
|
{
|
|
if (dataOrg[nn] == ' ')
|
|
nblanks++;
|
|
else
|
|
break;
|
|
}
|
|
|
|
p = dataOrg + nblanks;
|
|
dataLen = dataOrgLen - nblanks;
|
|
}
|
|
|
|
if (dataLen < 10)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
int inYear, inMonth, inDay;
|
|
memcpy(fld, p, 4);
|
|
fld[4] = '\0';
|
|
|
|
inYear = strtol(fld, 0, 10);
|
|
|
|
memcpy(fld, p + 5, 2);
|
|
fld[2] = '\0';
|
|
|
|
inMonth = strtol(fld, 0, 10);
|
|
|
|
memcpy(fld, p + 8, 2);
|
|
fld[2] = '\0';
|
|
|
|
inDay = strtol(fld, 0, 10);
|
|
|
|
if (isDateValid(inDay, inMonth, inYear))
|
|
{
|
|
Date aDay;
|
|
aDay.year = inYear;
|
|
aDay.month = inMonth;
|
|
aDay.day = inDay;
|
|
memcpy(&value, &aDay, 4);
|
|
}
|
|
else
|
|
{
|
|
status = -1;
|
|
}
|
|
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Verify that specified date is valid
|
|
//------------------------------------------------------------------------------
|
|
bool DataConvert::isColumnDateValid(int32_t date)
|
|
{
|
|
Date d;
|
|
void* dp = static_cast<void*>(&d);
|
|
memcpy(dp, &date, sizeof(int32_t));
|
|
return (isDateValid(d.day, d.month, d.year));
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert timestamp parquet data to binary datetime(millisecond). Used by BulkLoad.
|
|
//------------------------------------------------------------------------------
|
|
int64_t DataConvert::convertArrowColumnDatetime(int64_t timeVal, int& status)
|
|
{
|
|
int64_t value = 0;
|
|
int inYear;
|
|
int inMonth;
|
|
int inDay;
|
|
int inHour;
|
|
int inMinute;
|
|
int inSecond;
|
|
int inMicrosecond;
|
|
|
|
std::chrono::milliseconds duration(timeVal);
|
|
std::chrono::system_clock::time_point timePoint(duration);
|
|
|
|
std::time_t ttime = std::chrono::system_clock::to_time_t(timePoint);
|
|
std::tm* timeInfo = std::gmtime(&ttime);
|
|
|
|
inYear = timeInfo->tm_year + 1900;
|
|
inMonth = timeInfo->tm_mon + 1;
|
|
inDay = timeInfo->tm_mday;
|
|
inHour = timeInfo->tm_hour;
|
|
inMinute = timeInfo->tm_min;
|
|
inSecond = timeInfo->tm_sec;
|
|
inMicrosecond = duration.count() % 1000;
|
|
if (isDateValid(inDay, inMonth, inYear) && isDateTimeValid(inHour, inMinute, inSecond, inMicrosecond))
|
|
{
|
|
DateTime aDatetime;
|
|
aDatetime.year = inYear;
|
|
aDatetime.month = inMonth;
|
|
aDatetime.day = inDay;
|
|
aDatetime.hour = inHour;
|
|
aDatetime.minute = inMinute;
|
|
aDatetime.second = inSecond;
|
|
aDatetime.msecond = inMicrosecond;
|
|
|
|
memcpy(&value, &aDatetime, 8);
|
|
}
|
|
else
|
|
{
|
|
status = -1;
|
|
}
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert timestamp parquet data to binary datetime(millisecond). Used by BulkLoad.
|
|
//------------------------------------------------------------------------------
|
|
int64_t DataConvert::convertArrowColumnDatetimeUs(int64_t timeVal, int& status)
|
|
{
|
|
int64_t value = 0;
|
|
int inYear;
|
|
int inMonth;
|
|
int inDay;
|
|
int inHour;
|
|
int inMinute;
|
|
int inSecond;
|
|
int inMicrosecond;
|
|
|
|
std::chrono::microseconds duration(timeVal);
|
|
std::chrono::system_clock::time_point timePoint(duration);
|
|
|
|
std::time_t ttime = std::chrono::system_clock::to_time_t(timePoint);
|
|
std::tm* timeInfo = std::gmtime(&ttime);
|
|
|
|
inYear = timeInfo->tm_year + 1900;
|
|
inMonth = timeInfo->tm_mon + 1;
|
|
inDay = timeInfo->tm_mday;
|
|
inHour = timeInfo->tm_hour;
|
|
inMinute = timeInfo->tm_min;
|
|
inSecond = timeInfo->tm_sec;
|
|
inMicrosecond = duration.count() % 1000000;
|
|
if (isDateValid(inDay, inMonth, inYear) && isDateTimeValid(inHour, inMinute, inSecond, inMicrosecond))
|
|
{
|
|
DateTime aDatetime;
|
|
aDatetime.year = inYear;
|
|
aDatetime.month = inMonth;
|
|
aDatetime.day = inDay;
|
|
aDatetime.hour = inHour;
|
|
aDatetime.minute = inMinute;
|
|
aDatetime.second = inSecond;
|
|
aDatetime.msecond = inMicrosecond;
|
|
|
|
memcpy(&value, &aDatetime, 8);
|
|
}
|
|
else
|
|
{
|
|
status = -1;
|
|
}
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert date/time string to binary date/time. Used by BulkLoad.
|
|
//------------------------------------------------------------------------------
|
|
int64_t DataConvert::convertColumnDatetime(const char* dataOrg, CalpontDateTimeFormat datetimeFormat,
|
|
int& status, unsigned int dataOrgLen)
|
|
{
|
|
status = 0;
|
|
const char* p;
|
|
p = dataOrg;
|
|
char fld[10];
|
|
int64_t value = 0;
|
|
|
|
if (datetimeFormat != CALPONTDATETIME_ENUM)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
// @bug 5787: allow for leading blanks
|
|
unsigned int dataLen = dataOrgLen;
|
|
|
|
if ((dataOrgLen > 0) && (dataOrg[0] == ' '))
|
|
{
|
|
unsigned nblanks = 0;
|
|
|
|
for (unsigned nn = 0; nn < dataOrgLen; nn++)
|
|
{
|
|
if (dataOrg[nn] == ' ')
|
|
nblanks++;
|
|
else
|
|
break;
|
|
}
|
|
|
|
p = dataOrg + nblanks;
|
|
dataLen = dataOrgLen - nblanks;
|
|
}
|
|
|
|
if (dataLen < 10)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
int inYear, inMonth, inDay, inHour, inMinute, inSecond, inMicrosecond;
|
|
memcpy(fld, p, 4);
|
|
fld[4] = '\0';
|
|
|
|
inYear = strtol(fld, 0, 10);
|
|
|
|
memcpy(fld, p + 5, 2);
|
|
fld[2] = '\0';
|
|
|
|
inMonth = strtol(fld, 0, 10);
|
|
|
|
memcpy(fld, p + 8, 2);
|
|
fld[2] = '\0';
|
|
|
|
inDay = strtol(fld, 0, 10);
|
|
|
|
inHour = 0;
|
|
inMinute = 0;
|
|
inSecond = 0;
|
|
inMicrosecond = 0;
|
|
|
|
if (dataLen > 12)
|
|
{
|
|
// For backwards compatability we still allow leading blank
|
|
if ((!isdigit(p[11]) && (p[11] != ' ')) || !isdigit(p[12]))
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
memcpy(fld, p + 11, 2);
|
|
fld[2] = '\0';
|
|
|
|
inHour = strtol(fld, 0, 10);
|
|
|
|
if (dataLen > 15)
|
|
{
|
|
if (!isdigit(p[14]) || !isdigit(p[15]))
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
memcpy(fld, p + 14, 2);
|
|
fld[2] = '\0';
|
|
|
|
inMinute = strtol(fld, 0, 10);
|
|
|
|
if (dataLen > 18)
|
|
{
|
|
if (!isdigit(p[17]) || !isdigit(p[18]))
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
memcpy(fld, p + 17, 2);
|
|
fld[2] = '\0';
|
|
|
|
inSecond = strtol(fld, 0, 10);
|
|
|
|
if (dataLen > 20)
|
|
{
|
|
unsigned int microFldLen = dataLen - 20;
|
|
|
|
if (microFldLen > (sizeof(fld) - 1))
|
|
microFldLen = sizeof(fld) - 1;
|
|
|
|
memcpy(fld, p + 20, microFldLen);
|
|
fld[microFldLen] = '\0';
|
|
inMicrosecond = strtol(fld, 0, 10);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
if (isDateValid(inDay, inMonth, inYear) && isDateTimeValid(inHour, inMinute, inSecond, inMicrosecond))
|
|
{
|
|
DateTime aDatetime;
|
|
aDatetime.year = inYear;
|
|
aDatetime.month = inMonth;
|
|
aDatetime.day = inDay;
|
|
aDatetime.hour = inHour;
|
|
aDatetime.minute = inMinute;
|
|
aDatetime.second = inSecond;
|
|
aDatetime.msecond = inMicrosecond;
|
|
|
|
memcpy(&value, &aDatetime, 8);
|
|
}
|
|
else
|
|
{
|
|
status = -1;
|
|
}
|
|
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert timestamp parquet data to binary timestamp. Used by BulkLoad.
|
|
//------------------------------------------------------------------------------
|
|
int64_t DataConvert::convertArrowColumnTimestamp(int64_t timeVal, int& status)
|
|
{
|
|
int64_t value = 0;
|
|
int inYear;
|
|
int inMonth;
|
|
int inDay;
|
|
int inHour;
|
|
int inMinute;
|
|
int inSecond;
|
|
int inMicrosecond;
|
|
|
|
std::chrono::milliseconds duration(timeVal);
|
|
std::chrono::system_clock::time_point timePoint(duration);
|
|
|
|
std::time_t ttime = std::chrono::system_clock::to_time_t(timePoint);
|
|
std::tm* timeInfo = std::gmtime(&ttime);
|
|
|
|
inYear = timeInfo->tm_year + 1900;
|
|
inMonth = timeInfo->tm_mon + 1;
|
|
inDay = timeInfo->tm_mday;
|
|
inHour = timeInfo->tm_hour;
|
|
inMinute = timeInfo->tm_min;
|
|
inSecond = timeInfo->tm_sec;
|
|
inMicrosecond = duration.count() % 1000;
|
|
if (isDateValid(inDay, inMonth, inYear) && isDateTimeValid(inHour, inMinute, inSecond, inMicrosecond))
|
|
{
|
|
MySQLTime m_time;
|
|
m_time.year = inYear;
|
|
m_time.month = inMonth;
|
|
m_time.day = inDay;
|
|
m_time.hour = inHour;
|
|
m_time.minute = inMinute;
|
|
m_time.second = inSecond;
|
|
m_time.second_part = inMicrosecond;
|
|
|
|
bool isValid = true;
|
|
int64_t seconds = mySQLTimeToGmtSec(m_time, 0, isValid);
|
|
|
|
if (!isValid)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
TimeStamp timestamp;
|
|
timestamp.second = seconds;
|
|
timestamp.msecond = m_time.second_part;
|
|
|
|
memcpy(&value, ×tamp, 8);
|
|
}
|
|
else
|
|
{
|
|
status = -1;
|
|
}
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert timestamp parquet data to binary timestamp. Used by BulkLoad.
|
|
//------------------------------------------------------------------------------
|
|
int64_t DataConvert::convertArrowColumnTimestampUs(int64_t timeVal, int& status)
|
|
{
|
|
int64_t value = 0;
|
|
int inYear;
|
|
int inMonth;
|
|
int inDay;
|
|
int inHour;
|
|
int inMinute;
|
|
int inSecond;
|
|
int inMicrosecond;
|
|
|
|
std::chrono::microseconds duration(timeVal);
|
|
std::chrono::system_clock::time_point timePoint(duration);
|
|
|
|
std::time_t ttime = std::chrono::system_clock::to_time_t(timePoint);
|
|
std::tm* timeInfo = std::gmtime(&ttime);
|
|
|
|
inYear = timeInfo->tm_year + 1900;
|
|
inMonth = timeInfo->tm_mon + 1;
|
|
inDay = timeInfo->tm_mday;
|
|
inHour = timeInfo->tm_hour;
|
|
inMinute = timeInfo->tm_min;
|
|
inSecond = timeInfo->tm_sec;
|
|
inMicrosecond = static_cast<int>(duration.count() % 1000000);
|
|
|
|
if (isDateValid(inDay, inMonth, inYear) && isDateTimeValid(inHour, inMinute, inSecond, inMicrosecond))
|
|
{
|
|
MySQLTime m_time;
|
|
m_time.year = inYear;
|
|
m_time.month = inMonth;
|
|
m_time.day = inDay;
|
|
m_time.hour = inHour;
|
|
m_time.minute = inMinute;
|
|
m_time.second = inSecond;
|
|
m_time.second_part = inMicrosecond;
|
|
|
|
bool isValid = true;
|
|
int64_t seconds = mySQLTimeToGmtSec(m_time, 0, isValid);
|
|
|
|
if (!isValid)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
TimeStamp timestamp;
|
|
timestamp.second = seconds;
|
|
timestamp.msecond = m_time.second_part;
|
|
|
|
memcpy(&value, ×tamp, 8);
|
|
}
|
|
else
|
|
{
|
|
status = -1;
|
|
}
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert timestamp string to binary timestamp. Used by BulkLoad.
|
|
// Most of this code is taken from DataConvert::convertColumnDatetime
|
|
//------------------------------------------------------------------------------
|
|
int64_t DataConvert::convertColumnTimestamp(const char* dataOrg, CalpontDateTimeFormat datetimeFormat,
|
|
int& status, unsigned int dataOrgLen, long timeZone)
|
|
{
|
|
char tmbuf[64];
|
|
std::string dataOrgTemp = dataOrg;
|
|
status = 0;
|
|
if (dataOrgTemp.substr(0, 19) == "0000-00-00 00:00:00")
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
// this is the default value of the first timestamp field in a table,
|
|
// which is stored in the system catalog
|
|
if (strcmp(dataOrg, "current_timestamp() ON UPDATE current_timestamp()") == 0)
|
|
{
|
|
struct timeval tv;
|
|
gettimeofday(&tv, 0);
|
|
MySQLTime time;
|
|
gmtSecToMySQLTime(tv.tv_sec, time, timeZone);
|
|
sprintf(tmbuf, "%04d-%02d-%02d %02d:%02d:%02d.%06ld", time.year, time.month, time.day, time.hour,
|
|
time.minute, time.second, tv.tv_usec);
|
|
dataOrg = tmbuf;
|
|
dataOrgLen = strlen(tmbuf);
|
|
}
|
|
|
|
const char* p;
|
|
p = dataOrg;
|
|
char fld[10];
|
|
int64_t value = 0;
|
|
|
|
if (datetimeFormat != CALPONTDATETIME_ENUM)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
unsigned int dataLen = dataOrgLen;
|
|
|
|
if ((dataOrgLen > 0) && (dataOrg[0] == ' '))
|
|
{
|
|
unsigned nblanks = 0;
|
|
|
|
for (unsigned nn = 0; nn < dataOrgLen; nn++)
|
|
{
|
|
if (dataOrg[nn] == ' ')
|
|
nblanks++;
|
|
else
|
|
break;
|
|
}
|
|
|
|
p = dataOrg + nblanks;
|
|
dataLen = dataOrgLen - nblanks;
|
|
}
|
|
|
|
if (dataLen < 10)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
int inYear, inMonth, inDay, inHour, inMinute, inSecond, inMicrosecond;
|
|
memcpy(fld, p, 4);
|
|
fld[4] = '\0';
|
|
|
|
inYear = strtol(fld, 0, 10);
|
|
|
|
memcpy(fld, p + 5, 2);
|
|
fld[2] = '\0';
|
|
|
|
inMonth = strtol(fld, 0, 10);
|
|
|
|
memcpy(fld, p + 8, 2);
|
|
fld[2] = '\0';
|
|
|
|
inDay = strtol(fld, 0, 10);
|
|
|
|
inHour = 0;
|
|
inMinute = 0;
|
|
inSecond = 0;
|
|
inMicrosecond = 0;
|
|
|
|
if (dataLen > 12)
|
|
{
|
|
// For backwards compatability we still allow leading blank
|
|
if ((!isdigit(p[11]) && (p[11] != ' ')) || !isdigit(p[12]))
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
memcpy(fld, p + 11, 2);
|
|
fld[2] = '\0';
|
|
|
|
inHour = strtol(fld, 0, 10);
|
|
|
|
if (dataLen > 15)
|
|
{
|
|
if (!isdigit(p[14]) || !isdigit(p[15]))
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
memcpy(fld, p + 14, 2);
|
|
fld[2] = '\0';
|
|
|
|
inMinute = strtol(fld, 0, 10);
|
|
|
|
if (dataLen > 18)
|
|
{
|
|
if (!isdigit(p[17]) || !isdigit(p[18]))
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
memcpy(fld, p + 17, 2);
|
|
fld[2] = '\0';
|
|
|
|
inSecond = strtol(fld, 0, 10);
|
|
|
|
if (dataLen > 20)
|
|
{
|
|
unsigned int microFldLen = dataLen - 20;
|
|
|
|
if (microFldLen > (sizeof(fld) - 1))
|
|
microFldLen = sizeof(fld) - 1;
|
|
|
|
memcpy(fld, p + 20, microFldLen);
|
|
fld[microFldLen] = '\0';
|
|
inMicrosecond = strtol(fld, 0, 10);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
if (isDateValid(inDay, inMonth, inYear) && isDateTimeValid(inHour, inMinute, inSecond, inMicrosecond))
|
|
{
|
|
MySQLTime m_time;
|
|
m_time.year = inYear;
|
|
m_time.month = inMonth;
|
|
m_time.day = inDay;
|
|
m_time.hour = inHour;
|
|
m_time.minute = inMinute;
|
|
m_time.second = inSecond;
|
|
m_time.second_part = inMicrosecond;
|
|
|
|
bool isValid = true;
|
|
int64_t seconds = mySQLTimeToGmtSec(m_time, timeZone, isValid);
|
|
|
|
if (!isValid)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
TimeStamp timestamp;
|
|
timestamp.second = seconds;
|
|
timestamp.msecond = m_time.second_part;
|
|
|
|
memcpy(&value, ×tamp, 8);
|
|
}
|
|
else
|
|
{
|
|
status = -1;
|
|
}
|
|
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert time32 parquet data to binary time. Used by BulkLoad.
|
|
//------------------------------------------------------------------------------
|
|
int64_t DataConvert::convertArrowColumnTime32(int32_t timeVal, int& status)
|
|
{
|
|
int64_t value = 0;
|
|
// convert millisecond to time
|
|
int inHour, inMinute, inSecond, inMicrosecond;
|
|
inHour = inMinute = inSecond = inMicrosecond = 0;
|
|
bool isNeg = false;
|
|
if (timeVal < 0)
|
|
isNeg = true;
|
|
inHour = timeVal / 3600000;
|
|
inMinute = (timeVal - inHour * 3600000) / 60000;
|
|
inSecond = (timeVal - inHour * 3600000 - inMinute * 60000) / 1000;
|
|
inMicrosecond = timeVal - inHour * 3600000 - inMinute * 60000 - inSecond * 1000;
|
|
if (isTimeValid(inHour, inMinute, inSecond, inMicrosecond))
|
|
{
|
|
Time atime;
|
|
atime.hour = inHour;
|
|
atime.minute = inMinute;
|
|
atime.second = inSecond;
|
|
atime.msecond = inMicrosecond;
|
|
atime.is_neg = isNeg;
|
|
|
|
memcpy(&value, &atime, 8);
|
|
}
|
|
else
|
|
{
|
|
// Emulate MariaDB's time saturation
|
|
if (inHour > 838)
|
|
{
|
|
Time atime;
|
|
atime.hour = 838;
|
|
atime.minute = 59;
|
|
atime.second = 59;
|
|
atime.msecond = 999999;
|
|
atime.is_neg = false;
|
|
memcpy(&value, &atime, 8);
|
|
}
|
|
else if (inHour < -838)
|
|
{
|
|
Time atime;
|
|
atime.hour = -838;
|
|
atime.minute = 59;
|
|
atime.second = 59;
|
|
atime.msecond = 999999;
|
|
atime.is_neg = false;
|
|
memcpy(&value, &atime, 8);
|
|
}
|
|
|
|
// If neither of the above match then we return a 0 time
|
|
|
|
status = -1;
|
|
}
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert time64 parquet data to binary time. Used by BulkLoad.
|
|
//------------------------------------------------------------------------------
|
|
int64_t DataConvert::convertArrowColumnTime64(int64_t timeVal, int& status)
|
|
{
|
|
int64_t value = 0;
|
|
// convert macrosecond to time
|
|
int inHour, inMinute, inSecond, inMicrosecond;
|
|
inHour = inMinute = inSecond = inMicrosecond = 0;
|
|
bool isNeg = false;
|
|
if (timeVal < 0)
|
|
isNeg = true;
|
|
inHour = timeVal / 3600000000;
|
|
inMinute = (timeVal - inHour * 3600000000) / 60000000;
|
|
inSecond = (timeVal - inHour * 3600000000 - inMinute * 60000000) / 1000000;
|
|
inMicrosecond = timeVal - inHour * 3600000000 - inMinute * 60000000 - inSecond * 1000000;
|
|
if (isTimeValid(inHour, inMinute, inSecond, inMicrosecond))
|
|
{
|
|
Time atime;
|
|
atime.hour = inHour;
|
|
atime.minute = inMinute;
|
|
atime.second = inSecond;
|
|
atime.msecond = inMicrosecond;
|
|
atime.is_neg = isNeg;
|
|
|
|
memcpy(&value, &atime, 8);
|
|
}
|
|
else
|
|
{
|
|
// Emulate MariaDB's time saturation
|
|
if (inHour > 838)
|
|
{
|
|
Time atime;
|
|
atime.hour = 838;
|
|
atime.minute = 59;
|
|
atime.second = 59;
|
|
atime.msecond = 999999;
|
|
atime.is_neg = false;
|
|
memcpy(&value, &atime, 8);
|
|
}
|
|
else if (inHour < -838)
|
|
{
|
|
Time atime;
|
|
atime.hour = -838;
|
|
atime.minute = 59;
|
|
atime.second = 59;
|
|
atime.msecond = 999999;
|
|
atime.is_neg = false;
|
|
memcpy(&value, &atime, 8);
|
|
}
|
|
|
|
// If neither of the above match then we return a 0 time
|
|
|
|
status = -1;
|
|
}
|
|
return value;
|
|
}
|
|
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Convert time string to binary time. Used by BulkLoad.
|
|
// Most of this is taken from str_to_time in sql-common/my_time.c
|
|
//------------------------------------------------------------------------------
|
|
int64_t DataConvert::convertColumnTime(const char* dataOrg, CalpontDateTimeFormat datetimeFormat, int& status,
|
|
unsigned int dataOrgLen)
|
|
{
|
|
status = 0;
|
|
char* p;
|
|
char* retp = NULL;
|
|
char* savePoint = NULL;
|
|
p = const_cast<char*>(dataOrg);
|
|
int64_t value = 0;
|
|
int inHour, inMinute, inSecond, inMicrosecond;
|
|
inHour = 0;
|
|
inMinute = 0;
|
|
inSecond = 0;
|
|
inMicrosecond = 0;
|
|
bool isNeg = false;
|
|
|
|
if (datetimeFormat != CALPONTTIME_ENUM)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
if (dataOrgLen == 0)
|
|
{
|
|
return value;
|
|
}
|
|
|
|
if (dataOrgLen < 3)
|
|
{
|
|
// Not enough chars to be a time
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
if (p[0] == '-')
|
|
{
|
|
isNeg = true;
|
|
}
|
|
|
|
errno = 0;
|
|
|
|
p = strtok_r(p, ":.", &savePoint);
|
|
inHour = strtol(p, &retp, 10);
|
|
|
|
if (errno || !retp)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
p = strtok_r(NULL, ":.", &savePoint);
|
|
|
|
if (p == NULL)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
inMinute = strtol(p, &retp, 10);
|
|
|
|
if (errno || !retp)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
p = strtok_r(NULL, ":.", &savePoint);
|
|
|
|
if (p == NULL)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
inSecond = strtol(p, &retp, 10);
|
|
|
|
if (errno || !retp)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
|
|
p = strtok_r(NULL, ":.", &savePoint);
|
|
|
|
if (p != NULL)
|
|
{
|
|
inMicrosecond = strtol(p, &retp, 10);
|
|
|
|
if (errno || !retp)
|
|
{
|
|
status = -1;
|
|
return value;
|
|
}
|
|
}
|
|
|
|
if (isTimeValid(inHour, inMinute, inSecond, inMicrosecond))
|
|
{
|
|
Time atime;
|
|
atime.hour = inHour;
|
|
atime.minute = inMinute;
|
|
atime.second = inSecond;
|
|
atime.msecond = inMicrosecond;
|
|
atime.is_neg = isNeg;
|
|
|
|
memcpy(&value, &atime, 8);
|
|
}
|
|
else
|
|
{
|
|
// Emulate MariaDB's time saturation
|
|
if (inHour > 838)
|
|
{
|
|
Time atime;
|
|
atime.hour = 838;
|
|
atime.minute = 59;
|
|
atime.second = 59;
|
|
atime.msecond = 999999;
|
|
atime.is_neg = false;
|
|
memcpy(&value, &atime, 8);
|
|
}
|
|
else if (inHour < -838)
|
|
{
|
|
Time atime;
|
|
atime.hour = -838;
|
|
atime.minute = 59;
|
|
atime.second = 59;
|
|
atime.msecond = 999999;
|
|
atime.is_neg = false;
|
|
memcpy(&value, &atime, 8);
|
|
}
|
|
|
|
// If neither of the above match then we return a 0 time
|
|
|
|
status = -1;
|
|
}
|
|
|
|
return value;
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Verify that specified datetime is valid
|
|
//------------------------------------------------------------------------------
|
|
bool DataConvert::isColumnDateTimeValid(int64_t dateTime)
|
|
{
|
|
DateTime dt;
|
|
void* dtp = static_cast<void*>(&dt);
|
|
memcpy(dtp, &dateTime, sizeof(uint64_t));
|
|
|
|
if (isDateValid(dt.day, dt.month, dt.year))
|
|
return isDateTimeValid(dt.hour, dt.minute, dt.second, dt.msecond);
|
|
|
|
return false;
|
|
}
|
|
|
|
bool DataConvert::isColumnTimeValid(int64_t time)
|
|
{
|
|
Time dt;
|
|
void* dtp = static_cast<void*>(&dt);
|
|
memcpy(dtp, &time, sizeof(uint64_t));
|
|
|
|
return isTimeValid(dt.hour, dt.minute, dt.second, dt.msecond);
|
|
}
|
|
|
|
bool DataConvert::isColumnTimeStampValid(int64_t timeStamp)
|
|
{
|
|
TimeStamp dt;
|
|
void* dtp = static_cast<void*>(&dt);
|
|
memcpy(dtp, &timeStamp, sizeof(uint64_t));
|
|
|
|
return isTimestampValid(dt.second, dt.msecond);
|
|
}
|
|
|
|
std::string DataConvert::dateToString(int datevalue)
|
|
{
|
|
// @bug 4703 abandon multiple ostringstream's for conversion
|
|
Date d(datevalue);
|
|
const int DATETOSTRING_LEN = 12; // YYYY-MM-DD\0
|
|
char buf[DATETOSTRING_LEN];
|
|
|
|
sprintf(buf, "%04d-%02d-%02d", d.year, d.month, d.day);
|
|
return buf;
|
|
}
|
|
|
|
std::string DataConvert::datetimeToString(long long datetimevalue, long decimals)
|
|
{
|
|
// 10 is default which means we don't need microseconds
|
|
if (decimals > 6 || decimals < 0)
|
|
{
|
|
decimals = 0;
|
|
}
|
|
|
|
// @bug 4703 abandon multiple ostringstream's for conversion
|
|
DateTime dt(datetimevalue);
|
|
const int DATETIMETOSTRING_LEN = 28; // YYYY-MM-DD HH:MM:SS.mmmmmm\0
|
|
char buf[DATETIMETOSTRING_LEN];
|
|
|
|
sprintf(buf, "%04d-%02d-%02d %02d:%02d:%02d", dt.year, dt.month, dt.day, dt.hour, dt.minute, dt.second);
|
|
|
|
if (dt.msecond && decimals)
|
|
{
|
|
// Pad start with zeros
|
|
sprintf(buf + strlen(buf), ".%0*d", (int)decimals, dt.msecond);
|
|
}
|
|
|
|
return buf;
|
|
}
|
|
|
|
std::string DataConvert::timestampToString(long long timestampvalue, long timezone, long decimals)
|
|
{
|
|
// 10 is default which means we don't need microseconds
|
|
if (decimals > 6 || decimals < 0)
|
|
{
|
|
decimals = 0;
|
|
}
|
|
|
|
TimeStamp timestamp(timestampvalue);
|
|
int64_t seconds = timestamp.second;
|
|
|
|
MySQLTime time;
|
|
gmtSecToMySQLTime(seconds, time, timezone);
|
|
|
|
const int TIMESTAMPTOSTRING_LEN = 28; // YYYY-MM-DD HH:MM:SS.mmmmmm\0
|
|
char buf[TIMESTAMPTOSTRING_LEN];
|
|
|
|
sprintf(buf, "%04d-%02d-%02d %02d:%02d:%02d", time.year, time.month, time.day, time.hour, time.minute,
|
|
time.second);
|
|
|
|
if (timestamp.msecond && decimals)
|
|
{
|
|
// Pad start with zeros
|
|
sprintf(buf + strlen(buf), ".%0*d", (int)decimals, timestamp.msecond);
|
|
}
|
|
|
|
return buf;
|
|
}
|
|
|
|
std::string DataConvert::timeToString(long long timevalue, long decimals)
|
|
{
|
|
// 10 is default which means we don't need microseconds
|
|
if (decimals > 6 || decimals < 0)
|
|
{
|
|
decimals = 0;
|
|
}
|
|
|
|
// @bug 4703 abandon multiple ostringstream's for conversion
|
|
Time dt(timevalue);
|
|
const int TIMETOSTRING_LEN = 19; // (-H)HH:MM:SS.mmmmmm\0
|
|
char buf[TIMETOSTRING_LEN];
|
|
char* outbuf = buf;
|
|
|
|
if ((dt.hour >= 0) && dt.is_neg)
|
|
{
|
|
outbuf[0] = '-';
|
|
outbuf++;
|
|
}
|
|
|
|
sprintf(outbuf, "%02d:%02d:%02d", dt.hour, dt.minute, dt.second);
|
|
|
|
if (dt.msecond && decimals)
|
|
{
|
|
// Pad start with zeros
|
|
sprintf(buf + strlen(buf), ".%0*d", (int)decimals, dt.msecond);
|
|
}
|
|
|
|
return buf;
|
|
}
|
|
|
|
std::string DataConvert::dateToString1(int datevalue)
|
|
{
|
|
// @bug 4703 abandon multiple ostringstream's for conversion
|
|
Date d(datevalue);
|
|
const int DATETOSTRING1_LEN = 10; // YYYYMMDD\0
|
|
char buf[DATETOSTRING1_LEN];
|
|
|
|
sprintf(buf, "%04d%02d%02d", d.year, d.month, d.day);
|
|
return buf;
|
|
}
|
|
|
|
std::string DataConvert::datetimeToString1(long long datetimevalue)
|
|
{
|
|
// @bug 4703 abandon multiple ostringstream's for conversion
|
|
DateTime dt(datetimevalue);
|
|
// Interesting, gcc 7 says the sprintf below generates between 21 and 23 bytes of output.
|
|
const int DATETIMETOSTRING1_LEN = 23; // YYYYMMDDHHMMSSmmmmmm\0
|
|
char buf[DATETIMETOSTRING1_LEN];
|
|
|
|
sprintf(buf, "%04d%02d%02d%02d%02d%02d%06d", dt.year, dt.month, dt.day, dt.hour, dt.minute, dt.second,
|
|
dt.msecond);
|
|
return buf;
|
|
}
|
|
|
|
std::string DataConvert::timestampToString1(long long timestampvalue, long timezone)
|
|
{
|
|
const int TIMESTAMPTOSTRING1_LEN = 22; // YYYYMMDDHHMMSSmmmmmm\0
|
|
char buf[TIMESTAMPTOSTRING1_LEN];
|
|
|
|
TimeStamp timestamp(timestampvalue);
|
|
int64_t seconds = timestamp.second;
|
|
MySQLTime time;
|
|
gmtSecToMySQLTime(seconds, time, timezone);
|
|
|
|
sprintf(buf, "%04d%02d%02d%02d%02d%02d%06d", time.year, time.month, time.day, time.hour, time.minute,
|
|
time.second, timestamp.msecond);
|
|
return buf;
|
|
}
|
|
|
|
std::string DataConvert::timeToString1(long long timevalue)
|
|
{
|
|
// @bug 4703 abandon multiple ostringstream's for conversion
|
|
Time t(timevalue);
|
|
const int TIMETOSTRING1_LEN = 22; // HHMMSSmmmmmm\0
|
|
char buf[TIMETOSTRING1_LEN];
|
|
|
|
char* outbuf = buf;
|
|
|
|
sprintf(outbuf, "%02d%02d%02d%06d", t.hour, t.minute, t.second, t.msecond);
|
|
return buf;
|
|
}
|
|
|
|
int64_t DataConvert::dateToInt(const string& date)
|
|
{
|
|
return stringToDate(date);
|
|
}
|
|
|
|
int64_t DataConvert::dateToInt(const utils::NullString& date)
|
|
{
|
|
return stringToDate(date);
|
|
}
|
|
|
|
int64_t DataConvert::datetimeToInt(const string& datetime)
|
|
{
|
|
return stringToDatetime(datetime);
|
|
}
|
|
|
|
int64_t DataConvert::datetimeToInt(const utils::NullString& datetime)
|
|
{
|
|
return stringToDatetime(datetime);
|
|
}
|
|
|
|
int64_t DataConvert::timestampToInt(const string& timestamp, long timeZone)
|
|
{
|
|
return stringToTimestamp(timestamp, timeZone);
|
|
}
|
|
|
|
int64_t DataConvert::timeToInt(const string& time)
|
|
{
|
|
return stringToTime(time);
|
|
}
|
|
|
|
int64_t DataConvert::stringToDate(const string& data)
|
|
{
|
|
Date aDay;
|
|
|
|
if (stringToDateStruct(data, aDay))
|
|
{
|
|
uint32_t temp = getUInt32LE((const char*)&aDay);
|
|
return ((temp & 0xFFFFFFC0) | 0x3E);
|
|
}
|
|
else
|
|
return -1;
|
|
}
|
|
int64_t DataConvert::stringToDate(const utils::NullString& data)
|
|
{
|
|
if (data.isNull())
|
|
{
|
|
return -1;
|
|
}
|
|
|
|
return stringToDate(data.unsafeStringRef());
|
|
}
|
|
|
|
int64_t DataConvert::stringToDatetime(const string& data, bool* date)
|
|
{
|
|
DateTime dtime;
|
|
|
|
if (stringToDatetimeStruct(data, dtime, date))
|
|
return getUInt64LE((const char*)&dtime);
|
|
else
|
|
return -1;
|
|
}
|
|
|
|
int64_t DataConvert::stringToDatetime(const utils::NullString& data, bool* date)
|
|
{
|
|
if (data.isNull())
|
|
{
|
|
if (date)
|
|
{
|
|
*date = false;
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
return stringToDatetime(data.unsafeStringRef(), date);
|
|
}
|
|
|
|
int64_t DataConvert::stringToTimestamp(const string& data, long timeZone)
|
|
{
|
|
TimeStamp aTimestamp;
|
|
|
|
if (stringToTimestampStruct(data, aTimestamp, timeZone))
|
|
return getUInt64LE((const char*)&aTimestamp);
|
|
else
|
|
return -1;
|
|
}
|
|
|
|
int64_t DataConvert::stringToTimestamp(const utils::NullString& data, long timeZone)
|
|
{
|
|
if (data.isNull())
|
|
{
|
|
return -1;
|
|
}
|
|
return stringToTimestamp(data.unsafeStringRef(), timeZone);
|
|
}
|
|
|
|
/* This is really painful and expensive b/c it seems the input is not normalized or
|
|
sanitized. That should really be done on ingestion. */
|
|
int64_t DataConvert::intToDate(int64_t data)
|
|
{
|
|
char buf[21] = {0};
|
|
Date aday;
|
|
|
|
if (data == 0)
|
|
{
|
|
aday.year = 0;
|
|
aday.month = 0;
|
|
aday.day = 0;
|
|
return getUInt32LE((const char*)&aday);
|
|
}
|
|
|
|
// this snprintf call causes a compiler warning b/c we're potentially copying a 20-digit #
|
|
// into 15 bytes, however, that appears to be intentional.
|
|
#if defined(__GNUC__) && __GNUC__ >= 7
|
|
#pragma GCC diagnostic push
|
|
#pragma GCC diagnostic ignored "-Wformat-truncation="
|
|
snprintf(buf, 15, "%llu", (long long unsigned int)data);
|
|
#pragma GCC diagnostic pop
|
|
#else
|
|
snprintf(buf, 15, "%llu", (long long unsigned int)data);
|
|
#endif
|
|
|
|
string year, month, day, hour, min, sec, msec;
|
|
int64_t y = 0, m = 0, d = 0, h = 0, minute = 0, s = 0, ms = 0;
|
|
|
|
switch (strlen(buf))
|
|
{
|
|
case 14:
|
|
year = string(buf, 4);
|
|
month = string(buf + 4, 2);
|
|
day = string(buf + 6, 2);
|
|
hour = string(buf + 8, 2);
|
|
min = string(buf + 10, 2);
|
|
sec = string(buf + 12, 2);
|
|
msec = string(buf + 14, 6);
|
|
break;
|
|
|
|
case 12:
|
|
year = string(buf, 2);
|
|
month = string(buf + 2, 2);
|
|
day = string(buf + 4, 2);
|
|
hour = string(buf + 6, 2);
|
|
min = string(buf + 8, 2);
|
|
sec = string(buf + 10, 2);
|
|
msec = string(buf + 12, 6);
|
|
break;
|
|
|
|
case 10:
|
|
month = string(buf, 2);
|
|
day = string(buf + 2, 2);
|
|
hour = string(buf + 4, 2);
|
|
min = string(buf + 6, 2);
|
|
sec = string(buf + 8, 2);
|
|
msec = string(buf + 10, 6);
|
|
break;
|
|
|
|
case 9:
|
|
month = string(buf, 1);
|
|
day = string(buf + 1, 2);
|
|
hour = string(buf + 3, 2);
|
|
min = string(buf + 5, 2);
|
|
sec = string(buf + 7, 2);
|
|
msec = string(buf + 9, 6);
|
|
break;
|
|
|
|
case 8:
|
|
year = string(buf, 4);
|
|
month = string(buf + 4, 2);
|
|
day = string(buf + 6, 2);
|
|
break;
|
|
|
|
case 6:
|
|
year = string(buf, 2);
|
|
month = string(buf + 2, 2);
|
|
day = string(buf + 4, 2);
|
|
break;
|
|
|
|
case 4:
|
|
month = string(buf, 2);
|
|
day = string(buf + 2, 2);
|
|
break;
|
|
|
|
case 3:
|
|
month = string(buf, 1);
|
|
day = string(buf + 1, 2);
|
|
break;
|
|
|
|
default: return -1;
|
|
}
|
|
|
|
if (year.empty())
|
|
{
|
|
// MMDD format. assume current year
|
|
time_t calender_time;
|
|
struct tm todays_date;
|
|
calender_time = time(NULL);
|
|
localtime_r(&calender_time, &todays_date);
|
|
y = todays_date.tm_year + 1900;
|
|
}
|
|
else
|
|
{
|
|
y = atoi(year.c_str());
|
|
}
|
|
|
|
m = atoi(month.c_str());
|
|
d = atoi(day.c_str());
|
|
h = atoi(hour.c_str());
|
|
minute = atoi(min.c_str());
|
|
s = atoi(sec.c_str());
|
|
ms = atoi(msec.c_str());
|
|
|
|
// if (!isDateValid(d, m, y))
|
|
// return -1;
|
|
if (!isDateValid(d, m, y) || !isDateTimeValid(h, minute, s, ms))
|
|
return -1;
|
|
|
|
aday.year = y;
|
|
aday.month = m;
|
|
aday.day = d;
|
|
return getUInt32LE((const char*)&aday);
|
|
}
|
|
|
|
/* This is really painful and expensive b/c it seems the input is not normalized or
|
|
sanitized. That should really be done on ingestion. */
|
|
int64_t DataConvert::intToDatetime(int64_t data, bool* date)
|
|
{
|
|
bool isDate = false;
|
|
char buf[21] = {0};
|
|
DateTime adaytime;
|
|
|
|
if (data == 0)
|
|
{
|
|
adaytime.year = 0;
|
|
adaytime.month = 0;
|
|
adaytime.day = 0;
|
|
adaytime.hour = 0;
|
|
adaytime.minute = 0;
|
|
adaytime.second = 0;
|
|
adaytime.msecond = 0;
|
|
|
|
if (date)
|
|
*date = true;
|
|
|
|
return getUInt64LE((const char*)&adaytime);
|
|
}
|
|
|
|
// this snprintf call causes a compiler warning b/c we're potentially copying a 20-digit #
|
|
// into 15 bytes, however, that appears to be intentional.
|
|
#if defined(__GNUC__) && __GNUC__ >= 7
|
|
#pragma GCC diagnostic push
|
|
#pragma GCC diagnostic ignored "-Wformat-truncation="
|
|
snprintf(buf, 15, "%llu", (long long unsigned int)data);
|
|
#pragma GCC diagnostic pop
|
|
#else
|
|
snprintf(buf, 15, "%llu", (long long unsigned int)data);
|
|
#endif
|
|
|
|
// string date = buf;
|
|
string year, month, day, hour, min, sec, msec;
|
|
int64_t y = 0, m = 0, d = 0, h = 0, minute = 0, s = 0, ms = 0;
|
|
|
|
switch (strlen(buf))
|
|
{
|
|
case 14:
|
|
year = string(buf, 4);
|
|
month = string(buf + 4, 2);
|
|
day = string(buf + 6, 2);
|
|
hour = string(buf + 8, 2);
|
|
min = string(buf + 10, 2);
|
|
sec = string(buf + 12, 2);
|
|
break;
|
|
|
|
case 12:
|
|
year = string(buf, 2);
|
|
month = string(buf + 2, 2);
|
|
day = string(buf + 4, 2);
|
|
hour = string(buf + 6, 2);
|
|
min = string(buf + 8, 2);
|
|
sec = string(buf + 10, 2);
|
|
break;
|
|
|
|
case 10:
|
|
month = string(buf, 2);
|
|
day = string(buf + 2, 2);
|
|
hour = string(buf + 4, 2);
|
|
min = string(buf + 6, 2);
|
|
sec = string(buf + 8, 2);
|
|
break;
|
|
|
|
case 9:
|
|
month = string(buf, 1);
|
|
day = string(buf + 1, 2);
|
|
hour = string(buf + 3, 2);
|
|
min = string(buf + 5, 2);
|
|
sec = string(buf + 7, 2);
|
|
break;
|
|
|
|
case 8:
|
|
year = string(buf, 4);
|
|
month = string(buf + 4, 2);
|
|
day = string(buf + 6, 2);
|
|
isDate = true;
|
|
break;
|
|
|
|
case 6:
|
|
year = string(buf, 2);
|
|
month = string(buf + 2, 2);
|
|
day = string(buf + 4, 2);
|
|
isDate = true;
|
|
break;
|
|
|
|
case 4:
|
|
month = string(buf, 2);
|
|
day = string(buf + 2, 2);
|
|
break;
|
|
|
|
case 3:
|
|
month = string(buf, 1);
|
|
day = string(buf + 1, 2);
|
|
isDate = true;
|
|
break;
|
|
|
|
default: return -1;
|
|
}
|
|
|
|
if (year.empty())
|
|
{
|
|
// MMDD format. assume current year
|
|
time_t calender_time;
|
|
struct tm todays_date;
|
|
calender_time = time(NULL);
|
|
localtime_r(&calender_time, &todays_date);
|
|
y = todays_date.tm_year + 1900;
|
|
}
|
|
else
|
|
{
|
|
y = atoi(year.c_str());
|
|
|
|
// special handling for 2-byte year
|
|
if (year.length() == 2)
|
|
{
|
|
y += 2000;
|
|
if (y > 2069)
|
|
y -= 100;
|
|
}
|
|
}
|
|
|
|
m = atoi(month.c_str());
|
|
d = atoi(day.c_str());
|
|
h = atoi(hour.c_str());
|
|
minute = atoi(min.c_str());
|
|
s = atoi(sec.c_str());
|
|
ms = 0;
|
|
|
|
if (!isDateValid(d, m, y) || !isDateTimeValid(h, minute, s, ms))
|
|
return -1;
|
|
|
|
adaytime.year = y;
|
|
adaytime.month = m;
|
|
adaytime.day = d;
|
|
adaytime.hour = h;
|
|
adaytime.minute = minute;
|
|
adaytime.second = s;
|
|
adaytime.msecond = ms;
|
|
|
|
if (date)
|
|
*date = isDate;
|
|
|
|
return getUInt64LE((const char*)&adaytime);
|
|
}
|
|
|
|
/* This is really painful and expensive b/c it seems the input is not normalized or
|
|
sanitized. That should really be done on ingestion. */
|
|
int64_t DataConvert::intToTime(int64_t data, bool fromString)
|
|
{
|
|
char buf[21] = {0};
|
|
char* bufread = buf;
|
|
Time atime;
|
|
bool isNeg = false;
|
|
|
|
if (data == 0)
|
|
{
|
|
atime.hour = 0;
|
|
atime.minute = 0;
|
|
atime.second = 0;
|
|
atime.msecond = 0;
|
|
atime.is_neg = 0;
|
|
|
|
return getSInt64LE((const char*)&atime);
|
|
}
|
|
|
|
// this snprintf call causes a compiler warning b/c we're potentially copying a 20-digit #
|
|
// into 15 bytes, however, that appears to be intentional.
|
|
#if defined(__GNUC__) && __GNUC__ >= 7
|
|
#pragma GCC diagnostic push
|
|
#pragma GCC diagnostic ignored "-Wformat-truncation="
|
|
snprintf(buf, 15, "%lld", (long long int)data);
|
|
#pragma GCC diagnostic pop
|
|
#else
|
|
snprintf(buf, 15, "%lld", (long long int)data);
|
|
#endif
|
|
|
|
// string date = buf;
|
|
string hour, min, sec, msec;
|
|
int64_t h = 0, minute = 0, s = 0, ms = 0;
|
|
|
|
if (bufread[0] == '-')
|
|
{
|
|
isNeg = true;
|
|
bufread++;
|
|
}
|
|
|
|
bool zero = false;
|
|
|
|
switch (strlen(bufread))
|
|
{
|
|
// A full datetime
|
|
case 14:
|
|
hour = string(buf + 8, 2);
|
|
min = string(buf + 10, 2);
|
|
sec = string(buf + 12, 2);
|
|
break;
|
|
|
|
// Date so this is all 0
|
|
case 8: zero = true; break;
|
|
|
|
case 7:
|
|
hour = string(bufread, 3);
|
|
min = string(bufread + 3, 2);
|
|
sec = string(bufread + 5, 2);
|
|
break;
|
|
|
|
case 6:
|
|
hour = string(bufread, 2);
|
|
min = string(bufread + 2, 2);
|
|
sec = string(bufread + 4, 2);
|
|
break;
|
|
|
|
case 5:
|
|
hour = string(bufread, 1);
|
|
min = string(bufread + 1, 2);
|
|
sec = string(bufread + 3, 2);
|
|
break;
|
|
|
|
case 4:
|
|
min = string(bufread, 2);
|
|
sec = string(bufread + 2, 2);
|
|
break;
|
|
|
|
case 3:
|
|
min = string(bufread, 1);
|
|
sec = string(bufread + 1, 2);
|
|
break;
|
|
|
|
case 2: sec = string(bufread, 2); break;
|
|
|
|
case 1: sec = string(bufread, 1); break;
|
|
|
|
default: return -1;
|
|
}
|
|
|
|
if (!zero)
|
|
{
|
|
h = atoi(hour.c_str());
|
|
minute = atoi(min.c_str());
|
|
s = atoi(sec.c_str());
|
|
}
|
|
else if (fromString)
|
|
{
|
|
// Saturate fromString
|
|
h = 838;
|
|
minute = 59;
|
|
s = 59;
|
|
ms = 999999;
|
|
}
|
|
|
|
if (!isTimeValid(h, minute, s, 0))
|
|
return -1;
|
|
|
|
atime.hour = h;
|
|
atime.minute = minute;
|
|
atime.second = s;
|
|
atime.msecond = ms;
|
|
atime.is_neg = isNeg;
|
|
|
|
return getSInt64LE((const char*)&atime);
|
|
}
|
|
|
|
int64_t DataConvert::stringToTime(const utils::NullString& data)
|
|
{
|
|
return stringToTime(data.safeString(""));
|
|
}
|
|
|
|
int64_t DataConvert::stringToTime(const string& data)
|
|
{
|
|
// MySQL supported time value format 'D HHH:MM:SS.fraction'
|
|
// -34 <= D <= 34
|
|
// -838 <= H <= 838
|
|
uint64_t min = 0, sec = 0, msec = 0;
|
|
int64_t day = -1, hour = 0;
|
|
bool isNeg = false;
|
|
bool hasDate = false;
|
|
string time, hms, ms;
|
|
char* end = NULL;
|
|
|
|
size_t pos = data.find("-");
|
|
|
|
if (pos != string::npos)
|
|
{
|
|
isNeg = true;
|
|
}
|
|
|
|
if (data.substr(pos + 1, data.length() - pos - 1).find("-") != string::npos)
|
|
{
|
|
// A second dash, this has a date
|
|
hasDate = true;
|
|
isNeg = false;
|
|
}
|
|
// Day
|
|
pos = data.find(" ");
|
|
|
|
if (pos != string::npos)
|
|
{
|
|
if (!hasDate)
|
|
{
|
|
std::string tmpDataSegment = data.substr(0, pos);
|
|
day = strtol(tmpDataSegment.c_str(), &end, 10);
|
|
|
|
if (*end != '\0')
|
|
return -1;
|
|
|
|
hour = day * 24;
|
|
day = -1;
|
|
}
|
|
time = data.substr(pos + 1, data.length() - pos - 1);
|
|
}
|
|
else
|
|
{
|
|
time = data;
|
|
}
|
|
|
|
if (time.find(":") == string::npos)
|
|
{
|
|
if (hasDate)
|
|
{
|
|
// Has dashes, no colons. This is just a date!
|
|
// Or the length < 6 (MariaDB returns NULL)
|
|
return -1;
|
|
}
|
|
else
|
|
{
|
|
// This is an int time
|
|
return intToTime(atoll(time.c_str()), true);
|
|
}
|
|
}
|
|
|
|
// Fraction
|
|
pos = time.find(".");
|
|
|
|
if (pos != string::npos)
|
|
{
|
|
msec = strtoll(time.substr(pos + 1, time.length() - pos - 1).c_str(), 0, 10);
|
|
hms = time.substr(0, pos);
|
|
}
|
|
else
|
|
{
|
|
hms = time;
|
|
}
|
|
|
|
// HHH:MM:SS
|
|
pos = hms.find(":");
|
|
|
|
if (pos == string::npos)
|
|
{
|
|
if (hour >= 0)
|
|
hour += atoi(hms.c_str());
|
|
else
|
|
hour -= atoi(hms.c_str());
|
|
}
|
|
else
|
|
{
|
|
if (hour >= 0)
|
|
hour += atoi(hms.substr(0, pos).c_str());
|
|
else
|
|
hour -= atoi(hms.substr(0, pos).c_str());
|
|
|
|
ms = hms.substr(pos + 1, hms.length() - pos - 1);
|
|
}
|
|
|
|
// MM:SS
|
|
pos = ms.find(":");
|
|
|
|
if (pos != string::npos)
|
|
{
|
|
min = atoi(ms.substr(0, pos).c_str());
|
|
sec = atoi(ms.substr(pos + 1, ms.length() - pos - 1).c_str());
|
|
}
|
|
else
|
|
{
|
|
min = atoi(ms.c_str());
|
|
}
|
|
|
|
Time atime;
|
|
atime.day = day;
|
|
atime.hour = hour;
|
|
atime.minute = min;
|
|
atime.second = sec;
|
|
atime.msecond = msec;
|
|
atime.is_neg = isNeg;
|
|
return getSInt64LE((const char*)&atime);
|
|
}
|
|
|
|
void DataConvert::joinColTypeForUnion(datatypes::TypeHolderStd& unionedType,
|
|
const datatypes::TypeHolderStd& type, unsigned int& rc)
|
|
{
|
|
// limited support for VARBINARY, no implicit conversion.
|
|
if (type.colDataType == datatypes::SystemCatalog::VARBINARY ||
|
|
unionedType.colDataType == datatypes::SystemCatalog::VARBINARY)
|
|
{
|
|
if (type.colDataType != unionedType.colDataType || type.colWidth != unionedType.colWidth)
|
|
throw runtime_error("VARBINARY in UNION must be the same width.");
|
|
}
|
|
|
|
switch (type.colDataType)
|
|
{
|
|
case datatypes::SystemCatalog::TINYINT:
|
|
case datatypes::SystemCatalog::SMALLINT:
|
|
case datatypes::SystemCatalog::MEDINT:
|
|
case datatypes::SystemCatalog::INT:
|
|
case datatypes::SystemCatalog::BIGINT:
|
|
case datatypes::SystemCatalog::DECIMAL:
|
|
case datatypes::SystemCatalog::UTINYINT:
|
|
case datatypes::SystemCatalog::USMALLINT:
|
|
case datatypes::SystemCatalog::UMEDINT:
|
|
case datatypes::SystemCatalog::UINT:
|
|
case datatypes::SystemCatalog::UBIGINT:
|
|
case datatypes::SystemCatalog::UDECIMAL:
|
|
{
|
|
switch (unionedType.colDataType)
|
|
{
|
|
case datatypes::SystemCatalog::TINYINT:
|
|
case datatypes::SystemCatalog::SMALLINT:
|
|
case datatypes::SystemCatalog::MEDINT:
|
|
case datatypes::SystemCatalog::INT:
|
|
case datatypes::SystemCatalog::BIGINT:
|
|
case datatypes::SystemCatalog::DECIMAL:
|
|
case datatypes::SystemCatalog::UTINYINT:
|
|
case datatypes::SystemCatalog::USMALLINT:
|
|
case datatypes::SystemCatalog::UMEDINT:
|
|
case datatypes::SystemCatalog::UINT:
|
|
case datatypes::SystemCatalog::UBIGINT:
|
|
case datatypes::SystemCatalog::UDECIMAL:
|
|
|
|
if (type.scale != 0 && (unionedType.scale != 0 || isDecimal(unionedType.colDataType)))
|
|
{
|
|
const unsigned int digitsBeforeDecimal = type.precision - type.scale;
|
|
const unsigned int digitsBeforeDecimalUnion = unionedType.precision - unionedType.scale;
|
|
|
|
if ((std::max(digitsBeforeDecimal, digitsBeforeDecimalUnion) +
|
|
std::max(type.scale, unionedType.scale)) > datatypes::INT128MAXPRECISION)
|
|
{
|
|
rc = logging::ERR_UNION_DECIMAL_OVERFLOW;
|
|
return;
|
|
}
|
|
}
|
|
|
|
// Handle the scenario where the upstream code assigns special values of 9999
|
|
// and -1 as the precision of the unionedType.
|
|
if ((unionedType.precision == 9999 || unionedType.precision == -1) &&
|
|
(type.precision != 9999 && type.precision != -1))
|
|
{
|
|
unionedType.precision = type.precision;
|
|
}
|
|
else
|
|
{
|
|
unionedType.precision = std::max(type.precision, unionedType.precision);
|
|
}
|
|
|
|
unionedType.scale = std::max(type.scale, unionedType.scale);
|
|
|
|
if (datatypes::Decimal::isWideDecimalTypeByPrecision(unionedType.precision))
|
|
{
|
|
unionedType.colDataType = datatypes::SystemCatalog::DECIMAL;
|
|
unionedType.colWidth = datatypes::MAXDECIMALWIDTH;
|
|
break;
|
|
}
|
|
|
|
if (type.colDataType == unionedType.colDataType)
|
|
{
|
|
if (type.colWidth > unionedType.colWidth)
|
|
unionedType.colWidth = type.colWidth;
|
|
}
|
|
else if (sameSignednessInteger(unionedType.colDataType, type.colDataType))
|
|
{
|
|
// Keep the signedness on the larger data type.
|
|
if (type.colWidth > unionedType.colWidth)
|
|
{
|
|
unionedType.colDataType = type.colDataType;
|
|
unionedType.colWidth = type.colWidth;
|
|
}
|
|
}
|
|
else if (differentSignednessInteger(unionedType.colDataType, type.colDataType))
|
|
{
|
|
// unionedType must be signed integer with upcasted size to prevent overflow & underflow.
|
|
if (type.colWidth > unionedType.colWidth)
|
|
unionedType.colDataType = type.colDataType;
|
|
promoteSignedInteger(unionedType);
|
|
}
|
|
|
|
if (isDecimal(type.colDataType))
|
|
{
|
|
unionedType.colDataType = datatypes::SystemCatalog::DECIMAL;
|
|
}
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DATE:
|
|
unionedType.colDataType = datatypes::SystemCatalog::CHAR;
|
|
unionedType.colWidth = 20;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::TIME:
|
|
case datatypes::SystemCatalog::DATETIME:
|
|
case datatypes::SystemCatalog::TIMESTAMP:
|
|
unionedType.colDataType = datatypes::SystemCatalog::CHAR;
|
|
unionedType.colWidth = 26;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::CHAR:
|
|
if (unionedType.colWidth < 20)
|
|
unionedType.colWidth = 20;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::VARCHAR:
|
|
if (unionedType.colWidth < 21)
|
|
unionedType.colWidth = 21;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::FLOAT:
|
|
case datatypes::SystemCatalog::DOUBLE:
|
|
case datatypes::SystemCatalog::UFLOAT:
|
|
case datatypes::SystemCatalog::UDOUBLE:
|
|
case datatypes::SystemCatalog::LONGDOUBLE:
|
|
if (datatypes::isWideDecimalType(type.colDataType, type.colWidth))
|
|
unionedType = type;
|
|
break;
|
|
|
|
default: break;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case datatypes::SystemCatalog::DATE:
|
|
{
|
|
switch (unionedType.colDataType)
|
|
{
|
|
case datatypes::SystemCatalog::TINYINT:
|
|
case datatypes::SystemCatalog::SMALLINT:
|
|
case datatypes::SystemCatalog::MEDINT:
|
|
case datatypes::SystemCatalog::INT:
|
|
case datatypes::SystemCatalog::BIGINT:
|
|
case datatypes::SystemCatalog::DECIMAL:
|
|
case datatypes::SystemCatalog::FLOAT:
|
|
case datatypes::SystemCatalog::DOUBLE:
|
|
case datatypes::SystemCatalog::UTINYINT:
|
|
case datatypes::SystemCatalog::USMALLINT:
|
|
case datatypes::SystemCatalog::UMEDINT:
|
|
case datatypes::SystemCatalog::UINT:
|
|
case datatypes::SystemCatalog::UBIGINT:
|
|
case datatypes::SystemCatalog::UDECIMAL:
|
|
case datatypes::SystemCatalog::UFLOAT:
|
|
case datatypes::SystemCatalog::UDOUBLE:
|
|
case datatypes::SystemCatalog::LONGDOUBLE:
|
|
unionedType.colDataType = datatypes::SystemCatalog::CHAR;
|
|
unionedType.scale = 0;
|
|
unionedType.colWidth = 20;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::CHAR:
|
|
if (unionedType.colWidth < 10)
|
|
unionedType.colWidth = 10;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::VARCHAR:
|
|
if (unionedType.colWidth < 11)
|
|
unionedType.colWidth = 11;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DATE:
|
|
case datatypes::SystemCatalog::DATETIME:
|
|
case datatypes::SystemCatalog::TIMESTAMP:
|
|
case datatypes::SystemCatalog::TIME:
|
|
default: break;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case datatypes::SystemCatalog::DATETIME:
|
|
{
|
|
switch (unionedType.colDataType)
|
|
{
|
|
case datatypes::SystemCatalog::TINYINT:
|
|
case datatypes::SystemCatalog::SMALLINT:
|
|
case datatypes::SystemCatalog::MEDINT:
|
|
case datatypes::SystemCatalog::INT:
|
|
case datatypes::SystemCatalog::BIGINT:
|
|
case datatypes::SystemCatalog::DECIMAL:
|
|
case datatypes::SystemCatalog::FLOAT:
|
|
case datatypes::SystemCatalog::DOUBLE:
|
|
case datatypes::SystemCatalog::UTINYINT:
|
|
case datatypes::SystemCatalog::USMALLINT:
|
|
case datatypes::SystemCatalog::UMEDINT:
|
|
case datatypes::SystemCatalog::UINT:
|
|
case datatypes::SystemCatalog::UBIGINT:
|
|
case datatypes::SystemCatalog::UDECIMAL:
|
|
case datatypes::SystemCatalog::UFLOAT:
|
|
case datatypes::SystemCatalog::UDOUBLE:
|
|
case datatypes::SystemCatalog::TIME:
|
|
case datatypes::SystemCatalog::LONGDOUBLE:
|
|
case datatypes::SystemCatalog::TIMESTAMP:
|
|
unionedType.colDataType = datatypes::SystemCatalog::CHAR;
|
|
unionedType.scale = 0;
|
|
unionedType.colWidth = 26;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DATE:
|
|
unionedType.colDataType = datatypes::SystemCatalog::DATETIME;
|
|
unionedType.colWidth = type.colWidth;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::CHAR:
|
|
if (unionedType.colWidth < 26)
|
|
unionedType.colWidth = 26;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::VARCHAR:
|
|
if (unionedType.colWidth < 27)
|
|
unionedType.colWidth = 27;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DATETIME:
|
|
default: break;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case datatypes::SystemCatalog::TIMESTAMP:
|
|
{
|
|
switch (unionedType.colDataType)
|
|
{
|
|
case datatypes::SystemCatalog::TINYINT:
|
|
case datatypes::SystemCatalog::SMALLINT:
|
|
case datatypes::SystemCatalog::MEDINT:
|
|
case datatypes::SystemCatalog::INT:
|
|
case datatypes::SystemCatalog::BIGINT:
|
|
case datatypes::SystemCatalog::DECIMAL:
|
|
case datatypes::SystemCatalog::FLOAT:
|
|
case datatypes::SystemCatalog::DOUBLE:
|
|
case datatypes::SystemCatalog::UTINYINT:
|
|
case datatypes::SystemCatalog::USMALLINT:
|
|
case datatypes::SystemCatalog::UMEDINT:
|
|
case datatypes::SystemCatalog::UINT:
|
|
case datatypes::SystemCatalog::UBIGINT:
|
|
case datatypes::SystemCatalog::UDECIMAL:
|
|
case datatypes::SystemCatalog::UFLOAT:
|
|
case datatypes::SystemCatalog::UDOUBLE:
|
|
case datatypes::SystemCatalog::TIME:
|
|
case datatypes::SystemCatalog::DATETIME:
|
|
unionedType.colDataType = datatypes::SystemCatalog::CHAR;
|
|
unionedType.scale = 0;
|
|
unionedType.colWidth = 26;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DATE:
|
|
unionedType.colDataType = datatypes::SystemCatalog::TIMESTAMP;
|
|
unionedType.colWidth = type.colWidth;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::CHAR:
|
|
if (unionedType.colWidth < 26)
|
|
unionedType.colWidth = 26;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::VARCHAR:
|
|
if (unionedType.colWidth < 27)
|
|
unionedType.colWidth = 27;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::TIMESTAMP:
|
|
default: break;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case datatypes::SystemCatalog::FLOAT:
|
|
case datatypes::SystemCatalog::DOUBLE:
|
|
case datatypes::SystemCatalog::UFLOAT:
|
|
case datatypes::SystemCatalog::UDOUBLE:
|
|
{
|
|
switch (unionedType.colDataType)
|
|
{
|
|
case datatypes::SystemCatalog::DATE:
|
|
unionedType.colDataType = datatypes::SystemCatalog::CHAR;
|
|
unionedType.scale = 0;
|
|
unionedType.colWidth = 20;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DATETIME:
|
|
case datatypes::SystemCatalog::TIMESTAMP:
|
|
unionedType.colDataType = datatypes::SystemCatalog::CHAR;
|
|
unionedType.scale = 0;
|
|
unionedType.colWidth = 26;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::CHAR:
|
|
if (unionedType.colWidth < 20)
|
|
unionedType.colWidth = 20;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::VARCHAR:
|
|
if (unionedType.colWidth < 21)
|
|
unionedType.colWidth = 21;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::TINYINT:
|
|
case datatypes::SystemCatalog::SMALLINT:
|
|
case datatypes::SystemCatalog::MEDINT:
|
|
case datatypes::SystemCatalog::INT:
|
|
case datatypes::SystemCatalog::BIGINT:
|
|
case datatypes::SystemCatalog::FLOAT:
|
|
case datatypes::SystemCatalog::DOUBLE:
|
|
case datatypes::SystemCatalog::UTINYINT:
|
|
case datatypes::SystemCatalog::USMALLINT:
|
|
case datatypes::SystemCatalog::UMEDINT:
|
|
case datatypes::SystemCatalog::UINT:
|
|
case datatypes::SystemCatalog::UBIGINT:
|
|
case datatypes::SystemCatalog::UFLOAT:
|
|
case datatypes::SystemCatalog::UDOUBLE:
|
|
unionedType.colDataType = datatypes::SystemCatalog::DOUBLE;
|
|
unionedType.scale = 0;
|
|
unionedType.colWidth = sizeof(double);
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DECIMAL:
|
|
case datatypes::SystemCatalog::UDECIMAL:
|
|
if (unionedType.colWidth != datatypes::MAXDECIMALWIDTH)
|
|
{
|
|
unionedType.colDataType = datatypes::SystemCatalog::DOUBLE;
|
|
unionedType.scale = 0;
|
|
unionedType.colWidth = sizeof(double);
|
|
}
|
|
break;
|
|
|
|
default: break;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case datatypes::SystemCatalog::LONGDOUBLE:
|
|
{
|
|
switch (unionedType.colDataType)
|
|
{
|
|
case datatypes::SystemCatalog::DATE:
|
|
unionedType.colDataType = datatypes::SystemCatalog::CHAR;
|
|
unionedType.scale = 0;
|
|
unionedType.colWidth = 20;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DATETIME:
|
|
unionedType.colDataType = datatypes::SystemCatalog::CHAR;
|
|
unionedType.scale = 0;
|
|
unionedType.colWidth = 26;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::CHAR:
|
|
if (unionedType.colWidth < 20)
|
|
unionedType.colWidth = 20;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::VARCHAR:
|
|
if (unionedType.colWidth < 21)
|
|
unionedType.colWidth = 21;
|
|
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::TINYINT:
|
|
case datatypes::SystemCatalog::SMALLINT:
|
|
case datatypes::SystemCatalog::MEDINT:
|
|
case datatypes::SystemCatalog::INT:
|
|
case datatypes::SystemCatalog::BIGINT:
|
|
case datatypes::SystemCatalog::FLOAT:
|
|
case datatypes::SystemCatalog::DOUBLE:
|
|
case datatypes::SystemCatalog::UTINYINT:
|
|
case datatypes::SystemCatalog::USMALLINT:
|
|
case datatypes::SystemCatalog::UMEDINT:
|
|
case datatypes::SystemCatalog::UINT:
|
|
case datatypes::SystemCatalog::UBIGINT:
|
|
case datatypes::SystemCatalog::UFLOAT:
|
|
case datatypes::SystemCatalog::UDOUBLE:
|
|
case datatypes::SystemCatalog::LONGDOUBLE:
|
|
unionedType.colDataType = datatypes::SystemCatalog::LONGDOUBLE;
|
|
unionedType.scale = (type.scale > unionedType.scale) ? type.scale : unionedType.scale;
|
|
unionedType.colWidth = sizeof(long double);
|
|
unionedType.precision = -1;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DECIMAL:
|
|
case datatypes::SystemCatalog::UDECIMAL:
|
|
if (unionedType.colWidth != datatypes::MAXDECIMALWIDTH)
|
|
{
|
|
unionedType.colDataType = datatypes::SystemCatalog::LONGDOUBLE;
|
|
unionedType.scale = (type.scale > unionedType.scale) ? type.scale : unionedType.scale;
|
|
unionedType.colWidth = sizeof(long double);
|
|
unionedType.precision = -1;
|
|
}
|
|
break;
|
|
|
|
default: break;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
case datatypes::SystemCatalog::CHAR:
|
|
case datatypes::SystemCatalog::VARCHAR:
|
|
{
|
|
switch (unionedType.colDataType)
|
|
{
|
|
case datatypes::SystemCatalog::TINYINT:
|
|
case datatypes::SystemCatalog::SMALLINT:
|
|
case datatypes::SystemCatalog::MEDINT:
|
|
case datatypes::SystemCatalog::INT:
|
|
case datatypes::SystemCatalog::BIGINT:
|
|
case datatypes::SystemCatalog::DECIMAL:
|
|
case datatypes::SystemCatalog::FLOAT:
|
|
case datatypes::SystemCatalog::DOUBLE:
|
|
case datatypes::SystemCatalog::UTINYINT:
|
|
case datatypes::SystemCatalog::USMALLINT:
|
|
case datatypes::SystemCatalog::UMEDINT:
|
|
case datatypes::SystemCatalog::UINT:
|
|
case datatypes::SystemCatalog::UBIGINT:
|
|
case datatypes::SystemCatalog::UDECIMAL:
|
|
case datatypes::SystemCatalog::UFLOAT:
|
|
case datatypes::SystemCatalog::UDOUBLE:
|
|
case datatypes::SystemCatalog::LONGDOUBLE:
|
|
unionedType.scale = 0;
|
|
unionedType.colWidth = (type.colWidth > 20) ? type.colWidth : 20;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DATE:
|
|
unionedType.colWidth = (type.colWidth > 10) ? type.colWidth : 10;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::DATETIME:
|
|
case datatypes::SystemCatalog::TIMESTAMP:
|
|
unionedType.colWidth = (type.colWidth > 26) ? type.colWidth : 26;
|
|
break;
|
|
|
|
case datatypes::SystemCatalog::CHAR:
|
|
case datatypes::SystemCatalog::VARCHAR:
|
|
|
|
// VARCHAR will fit in CHAR of the same width
|
|
if (unionedType.colWidth < type.colWidth)
|
|
unionedType.colWidth = type.colWidth;
|
|
|
|
break;
|
|
|
|
default: break;
|
|
}
|
|
|
|
// MariaDB bug 651. Setting to CHAR broke union in subquery
|
|
unionedType.colDataType = datatypes::SystemCatalog::VARCHAR;
|
|
break;
|
|
}
|
|
|
|
default:
|
|
{
|
|
break;
|
|
}
|
|
} // switch
|
|
}
|
|
|
|
} // namespace dataconvert
|