mariadb-columnstore-engine/utils/dataconvert/dataconvert.cpp

/* Copyright (C) 2014 InfiniDB, Inc.
   Copyright (C) 2019 MariaDB Corporation

   This program is free software; you can redistribute it and/or
   modify it under the terms of the GNU General Public License
   as published by the Free Software Foundation; version 2 of
   the License.

   This program is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License for more details.

   You should have received a copy of the GNU General Public License
   along with this program; if not, write to the Free Software
   Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
   MA 02110-1301, USA. */

/****************************************************************************
 * $Id: dataconvert.cpp 3901 2013-06-17 20:59:13Z rdempsey $
 *
 *
 ****************************************************************************/

#include <string>
#include <cmath>
#include <errno.h>
#include <ctime>
#include <stdlib.h>
#include <string.h>
#include <type_traits>
#include "mcs_decimal.h"
using namespace std;
#include <boost/algorithm/string/case_conv.hpp>
#include <boost/algorithm/string.hpp>
using namespace boost::algorithm;
#include <boost/tokenizer.hpp>
#include "calpontselectexecutionplan.h"
#include "columnresult.h"

#include "basic/string_utils.h"

#include "joblisttypes.h"

#define DATACONVERT_DLLEXPORT
#include "dataconvert.h"
#undef DATACONVERT_DLLEXPORT

using namespace logging;

namespace
{
template <class T>
bool from_string(T& t, const std::string& s, std::ios_base& (*f)(std::ios_base&))
{
  std::istringstream iss(s);
  return !(iss >> f >> t).fail();
}

bool number_value(const string& data)
{
  for (unsigned int i = 0; i < strlen(data.c_str()); i++)
  {
    if (data[i] > '9' || data[i] < '0')
    {
      if (data[i] != '+' && data[i] != '-' && data[i] != '.' && data[i] != ' ' && data[i] != 'E' &&
          data[i] != 'e')
      {
        throw QueryDataExcept("value is not numerical.", formatErr);
      }
    }
  }

  return true;
}

}  // namespace

namespace dataconvert
{
// LE stands for Little Endian
uint32_t getUInt32LE(const char* ptr)
{
  return reinterpret_cast<const uint32_t*>(ptr)[0];
}

int32_t getSInt32LE(const char* ptr)
{
  return reinterpret_cast<const int32_t*>(ptr)[0];
}

uint64_t getUInt64LE(const char* ptr)
{
  return reinterpret_cast<const uint64_t*>(ptr)[0];
}

int64_t getSInt64LE(const char* ptr)
{
  return reinterpret_cast<const int64_t*>(ptr)[0];
}

template <typename T>
void number_int_value(const string& data, cscDataType typeCode,
                      const datatypes::SystemCatalog::TypeAttributesStd& ct, bool& pushwarning,
                      bool noRoundup, T& intVal, bool* saturate)
{
  // copy of the original input
  string valStr(data);

  // in case, the values are in parentheses
  string::size_type x = valStr.find('(');
  string::size_type y = valStr.find(')');

  while (x < string::npos)
  {
    // erase y first
    if (y == string::npos)
      throw QueryDataExcept("'(' is not matched.", formatErr);

    valStr.erase(y, 1);
    valStr.erase(x, 1);
    x = valStr.find('(');
    y = valStr.find(')');
  }

  if (y != string::npos)
    throw QueryDataExcept("')' is not matched.", formatErr);

  if (datatypes::ASCIIStringCaseInsensetiveEquals(valStr, "true"))
  {
    intVal = 1;
    return;
  }
  if (datatypes::ASCIIStringCaseInsensetiveEquals(valStr, "false"))
  {
    intVal = 0;
    return;
  }

  // convert to fixed-point notation if input is in scientific notation
  if (valStr.find('E') < string::npos || valStr.find('e') < string::npos)
  {
    size_t epos = valStr.find('E');

    if (epos == string::npos)
      epos = valStr.find('e');

    // get the coefficient
    string coef = valStr.substr(0, epos);
    // get the exponent
    string exp = valStr.substr(epos + 1);
    bool overflow = false;
    T exponent = dataconvert::string_to_ll<T>(exp, overflow);

    // if the exponent can not be held in 64 or 128 bits, not supported or saturated.
    if (overflow)
      throw QueryDataExcept("value is invalid.", formatErr);

    // find the optional "." point
    size_t dpos = coef.find('.');

    if (dpos != string::npos)
    {
      // move "." to the end by mutiply 10 ** (# of fraction digits)
      coef.erase(dpos, 1);
      exponent -= coef.length() - dpos;
    }

    if (exponent >= 0)
    {
      coef.resize(coef.length() + exponent, '0');
    }
    else
    {
      size_t bpos = coef.find_first_of("0123456789");
      size_t epos = coef.length();
      size_t mpos = -exponent;
      dpos = epos - mpos;
      int64_t padding = (int64_t)mpos - (int64_t)(epos - bpos);

      if (padding > 0)
      {
        coef.insert(bpos, padding, '0');
        dpos = bpos;
      }

      coef.insert(dpos, ".");
    }

    valStr = coef;
  }

  // apply the scale
  if (ct.scale != 0)
  {
    uint64_t scale = (uint64_t)(ct.scale < 0) ? (-ct.scale) : (ct.scale);
    size_t dpos = valStr.find('.');
    string intPart = valStr.substr(0, dpos);
    string leftStr;

    if (ct.scale > 0)
    {
      if (dpos != string::npos)
      {
        // decimal point exist, prepare "#scale" digits in fraction part
        ++dpos;
        string frnStr = valStr.substr(dpos, scale);

        if (frnStr.length() < scale)
          frnStr.resize(scale, '0');  // padding digit 0, not null.

        // effectly shift "#scale" digits to left.
        intPart += frnStr;
        leftStr = valStr.substr(dpos);
        leftStr.erase(0, scale);
      }
      else
      {
        // no decimal point, shift "#scale" digits to left.
        intPart.resize(intPart.length() + scale, '0');  // padding digit 0, not null.
      }
    }
    else  // if (ct.scale < 0) -- in ct.scale != 0 block
    {
      if (dpos != string::npos)
      {
        // decimal point exist, get the fraction part
        ++dpos;
        leftStr = valStr.substr(dpos);
      }
    }

    valStr = intPart;

    if (leftStr.length() > 0)
      valStr += "." + leftStr;
  }

  // now, convert to long long int
  string intStr(valStr);
  string frnStr = "";
  size_t dp = valStr.find('.');
  int roundup = 0;

  if (dp != string::npos)
  {
    // Check if need round up
    int frac1 = dataconvert::string_to_ll<int64_t>(valStr.substr(dp + 1, 1), pushwarning);

    if ((!noRoundup) && frac1 >= 5)
      roundup = 1;

    intStr.erase(dp);
    frnStr = valStr.substr(dp + 1);

    if (intStr.length() == 0)
      intStr = "0";
    else if ((intStr.length() == 1) && ((intStr[0] == '+') || (intStr[0] == '-')))
    {
      intStr.insert(1, 1, '0');
    }
  }

  intVal = dataconvert::string_to_ll<T>(intStr, pushwarning);
  //@Bug 3350 negative value round up.
  intVal += intVal >= 0 ? roundup : -roundup;
  bool dummy = false;
  T frnVal = (frnStr.length() > 0) ? dataconvert::string_to_ll<T>(frnStr, dummy) : 0;

  if (frnVal != 0)
    pushwarning = true;

  switch (typeCode)
  {
    case datatypes::SystemCatalog::TINYINT:
      if (intVal < MIN_TINYINT)
      {
        intVal = MIN_TINYINT;
        pushwarning = true;

        if (saturate)
          *saturate = true;
      }
      else if (intVal > MAX_TINYINT)
      {
        intVal = MAX_TINYINT;
        pushwarning = true;

        if (saturate)
          *saturate = true;
      }

      break;

    case datatypes::SystemCatalog::SMALLINT:
      if (intVal < MIN_SMALLINT)
      {
        intVal = MIN_SMALLINT;
        pushwarning = true;

        if (saturate)
          *saturate = true;
      }
      else if (intVal > MAX_SMALLINT)
      {
        intVal = MAX_SMALLINT;
        pushwarning = true;

        if (saturate)
          *saturate = true;
      }

      break;

    case datatypes::SystemCatalog::MEDINT:
      if (intVal < MIN_MEDINT)
      {
        intVal = MIN_MEDINT;
        pushwarning = true;

        if (saturate)
          *saturate = true;
      }
      else if (intVal > MAX_MEDINT)
      {
        intVal = MAX_MEDINT;
        pushwarning = true;

        if (saturate)
          *saturate = true;
      }

      break;

    case datatypes::SystemCatalog::INT:
      if (intVal < MIN_INT)
      {
        intVal = MIN_INT;
        pushwarning = true;

        if (saturate)
          *saturate = true;
      }
      else if (intVal > MAX_INT)
      {
        intVal = MAX_INT;
        pushwarning = true;

        if (saturate)
          *saturate = true;
      }

      break;

    case datatypes::SystemCatalog::BIGINT:
      if (intVal < MIN_BIGINT)
      {
        intVal = MIN_BIGINT;
        pushwarning = true;

        if (saturate)
          *saturate = true;
      }

      break;

    case datatypes::SystemCatalog::DECIMAL:
    case datatypes::SystemCatalog::UDECIMAL:
      if (LIKELY(ct.colWidth == 16))
      {
        int128_t tmp;
        utils::int128Min(tmp);
        if (intVal < tmp + 2)  // + 2 for NULL and EMPTY values
        {
          intVal = tmp + 2;
          pushwarning = true;

          if (saturate)
            *saturate = true;
        }
      }
      else if (ct.colWidth == 8)
      {
        if (intVal < MIN_BIGINT)
        {
          intVal = MIN_BIGINT;
          pushwarning = true;

          if (saturate)
            *saturate = true;
        }
      }
      else if (ct.colWidth == 4)
      {
        if (intVal < MIN_INT)
        {
          intVal = MIN_INT;
          pushwarning = true;

          if (saturate)
            *saturate = true;
        }
        else if (intVal > MAX_INT)
        {
          intVal = MAX_INT;
          pushwarning = true;

          if (saturate)
            *saturate = true;
        }
      }
      else if (ct.colWidth == 2)
      {
        if (intVal < MIN_SMALLINT)
        {
          intVal = MIN_SMALLINT;
          pushwarning = true;

          if (saturate)
            *saturate = true;
        }
        else if (intVal > MAX_SMALLINT)
        {
          intVal = MAX_SMALLINT;
          pushwarning = true;

          if (saturate)
            *saturate = true;
        }
      }
      else if (ct.colWidth == 1)
      {
        if (intVal < MIN_TINYINT)
        {
          intVal = MIN_TINYINT;
          pushwarning = true;

          if (saturate)
            *saturate = true;
        }
        else if (intVal > MAX_TINYINT)
        {
          intVal = MAX_TINYINT;
          pushwarning = true;

          if (saturate)
            *saturate = true;
        }
      }

      break;

    default: break;
  }

  // @ bug 3285 make sure the value is in precision range for decimal data type
  if ((typeCode == datatypes::SystemCatalog::DECIMAL) || (typeCode == datatypes::SystemCatalog::UDECIMAL) ||
      (ct.scale > 0))
  {
    auto precision =
        ct.precision == rowgroup::MagicPrecisionForCountAgg ? datatypes::INT128MAXPRECISION : ct.precision;
    if (precision > datatypes::INT128MAXPRECISION || precision < 0)
    {
      throw QueryDataExcept("Unsupported precision " + std::to_string(precision) + " converting DECIMAL ",
                            dataTypeErr);
    }

    T rangeUp = dataconvert::decimalRangeUp<T>(precision);
    T rangeLow = -rangeUp;

    if (intVal > rangeUp)
    {
      intVal = rangeUp;
      pushwarning = true;

      if (saturate)
        *saturate = true;
    }
    else if (intVal < rangeLow)
    {
      intVal = rangeLow;
      pushwarning = true;

      if (saturate)
        *saturate = true;
    }
  }
}

// Explicit template instantiation
template void number_int_value<int64_t>(const std::string& data, cscDataType typeCode,
                                        const datatypes::SystemCatalog::TypeAttributesStd& ct,
                                        bool& pushwarning, bool noRoundup, int64_t& intVal, bool* saturate);

template void number_int_value<int128_t>(const std::string& data, cscDataType typeCode,
                                         const datatypes::SystemCatalog::TypeAttributesStd& ct,
                                         bool& pushwarning, bool noRoundup, int128_t& intVal, bool* saturate);

uint64_t number_uint_value(const string& data, cscDataType typeCode,
                           const datatypes::SystemCatalog::TypeAttributesStd& /*ct*/, bool& pushwarning,
                           bool /*noRoundup*/)
{
  // copy of the original input
  string valStr(data);

  // in case, the values are in parentheses
  string::size_type x = valStr.find('(');
  string::size_type y = valStr.find(')');

  while (x < string::npos)
  {
    // erase y first
    if (y == string::npos)
      throw QueryDataExcept("'(' is not matched.", formatErr);

    valStr.erase(y, 1);
    valStr.erase(x, 1);
    x = valStr.find('(');
    y = valStr.find(')');
  }

  if (y != string::npos)
    throw QueryDataExcept("')' is not matched.", formatErr);

  // convert to fixed-point notation if input is in scientific notation
  if (valStr.find('E') < string::npos || valStr.find('e') < string::npos)
  {
    size_t epos = valStr.find('E');

    if (epos == string::npos)
      epos = valStr.find('e');

    // get the coefficient
    string coef = valStr.substr(0, epos);
    // get the exponent
    string exp = valStr.substr(epos + 1);
    bool overflow = false;
    int64_t exponent = dataconvert::string_to_ll<int64_t>(exp, overflow);

    // if the exponent can not be held in 64-bit, not supported or saturated.
    if (overflow)
      throw QueryDataExcept("value is invalid.", formatErr);

    // find the optional "." point
    size_t dpos = coef.find('.');

    if (dpos != string::npos)
    {
      // move "." to the end by mutiply 10 ** (# of fraction digits)
      coef.erase(dpos, 1);
      exponent -= coef.length() - dpos;
    }

    if (exponent >= 0)
    {
      coef.resize(coef.length() + exponent, '0');
    }
    else
    {
      size_t bpos = coef.find_first_of("0123456789");
      size_t epos = coef.length();
      size_t mpos = -exponent;
      dpos = epos - mpos;
      int64_t padding = (int64_t)mpos - (int64_t)(epos - bpos);

      if (padding > 0)
      {
        coef.insert(bpos, padding, '0');
        dpos = bpos;
      }

      coef.insert(dpos, ".");
    }

    valStr = coef;
  }

  // now, convert to uint64_t
  string intStr(valStr);
  string frnStr = "";
  size_t dp = valStr.find('.');

  if (dp != string::npos)
  {
    intStr.erase(dp);
    frnStr = valStr.substr(dp + 1);

    if (intStr.length() == 0)
      intStr = "0";
    else if ((intStr.length() == 1) && ((intStr[0] == '+') || (intStr[0] == '-')))
    {
      intStr.insert(1, 1, '0');
    }
  }

  uint64_t uintVal = dataconvert::string_to_ull(intStr, pushwarning);

  bool dummy = false;
  uint64_t frnVal = (frnStr.length() > 0) ? dataconvert::string_to_ull(frnStr, dummy) : 0;

  if (frnVal != 0)
    pushwarning = true;

  switch (typeCode)
  {
    case datatypes::SystemCatalog::UTINYINT:
      if (uintVal > MAX_UTINYINT)
      {
        uintVal = MAX_UTINYINT;
        pushwarning = true;
      }

      break;

    case datatypes::SystemCatalog::USMALLINT:
      if (uintVal > MAX_USMALLINT)
      {
        uintVal = MAX_USMALLINT;
        pushwarning = true;
      }

      break;

    case datatypes::SystemCatalog::UMEDINT:
      if (uintVal > MAX_UMEDINT)
      {
        uintVal = MAX_UMEDINT;
        pushwarning = true;
      }

      break;

    case datatypes::SystemCatalog::UINT:
      if (uintVal > MAX_UINT)
      {
        uintVal = MAX_UINT;
        pushwarning = true;
      }

      break;

    case datatypes::SystemCatalog::UBIGINT:
      if (uintVal > MAX_UBIGINT)
      {
        uintVal = MAX_UBIGINT;
        pushwarning = true;
      }

      break;

    default: break;
  }

  return uintVal;
}

/**
 * This function reads a decimal value from a string.  It will stop processing
 * in 3 cases:
 *     1) end of input string (null-terminated)
 *     2) non-digit hit
 *     3) max characters read (if max != 0 then at most max characters read)
 *
 * It's up to the caller to figure out whether an error occurred based on
 * their definition of an error and how many characters were read
 */
uint32_t readDecimal(const char*& str, int32_t& value, uint32_t max = 0)
{
  value = 0;
  uint32_t numread = 0;

  while ((!max || numread < max) && *str && isdigit(*str))
  {
    value = value * 10 + ((*str) - '0');
    ++numread;
    ++str;
  }

  return numread;
}

bool mysql_str_to_datetime(const string& input, DateTime& output, bool& isDate)
{
  /**
   *  First we are going to identify the stop/start of the date portion.
   *  The rules are:
   *      - Date portion must come before anything else
   *      - Date portion may only contain numbers and '-'
   *      - Date portion ends with ' ', 'T', or '\0'
   *      - Date portion always starts with Year
   *      - Without date separators ('-'):
   *            YYMMDD
   *            YYYYMMDD
   *      - With date separators there are no specific field length
   *        requirements
   */
  int32_t datesepct = 0;
  uint32_t dtend = 0;

  for (; dtend < input.length(); ++dtend)
  {
    char c = input[dtend];

    if (isdigit(c))
    {
      continue;
    }
    //		else if( dtend != 0 && c == '-' )
    else if (dtend != 0 && ispunct(c))
    {
      ++datesepct;
    }
    else if (c == 'T' || c == ' ')
    {
      break;
    }
    else
    {
      // some other character showed up
      output.reset();
      return false;
    }
  }

  int32_t year = -1;
  int32_t mon = -1;
  int32_t day = -1;
  const char* ptr = input.c_str();

  if (datesepct == 0)
  {
    if (dtend == 6 || dtend == 12)
    {
      readDecimal(ptr, year, 2);
      readDecimal(ptr, mon, 2);
      readDecimal(ptr, day, 2);
      year += 2000;

      if (year > 2069)
        year -= 100;

      if (dtend == 12)
        dtend -= 6;
    }
    else if (dtend == 8 || dtend == 14)
    {
      readDecimal(ptr, year, 4);
      readDecimal(ptr, mon, 2);
      readDecimal(ptr, day, 2);

      if (dtend == 14)
        dtend -= 6;
    }
    else
    {
      output.reset();
      return false;
    }
  }
  else if (datesepct == 2)
  {
    uint32_t numread = readDecimal(ptr, year);

    if (numread == 2)
    {
      // special handling if we read a 2-byte year
      year += 2000;

      if (year > 2069)
        year -= 100;
    }

    ++ptr;  // skip one separator
    readDecimal(ptr, mon);
    ++ptr;                  // skip one separator
    readDecimal(ptr, day);  // skip two separators
  }
  else
  {
    output.reset();
    return false;
  }

  if (!isDateValid(day, mon, year))
  {
    output.reset();
    return false;
  }

  output.year = year;
  output.month = mon;
  output.day = day;

  /**
   *  Now we need to deal with the time portion.
   *  The rules are:
   *      - Time portion may be empty
   *      - Time portion may start with 'T'
   *      - Time portion always ends with '\0'
   *      - Time portion always starts with hour
   *      - Without time separators (':'):
   *            HHMMSS
   *      - All Times can end with option .[microseconds]
   *      - With time separators there are no specific field length
   *        requirements
   */
  while (input[dtend] == ' ' && dtend < input.length())
  {
    ++dtend;
  }

  if (dtend == input.length())
  {
    isDate = true;
    return true;
  }

  uint32_t timesep_ct = 0;
  bool has_usec = false;
  uint32_t len_before_msec = 0;
  uint32_t tmstart = (input[dtend] == ' ' || input[dtend] == 'T') ? dtend + 1 : dtend;
  uint32_t tmend = tmstart;

  for (; tmend < input.length(); ++tmend)
  {
    char c = input[tmend];

    if (isdigit(c))
    {
      // digits always ok
      continue;
    }
    //		else if( c == ':' )
    //		{
    //			timesep_ct++;
    //		}
    //		else if( c == '.' )
    //		{
    //			len_before_msec = ( tmend - tmstart );
    //			has_usec = true;
    //		}
    else if (ispunct(c))
    {
      if (c == '.' && timesep_ct == 2)
      {
        len_before_msec = (tmend - tmstart);
        has_usec = true;
      }
      else
      {
        timesep_ct++;
      }
    }
    else
    {
      // some other character showed up
      output.reset();
      return false;
    }
  }

  if (!len_before_msec)
    len_before_msec = (tmend - tmstart);

  int32_t hour = -1;
  int32_t min = 0;
  int32_t sec = 0;
  int32_t usec = 0;
  const char* tstart = input.c_str() + tmstart;

  if (timesep_ct == 2)
  {
    readDecimal(tstart, hour);
    ++tstart;  // skip one separator
    readDecimal(tstart, min);
    ++tstart;  // skip one separator
    readDecimal(tstart, sec);
  }
  else if (timesep_ct == 1)
  {
    readDecimal(tstart, hour);
    ++tstart;  // skip one separator
    readDecimal(tstart, min);
  }
  else if (timesep_ct == 0 && len_before_msec == 6)
  {
    readDecimal(tstart, hour, 2);
    readDecimal(tstart, min, 2);
    readDecimal(tstart, sec, 2);
  }
  else if (timesep_ct == 0 && len_before_msec == 4)
  {
    readDecimal(tstart, hour, 2);
    readDecimal(tstart, min, 2);
  }
  else if (timesep_ct == 0 && len_before_msec == 2)
  {
    readDecimal(tstart, hour, 2);
  }
  else
  {
    output.reset();
    return false;
  }

  if (has_usec)
  {
    ++tstart;  // skip '.' character.  We could error check if we wanted to
    uint32_t numread = readDecimal(tstart, usec);

    if (numread > 6 || numread < 1)
    {
      // don't allow more than 6 digits when specifying microseconds
      output.reset();
      return false;
    }

    // usec have to be scaled up so that it always represents microseconds
    for (int i = numread; i < 6; i++)
      usec *= 10;
  }

  if (!isDateTimeValid(hour, min, sec, usec))
  {
    output.reset();
    return false;
  }

  output.hour = hour;
  output.minute = min;
  output.second = sec;
  output.msecond = usec;
  isDate = false;
  return true;
}

bool mysql_str_to_time(const string& input, Time& output, long decimals)
{
  uint32_t dtend = 0;
  bool isNeg = false;

  /**
   *  We need to deal with the time portion.
   *  The rules are:
   *      - Time portion always ends with '\0'
   *      - Time portion always starts with hour
   *      - Without time separators (':'):
   *            HHMMSS
   *      - All Times can end with option .[microseconds]
   *      - With time separators there are no specific field length
   *        requirements
   */
  while (input[dtend] == ' ' && dtend < input.length())
  {
    ++dtend;
  }

  if (dtend == input.length())
  {
    return false;
  }

  uint32_t timesep_ct = 0;
  bool has_usec = false;
  uint32_t len_before_msec = 0;
  uint32_t tmstart = dtend;
  uint32_t tmend = tmstart;

  for (; tmend < input.length(); ++tmend)
  {
    char c = input[tmend];

    if (isdigit(c))
    {
      // digits always ok
      continue;
    }
    //		else if( c == ':' )
    //		{
    //			timesep_ct++;
    //		}
    //		else if( c == '.' )
    //		{
    //			len_before_msec = ( tmend - tmstart );
    //			has_usec = true;
    //		}
    else if (ispunct(c))
    {
      if (c == '.' && timesep_ct == 2)
      {
        len_before_msec = (tmend - tmstart);
        has_usec = true;
      }
      else if (c == '-' && (tmend == tmstart))
      {
        isNeg = true;
        ++tmstart;
      }
      else
      {
        timesep_ct++;
      }
    }
    else
    {
      // some other character showed up
      output.reset();
      return false;
    }
  }

  if (!len_before_msec)
    len_before_msec = (tmend - tmstart);

  int32_t hour = -1;
  int32_t min = 0;
  int32_t sec = 0;
  int32_t usec = 0;
  const char* tstart = input.c_str() + tmstart;

  if (timesep_ct == 2)
  {
    readDecimal(tstart, hour);
    ++tstart;  // skip one separator
    readDecimal(tstart, min);
    ++tstart;  // skip one separator
    readDecimal(tstart, sec);
  }
  else if (timesep_ct == 1)
  {
    readDecimal(tstart, hour);
    ++tstart;  // skip one separator
    readDecimal(tstart, min);
  }
  else if (timesep_ct == 0 && len_before_msec == 6)
  {
    readDecimal(tstart, hour, 2);
    readDecimal(tstart, min, 2);
    readDecimal(tstart, sec, 2);
  }
  else if (timesep_ct == 0 && len_before_msec == 4)
  {
    readDecimal(tstart, hour, 2);
    readDecimal(tstart, min, 2);
  }
  else if (timesep_ct == 0 && len_before_msec == 2)
  {
    readDecimal(tstart, hour, 2);
  }
  else
  {
    output.reset();
    return false;
  }

  if (has_usec)
  {
    ++tstart;  // skip '.' character.  We could error check if we wanted to
    uint32_t numread = readDecimal(tstart, usec);

    if (numread > 6 || numread < 1)
    {
      // don't allow more than 6 digits when specifying microseconds
      output.reset();
      return false;
    }

    // usec have to be scaled up so that it always represents microseconds
    for (int i = numread; i < 6; i++)
      usec *= 10;
  }

  if (!isTimeValid(hour, min, sec, usec))
  {
    // Emulate MariaDB's time saturation
    // TODO: msec saturation
    if ((hour > 838) && !isNeg)
    {
      output.hour = 838;
      output.minute = 59;
      output.second = 59;
      output.msecond = exp10(decimals) - 1;
      output.is_neg = 0;
    }
    else if ((hour < -838) || ((hour > 838) && isNeg))
    {
      output.hour = -838;
      output.minute = 59;
      output.second = 59;
      output.msecond = exp10(decimals) - 1;
      output.is_neg = -1;
    }
    // If neither of the above match then we return a 0 time
    else
    {
      output.reset();
    }

    return false;
  }

  output.hour = isNeg ? 0 - hour : hour;
  output.minute = min;
  output.second = sec;
  output.msecond = usec;
  output.is_neg = isNeg;
  return true;
}

bool stringToDateStruct(const string& data, Date& date)
{
  bool isDate;
  DateTime dt;

  if (!mysql_str_to_datetime(data, dt, isDate))
    return false;

  date.year = dt.year;
  date.month = dt.month;
  date.day = dt.day;
  return true;
}

bool stringToDatetimeStruct(const string& data, DateTime& dtime, bool* date)
{
  bool isDate;

  if (!mysql_str_to_datetime(data, dtime, isDate))
    return false;

  if (isDate)
  {
    if (date)
      *date = true;

    dtime.hour = 0;
    dtime.minute = 0;
    dtime.second = 0;
    dtime.msecond = 0;
  }

  return true;
}

bool stringToTimeStruct(const string& data, Time& dtime, long decimals)
{
  if (!mysql_str_to_time(data, dtime, decimals))
    return false;

  return true;
}

bool stringToTimestampStruct(const string& data, TimeStamp& timeStamp, long timeZone)
{
  // special handling for 0000-00-00 00:00:00
  // "0" is sent by the server when checking for default value
  // in the DDL. This is equivalent of 0000-00-00 00:00:00
  if (data.substr(0, 19) == "0000-00-00 00:00:00" || data == "0")
  {
    timeStamp.second = 0;
    timeStamp.msecond = 0;
    return true;
  }

  // for alter table add column <columnname> timestamp,
  // if the table is non-empty, then columnstore will apply
  // default value to populate the new column
  if (data == "current_timestamp() ON UPDATE current_timestamp()")
  {
    struct timeval tv;
    gettimeofday(&tv, 0);
    timeStamp.second = tv.tv_sec;
    timeStamp.msecond = tv.tv_usec;
    return true;
  }

  bool isDate;

  DateTime dtime;

  if (!mysql_str_to_datetime(data, dtime, isDate))
  {
    timeStamp.reset();
    return false;
  }

  if (isDate)
  {
    dtime.hour = 0;
    dtime.minute = 0;
    dtime.second = 0;
    dtime.msecond = 0;
  }

  MySQLTime m_time;
  m_time.year = dtime.year;
  m_time.month = dtime.month;
  m_time.day = dtime.day;
  m_time.hour = dtime.hour;
  m_time.minute = dtime.minute;
  m_time.second = dtime.second;
  m_time.second_part = dtime.msecond;

  bool isValid = true;
  int64_t seconds = mySQLTimeToGmtSec(m_time, timeZone, isValid);

  if (!isValid)
  {
    timeStamp.reset();
    return false;
  }

  timeStamp.second = seconds;
  timeStamp.msecond = m_time.second_part;

  return true;
}

boost::any DataConvert::StringToBit(const datatypes::SystemCatalog::TypeAttributesStd& colType,
                                    const datatypes::ConvertFromStringParam& prm, const std::string& dataOrig,
                                    bool& pushWarning)
{
  std::string data(dataOrig);
  unsigned int x = data.find("(");

  if (x <= data.length())
  {
    data.replace(x, 1, " ");
  }

  x = data.find(")");

  if (x <= data.length())
  {
    data.replace(x, 1, " ");
  }

  int64_t tmp = 0;

  number_int_value(data, datatypes::SystemCatalog::BIT, colType, pushWarning, prm.noRoundup(), tmp);

  if (tmp)
  {
    bool bitvalue;

    if (from_string<bool>(bitvalue, data, std::dec))
    {
      boost::any value = bitvalue;
      return value;
    }
    else
    {
      throw QueryDataExcept("range, valid value or conversion error on BIT type.", formatErr);
    }
  }
  return boost::any();
}

boost::any DataConvert::StringToSDecimal(const datatypes::SystemCatalog::TypeAttributesStd& colType,
                                         const datatypes::ConvertFromStringParam& prm,
                                         const std::string& data, bool& pushWarning)
{
  const cscDataType typeCode = datatypes::SystemCatalog::DECIMAL;
  if (LIKELY(colType.colWidth == 16))
  {
    int128_t val128;
    number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val128);
    boost::any value = (int128_t)val128;
    return value;
  }
  else if (colType.colWidth == 8)
  {
    int64_t val64;
    number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
    boost::any value = (long long)val64;
    return value;
  }
  else if (colType.colWidth == 4)
  {
    int64_t val64;
    number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
    boost::any value = (int)val64;
    return value;
  }
  else if (colType.colWidth == 2)
  {
    int64_t val64;
    number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
    boost::any value = (short)val64;
    return value;
  }
  else if (colType.colWidth == 1)
  {
    int64_t val64;
    number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
    boost::any value = (char)val64;
    return value;
  }
  // else if (colType.colWidth == 32)
  //    value = data;
  return boost::any();
}

boost::any DataConvert::StringToUDecimal(const datatypes::SystemCatalog::TypeAttributesStd& colType,
                                         const datatypes::ConvertFromStringParam& prm,
                                         const std::string& data, bool& pushWarning)
{
  const cscDataType typeCode = datatypes::SystemCatalog::UDECIMAL;

  // UDECIMAL numbers may not be negative
  if (LIKELY(colType.colWidth == 16))
  {
    int128_t val128;
    number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val128);

    if (val128 < 0 && !datatypes::Decimal::isWideDecimalNullValue(val128) &&
        !datatypes::Decimal::isWideDecimalEmptyValue(val128))
    {
      val128 = 0;
      pushWarning = true;
    }

    boost::any value = val128;
    return value;
  }
  else if (colType.colWidth == 8)
  {
    int64_t val64;
    number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
    long long ival = static_cast<long long>(val64);

    if (ival < 0 && ival != static_cast<long long>(joblist::BIGINTEMPTYROW) &&
        ival != static_cast<long long>(joblist::BIGINTNULL))
    {
      ival = 0;
      pushWarning = true;
    }

    boost::any value = ival;
    return value;
  }
  else if (colType.colWidth == 4)
  {
    int64_t val64;
    number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
    int ival = static_cast<int>(val64);

    if (ival < 0 && ival != static_cast<int>(joblist::INTEMPTYROW) &&
        ival != static_cast<int>(joblist::INTNULL))
    {
      ival = 0;
      pushWarning = true;
    }

    boost::any value = ival;
    return value;
  }
  else if (colType.colWidth == 2)
  {
    int64_t val64;
    number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
    short ival = (short)val64;

    if (ival < 0 && ival != static_cast<int16_t>(joblist::SMALLINTEMPTYROW) &&
        ival != static_cast<int16_t>(joblist::SMALLINTNULL))
    {
      ival = 0;
      pushWarning = true;
    }

    boost::any value = ival;
    return value;
  }
  else if (colType.colWidth == 1)
  {
    int64_t val64;
    number_int_value(data, typeCode, colType, pushWarning, prm.noRoundup(), val64);
    signed char ival = (signed char)val64;

    if (ival < 0 && ival != static_cast<int8_t>(joblist::TINYINTEMPTYROW) &&
        ival != static_cast<int8_t>(joblist::TINYINTNULL))
    {
      ival = 0;
      pushWarning = true;
    }

    boost::any value = ival;
    return value;
  }
  return boost::any();
}

boost::any DataConvert::StringToFloat(cscDataType typeCode, const std::string& dataOrig, bool& pushWarning)
{
  boost::any value;
  std::string data(dataOrig);

  string::size_type x = data.find('(');

  if (x < string::npos)
    data.erase(x, 1);

  x = data.find(')');

  if (x < string::npos)
    data.erase(x, 1);

  if (number_value(data))
  {
    float floatvalue;
    errno = 0;
    floatvalue = strtof(data.c_str(), 0);

    if (errno == ERANGE)
    {
      pushWarning = true;
      if (abs(floatvalue) == HUGE_VALF)
      {
        if (floatvalue > 0)
          floatvalue = MAX_FLOAT;
        else
          floatvalue = MIN_FLOAT;
      }
      else
        floatvalue = 0;
    }

    if (floatvalue < 0.0 && typeCode == datatypes::SystemCatalog::UFLOAT &&
        floatvalue != static_cast<float>(joblist::FLOATEMPTYROW) &&
        floatvalue != static_cast<float>(joblist::FLOATNULL))
    {
      value = 0.0;  // QQ: should it assign floatvalue?
      pushWarning = true;
    }

    value = floatvalue;
  }
  else
    throw QueryDataExcept("range, valid value or conversion error on FLOAT type.", formatErr);
  return value;
}

boost::any DataConvert::StringToDouble(cscDataType typeCode, const std::string& dataOrig, bool& pushWarning)
{
  boost::any value;
  std::string data(dataOrig);

  string::size_type x = data.find('(');

  if (x < string::npos)
    data.erase(x, 1);

  x = data.find(')');

  if (x < string::npos)
    data.erase(x, 1);

  if (number_value(data))
  {
    double doublevalue;
    errno = 0;
    doublevalue = strtod(data.c_str(), 0);

    if (errno == ERANGE)
    {
      pushWarning = true;
      if (abs(doublevalue) == HUGE_VALL)
      {
        if (doublevalue > 0)
          value = MAX_DOUBLE;
        else
          value = MIN_DOUBLE;
      }
      else
        value = 0;
    }
    else
      value = doublevalue;

    if (doublevalue < 0.0 && typeCode == datatypes::SystemCatalog::UDOUBLE &&
        doublevalue != static_cast<double>(joblist::DOUBLEEMPTYROW) &&
        doublevalue != static_cast<double>(joblist::DOUBLENULL))
    {
      doublevalue = 0.0;  // QQ: should it assign "value" ?
      pushWarning = true;
    }
  }
  else
  {
    throw QueryDataExcept("range, valid value or conversion error on DOUBLE type.", formatErr);
  }
  return value;
}

boost::any DataConvert::StringToString(const datatypes::SystemCatalog::TypeAttributesStd& colType,
                                       const std::string& dataOrig, bool& pushWarning)

{
  std::string data(dataOrig);
  // check data length
  if (data.length() > (unsigned int)colType.colWidth)
  {
    // TODO: charsetNumber should be moved to TypeStdAttributes ASAP
    const execplan::CalpontSystemCatalog::ColType& colType2 =
        static_cast<const execplan::CalpontSystemCatalog::ColType&>(colType);
    datatypes::Charset cs(colType2.charsetNumber);
    const char* newEnd = data.data() + colType.colWidth;
    const char* origEnd = data.data() + data.length();
    pushWarning = cs.test_if_important_data(newEnd, origEnd);
    data = data.substr(0, colType.colWidth);
    boost::any value = data;
    return value;
  }
  if ((unsigned int)colType.colWidth > data.length())
  {
    // Pad null character to the string
    data.resize(colType.colWidth, 0);
  }
  boost::any value = data;
  return value;
}

boost::any DataConvert::StringToDate(const std::string& data, bool& pushWarning)
{
  Date aDay;

  if (stringToDateStruct(data, aDay))
  {
    boost::any value = getUInt32LE((const char*)&aDay);
    return value;
  }
  boost::any value = (uint32_t)0;
  pushWarning = true;
  return value;
}

boost::any DataConvert::StringToDatetime(const std::string& data, bool& pushWarning)
{
  DateTime aDatetime;

  if (stringToDatetimeStruct(data, aDatetime, 0))  // QQ: why 0?
  {
    boost::any value = getUInt64LE((const char*)&aDatetime);
    return value;
  }
  boost::any value = (uint64_t)0;
  pushWarning = true;
  return value;
}

boost::any DataConvert::StringToTime(const datatypes::SystemCatalog::TypeAttributesStd& colType,
                                     const std::string& data, bool& pushWarning)
{
  Time aTime;

  if (!stringToTimeStruct(data, aTime, colType.precision))
  {
    pushWarning = true;
  }

  boost::any value = getSInt64LE((const char*)&aTime);
  return value;
}

boost::any DataConvert::StringToTimestamp(const datatypes::ConvertFromStringParam& prm,
                                          const std::string& data, bool& pushWarning)
{
  TimeStamp aTimestamp;

  if (!stringToTimestampStruct(data, aTimestamp, prm.timeZone()))
  {
    pushWarning = true;
  }

  boost::any value = getUInt64LE((const char*)&aTimestamp);
  return value;
}

//------------------------------------------------------------------------------
// Convert date string to binary date.  Used by BulkLoad.
//------------------------------------------------------------------------------
int32_t DataConvert::convertColumnDate(const char* dataOrg, CalpontDateTimeFormat dateFormat, int& status,
                                       unsigned int dataOrgLen)
{
  status = 0;
  const char* p;
  p = dataOrg;
  char fld[10];
  int32_t value = 0;

  if (dateFormat != CALPONTDATE_ENUM)
  {
    status = -1;
    return value;
  }

  // @bug 5787: allow for leading blanks
  unsigned int dataLen = dataOrgLen;

  if ((dataOrgLen > 0) && (dataOrg[0] == ' '))
  {
    unsigned nblanks = 0;

    for (unsigned nn = 0; nn < dataOrgLen; nn++)
    {
      if (dataOrg[nn] == ' ')
        nblanks++;
      else
        break;
    }

    p = dataOrg + nblanks;
    dataLen = dataOrgLen - nblanks;
  }

  if (dataLen < 10)
  {
    status = -1;
    return value;
  }

  int inYear, inMonth, inDay;
  memcpy(fld, p, 4);
  fld[4] = '\0';

  inYear = strtol(fld, 0, 10);

  memcpy(fld, p + 5, 2);
  fld[2] = '\0';

  inMonth = strtol(fld, 0, 10);

  memcpy(fld, p + 8, 2);
  fld[2] = '\0';

  inDay = strtol(fld, 0, 10);

  if (isDateValid(inDay, inMonth, inYear))
  {
    Date aDay;
    aDay.year = inYear;
    aDay.month = inMonth;
    aDay.day = inDay;
    memcpy(&value, &aDay, 4);
  }
  else
  {
    status = -1;
  }

  return value;
}

//------------------------------------------------------------------------------
// Verify that specified date is valid
//------------------------------------------------------------------------------
bool DataConvert::isColumnDateValid(int32_t date)
{
  Date d;
  void* dp = static_cast<void*>(&d);
  memcpy(dp, &date, sizeof(int32_t));
  return (isDateValid(d.day, d.month, d.year));
}

//------------------------------------------------------------------------------
// Convert date/time string to binary date/time.  Used by BulkLoad.
//------------------------------------------------------------------------------
int64_t DataConvert::convertColumnDatetime(const char* dataOrg, CalpontDateTimeFormat datetimeFormat,
                                           int& status, unsigned int dataOrgLen)
{
  status = 0;
  const char* p;
  p = dataOrg;
  char fld[10];
  int64_t value = 0;

  if (datetimeFormat != CALPONTDATETIME_ENUM)
  {
    status = -1;
    return value;
  }

  // @bug 5787: allow for leading blanks
  unsigned int dataLen = dataOrgLen;

  if ((dataOrgLen > 0) && (dataOrg[0] == ' '))
  {
    unsigned nblanks = 0;

    for (unsigned nn = 0; nn < dataOrgLen; nn++)
    {
      if (dataOrg[nn] == ' ')
        nblanks++;
      else
        break;
    }

    p = dataOrg + nblanks;
    dataLen = dataOrgLen - nblanks;
  }

  if (dataLen < 10)
  {
    status = -1;
    return value;
  }

  int inYear, inMonth, inDay, inHour, inMinute, inSecond, inMicrosecond;
  memcpy(fld, p, 4);
  fld[4] = '\0';

  inYear = strtol(fld, 0, 10);

  memcpy(fld, p + 5, 2);
  fld[2] = '\0';

  inMonth = strtol(fld, 0, 10);

  memcpy(fld, p + 8, 2);
  fld[2] = '\0';

  inDay = strtol(fld, 0, 10);

  inHour = 0;
  inMinute = 0;
  inSecond = 0;
  inMicrosecond = 0;

  if (dataLen > 12)
  {
    // For backwards compatability we still allow leading blank
    if ((!isdigit(p[11]) && (p[11] != ' ')) || !isdigit(p[12]))
    {
      status = -1;
      return value;
    }

    memcpy(fld, p + 11, 2);
    fld[2] = '\0';

    inHour = strtol(fld, 0, 10);

    if (dataLen > 15)
    {
      if (!isdigit(p[14]) || !isdigit(p[15]))
      {
        status = -1;
        return value;
      }

      memcpy(fld, p + 14, 2);
      fld[2] = '\0';

      inMinute = strtol(fld, 0, 10);

      if (dataLen > 18)
      {
        if (!isdigit(p[17]) || !isdigit(p[18]))
        {
          status = -1;
          return value;
        }

        memcpy(fld, p + 17, 2);
        fld[2] = '\0';

        inSecond = strtol(fld, 0, 10);

        if (dataLen > 20)
        {
          unsigned int microFldLen = dataLen - 20;

          if (microFldLen > (sizeof(fld) - 1))
            microFldLen = sizeof(fld) - 1;

          memcpy(fld, p + 20, microFldLen);
          fld[microFldLen] = '\0';
          inMicrosecond = strtol(fld, 0, 10);
        }
      }
    }
  }

  if (isDateValid(inDay, inMonth, inYear) && isDateTimeValid(inHour, inMinute, inSecond, inMicrosecond))
  {
    DateTime aDatetime;
    aDatetime.year = inYear;
    aDatetime.month = inMonth;
    aDatetime.day = inDay;
    aDatetime.hour = inHour;
    aDatetime.minute = inMinute;
    aDatetime.second = inSecond;
    aDatetime.msecond = inMicrosecond;

    memcpy(&value, &aDatetime, 8);
  }
  else
  {
    status = -1;
  }

  return value;
}

//------------------------------------------------------------------------------
// Convert timestamp string to binary timestamp.  Used by BulkLoad.
// Most of this code is taken from DataConvert::convertColumnDatetime
//------------------------------------------------------------------------------
int64_t DataConvert::convertColumnTimestamp(const char* dataOrg, CalpontDateTimeFormat datetimeFormat,
                                            int& status, unsigned int dataOrgLen, long timeZone)
{
  char tmbuf[64];
  std::string dataOrgTemp = dataOrg;
  status = 0;
  if (dataOrgTemp.substr(0, 19) == "0000-00-00 00:00:00")
  {
    return 0;
  }

  // this is the default value of the first timestamp field in a table,
  // which is stored in the system catalog
  if (strcmp(dataOrg, "current_timestamp() ON UPDATE current_timestamp()") == 0)
  {
    struct timeval tv;
    gettimeofday(&tv, 0);
    MySQLTime time;
    gmtSecToMySQLTime(tv.tv_sec, time, timeZone);
    sprintf(tmbuf, "%04d-%02d-%02d %02d:%02d:%02d.%06ld", time.year, time.month, time.day, time.hour,
            time.minute, time.second, tv.tv_usec);
    dataOrg = tmbuf;
    dataOrgLen = strlen(tmbuf);
  }

  const char* p;
  p = dataOrg;
  char fld[10];
  int64_t value = 0;

  if (datetimeFormat != CALPONTDATETIME_ENUM)
  {
    status = -1;
    return value;
  }

  unsigned int dataLen = dataOrgLen;

  if ((dataOrgLen > 0) && (dataOrg[0] == ' '))
  {
    unsigned nblanks = 0;

    for (unsigned nn = 0; nn < dataOrgLen; nn++)
    {
      if (dataOrg[nn] == ' ')
        nblanks++;
      else
        break;
    }

    p = dataOrg + nblanks;
    dataLen = dataOrgLen - nblanks;
  }

  if (dataLen < 10)
  {
    status = -1;
    return value;
  }

  int inYear, inMonth, inDay, inHour, inMinute, inSecond, inMicrosecond;
  memcpy(fld, p, 4);
  fld[4] = '\0';

  inYear = strtol(fld, 0, 10);

  memcpy(fld, p + 5, 2);
  fld[2] = '\0';

  inMonth = strtol(fld, 0, 10);

  memcpy(fld, p + 8, 2);
  fld[2] = '\0';

  inDay = strtol(fld, 0, 10);

  inHour = 0;
  inMinute = 0;
  inSecond = 0;
  inMicrosecond = 0;

  if (dataLen > 12)
  {
    // For backwards compatability we still allow leading blank
    if ((!isdigit(p[11]) && (p[11] != ' ')) || !isdigit(p[12]))
    {
      status = -1;
      return value;
    }

    memcpy(fld, p + 11, 2);
    fld[2] = '\0';

    inHour = strtol(fld, 0, 10);

    if (dataLen > 15)
    {
      if (!isdigit(p[14]) || !isdigit(p[15]))
      {
        status = -1;
        return value;
      }

      memcpy(fld, p + 14, 2);
      fld[2] = '\0';

      inMinute = strtol(fld, 0, 10);

      if (dataLen > 18)
      {
        if (!isdigit(p[17]) || !isdigit(p[18]))
        {
          status = -1;
          return value;
        }

        memcpy(fld, p + 17, 2);
        fld[2] = '\0';

        inSecond = strtol(fld, 0, 10);

        if (dataLen > 20)
        {
          unsigned int microFldLen = dataLen - 20;

          if (microFldLen > (sizeof(fld) - 1))
            microFldLen = sizeof(fld) - 1;

          memcpy(fld, p + 20, microFldLen);
          fld[microFldLen] = '\0';
          inMicrosecond = strtol(fld, 0, 10);
        }
      }
    }
  }

  if (isDateValid(inDay, inMonth, inYear) && isDateTimeValid(inHour, inMinute, inSecond, inMicrosecond))
  {
    MySQLTime m_time;
    m_time.year = inYear;
    m_time.month = inMonth;
    m_time.day = inDay;
    m_time.hour = inHour;
    m_time.minute = inMinute;
    m_time.second = inSecond;
    m_time.second_part = inMicrosecond;

    bool isValid = true;
    int64_t seconds = mySQLTimeToGmtSec(m_time, timeZone, isValid);

    if (!isValid)
    {
      status = -1;
      return value;
    }

    TimeStamp timestamp;
    timestamp.second = seconds;
    timestamp.msecond = m_time.second_part;

    memcpy(&value, &timestamp, 8);
  }
  else
  {
    status = -1;
  }

  return value;
}

//------------------------------------------------------------------------------
// Convert time string to binary time.  Used by BulkLoad.
// Most of this is taken from str_to_time in sql-common/my_time.c
//------------------------------------------------------------------------------
int64_t DataConvert::convertColumnTime(const char* dataOrg, CalpontDateTimeFormat datetimeFormat, int& status,
                                       unsigned int dataOrgLen)
{
  status = 0;
  char* p;
  char* retp = NULL;
  char* savePoint = NULL;
  p = const_cast<char*>(dataOrg);
  int64_t value = 0;
  int inHour, inMinute, inSecond, inMicrosecond;
  inHour = 0;
  inMinute = 0;
  inSecond = 0;
  inMicrosecond = 0;
  bool isNeg = false;

  if (datetimeFormat != CALPONTTIME_ENUM)
  {
    status = -1;
    return value;
  }

  if (dataOrgLen == 0)
  {
    return value;
  }

  if (dataOrgLen < 3)
  {
    // Not enough chars to be a time
    status = -1;
    return value;
  }

  if (p[0] == '-')
  {
    isNeg = true;
  }

  errno = 0;

  p = strtok_r(p, ":.", &savePoint);
  inHour = strtol(p, &retp, 10);

  if (errno || !retp)
  {
    status = -1;
    return value;
  }

  p = strtok_r(NULL, ":.", &savePoint);

  if (p == NULL)
  {
    status = -1;
    return value;
  }

  inMinute = strtol(p, &retp, 10);

  if (errno || !retp)
  {
    status = -1;
    return value;
  }

  p = strtok_r(NULL, ":.", &savePoint);

  if (p == NULL)
  {
    status = -1;
    return value;
  }

  inSecond = strtol(p, &retp, 10);

  if (errno || !retp)
  {
    status = -1;
    return value;
  }

  p = strtok_r(NULL, ":.", &savePoint);

  if (p != NULL)
  {
    inMicrosecond = strtol(p, &retp, 10);

    if (errno || !retp)
    {
      status = -1;
      return value;
    }
  }

  if (isTimeValid(inHour, inMinute, inSecond, inMicrosecond))
  {
    Time atime;
    atime.hour = inHour;
    atime.minute = inMinute;
    atime.second = inSecond;
    atime.msecond = inMicrosecond;
    atime.is_neg = isNeg;

    memcpy(&value, &atime, 8);
  }
  else
  {
    // Emulate MariaDB's time saturation
    if (inHour > 838)
    {
      Time atime;
      atime.hour = 838;
      atime.minute = 59;
      atime.second = 59;
      atime.msecond = 999999;
      atime.is_neg = false;
      memcpy(&value, &atime, 8);
    }
    else if (inHour < -838)
    {
      Time atime;
      atime.hour = -838;
      atime.minute = 59;
      atime.second = 59;
      atime.msecond = 999999;
      atime.is_neg = false;
      memcpy(&value, &atime, 8);
    }

    // If neither of the above match then we return a 0 time

    status = -1;
  }

  return value;
}

//------------------------------------------------------------------------------
// Verify that specified datetime is valid
//------------------------------------------------------------------------------
bool DataConvert::isColumnDateTimeValid(int64_t dateTime)
{
  DateTime dt;
  void* dtp = static_cast<void*>(&dt);
  memcpy(dtp, &dateTime, sizeof(uint64_t));

  if (isDateValid(dt.day, dt.month, dt.year))
    return isDateTimeValid(dt.hour, dt.minute, dt.second, dt.msecond);

  return false;
}

bool DataConvert::isColumnTimeValid(int64_t time)
{
  Time dt;
  void* dtp = static_cast<void*>(&dt);
  memcpy(dtp, &time, sizeof(uint64_t));

  return isTimeValid(dt.hour, dt.minute, dt.second, dt.msecond);
}

bool DataConvert::isColumnTimeStampValid(int64_t timeStamp)
{
  TimeStamp dt;
  void* dtp = static_cast<void*>(&dt);
  memcpy(dtp, &timeStamp, sizeof(uint64_t));

  return isTimestampValid(dt.second, dt.msecond);
}

std::string DataConvert::dateToString(int datevalue)
{
  // @bug 4703 abandon multiple ostringstream's for conversion
  Date d(datevalue);
  const int DATETOSTRING_LEN = 12;  // YYYY-MM-DD\0
  char buf[DATETOSTRING_LEN];

  sprintf(buf, "%04d-%02d-%02d", d.year, d.month, d.day);
  return buf;
}

std::string DataConvert::datetimeToString(long long datetimevalue, long decimals)
{
  // 10 is default which means we don't need microseconds
  if (decimals > 6 || decimals < 0)
  {
    decimals = 0;
  }

  // @bug 4703 abandon multiple ostringstream's for conversion
  DateTime dt(datetimevalue);
  const int DATETIMETOSTRING_LEN = 28;  // YYYY-MM-DD HH:MM:SS.mmmmmm\0
  char buf[DATETIMETOSTRING_LEN];

  sprintf(buf, "%04d-%02d-%02d %02d:%02d:%02d", dt.year, dt.month, dt.day, dt.hour, dt.minute, dt.second);

  if (dt.msecond && decimals)
  {
    // Pad start with zeros
    sprintf(buf + strlen(buf), ".%0*d", (int)decimals, dt.msecond);
  }

  return buf;
}

std::string DataConvert::timestampToString(long long timestampvalue, long timezone, long decimals)
{
  // 10 is default which means we don't need microseconds
  if (decimals > 6 || decimals < 0)
  {
    decimals = 0;
  }

  TimeStamp timestamp(timestampvalue);
  int64_t seconds = timestamp.second;

  MySQLTime time;
  gmtSecToMySQLTime(seconds, time, timezone);

  const int TIMESTAMPTOSTRING_LEN = 28;  // YYYY-MM-DD HH:MM:SS.mmmmmm\0
  char buf[TIMESTAMPTOSTRING_LEN];

  sprintf(buf, "%04d-%02d-%02d %02d:%02d:%02d", time.year, time.month, time.day, time.hour, time.minute,
          time.second);

  if (timestamp.msecond && decimals)
  {
    // Pad start with zeros
    sprintf(buf + strlen(buf), ".%0*d", (int)decimals, timestamp.msecond);
  }

  return buf;
}

std::string DataConvert::timeToString(long long timevalue, long decimals)
{
  // 10 is default which means we don't need microseconds
  if (decimals > 6 || decimals < 0)
  {
    decimals = 0;
  }

  // @bug 4703 abandon multiple ostringstream's for conversion
  Time dt(timevalue);
  const int TIMETOSTRING_LEN = 19;  // (-H)HH:MM:SS.mmmmmm\0
  char buf[TIMETOSTRING_LEN];
  char* outbuf = buf;

  if ((dt.hour >= 0) && dt.is_neg)
  {
    outbuf[0] = '-';
    outbuf++;
  }

  sprintf(outbuf, "%02d:%02d:%02d", dt.hour, dt.minute, dt.second);

  if (dt.msecond && decimals)
  {
    // Pad start with zeros
    sprintf(buf + strlen(buf), ".%0*d", (int)decimals, dt.msecond);
  }

  return buf;
}

std::string DataConvert::dateToString1(int datevalue)
{
  // @bug 4703 abandon multiple ostringstream's for conversion
  Date d(datevalue);
  const int DATETOSTRING1_LEN = 10;  // YYYYMMDD\0
  char buf[DATETOSTRING1_LEN];

  sprintf(buf, "%04d%02d%02d", d.year, d.month, d.day);
  return buf;
}

std::string DataConvert::datetimeToString1(long long datetimevalue)
{
  // @bug 4703 abandon multiple ostringstream's for conversion
  DateTime dt(datetimevalue);
  // Interesting, gcc 7 says the sprintf below generates between 21 and 23 bytes of output.
  const int DATETIMETOSTRING1_LEN = 23;  // YYYYMMDDHHMMSSmmmmmm\0
  char buf[DATETIMETOSTRING1_LEN];

  sprintf(buf, "%04d%02d%02d%02d%02d%02d%06d", dt.year, dt.month, dt.day, dt.hour, dt.minute, dt.second,
          dt.msecond);
  return buf;
}

std::string DataConvert::timestampToString1(long long timestampvalue, long timezone)
{
  const int TIMESTAMPTOSTRING1_LEN = 22;  // YYYYMMDDHHMMSSmmmmmm\0
  char buf[TIMESTAMPTOSTRING1_LEN];

  TimeStamp timestamp(timestampvalue);
  int64_t seconds = timestamp.second;
  MySQLTime time;
  gmtSecToMySQLTime(seconds, time, timezone);

  sprintf(buf, "%04d%02d%02d%02d%02d%02d%06d", time.year, time.month, time.day, time.hour, time.minute,
          time.second, timestamp.msecond);
  return buf;
}

std::string DataConvert::timeToString1(long long timevalue)
{
  // @bug 4703 abandon multiple ostringstream's for conversion
  Time t(timevalue);
  const int TIMETOSTRING1_LEN = 22;  // HHMMSSmmmmmm\0
  char buf[TIMETOSTRING1_LEN];

  char* outbuf = buf;

  sprintf(outbuf, "%02d%02d%02d%06d", t.hour, t.minute, t.second, t.msecond);
  return buf;
}

int64_t DataConvert::dateToInt(const string& date)
{
  return stringToDate(date);
}

int64_t DataConvert::dateToInt(const utils::NullString& date)
{
  return stringToDate(date);
}

int64_t DataConvert::datetimeToInt(const string& datetime)
{
  return stringToDatetime(datetime);
}

int64_t DataConvert::datetimeToInt(const utils::NullString& datetime)
{
  return stringToDatetime(datetime);
}

int64_t DataConvert::timestampToInt(const string& timestamp, long timeZone)
{
  return stringToTimestamp(timestamp, timeZone);
}

int64_t DataConvert::timeToInt(const string& time)
{
  return stringToTime(time);
}

int64_t DataConvert::stringToDate(const string& data)
{
  Date aDay;

  if (stringToDateStruct(data, aDay))
  {
    uint32_t temp = getUInt32LE((const char*)&aDay);
    return ((temp & 0xFFFFFFC0) | 0x3E);
  }
  else
    return -1;
}
int64_t DataConvert::stringToDate(const utils::NullString& data)
{
  if (data.isNull())
  {
    return -1;
  }

  return stringToDate(data.unsafeStringRef());
}

int64_t DataConvert::stringToDatetime(const string& data, bool* date)
{
  DateTime dtime;

  if (stringToDatetimeStruct(data, dtime, date))
    return getUInt64LE((const char*)&dtime);
  else
    return -1;
}

int64_t DataConvert::stringToDatetime(const utils::NullString& data, bool* date)
{
  if (data.isNull())
  {
    if (date)
    {
      *date = false;
    }
    return -1;
  }

  return stringToDatetime(data.unsafeStringRef(), date);
}

int64_t DataConvert::stringToTimestamp(const string& data, long timeZone)
{
  TimeStamp aTimestamp;

  if (stringToTimestampStruct(data, aTimestamp, timeZone))
    return getUInt64LE((const char*)&aTimestamp);
  else
    return -1;
}

int64_t DataConvert::stringToTimestamp(const utils::NullString& data, long timeZone)
{
  if (data.isNull())
  {
    return -1;
  }
  return stringToTimestamp(data.unsafeStringRef(), timeZone);
}

/* This is really painful and expensive b/c it seems the input is not normalized or
sanitized.  That should really be done on ingestion. */
int64_t DataConvert::intToDate(int64_t data)
{
  char buf[21] = {0};
  Date aday;

  if (data == 0)
  {
    aday.year = 0;
    aday.month = 0;
    aday.day = 0;
    return getUInt32LE((const char*)&aday);
  }

  // this snprintf call causes a compiler warning b/c we're potentially copying a 20-digit #
  // into 15 bytes, however, that appears to be intentional.
#if defined(__GNUC__) && __GNUC__ >= 7
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wformat-truncation="
  snprintf(buf, 15, "%llu", (long long unsigned int)data);
#pragma GCC diagnostic pop
#else
  snprintf(buf, 15, "%llu", (long long unsigned int)data);
#endif

  string year, month, day, hour, min, sec, msec;
  int64_t y = 0, m = 0, d = 0, h = 0, minute = 0, s = 0, ms = 0;

  switch (strlen(buf))
  {
    case 14:
      year = string(buf, 4);
      month = string(buf + 4, 2);
      day = string(buf + 6, 2);
      hour = string(buf + 8, 2);
      min = string(buf + 10, 2);
      sec = string(buf + 12, 2);
      msec = string(buf + 14, 6);
      break;

    case 12:
      year = string(buf, 2);
      month = string(buf + 2, 2);
      day = string(buf + 4, 2);
      hour = string(buf + 6, 2);
      min = string(buf + 8, 2);
      sec = string(buf + 10, 2);
      msec = string(buf + 12, 6);
      break;

    case 10:
      month = string(buf, 2);
      day = string(buf + 2, 2);
      hour = string(buf + 4, 2);
      min = string(buf + 6, 2);
      sec = string(buf + 8, 2);
      msec = string(buf + 10, 6);
      break;

    case 9:
      month = string(buf, 1);
      day = string(buf + 1, 2);
      hour = string(buf + 3, 2);
      min = string(buf + 5, 2);
      sec = string(buf + 7, 2);
      msec = string(buf + 9, 6);
      break;

    case 8:
      year = string(buf, 4);
      month = string(buf + 4, 2);
      day = string(buf + 6, 2);
      break;

    case 6:
      year = string(buf, 2);
      month = string(buf + 2, 2);
      day = string(buf + 4, 2);
      break;

    case 4:
      month = string(buf, 2);
      day = string(buf + 2, 2);
      break;

    case 3:
      month = string(buf, 1);
      day = string(buf + 1, 2);
      break;

    default: return -1;
  }

  if (year.empty())
  {
    // MMDD format. assume current year
    time_t calender_time;
    struct tm todays_date;
    calender_time = time(NULL);
    localtime_r(&calender_time, &todays_date);
    y = todays_date.tm_year + 1900;
  }
  else
  {
    y = atoi(year.c_str());
  }

  m = atoi(month.c_str());
  d = atoi(day.c_str());
  h = atoi(hour.c_str());
  minute = atoi(min.c_str());
  s = atoi(sec.c_str());
  ms = atoi(msec.c_str());

  // if (!isDateValid(d, m, y))
  //	return -1;
  if (!isDateValid(d, m, y) || !isDateTimeValid(h, minute, s, ms))
    return -1;

  aday.year = y;
  aday.month = m;
  aday.day = d;
  return getUInt32LE((const char*)&aday);
}

/* This is really painful and expensive b/c it seems the input is not normalized or
sanitized.  That should really be done on ingestion. */
int64_t DataConvert::intToDatetime(int64_t data, bool* date)
{
  bool isDate = false;
  char buf[21] = {0};
  DateTime adaytime;

  if (data == 0)
  {
    adaytime.year = 0;
    adaytime.month = 0;
    adaytime.day = 0;
    adaytime.hour = 0;
    adaytime.minute = 0;
    adaytime.second = 0;
    adaytime.msecond = 0;

    if (date)
      *date = true;

    return getUInt64LE((const char*)&adaytime);
  }

  // this snprintf call causes a compiler warning b/c we're potentially copying a 20-digit #
  // into 15 bytes, however, that appears to be intentional.
#if defined(__GNUC__) && __GNUC__ >= 7
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wformat-truncation="
  snprintf(buf, 15, "%llu", (long long unsigned int)data);
#pragma GCC diagnostic pop
#else
  snprintf(buf, 15, "%llu", (long long unsigned int)data);
#endif

  // string date = buf;
  string year, month, day, hour, min, sec, msec;
  int64_t y = 0, m = 0, d = 0, h = 0, minute = 0, s = 0, ms = 0;

  switch (strlen(buf))
  {
    case 14:
      year = string(buf, 4);
      month = string(buf + 4, 2);
      day = string(buf + 6, 2);
      hour = string(buf + 8, 2);
      min = string(buf + 10, 2);
      sec = string(buf + 12, 2);
      break;

    case 12:
      year = string(buf, 2);
      month = string(buf + 2, 2);
      day = string(buf + 4, 2);
      hour = string(buf + 6, 2);
      min = string(buf + 8, 2);
      sec = string(buf + 10, 2);
      break;

    case 10:
      month = string(buf, 2);
      day = string(buf + 2, 2);
      hour = string(buf + 4, 2);
      min = string(buf + 6, 2);
      sec = string(buf + 8, 2);
      break;

    case 9:
      month = string(buf, 1);
      day = string(buf + 1, 2);
      hour = string(buf + 3, 2);
      min = string(buf + 5, 2);
      sec = string(buf + 7, 2);
      break;

    case 8:
      year = string(buf, 4);
      month = string(buf + 4, 2);
      day = string(buf + 6, 2);
      isDate = true;
      break;

    case 6:
      year = string(buf, 2);
      month = string(buf + 2, 2);
      day = string(buf + 4, 2);
      isDate = true;
      break;

    case 4:
      month = string(buf, 2);
      day = string(buf + 2, 2);
      break;

    case 3:
      month = string(buf, 1);
      day = string(buf + 1, 2);
      isDate = true;
      break;

    default: return -1;
  }

  if (year.empty())
  {
    // MMDD format. assume current year
    time_t calender_time;
    struct tm todays_date;
    calender_time = time(NULL);
    localtime_r(&calender_time, &todays_date);
    y = todays_date.tm_year + 1900;
  }
  else
  {
    y = atoi(year.c_str());

    // special handling for 2-byte year
    if (year.length() == 2)
    {
      y += 2000;
      if (y > 2069)
        y -= 100;
    }
  }

  m = atoi(month.c_str());
  d = atoi(day.c_str());
  h = atoi(hour.c_str());
  minute = atoi(min.c_str());
  s = atoi(sec.c_str());
  ms = 0;

  if (!isDateValid(d, m, y) || !isDateTimeValid(h, minute, s, ms))
    return -1;

  adaytime.year = y;
  adaytime.month = m;
  adaytime.day = d;
  adaytime.hour = h;
  adaytime.minute = minute;
  adaytime.second = s;
  adaytime.msecond = ms;

  if (date)
    *date = isDate;

  return getUInt64LE((const char*)&adaytime);
}

/* This is really painful and expensive b/c it seems the input is not normalized or
sanitized.  That should really be done on ingestion. */
int64_t DataConvert::intToTime(int64_t data, bool fromString)
{
  char buf[21] = {0};
  char* bufread = buf;
  Time atime;
  bool isNeg = false;

  if (data == 0)
  {
    atime.hour = 0;
    atime.minute = 0;
    atime.second = 0;
    atime.msecond = 0;
    atime.is_neg = 0;

    return getSInt64LE((const char*)&atime);
  }

  // this snprintf call causes a compiler warning b/c we're potentially copying a 20-digit #
  // into 15 bytes, however, that appears to be intentional.
#if defined(__GNUC__) && __GNUC__ >= 7
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wformat-truncation="
  snprintf(buf, 15, "%lld", (long long int)data);
#pragma GCC diagnostic pop
#else
  snprintf(buf, 15, "%lld", (long long int)data);
#endif

  // string date = buf;
  string hour, min, sec, msec;
  int64_t h = 0, minute = 0, s = 0, ms = 0;

  if (bufread[0] == '-')
  {
    isNeg = true;
    bufread++;
  }

  bool zero = false;

  switch (strlen(bufread))
  {
    // A full datetime
    case 14:
      hour = string(buf + 8, 2);
      min = string(buf + 10, 2);
      sec = string(buf + 12, 2);
      break;

    // Date so this is all 0
    case 8: zero = true; break;

    case 7:
      hour = string(bufread, 3);
      min = string(bufread + 3, 2);
      sec = string(bufread + 5, 2);
      break;

    case 6:
      hour = string(bufread, 2);
      min = string(bufread + 2, 2);
      sec = string(bufread + 4, 2);
      break;

    case 5:
      hour = string(bufread, 1);
      min = string(bufread + 1, 2);
      sec = string(bufread + 3, 2);
      break;

    case 4:
      min = string(bufread, 2);
      sec = string(bufread + 2, 2);
      break;

    case 3:
      min = string(bufread, 1);
      sec = string(bufread + 1, 2);
      break;

    case 2: sec = string(bufread, 2); break;

    case 1: sec = string(bufread, 1); break;

    default: return -1;
  }

  if (!zero)
  {
    h = atoi(hour.c_str());
    minute = atoi(min.c_str());
    s = atoi(sec.c_str());
  }
  else if (fromString)
  {
    // Saturate fromString
    h = 838;
    minute = 59;
    s = 59;
    ms = 999999;
  }

  if (!isTimeValid(h, minute, s, 0))
    return -1;

  atime.hour = h;
  atime.minute = minute;
  atime.second = s;
  atime.msecond = ms;
  atime.is_neg = isNeg;

  return getSInt64LE((const char*)&atime);
}

int64_t DataConvert::stringToTime(const utils::NullString& data)
{
  return stringToTime(data.safeString(""));
}

int64_t DataConvert::stringToTime(const string& data)
{
  // MySQL supported time value format 'D HHH:MM:SS.fraction'
  // -34 <= D <= 34
  // -838 <= H <= 838
  uint64_t min = 0, sec = 0, msec = 0;
  int64_t day = -1, hour = 0;
  bool isNeg = false;
  bool hasDate = false;
  string time, hms, ms;
  char* end = NULL;

  size_t pos = data.find("-");

  if (pos != string::npos)
  {
    isNeg = true;
  }

  if (data.substr(pos + 1, data.length() - pos - 1).find("-") != string::npos)
  {
    // A second dash, this has a date
    hasDate = true;
    isNeg = false;
  }
  // Day
  pos = data.find(" ");

  if (pos != string::npos)
  {
    if (!hasDate)
    {
      std::string tmpDataSegment = data.substr(0, pos);
      day = strtol(tmpDataSegment.c_str(), &end, 10);

      if (*end != '\0')
        return -1;

      hour = day * 24;
      day = -1;
    }
    time = data.substr(pos + 1, data.length() - pos - 1);
  }
  else
  {
    time = data;
  }

  if (time.find(":") == string::npos)
  {
    if (hasDate)
    {
      // Has dashes, no colons. This is just a date!
      // Or the length < 6 (MariaDB returns NULL)
      return -1;
    }
    else
    {
      // This is an int time
      return intToTime(atoll(time.c_str()), true);
    }
  }

  // Fraction
  pos = time.find(".");

  if (pos != string::npos)
  {
    msec = strtoll(time.substr(pos + 1, time.length() - pos - 1).c_str(), 0, 10);
    hms = time.substr(0, pos);
  }
  else
  {
    hms = time;
  }

  // HHH:MM:SS
  pos = hms.find(":");

  if (pos == string::npos)
  {
    if (hour >= 0)
      hour += atoi(hms.c_str());
    else
      hour -= atoi(hms.c_str());
  }
  else
  {
    if (hour >= 0)
      hour += atoi(hms.substr(0, pos).c_str());
    else
      hour -= atoi(hms.substr(0, pos).c_str());

    ms = hms.substr(pos + 1, hms.length() - pos - 1);
  }

  // MM:SS
  pos = ms.find(":");

  if (pos != string::npos)
  {
    min = atoi(ms.substr(0, pos).c_str());
    sec = atoi(ms.substr(pos + 1, ms.length() - pos - 1).c_str());
  }
  else
  {
    min = atoi(ms.c_str());
  }

  Time atime;
  atime.day = day;
  atime.hour = hour;
  atime.minute = min;
  atime.second = sec;
  atime.msecond = msec;
  atime.is_neg = isNeg;
  return getSInt64LE((const char*)&atime);
}

void DataConvert::joinColTypeForUnion(datatypes::SystemCatalog::TypeHolderStd& unionedType,
                                      const datatypes::SystemCatalog::TypeHolderStd& type, unsigned int& rc)
{
  // limited support for VARBINARY, no implicit conversion.
  if (type.colDataType == datatypes::SystemCatalog::VARBINARY ||
      unionedType.colDataType == datatypes::SystemCatalog::VARBINARY)
  {
    if (type.colDataType != unionedType.colDataType || type.colWidth != unionedType.colWidth)
      throw runtime_error("VARBINARY in UNION must be the same width.");
  }

  switch (type.colDataType)
  {
    case datatypes::SystemCatalog::TINYINT:
    case datatypes::SystemCatalog::SMALLINT:
    case datatypes::SystemCatalog::MEDINT:
    case datatypes::SystemCatalog::INT:
    case datatypes::SystemCatalog::BIGINT:
    case datatypes::SystemCatalog::DECIMAL:
    case datatypes::SystemCatalog::UTINYINT:
    case datatypes::SystemCatalog::USMALLINT:
    case datatypes::SystemCatalog::UMEDINT:
    case datatypes::SystemCatalog::UINT:
    case datatypes::SystemCatalog::UBIGINT:
    case datatypes::SystemCatalog::UDECIMAL:
    {
      switch (unionedType.colDataType)
      {
        case datatypes::SystemCatalog::TINYINT:
        case datatypes::SystemCatalog::SMALLINT:
        case datatypes::SystemCatalog::MEDINT:
        case datatypes::SystemCatalog::INT:
        case datatypes::SystemCatalog::BIGINT:
        case datatypes::SystemCatalog::DECIMAL:
        case datatypes::SystemCatalog::UTINYINT:
        case datatypes::SystemCatalog::USMALLINT:
        case datatypes::SystemCatalog::UMEDINT:
        case datatypes::SystemCatalog::UINT:
        case datatypes::SystemCatalog::UBIGINT:
        case datatypes::SystemCatalog::UDECIMAL:
        {
          if (type.scale != 0 && (unionedType.scale != 0 || isDecimal(unionedType.colDataType)))
          {
            const unsigned int digitsBeforeDecimal = type.precision - type.scale;
            const unsigned int digitsBeforeDecimalUnion = unionedType.precision - unionedType.scale;

            if ((std::max(digitsBeforeDecimal, digitsBeforeDecimalUnion) +
                 std::max(type.scale, unionedType.scale)) > datatypes::INT128MAXPRECISION)
            {
              rc = logging::ERR_UNION_DECIMAL_OVERFLOW;
              return;
            }
          }

          // Handle the scenario where the upstream code assigns special values of 9999
          // and -1 as the precision of the unionedType.
          if ((unionedType.precision == 9999 || unionedType.precision == -1) &&
              (type.precision != 9999 && type.precision != -1))
          {
            unionedType.precision = type.precision;
          }
          else
          {
            unionedType.precision = std::max(type.precision, unionedType.precision);
          }

          unionedType.scale = std::max(type.scale, unionedType.scale);

          if (datatypes::Decimal::isWideDecimalTypeByPrecision(unionedType.precision))
          {
            unionedType.colDataType = datatypes::SystemCatalog::DECIMAL;
            unionedType.colWidth = datatypes::MAXDECIMALWIDTH;
            break;
          }

          if (type.colDataType == unionedType.colDataType)
          {
            if (type.colWidth > unionedType.colWidth)
              unionedType.colWidth = type.colWidth;
          }
          else if (sameSignednessInteger(unionedType.colDataType, type.colDataType))
          {
            // Keep the signedness on the larger data type.
            if (type.colWidth > unionedType.colWidth)
            {
              unionedType.colDataType = type.colDataType;
              unionedType.colWidth = type.colWidth;
            }
          }
          else if (differentSignednessInteger(unionedType.colDataType, type.colDataType))
          {
            // unionedType must be signed integer with upcasted size to prevent overflow & underflow.
            if (type.colWidth > unionedType.colWidth)
              unionedType.colDataType = type.colDataType;
            promoteSignedInteger(unionedType);
          }

          if (isDecimal(type.colDataType))
          {
            unionedType.colDataType = datatypes::SystemCatalog::DECIMAL;
          }

          break;
        }
        case datatypes::SystemCatalog::DATE:
          unionedType.colDataType = datatypes::SystemCatalog::CHAR;
          unionedType.colWidth = 20;
          break;

        case datatypes::SystemCatalog::TIME:
        case datatypes::SystemCatalog::DATETIME:
        case datatypes::SystemCatalog::TIMESTAMP:
          unionedType.colDataType = datatypes::SystemCatalog::CHAR;
          unionedType.colWidth = 26;
          break;

        case datatypes::SystemCatalog::CHAR:
          if (unionedType.colWidth < 20)
            unionedType.colWidth = 20;

          break;

        case datatypes::SystemCatalog::VARCHAR:
          if (unionedType.colWidth < 21)
            unionedType.colWidth = 21;

          break;

        case datatypes::SystemCatalog::FLOAT:
        case datatypes::SystemCatalog::DOUBLE:
        case datatypes::SystemCatalog::UFLOAT:
        case datatypes::SystemCatalog::UDOUBLE:
        case datatypes::SystemCatalog::LONGDOUBLE:
        default: break;
      }

      break;
    }

    case datatypes::SystemCatalog::DATE:
    {
      switch (unionedType.colDataType)
      {
        case datatypes::SystemCatalog::TINYINT:
        case datatypes::SystemCatalog::SMALLINT:
        case datatypes::SystemCatalog::MEDINT:
        case datatypes::SystemCatalog::INT:
        case datatypes::SystemCatalog::BIGINT:
        case datatypes::SystemCatalog::DECIMAL:
        case datatypes::SystemCatalog::FLOAT:
        case datatypes::SystemCatalog::DOUBLE:
        case datatypes::SystemCatalog::UTINYINT:
        case datatypes::SystemCatalog::USMALLINT:
        case datatypes::SystemCatalog::UMEDINT:
        case datatypes::SystemCatalog::UINT:
        case datatypes::SystemCatalog::UBIGINT:
        case datatypes::SystemCatalog::UDECIMAL:
        case datatypes::SystemCatalog::UFLOAT:
        case datatypes::SystemCatalog::UDOUBLE:
        case datatypes::SystemCatalog::LONGDOUBLE:
          unionedType.colDataType = datatypes::SystemCatalog::CHAR;
          unionedType.scale = 0;
          unionedType.colWidth = 20;
          break;

        case datatypes::SystemCatalog::CHAR:
          if (unionedType.colWidth < 10)
            unionedType.colWidth = 10;

          break;

        case datatypes::SystemCatalog::VARCHAR:
          if (unionedType.colWidth < 11)
            unionedType.colWidth = 11;

          break;

        case datatypes::SystemCatalog::DATE:
        case datatypes::SystemCatalog::DATETIME:
        case datatypes::SystemCatalog::TIMESTAMP:
        case datatypes::SystemCatalog::TIME:
        default: break;
      }

      break;
    }

    case datatypes::SystemCatalog::DATETIME:
    {
      switch (unionedType.colDataType)
      {
        case datatypes::SystemCatalog::TINYINT:
        case datatypes::SystemCatalog::SMALLINT:
        case datatypes::SystemCatalog::MEDINT:
        case datatypes::SystemCatalog::INT:
        case datatypes::SystemCatalog::BIGINT:
        case datatypes::SystemCatalog::DECIMAL:
        case datatypes::SystemCatalog::FLOAT:
        case datatypes::SystemCatalog::DOUBLE:
        case datatypes::SystemCatalog::UTINYINT:
        case datatypes::SystemCatalog::USMALLINT:
        case datatypes::SystemCatalog::UMEDINT:
        case datatypes::SystemCatalog::UINT:
        case datatypes::SystemCatalog::UBIGINT:
        case datatypes::SystemCatalog::UDECIMAL:
        case datatypes::SystemCatalog::UFLOAT:
        case datatypes::SystemCatalog::UDOUBLE:
        case datatypes::SystemCatalog::TIME:
        case datatypes::SystemCatalog::LONGDOUBLE:
        case datatypes::SystemCatalog::TIMESTAMP:
          unionedType.colDataType = datatypes::SystemCatalog::CHAR;
          unionedType.scale = 0;
          unionedType.colWidth = 26;
          break;

        case datatypes::SystemCatalog::DATE:
          unionedType.colDataType = datatypes::SystemCatalog::DATETIME;
          unionedType.colWidth = type.colWidth;
          break;

        case datatypes::SystemCatalog::CHAR:
          if (unionedType.colWidth < 26)
            unionedType.colWidth = 26;

          break;

        case datatypes::SystemCatalog::VARCHAR:
          if (unionedType.colWidth < 27)
            unionedType.colWidth = 27;

          break;

        case datatypes::SystemCatalog::DATETIME:
        default: break;
      }

      break;
    }

    case datatypes::SystemCatalog::TIMESTAMP:
    {
      switch (unionedType.colDataType)
      {
        case datatypes::SystemCatalog::TINYINT:
        case datatypes::SystemCatalog::SMALLINT:
        case datatypes::SystemCatalog::MEDINT:
        case datatypes::SystemCatalog::INT:
        case datatypes::SystemCatalog::BIGINT:
        case datatypes::SystemCatalog::DECIMAL:
        case datatypes::SystemCatalog::FLOAT:
        case datatypes::SystemCatalog::DOUBLE:
        case datatypes::SystemCatalog::UTINYINT:
        case datatypes::SystemCatalog::USMALLINT:
        case datatypes::SystemCatalog::UMEDINT:
        case datatypes::SystemCatalog::UINT:
        case datatypes::SystemCatalog::UBIGINT:
        case datatypes::SystemCatalog::UDECIMAL:
        case datatypes::SystemCatalog::UFLOAT:
        case datatypes::SystemCatalog::UDOUBLE:
        case datatypes::SystemCatalog::TIME:
        case datatypes::SystemCatalog::DATETIME:
          unionedType.colDataType = datatypes::SystemCatalog::CHAR;
          unionedType.scale = 0;
          unionedType.colWidth = 26;
          break;

        case datatypes::SystemCatalog::DATE:
          unionedType.colDataType = datatypes::SystemCatalog::TIMESTAMP;
          unionedType.colWidth = type.colWidth;
          break;

        case datatypes::SystemCatalog::CHAR:
          if (unionedType.colWidth < 26)
            unionedType.colWidth = 26;

          break;

        case datatypes::SystemCatalog::VARCHAR:
          if (unionedType.colWidth < 27)
            unionedType.colWidth = 27;

          break;

        case datatypes::SystemCatalog::TIMESTAMP:
        default: break;
      }

      break;
    }

    case datatypes::SystemCatalog::FLOAT:
    case datatypes::SystemCatalog::DOUBLE:
    case datatypes::SystemCatalog::UFLOAT:
    case datatypes::SystemCatalog::UDOUBLE:
    {
      switch (unionedType.colDataType)
      {
        case datatypes::SystemCatalog::DATE:
          unionedType.colDataType = datatypes::SystemCatalog::CHAR;
          unionedType.scale = 0;
          unionedType.colWidth = 20;
          break;

        case datatypes::SystemCatalog::DATETIME:
        case datatypes::SystemCatalog::TIMESTAMP:
          unionedType.colDataType = datatypes::SystemCatalog::CHAR;
          unionedType.scale = 0;
          unionedType.colWidth = 26;
          break;

        case datatypes::SystemCatalog::CHAR:
          if (unionedType.colWidth < 20)
            unionedType.colWidth = 20;

          break;

        case datatypes::SystemCatalog::VARCHAR:
          if (unionedType.colWidth < 21)
            unionedType.colWidth = 21;

          break;

        case datatypes::SystemCatalog::TINYINT:
        case datatypes::SystemCatalog::SMALLINT:
        case datatypes::SystemCatalog::MEDINT:
        case datatypes::SystemCatalog::INT:
        case datatypes::SystemCatalog::BIGINT:
        case datatypes::SystemCatalog::FLOAT:
        case datatypes::SystemCatalog::DOUBLE:
        case datatypes::SystemCatalog::UTINYINT:
        case datatypes::SystemCatalog::USMALLINT:
        case datatypes::SystemCatalog::UMEDINT:
        case datatypes::SystemCatalog::UINT:
        case datatypes::SystemCatalog::UBIGINT:
        case datatypes::SystemCatalog::UFLOAT:
        case datatypes::SystemCatalog::UDOUBLE:
        case datatypes::SystemCatalog::DECIMAL:
        case datatypes::SystemCatalog::UDECIMAL:
          unionedType.colDataType = datatypes::SystemCatalog::DOUBLE;
          unionedType.scale = 0;
          unionedType.colWidth = sizeof(double);
          break;

        default: break;
      }

      break;
    }

    case datatypes::SystemCatalog::LONGDOUBLE:
    {
      switch (unionedType.colDataType)
      {
        case datatypes::SystemCatalog::DATE:
          unionedType.colDataType = datatypes::SystemCatalog::CHAR;
          unionedType.scale = 0;
          unionedType.colWidth = 20;
          break;

        case datatypes::SystemCatalog::DATETIME:
          unionedType.colDataType = datatypes::SystemCatalog::CHAR;
          unionedType.scale = 0;
          unionedType.colWidth = 26;
          break;

        case datatypes::SystemCatalog::CHAR:
          if (unionedType.colWidth < 20)
            unionedType.colWidth = 20;

          break;

        case datatypes::SystemCatalog::VARCHAR:
          if (unionedType.colWidth < 21)
            unionedType.colWidth = 21;

          break;

        case datatypes::SystemCatalog::TINYINT:
        case datatypes::SystemCatalog::SMALLINT:
        case datatypes::SystemCatalog::MEDINT:
        case datatypes::SystemCatalog::INT:
        case datatypes::SystemCatalog::BIGINT:
        case datatypes::SystemCatalog::FLOAT:
        case datatypes::SystemCatalog::DOUBLE:
        case datatypes::SystemCatalog::UTINYINT:
        case datatypes::SystemCatalog::USMALLINT:
        case datatypes::SystemCatalog::UMEDINT:
        case datatypes::SystemCatalog::UINT:
        case datatypes::SystemCatalog::UBIGINT:
        case datatypes::SystemCatalog::UFLOAT:
        case datatypes::SystemCatalog::UDOUBLE:
        case datatypes::SystemCatalog::LONGDOUBLE:
        case datatypes::SystemCatalog::DECIMAL:
        case datatypes::SystemCatalog::UDECIMAL:
          unionedType.colDataType = datatypes::SystemCatalog::LONGDOUBLE;
          unionedType.scale = (type.scale > unionedType.scale) ? type.scale : unionedType.scale;
          unionedType.colWidth = sizeof(long double);
          unionedType.precision = -1;
          break;

        default: break;
      }

      break;
    }

    case datatypes::SystemCatalog::CHAR:
    case datatypes::SystemCatalog::VARCHAR:
    {
      switch (unionedType.colDataType)
      {
        case datatypes::SystemCatalog::TINYINT:
        case datatypes::SystemCatalog::SMALLINT:
        case datatypes::SystemCatalog::MEDINT:
        case datatypes::SystemCatalog::INT:
        case datatypes::SystemCatalog::BIGINT:
        case datatypes::SystemCatalog::DECIMAL:
        case datatypes::SystemCatalog::FLOAT:
        case datatypes::SystemCatalog::DOUBLE:
        case datatypes::SystemCatalog::UTINYINT:
        case datatypes::SystemCatalog::USMALLINT:
        case datatypes::SystemCatalog::UMEDINT:
        case datatypes::SystemCatalog::UINT:
        case datatypes::SystemCatalog::UBIGINT:
        case datatypes::SystemCatalog::UDECIMAL:
        case datatypes::SystemCatalog::UFLOAT:
        case datatypes::SystemCatalog::UDOUBLE:
        case datatypes::SystemCatalog::LONGDOUBLE:
          unionedType.scale = 0;
          unionedType.colWidth = (type.colWidth > 20) ? type.colWidth : 20;
          break;

        case datatypes::SystemCatalog::DATE:
          unionedType.colWidth = (type.colWidth > 10) ? type.colWidth : 10;
          break;

        case datatypes::SystemCatalog::DATETIME:
        case datatypes::SystemCatalog::TIMESTAMP:
          unionedType.colWidth = (type.colWidth > 26) ? type.colWidth : 26;
          break;

        case datatypes::SystemCatalog::CHAR:
        case datatypes::SystemCatalog::VARCHAR:

          // VARCHAR will fit in CHAR of the same width
          if (unionedType.colWidth < type.colWidth)
            unionedType.colWidth = type.colWidth;

          break;

        default: break;
      }

      // MariaDB bug 651. Setting to CHAR broke union in subquery
      unionedType.colDataType = datatypes::SystemCatalog::VARCHAR;
      break;
    }

    default:
    {
      break;
    }
  }  // switch
}

}  // namespace dataconvert