You've already forked mariadb-columnstore-engine
							
							
				mirror of
				https://github.com/mariadb-corporation/mariadb-columnstore-engine.git
				synced 2025-11-03 17:13:17 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			185 lines
		
	
	
		
			5.1 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			185 lines
		
	
	
		
			5.1 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
/* Copyright (C) 2014 InfiniDB, Inc.
 | 
						|
 | 
						|
   This program is free software; you can redistribute it and/or
 | 
						|
   modify it under the terms of the GNU General Public License
 | 
						|
   as published by the Free Software Foundation; version 2 of
 | 
						|
   the License.
 | 
						|
 | 
						|
   This program is distributed in the hope that it will be useful,
 | 
						|
   but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
						|
   GNU General Public License for more details.
 | 
						|
 | 
						|
   You should have received a copy of the GNU General Public License
 | 
						|
   along with this program; if not, write to the Free Software
 | 
						|
   Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
 | 
						|
   MA 02110-1301, USA. */
 | 
						|
 | 
						|
/****************************************************************************
 | 
						|
 * $Id: func_replace.cpp 3923 2013-06-19 21:43:06Z bwilkinson $
 | 
						|
 *
 | 
						|
 *
 | 
						|
 ****************************************************************************/
 | 
						|
 | 
						|
#include <string>
 | 
						|
using namespace std;
 | 
						|
 | 
						|
#include "functor_str.h"
 | 
						|
#include "functioncolumn.h"
 | 
						|
using namespace execplan;
 | 
						|
 | 
						|
#include "rowgroup.h"
 | 
						|
using namespace rowgroup;
 | 
						|
 | 
						|
#include "joblisttypes.h"
 | 
						|
using namespace joblist;
 | 
						|
 | 
						|
namespace funcexp
 | 
						|
{
 | 
						|
CalpontSystemCatalog::ColType Func_replace::operationType(FunctionParm& fp,
 | 
						|
                                                          CalpontSystemCatalog::ColType& /*resultType*/)
 | 
						|
{
 | 
						|
  // operation type is not used by this functor
 | 
						|
  return fp[0]->data()->resultType();
 | 
						|
}
 | 
						|
 | 
						|
std::string Func_replace::getStrVal(rowgroup::Row& row, FunctionParm& fp, bool& isNull,
 | 
						|
                                    execplan::CalpontSystemCatalog::ColType& ct)
 | 
						|
{
 | 
						|
  CHARSET_INFO* cs = ct.getCharset();
 | 
						|
 | 
						|
  const auto& nstr = fp[0]->data()->getStrVal(row, isNull);
 | 
						|
  if (nstr.isNull())
 | 
						|
    return "";
 | 
						|
 | 
						|
  const auto& str = nstr.unsafeStringRef();
 | 
						|
  size_t strLen = str.length();
 | 
						|
 | 
						|
  const auto& nfromstr = fp[1]->data()->getStrVal(row, isNull);
 | 
						|
  if (nfromstr.isNull())
 | 
						|
    return "";
 | 
						|
  const auto& fromstr = nfromstr.unsafeStringRef();
 | 
						|
 | 
						|
  if (fromstr.length() == 0)
 | 
						|
    return str;
 | 
						|
  size_t fromLen = fromstr.length();
 | 
						|
 | 
						|
  const auto& ntostr = fp[2]->data()->getStrVal(row, isNull);
 | 
						|
  if (ntostr.isNull())
 | 
						|
    return "";
 | 
						|
  const auto& tostr = ntostr.unsafeStringRef();
 | 
						|
 | 
						|
  size_t toLen = tostr.length();
 | 
						|
 | 
						|
  bool binaryCmp = (cs->state & MY_CS_BINSORT) || !cs->use_mb();
 | 
						|
  string newstr;
 | 
						|
  size_t pos = 0;
 | 
						|
  if (binaryCmp)
 | 
						|
  {
 | 
						|
    // Count the number of fromstr in strend so we can reserve buffer space.
 | 
						|
    size_t count = 0;
 | 
						|
    while (string::npos != (pos = str.find(fromstr, pos)))
 | 
						|
    {
 | 
						|
      ++count;
 | 
						|
      pos += fromLen;
 | 
						|
    }
 | 
						|
 | 
						|
    if (count == 0)
 | 
						|
    {
 | 
						|
      return str;
 | 
						|
    }
 | 
						|
 | 
						|
    newstr.reserve(strLen + (count * (toLen - fromLen)) + 1);
 | 
						|
 | 
						|
    uint32_t i = 0;
 | 
						|
    pos = str.find(fromstr);
 | 
						|
    // Move the stuff into newstr
 | 
						|
    do
 | 
						|
    {
 | 
						|
      if (pos > i)
 | 
						|
        newstr = newstr + str.substr(i, pos - i);
 | 
						|
 | 
						|
      newstr = newstr + tostr;
 | 
						|
      i = pos + fromLen;
 | 
						|
      pos = str.find(fromstr, i);
 | 
						|
    } while (pos != string::npos);
 | 
						|
 | 
						|
    newstr = newstr + str.substr(i, string::npos);
 | 
						|
  }
 | 
						|
  else
 | 
						|
  {
 | 
						|
    // UTF
 | 
						|
    const char* src = str.c_str();
 | 
						|
    const char* srcEnd = src + strLen;
 | 
						|
    const char* srchEnd = srcEnd - fromLen + 1;
 | 
						|
    const char* from = fromstr.c_str();
 | 
						|
    const char* fromEnd = from + fromLen;
 | 
						|
    const char* to = tostr.c_str();
 | 
						|
    const char* ptr = src;
 | 
						|
    char *i, *j;
 | 
						|
    size_t count = 10;  // Some arbitray number to reserve some space to start.
 | 
						|
    int growlen = (int)toLen - (int)fromLen;
 | 
						|
    growlen = growlen < 1 ? 1 : growlen;
 | 
						|
    growlen *= count;
 | 
						|
    newstr.reserve(strLen + (count * growlen) + 1);
 | 
						|
    size_t maxsize = newstr.capacity();
 | 
						|
    uint32_t l;
 | 
						|
 | 
						|
    // We don't know where byte patterns might match so
 | 
						|
    // we start at the beginning of the string and move forward
 | 
						|
    // one character at a time until we find a match. Then we can
 | 
						|
    // move the src bytes and add in the to bytes,then try again.
 | 
						|
    while (ptr < srchEnd)
 | 
						|
    {
 | 
						|
      bool found = false;
 | 
						|
      if (*ptr == *from)  // If the first byte matches, maybe we have a match
 | 
						|
      {
 | 
						|
        // Do a byte by byte compare of src at that spot against from
 | 
						|
        i = const_cast<char*>(ptr) + 1;
 | 
						|
        j = const_cast<char*>(from) + 1;
 | 
						|
        found = true;
 | 
						|
        while (j != fromEnd)
 | 
						|
        {
 | 
						|
          if (*i++ != *j++)
 | 
						|
          {
 | 
						|
            found = false;
 | 
						|
            break;
 | 
						|
          }
 | 
						|
        }
 | 
						|
      }
 | 
						|
      if (found)
 | 
						|
      {
 | 
						|
        if (ptr < i)
 | 
						|
        {
 | 
						|
          int mvsize = ptr - src;
 | 
						|
          if (newstr.length() + mvsize + toLen > maxsize)
 | 
						|
          {
 | 
						|
            // We need a re-alloc
 | 
						|
            newstr.reserve(maxsize + growlen);
 | 
						|
            maxsize = newstr.capacity();
 | 
						|
            growlen *= 2;
 | 
						|
          }
 | 
						|
          newstr.append(src, ptr - src);
 | 
						|
          src += mvsize + fromLen;
 | 
						|
          ptr = src;
 | 
						|
        }
 | 
						|
        newstr.append(to, toLen);
 | 
						|
      }
 | 
						|
      else
 | 
						|
      {
 | 
						|
        // move to the next character
 | 
						|
        if ((l = my_ismbchar(cs, ptr,
 | 
						|
                             srcEnd)))  // returns the number of bytes in the leading char or zero if one byte
 | 
						|
          ptr += l;
 | 
						|
        else
 | 
						|
          ++ptr;
 | 
						|
      }
 | 
						|
    }
 | 
						|
    // Copy in the trailing src chars.
 | 
						|
    newstr.append(src, srcEnd - src);
 | 
						|
  }
 | 
						|
  return newstr;
 | 
						|
}
 | 
						|
 | 
						|
}  // namespace funcexp
 |