You've already forked mariadb-columnstore-engine
							
							
				mirror of
				https://github.com/mariadb-corporation/mariadb-columnstore-engine.git
				synced 2025-11-03 17:13:17 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			6554 lines
		
	
	
		
			232 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			6554 lines
		
	
	
		
			232 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
/* Copyright (C) 2014 InfiniDB, Inc.
 | 
						|
   Copyright (C) 2016 MariaDB Corporation
 | 
						|
 | 
						|
   This program is free software; you can redistribute it and/or
 | 
						|
   modify it under the terms of the GNU General Public License
 | 
						|
   as published by the Free Software Foundation; version 2 of
 | 
						|
   the License.
 | 
						|
 | 
						|
   This program is distributed in the hope that it will be useful,
 | 
						|
   but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
						|
   GNU General Public License for more details.
 | 
						|
 | 
						|
   You should have received a copy of the GNU General Public License
 | 
						|
   along with this program; if not, write to the Free Software
 | 
						|
   Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
 | 
						|
   MA 02110-1301, USA. */
 | 
						|
 | 
						|
// $Id: writeengine.cpp 4737 2013-08-14 20:45:46Z bwilkinson $
 | 
						|
 | 
						|
/** @writeengine.cpp
 | 
						|
 *   A wrapper class for the write engine to write information to files
 | 
						|
 */
 | 
						|
#include <cmath>
 | 
						|
#include <cstdlib>
 | 
						|
#include <unistd.h>
 | 
						|
#include <boost/scoped_array.hpp>
 | 
						|
#include <boost/scoped_ptr.hpp>
 | 
						|
using namespace std;
 | 
						|
 | 
						|
#include "joblisttypes.h"
 | 
						|
 | 
						|
#define WRITEENGINEWRAPPER_DLLEXPORT
 | 
						|
#include "writeengine.h"
 | 
						|
#undef WRITEENGINEWRAPPER_DLLEXPORT
 | 
						|
 | 
						|
#include "we_convertor.h"
 | 
						|
#include "we_log.h"
 | 
						|
#include "we_simplesyslog.h"
 | 
						|
#include "we_config.h"
 | 
						|
#include "we_bulkrollbackmgr.h"
 | 
						|
#include "brm.h"
 | 
						|
#include "stopwatch.h"
 | 
						|
#include "we_colop.h"
 | 
						|
#include "we_type.h"
 | 
						|
 | 
						|
#include "we_colopcompress.h"
 | 
						|
#include "we_dctnrycompress.h"
 | 
						|
#include "cacheutils.h"
 | 
						|
#include "calpontsystemcatalog.h"
 | 
						|
#include "we_simplesyslog.h"
 | 
						|
using namespace cacheutils;
 | 
						|
using namespace logging;
 | 
						|
using namespace BRM;
 | 
						|
using namespace execplan;
 | 
						|
#include "IDBDataFile.h"
 | 
						|
#include "IDBPolicy.h"
 | 
						|
#include "MonitorProcMem.h"
 | 
						|
using namespace idbdatafile;
 | 
						|
 | 
						|
#ifdef _MSC_VER
 | 
						|
#define isnan _isnan
 | 
						|
#endif
 | 
						|
 | 
						|
namespace WriteEngine
 | 
						|
//#define PROFILE 1
 | 
						|
 | 
						|
{
 | 
						|
StopWatch timer;
 | 
						|
 | 
						|
/**@brief WriteEngineWrapper Constructor
 | 
						|
*/
 | 
						|
WriteEngineWrapper::WriteEngineWrapper() :  m_opType(NOOP)
 | 
						|
{
 | 
						|
    m_colOp[UN_COMPRESSED_OP] = new ColumnOpCompress0;
 | 
						|
    m_colOp[COMPRESSED_OP]    = new ColumnOpCompress1;
 | 
						|
 | 
						|
    m_dctnry[UN_COMPRESSED_OP] = new DctnryCompress0;
 | 
						|
    m_dctnry[COMPRESSED_OP]    = new DctnryCompress1;
 | 
						|
}
 | 
						|
 | 
						|
WriteEngineWrapper::WriteEngineWrapper(const WriteEngineWrapper& rhs) :  m_opType(rhs.m_opType)
 | 
						|
{
 | 
						|
    m_colOp[UN_COMPRESSED_OP] = new ColumnOpCompress0;
 | 
						|
    m_colOp[COMPRESSED_OP]    = new ColumnOpCompress1;
 | 
						|
 | 
						|
    m_dctnry[UN_COMPRESSED_OP] = new DctnryCompress0;
 | 
						|
    m_dctnry[COMPRESSED_OP]    = new DctnryCompress1;
 | 
						|
}
 | 
						|
 | 
						|
/**@brief WriteEngineWrapper Constructor
 | 
						|
*/
 | 
						|
WriteEngineWrapper::~WriteEngineWrapper()
 | 
						|
{
 | 
						|
    delete m_colOp[UN_COMPRESSED_OP];
 | 
						|
    delete m_colOp[COMPRESSED_OP];
 | 
						|
    delete m_dctnry[UN_COMPRESSED_OP];
 | 
						|
    delete m_dctnry[COMPRESSED_OP];
 | 
						|
}
 | 
						|
 | 
						|
/**@brief Perform upfront initialization
 | 
						|
*/
 | 
						|
/* static */ void WriteEngineWrapper::init(unsigned subSystemID)
 | 
						|
{
 | 
						|
    SimpleSysLog::instance()->setLoggingID(logging::LoggingID(subSystemID));
 | 
						|
    Config::initConfigCache();
 | 
						|
    BRMWrapper::getInstance();
 | 
						|
 | 
						|
    // Bug 5415 Add HDFS MemBuffer vs. FileBuffer decision logic.
 | 
						|
    config::Config* cf = config::Config::makeConfig();
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Memory overload protection. This setting will cause the process to die should
 | 
						|
    // it, by itself, consume maxPct of total memory. Monitored in MonitorProcMem.
 | 
						|
    // Only used at the express direction of Field Support.
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    int maxPct = 0; //disable by default
 | 
						|
    string strMaxPct = cf->getConfig("WriteEngine", "MaxPct");
 | 
						|
 | 
						|
    if ( strMaxPct.length() != 0 )
 | 
						|
        maxPct = cf->uFromText(strMaxPct);
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // MemoryCheckPercent. This controls at what percent of total memory be consumed
 | 
						|
    // by all processes before we switch from HdfsRdwrMemBuffer to HdfsRdwrFileBuffer.
 | 
						|
    // This is only used in Hdfs installations.
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    int checkPct = 95;
 | 
						|
    string strCheckPct = cf->getConfig("SystemConfig", "MemoryCheckPercent");
 | 
						|
 | 
						|
    if ( strCheckPct.length() != 0 )
 | 
						|
        checkPct = cf->uFromText(strCheckPct);
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // If we're either HDFS, or maxPct is turned on, start the monitor thread.
 | 
						|
    // Otherwise, we don't need it, so don't waste the resources.
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    if (maxPct > 0 || IDBPolicy::useHdfs())
 | 
						|
    {
 | 
						|
        new boost::thread(utils::MonitorProcMem(maxPct, checkPct, subSystemID));
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
/*@brief checkValid --Check input parameters are valid
 | 
						|
 */
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Check input parameters are valid
 | 
						|
 * PARAMETERS:
 | 
						|
 *    colStructList - column struct list
 | 
						|
 *    colValueList - column value list
 | 
						|
 *    ridList - rowid list
 | 
						|
 * RETURN:
 | 
						|
 *    NO_ERROR if success
 | 
						|
 *    others if something wrong in the checking process
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::checkValid(const TxnID& txnid, const ColStructList& colStructList, const ColValueList& colValueList, const RIDList& ridList) const
 | 
						|
{
 | 
						|
    ColTupleList   curTupleList;
 | 
						|
    ColStructList::size_type structListSize;
 | 
						|
    ColValueList::size_type  valListSize;
 | 
						|
    ColTupleList::size_type  totalRow;
 | 
						|
 | 
						|
    if (colStructList.size() == 0)
 | 
						|
        return ERR_STRUCT_EMPTY;
 | 
						|
 | 
						|
    structListSize = colStructList.size() ;
 | 
						|
    valListSize = colValueList.size();
 | 
						|
 | 
						|
//      if (colStructList.size() !=  colValueList.size())
 | 
						|
    if (structListSize != valListSize)
 | 
						|
        return ERR_STRUCT_VALUE_NOT_MATCH;
 | 
						|
 | 
						|
    for (ColValueList::size_type i = 0; i < valListSize; i++)
 | 
						|
    {
 | 
						|
 | 
						|
        curTupleList = static_cast<ColTupleList>(colValueList[i]);
 | 
						|
        totalRow = curTupleList.size();
 | 
						|
 | 
						|
        if (ridList.size() > 0)
 | 
						|
        {
 | 
						|
            if (totalRow != ridList.size())
 | 
						|
                return ERR_ROWID_VALUE_NOT_MATCH;
 | 
						|
        }
 | 
						|
 | 
						|
    } // end of for (int i = 0;
 | 
						|
 | 
						|
    return NO_ERROR;
 | 
						|
}
 | 
						|
 | 
						|
/*@brief findSmallestColumn --Find the smallest column for this table
 | 
						|
 */
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Find the smallest column for this table
 | 
						|
 * PARAMETERS:
 | 
						|
 *    lowColLen - returns smallest column width
 | 
						|
 *    colId - returns smallest column id
 | 
						|
 *    colStructList - column struct list
 | 
						|
 * RETURN:
 | 
						|
 *  void
 | 
						|
 ***********************************************************/
 | 
						|
void WriteEngineWrapper::findSmallestColumn(uint32_t& colId, ColStructList colStructList)
 | 
						|
// MCOL-1675: find the smallest column width to calculate the RowID from so
 | 
						|
// that all HWMs will be incremented by this operation
 | 
						|
{
 | 
						|
    int32_t lowColLen = 8192;
 | 
						|
    for (uint32_t colIt = 0; colIt < colStructList.size(); colIt++)
 | 
						|
    {        
 | 
						|
        if (colStructList[colIt].colWidth < lowColLen)
 | 
						|
        {
 | 
						|
            colId = colIt;
 | 
						|
            lowColLen = colStructList[colId].colWidth;
 | 
						|
            if ( lowColLen == 1 )
 | 
						|
            {
 | 
						|
                break;
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
/*@convertValArray -  Convert interface values to internal values
 | 
						|
 */
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Convert interface values to internal values
 | 
						|
 * PARAMETERS:
 | 
						|
 *    colStructList - column struct list
 | 
						|
 *    colValueList - column value list
 | 
						|
 * RETURN:
 | 
						|
 *    none
 | 
						|
 *    valArray - output value array
 | 
						|
 *    nullArray - output null flag array
 | 
						|
 ***********************************************************/
 | 
						|
void WriteEngineWrapper::convertValArray(const size_t totalRow, const ColType colType, ColTupleList& curTupleList, void* valArray, bool bFromList)
 | 
						|
{
 | 
						|
    ColTuple    curTuple;
 | 
						|
    ColTupleList::size_type i;
 | 
						|
 | 
						|
    if (bFromList)
 | 
						|
        for (i = 0; i < curTupleList.size(); i++)
 | 
						|
        {
 | 
						|
            curTuple = curTupleList[i];
 | 
						|
            convertValue(colType, valArray, i, curTuple.data);
 | 
						|
        } // end of for (int i = 0
 | 
						|
    else
 | 
						|
        for (i = 0; i < totalRow; i++)
 | 
						|
        {
 | 
						|
            convertValue(colType, valArray, i, curTuple.data, false);
 | 
						|
            curTupleList.push_back(curTuple);
 | 
						|
        }
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * @brief Convert column value to its internal representation
 | 
						|
 */
 | 
						|
void WriteEngineWrapper::convertValue(const ColType colType, void* value, boost::any& data)
 | 
						|
{
 | 
						|
    string curStr;
 | 
						|
    int size;
 | 
						|
 | 
						|
    switch (colType)
 | 
						|
    {
 | 
						|
        case WriteEngine::WR_INT :
 | 
						|
            if (data.type() == typeid(int))
 | 
						|
            {
 | 
						|
                int val = boost::any_cast<int>(data);
 | 
						|
                size = sizeof(int);
 | 
						|
                memcpy(value, &val, size);
 | 
						|
            }
 | 
						|
            else
 | 
						|
            {
 | 
						|
                uint32_t val = boost::any_cast<uint32_t>(data);
 | 
						|
                size = sizeof(uint32_t);
 | 
						|
                memcpy(value, &val, size);
 | 
						|
            }
 | 
						|
 | 
						|
            break;
 | 
						|
 | 
						|
        case WriteEngine::WR_UINT :
 | 
						|
        {
 | 
						|
            uint32_t val = boost::any_cast<uint32_t>(data);
 | 
						|
            size = sizeof(uint32_t);
 | 
						|
            memcpy(value, &val, size);
 | 
						|
        }
 | 
						|
        break;
 | 
						|
 | 
						|
        case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
        case WriteEngine::WR_CHAR :
 | 
						|
        case WriteEngine::WR_BLOB :
 | 
						|
        case WriteEngine::WR_TEXT :
 | 
						|
            curStr = boost::any_cast<string>(data);
 | 
						|
 | 
						|
            if ((int) curStr.length() > MAX_COLUMN_BOUNDARY)
 | 
						|
                curStr = curStr.substr(0, MAX_COLUMN_BOUNDARY);
 | 
						|
 | 
						|
            memcpy(value, curStr.c_str(), curStr.length());
 | 
						|
            break;
 | 
						|
 | 
						|
        case WriteEngine::WR_FLOAT:
 | 
						|
        {
 | 
						|
            float val = boost::any_cast<float>(data);
 | 
						|
 | 
						|
//N.B.There is a bug in boost::any or in gcc where, if you store a nan, you will get back a nan,
 | 
						|
// but not necessarily the same bits that you put in. This only seems to be for float (double seems
 | 
						|
// to work).
 | 
						|
            if (isnan(val))
 | 
						|
            {
 | 
						|
                uint32_t ti = joblist::FLOATNULL;
 | 
						|
                float* tfp = (float*)&ti;
 | 
						|
                val = *tfp;
 | 
						|
            }
 | 
						|
 | 
						|
            size = sizeof(float);
 | 
						|
            memcpy(value, &val, size);
 | 
						|
        }
 | 
						|
        break;
 | 
						|
 | 
						|
        case WriteEngine::WR_DOUBLE:
 | 
						|
        {
 | 
						|
            double val = boost::any_cast<double>(data);
 | 
						|
            size = sizeof(double);
 | 
						|
            memcpy(value, &val, size);
 | 
						|
        }
 | 
						|
        break;
 | 
						|
 | 
						|
        case WriteEngine::WR_SHORT:
 | 
						|
        {
 | 
						|
            short val = boost::any_cast<short>(data);
 | 
						|
            size = sizeof(short);
 | 
						|
            memcpy(value, &val, size);
 | 
						|
        }
 | 
						|
        break;
 | 
						|
 | 
						|
        case WriteEngine::WR_USHORT:
 | 
						|
        {
 | 
						|
            uint16_t val = boost::any_cast<uint16_t>(data);
 | 
						|
            size = sizeof(uint16_t);
 | 
						|
            memcpy(value, &val, size);
 | 
						|
        }
 | 
						|
        break;
 | 
						|
 | 
						|
        case WriteEngine::WR_BYTE:
 | 
						|
        {
 | 
						|
            char val = boost::any_cast<char>(data);
 | 
						|
            size = sizeof(char);
 | 
						|
            memcpy(value, &val, size);
 | 
						|
        }
 | 
						|
        break;
 | 
						|
 | 
						|
        case WriteEngine::WR_UBYTE:
 | 
						|
        {
 | 
						|
            uint8_t val = boost::any_cast<uint8_t>(data);
 | 
						|
            size = sizeof(uint8_t);
 | 
						|
            memcpy(value, &val, size);
 | 
						|
        }
 | 
						|
        break;
 | 
						|
 | 
						|
        case WriteEngine::WR_LONGLONG:
 | 
						|
            if (data.type() == typeid(long long))
 | 
						|
            {
 | 
						|
                long long val = boost::any_cast<long long>(data);
 | 
						|
                size = sizeof(long long);
 | 
						|
                memcpy(value, &val, size);
 | 
						|
            }
 | 
						|
            else
 | 
						|
            {
 | 
						|
                uint64_t val = boost::any_cast<uint64_t>(data);
 | 
						|
                size = sizeof(uint64_t);
 | 
						|
                memcpy(value, &val, size);
 | 
						|
            }
 | 
						|
 | 
						|
            break;
 | 
						|
 | 
						|
        case WriteEngine::WR_ULONGLONG:
 | 
						|
        {
 | 
						|
            uint64_t val = boost::any_cast<uint64_t>(data);
 | 
						|
            size = sizeof(uint64_t);
 | 
						|
            memcpy(value, &val, size);
 | 
						|
        }
 | 
						|
        break;
 | 
						|
 | 
						|
        case WriteEngine::WR_TOKEN:
 | 
						|
        {
 | 
						|
            Token val = boost::any_cast<Token>(data);
 | 
						|
            size = sizeof(Token);
 | 
						|
            memcpy(value, &val, size);
 | 
						|
        }
 | 
						|
        break;
 | 
						|
 | 
						|
    } // end of switch (colType)
 | 
						|
}  /*@convertValue -  The base for converting values */
 | 
						|
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    The base for converting values
 | 
						|
 * PARAMETERS:
 | 
						|
 *    colType - data type
 | 
						|
 *    pos - array position
 | 
						|
 *    data - value
 | 
						|
 * RETURN:
 | 
						|
 *    none
 | 
						|
 ***********************************************************/
 | 
						|
void WriteEngineWrapper::convertValue(const ColType colType, void* valArray, const size_t pos, boost::any& data, bool fromList)
 | 
						|
{
 | 
						|
    string curStr;
 | 
						|
//      ColTuple    curTuple;
 | 
						|
 | 
						|
    if (fromList)
 | 
						|
    {
 | 
						|
        switch (colType)
 | 
						|
        {
 | 
						|
            case WriteEngine::WR_INT :
 | 
						|
                if (data.type() == typeid(long))
 | 
						|
                    ((int*)valArray)[pos] = static_cast<int>(boost::any_cast<long>(data));
 | 
						|
                else if (data.type() == typeid(int))
 | 
						|
                    ((int*)valArray)[pos] = boost::any_cast<int>(data);
 | 
						|
                else
 | 
						|
                    ((int*)valArray)[pos] = boost::any_cast<uint32_t>(data);
 | 
						|
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_UINT :
 | 
						|
                ((uint32_t*)valArray)[pos] = boost::any_cast<uint32_t>(data);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
            case WriteEngine::WR_CHAR :
 | 
						|
            case WriteEngine::WR_BLOB :
 | 
						|
            case WriteEngine::WR_TEXT :
 | 
						|
                curStr = boost::any_cast<string>(data);
 | 
						|
 | 
						|
                if ((int) curStr.length() > MAX_COLUMN_BOUNDARY)
 | 
						|
                    curStr = curStr.substr(0, MAX_COLUMN_BOUNDARY);
 | 
						|
 | 
						|
                memcpy((char*)valArray + pos * MAX_COLUMN_BOUNDARY, curStr.c_str(), curStr.length());
 | 
						|
                break;
 | 
						|
 | 
						|
//            case WriteEngine::WR_LONG :   ((long*)valArray)[pos] = boost::any_cast<long>(curTuple.data);
 | 
						|
//                                          break;
 | 
						|
            case WriteEngine::WR_FLOAT:
 | 
						|
                ((float*)valArray)[pos] = boost::any_cast<float>(data);
 | 
						|
 | 
						|
                if (isnan(((float*)valArray)[pos]))
 | 
						|
                {
 | 
						|
                    uint32_t ti = joblist::FLOATNULL;
 | 
						|
                    float* tfp = (float*)&ti;
 | 
						|
                    ((float*)valArray)[pos] = *tfp;
 | 
						|
                }
 | 
						|
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_DOUBLE:
 | 
						|
                ((double*)valArray)[pos] = boost::any_cast<double>(data);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_SHORT:
 | 
						|
                ((short*)valArray)[pos] = boost::any_cast<short>(data);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_USHORT:
 | 
						|
                ((uint16_t*)valArray)[pos] = boost::any_cast<uint16_t>(data);
 | 
						|
                break;
 | 
						|
 | 
						|
//            case WriteEngine::WR_BIT:     ((bool*)valArray)[pos] = boost::any_cast<bool>(data);
 | 
						|
//                                          break;
 | 
						|
            case WriteEngine::WR_BYTE:
 | 
						|
                ((char*)valArray)[pos] = boost::any_cast<char>(data);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_UBYTE:
 | 
						|
                ((uint8_t*)valArray)[pos] = boost::any_cast<uint8_t>(data);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_LONGLONG:
 | 
						|
                if (data.type() == typeid(long long))
 | 
						|
                    ((long long*)valArray)[pos] = boost::any_cast<long long>(data);
 | 
						|
                else if (data.type() == typeid(long))
 | 
						|
                    ((long long*)valArray)[pos] = (long long)boost::any_cast<long>(data);
 | 
						|
                else
 | 
						|
                    ((long long*)valArray)[pos] = boost::any_cast<uint64_t>(data);
 | 
						|
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_ULONGLONG:
 | 
						|
                ((uint64_t*)valArray)[pos] = boost::any_cast<uint64_t>(data);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_TOKEN:
 | 
						|
                ((Token*)valArray)[pos] = boost::any_cast<Token>(data);
 | 
						|
                break;
 | 
						|
        } // end of switch (colType)
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        switch (colType)
 | 
						|
        {
 | 
						|
            case WriteEngine::WR_INT :
 | 
						|
                data = ((int*)valArray)[pos];
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_UINT :
 | 
						|
                data = ((uint64_t*)valArray)[pos];
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
            case WriteEngine::WR_CHAR :
 | 
						|
            case WriteEngine::WR_BLOB :
 | 
						|
            case WriteEngine::WR_TEXT :
 | 
						|
                char tmp[10];
 | 
						|
                memcpy(tmp, (char*)valArray + pos * 8, 8);
 | 
						|
                curStr = tmp;
 | 
						|
                data = curStr;
 | 
						|
                break;
 | 
						|
 | 
						|
//            case WriteEngine::WR_LONG :   ((long*)valArray)[pos] = boost::any_cast<long>(curTuple.data);
 | 
						|
//                                          break;
 | 
						|
            case WriteEngine::WR_FLOAT:
 | 
						|
                data = ((float*)valArray)[pos];
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_DOUBLE:
 | 
						|
                data = ((double*)valArray)[pos];
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_SHORT:
 | 
						|
                data = ((short*)valArray)[pos];
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_USHORT:
 | 
						|
                data = ((uint16_t*)valArray)[pos];
 | 
						|
                break;
 | 
						|
 | 
						|
//            case WriteEngine::WR_BIT:     data = ((bool*)valArray)[pos];
 | 
						|
//                                          break;
 | 
						|
            case WriteEngine::WR_BYTE:
 | 
						|
                data = ((char*)valArray)[pos];
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_UBYTE:
 | 
						|
                data = ((uint8_t*)valArray)[pos];
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_LONGLONG:
 | 
						|
                data = ((long long*)valArray)[pos];
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_ULONGLONG:
 | 
						|
                data = ((uint64_t*)valArray)[pos];
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_TOKEN:
 | 
						|
                data = ((Token*)valArray)[pos];
 | 
						|
                break;
 | 
						|
        } // end of switch (colType)
 | 
						|
    } // end of if
 | 
						|
}
 | 
						|
 | 
						|
/*@createColumn -  Create column files, including data and bitmap files
 | 
						|
 */
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Create column files, including data and bitmap files
 | 
						|
 * PARAMETERS:
 | 
						|
 *    dataOid - column data file id
 | 
						|
 *    bitmapOid - column bitmap file id
 | 
						|
 *    colWidth - column width
 | 
						|
 *    dbRoot   - DBRoot where file is to be located
 | 
						|
 *    partition - Starting partition number for segment file path
 | 
						|
 *     compressionType - compression type
 | 
						|
 * RETURN:
 | 
						|
 *    NO_ERROR if success
 | 
						|
 *    ERR_FILE_EXIST if file exists
 | 
						|
 *    ERR_FILE_CREATE if something wrong in creating the file
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::createColumn(
 | 
						|
    const TxnID& txnid,
 | 
						|
    const OID& dataOid,
 | 
						|
    const CalpontSystemCatalog::ColDataType dataType,
 | 
						|
    int dataWidth,
 | 
						|
    uint16_t dbRoot,
 | 
						|
    uint32_t partition,
 | 
						|
    int compressionType)
 | 
						|
{
 | 
						|
    int      rc;
 | 
						|
    Column   curCol;
 | 
						|
 | 
						|
    int compress_op = op(compressionType);
 | 
						|
    m_colOp[compress_op]->initColumn(curCol);
 | 
						|
    rc = m_colOp[compress_op]->createColumn(curCol, 0, dataWidth, dataType,
 | 
						|
                                            WriteEngine::WR_CHAR, (FID)dataOid, dbRoot, partition);
 | 
						|
 | 
						|
    // This is optional, however, it's recommended to do so to free heap
 | 
						|
    // memory if assigned in the future
 | 
						|
    m_colOp[compress_op]->clearColumn(curCol);
 | 
						|
    std::map<FID, FID> oids;
 | 
						|
 | 
						|
    if (rc == NO_ERROR)
 | 
						|
        rc = flushDataFiles(NO_ERROR, txnid, oids);
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
    {
 | 
						|
        return rc;
 | 
						|
    }
 | 
						|
 | 
						|
    RETURN_ON_ERROR(BRMWrapper::getInstance()->setLocalHWM(dataOid, partition, 0, 0));
 | 
						|
    // @bug 281 : fix for bug 281 - Add flush VM cache to clear all write buffer
 | 
						|
    //flushVMCache();
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
//BUG931
 | 
						|
/**
 | 
						|
 * @brief Fill column with default values
 | 
						|
 */
 | 
						|
int WriteEngineWrapper::fillColumn(const TxnID& txnid, const OID& dataOid,
 | 
						|
                                   const CalpontSystemCatalog::ColDataType dataType, int dataWidth,
 | 
						|
                                   ColTuple defaultVal, const OID& refColOID,
 | 
						|
                                   const CalpontSystemCatalog::ColDataType refColDataType,
 | 
						|
                                   int refColWidth, int refCompressionType,
 | 
						|
                                   bool isNULL, int compressionType,
 | 
						|
                                   const string& defaultValStr,
 | 
						|
                                   const OID& dictOid, bool autoincrement)
 | 
						|
{
 | 
						|
    int      rc = NO_ERROR;
 | 
						|
    Column   newCol;
 | 
						|
    Column   refCol;
 | 
						|
    ColType  newColType;
 | 
						|
    ColType  refColType;
 | 
						|
    boost::scoped_array<char> defVal(new char[MAX_COLUMN_BOUNDARY]);
 | 
						|
    ColumnOp* colOpNewCol = m_colOp[op(compressionType)];
 | 
						|
    ColumnOp* refColOp = m_colOp[op(refCompressionType)];
 | 
						|
    Dctnry*   dctnry  = m_dctnry[op(compressionType)];
 | 
						|
    colOpNewCol->initColumn(newCol);
 | 
						|
    refColOp->initColumn(refCol);
 | 
						|
    //boost::shared_ptr<Dctnry> dctnry;
 | 
						|
    // boost::shared_ptr<ColumnOp> refColOp;
 | 
						|
    // refColOp.reset(colOpRefCol);
 | 
						|
    // dctnry.reset(dctOp);
 | 
						|
    uint16_t dbRoot = 1;	//not to be used
 | 
						|
    //Convert HWM of the reference column for the new column
 | 
						|
    //Bug 1703,1705
 | 
						|
    bool isToken = false;
 | 
						|
 | 
						|
    if (((dataType == CalpontSystemCatalog::VARCHAR) && (dataWidth > 7)) ||
 | 
						|
            ((dataType == CalpontSystemCatalog::CHAR) && (dataWidth > 8)) ||
 | 
						|
            (dataType == CalpontSystemCatalog::VARBINARY) ||
 | 
						|
            (dataType == CalpontSystemCatalog::BLOB) ||
 | 
						|
            (dataType == CalpontSystemCatalog::TEXT))
 | 
						|
    {
 | 
						|
        isToken = true;
 | 
						|
    }
 | 
						|
 | 
						|
    Convertor::convertColType(dataType, newColType, isToken);
 | 
						|
 | 
						|
    if (((refColDataType == CalpontSystemCatalog::VARCHAR) && (refColWidth > 7)) ||
 | 
						|
            ((refColDataType == CalpontSystemCatalog::CHAR) && (refColWidth > 8)) ||
 | 
						|
            (refColDataType == CalpontSystemCatalog::VARBINARY) ||
 | 
						|
            (dataType == CalpontSystemCatalog::BLOB) ||
 | 
						|
            (dataType == CalpontSystemCatalog::TEXT))
 | 
						|
    {
 | 
						|
        isToken = true;
 | 
						|
    }
 | 
						|
 | 
						|
    Convertor::convertColType(refColDataType, refColType, isToken);
 | 
						|
    refColOp->setColParam(refCol, 0, refColOp->getCorrectRowWidth(refColDataType, refColWidth),
 | 
						|
                          refColDataType, refColType, (FID)refColOID, refCompressionType, dbRoot);
 | 
						|
    colOpNewCol->setColParam(newCol, 0, colOpNewCol->getCorrectRowWidth(dataType, dataWidth),
 | 
						|
                             dataType, newColType, (FID)dataOid, compressionType, dbRoot);
 | 
						|
 | 
						|
    int size = sizeof(Token);
 | 
						|
 | 
						|
    if (newColType == WriteEngine::WR_TOKEN)
 | 
						|
    {
 | 
						|
        if (isNULL)
 | 
						|
        {
 | 
						|
            Token nullToken;
 | 
						|
            memcpy(defVal.get(), &nullToken, size);
 | 
						|
        }
 | 
						|
 | 
						|
        //Tokenization is done when we create dictionary file
 | 
						|
    }
 | 
						|
    else
 | 
						|
        convertValue(newColType, defVal.get(), defaultVal.data);
 | 
						|
 | 
						|
    if (rc == NO_ERROR)
 | 
						|
        rc = colOpNewCol->fillColumn(txnid, newCol, refCol, defVal.get(), dctnry, refColOp, dictOid, dataWidth, defaultValStr, autoincrement);
 | 
						|
 | 
						|
//   colOpNewCol->clearColumn(newCol);
 | 
						|
//   colOpRefCol->clearColumn(refCol);
 | 
						|
 | 
						|
//   free(defVal);
 | 
						|
 | 
						|
// flushing files is in colOp->fillColumn()
 | 
						|
// if (rc == NO_ERROR)
 | 
						|
// rc = flushDataFiles();
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::deleteRow(const TxnID& txnid, vector<ColStructList>& colExtentsStruct, vector<void*>& colOldValueList,
 | 
						|
                                  vector<RIDList>& ridLists, const int32_t tableOid)
 | 
						|
{
 | 
						|
    ColTuple         curTuple;
 | 
						|
    ColStruct        curColStruct;
 | 
						|
    DctnryStruct     dctnryStruct;
 | 
						|
    ColValueList     colValueList;
 | 
						|
    ColTupleList     curTupleList;
 | 
						|
    DctnryStructList dctnryStructList;
 | 
						|
    DctnryValueList  dctnryValueList;
 | 
						|
    ColStructList    colStructList;
 | 
						|
    uint64_t         emptyVal;
 | 
						|
    int              rc;
 | 
						|
    string           tmpStr("");
 | 
						|
    vector<DctnryStructList> dctnryExtentsStruct;
 | 
						|
 | 
						|
    if (colExtentsStruct.size() == 0 || ridLists.size() == 0)
 | 
						|
        return ERR_STRUCT_EMPTY;
 | 
						|
 | 
						|
    // set transaction id
 | 
						|
    setTransId(txnid);
 | 
						|
    unsigned numExtents = colExtentsStruct.size();
 | 
						|
 | 
						|
    for (unsigned extent = 0; extent < numExtents; extent++)
 | 
						|
    {
 | 
						|
        colStructList = colExtentsStruct[extent];
 | 
						|
 | 
						|
        for (ColStructList::size_type i = 0; i < colStructList.size(); i++)
 | 
						|
        {
 | 
						|
            curTupleList.clear();
 | 
						|
            curColStruct = colStructList[i];
 | 
						|
            emptyVal = m_colOp[op(curColStruct.fCompressionType)]->
 | 
						|
                       getEmptyRowValue(curColStruct.colDataType, curColStruct.colWidth);
 | 
						|
 | 
						|
            curTuple.data = emptyVal;
 | 
						|
            //for (RIDList::size_type j = 0; j < ridLists[extent].size(); j++)
 | 
						|
            //    curTupleList.push_back(curTuple);
 | 
						|
            curTupleList.push_back(curTuple);
 | 
						|
            colValueList.push_back(curTupleList);
 | 
						|
 | 
						|
            dctnryStruct.dctnryOid = 0;
 | 
						|
            dctnryStruct.fColPartition = curColStruct.fColPartition;
 | 
						|
            dctnryStruct.fColSegment = curColStruct.fColSegment;
 | 
						|
            dctnryStruct.fColDbRoot = curColStruct.fColDbRoot;
 | 
						|
            dctnryStruct.columnOid = colStructList[i].dataOid;
 | 
						|
            dctnryStructList.push_back(dctnryStruct);
 | 
						|
 | 
						|
            DctnryTuple dctnryTuple;
 | 
						|
            DctColTupleList dctColTuples;
 | 
						|
            dctnryTuple.sigValue = (unsigned char*)tmpStr.c_str();
 | 
						|
            dctnryTuple.sigSize = tmpStr.length();
 | 
						|
            dctnryTuple.isNull = true;
 | 
						|
            dctColTuples.push_back (dctnryTuple);
 | 
						|
            dctnryValueList.push_back (dctColTuples);
 | 
						|
        }
 | 
						|
 | 
						|
        dctnryExtentsStruct.push_back(dctnryStructList);
 | 
						|
    }
 | 
						|
 | 
						|
    // unfortunately I don't have a better way to instruct without passing too many parameters
 | 
						|
    m_opType = DELETE;
 | 
						|
    rc = updateColumnRec(txnid, colExtentsStruct, colValueList, colOldValueList, ridLists, dctnryExtentsStruct, dctnryValueList, tableOid);
 | 
						|
    m_opType = NOOP;
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::deleteBadRows(const TxnID& txnid, ColStructList& colStructs,
 | 
						|
                                      RIDList& ridList, DctnryStructList& dctnryStructList)
 | 
						|
{
 | 
						|
    /*  Need to scan all files including dictionary store files to check whether there is any bad chunks
 | 
						|
     *
 | 
						|
     */
 | 
						|
    int rc = 0;
 | 
						|
    Column         curCol;
 | 
						|
    void*          valArray = NULL;
 | 
						|
 | 
						|
    for (unsigned i = 0; i < colStructs.size(); i++)
 | 
						|
    {
 | 
						|
        ColumnOp* colOp = m_colOp[op(colStructs[i].fCompressionType)];
 | 
						|
        unsigned needFixFiles = colStructs[i].tokenFlag ? 2 : 1;
 | 
						|
        colOp->initColumn(curCol);
 | 
						|
 | 
						|
        for (unsigned j = 0; j < needFixFiles; j++)
 | 
						|
        {
 | 
						|
            if (j == 0)
 | 
						|
            {
 | 
						|
                colOp->setColParam(curCol, 0, colStructs[i].colWidth,
 | 
						|
                                   colStructs[i].colDataType, colStructs[i].colType, colStructs[i].dataOid,
 | 
						|
                                   colStructs[i].fCompressionType, colStructs[i].fColDbRoot,
 | 
						|
                                   colStructs[i].fColPartition, colStructs[i].fColSegment);
 | 
						|
 | 
						|
                string segFile;
 | 
						|
                rc = colOp->openColumnFile(curCol, segFile, true, IO_BUFF_SIZE); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
                if (rc != NO_ERROR) //If openFile fails, disk error or header error is assumed.
 | 
						|
                {
 | 
						|
                    //report error and return.
 | 
						|
                    std::ostringstream oss;
 | 
						|
                    WErrorCodes ec;
 | 
						|
                    string err = ec.errorString(rc);
 | 
						|
                    oss << "Error opening file oid:dbroot:partition:segment = " << colStructs[i].dataOid << ":" << colStructs[i].fColDbRoot
 | 
						|
                        << ":" << colStructs[i].fColPartition << ":" << colStructs[i].fColSegment << " and error code is " << rc << " with message " << err;
 | 
						|
                    throw std::runtime_error(oss.str());
 | 
						|
                }
 | 
						|
 | 
						|
                switch (colStructs[i].colType)
 | 
						|
                {
 | 
						|
                    case WriteEngine::WR_INT:
 | 
						|
                        valArray = (int*) calloc(sizeof(int), 1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_UINT:
 | 
						|
                        valArray = (uint32_t*) calloc(sizeof(uint32_t), 1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
                    case WriteEngine::WR_CHAR:
 | 
						|
                    case WriteEngine::WR_BLOB:
 | 
						|
                    case WriteEngine::WR_TEXT:
 | 
						|
                        valArray = (char*) calloc(sizeof(char), 1 * MAX_COLUMN_BOUNDARY);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_FLOAT:
 | 
						|
                        valArray = (float*) calloc(sizeof(float), 1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_DOUBLE:
 | 
						|
                        valArray = (double*) calloc(sizeof(double), 1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_BYTE:
 | 
						|
                        valArray = (char*) calloc(sizeof(char), 1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_UBYTE:
 | 
						|
                        valArray = (uint8_t*) calloc(sizeof(uint8_t), 1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_SHORT:
 | 
						|
                        valArray = (short*) calloc(sizeof(short), 1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_USHORT:
 | 
						|
                        valArray = (uint16_t*) calloc(sizeof(uint16_t), 1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_LONGLONG:
 | 
						|
                        valArray = (long long*) calloc(sizeof(long long), 1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_ULONGLONG:
 | 
						|
                        valArray = (uint64_t*) calloc(sizeof(uint64_t), 1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_TOKEN:
 | 
						|
                        valArray = (Token*) calloc(sizeof(Token), 1);
 | 
						|
                        break;
 | 
						|
                }
 | 
						|
 | 
						|
                rc = colOp->writeRows(curCol, ridList.size(), ridList, valArray, 0, true);
 | 
						|
 | 
						|
                if ( rc != NO_ERROR)
 | 
						|
                {
 | 
						|
                    //read error is fixed in place
 | 
						|
                    if (rc == ERR_COMP_COMPRESS) //write error
 | 
						|
                    {
 | 
						|
 | 
						|
                    }
 | 
						|
 | 
						|
                }
 | 
						|
 | 
						|
                //flush files will be done in the end of fix.
 | 
						|
                colOp->clearColumn(curCol);
 | 
						|
 | 
						|
                if (valArray != NULL)
 | 
						|
                    free(valArray);
 | 
						|
            }
 | 
						|
            else //dictionary file. How to fix
 | 
						|
            {
 | 
						|
                //read headers out, uncompress the last chunk, if error, replace it with empty chunk.
 | 
						|
                Dctnry* dctnry = m_dctnry[op(dctnryStructList[i].fCompressionType)];
 | 
						|
                rc = dctnry->openDctnry(dctnryStructList[i].dctnryOid,
 | 
						|
                                        dctnryStructList[i].fColDbRoot, dctnryStructList[i].fColPartition,
 | 
						|
                                        dctnryStructList[i].fColSegment,
 | 
						|
                                        false);
 | 
						|
 | 
						|
                rc =  dctnry->checkFixLastDictChunk();
 | 
						|
                rc = dctnry->closeDctnry(true);
 | 
						|
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
/*@flushVMCache - Flush VM cache
 | 
						|
*/
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Flush sytem VM cache
 | 
						|
 * PARAMETERS:
 | 
						|
 *    none
 | 
						|
 * RETURN:
 | 
						|
 *    none
 | 
						|
 ***********************************************************/
 | 
						|
void WriteEngineWrapper::flushVMCache() const
 | 
						|
{
 | 
						|
//      int fd = open("/proc/sys/vm/drop_caches", O_WRONLY);
 | 
						|
//      write(fd, "3", 1);
 | 
						|
//      close(fd);
 | 
						|
 | 
						|
}
 | 
						|
 | 
						|
/*@insertColumnRecs -  Insert value(s) into a column
 | 
						|
*/
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Insert values into  columns (batchinsert)
 | 
						|
 * PARAMETERS:
 | 
						|
 *    colStructList - column struct list
 | 
						|
 *    colValueList - column value list
 | 
						|
 * RETURN:
 | 
						|
 *    NO_ERROR if success
 | 
						|
 *    others if something wrong in inserting the value
 | 
						|
 ***********************************************************/
 | 
						|
 | 
						|
int WriteEngineWrapper::insertColumnRecs(const TxnID& txnid,
 | 
						|
        ColStructList& colStructList,
 | 
						|
        ColValueList& colValueList,
 | 
						|
        DctnryStructList& dctnryStructList,
 | 
						|
        DictStrList& dictStrList,
 | 
						|
        std::vector<boost::shared_ptr<DBRootExtentTracker> >& dbRootExtentTrackers,
 | 
						|
        RBMetaWriter* fRBMetaWriter,
 | 
						|
        bool bFirstExtentOnThisPM,
 | 
						|
        bool insertSelect,
 | 
						|
        bool isAutoCommitOn,
 | 
						|
        OID tableOid,
 | 
						|
        bool isFirstBatchPm)
 | 
						|
{
 | 
						|
    int            rc;
 | 
						|
    RID*           rowIdArray = NULL;
 | 
						|
    ColTupleList   curTupleList;
 | 
						|
    Column         curCol;
 | 
						|
    ColStruct      curColStruct;
 | 
						|
    ColValueList   colOldValueList;
 | 
						|
    ColValueList   colNewValueList;
 | 
						|
    ColStructList  newColStructList;
 | 
						|
    DctnryStructList newDctnryStructList;
 | 
						|
    HWM            hwm = 0;
 | 
						|
    HWM            oldHwm = 0;
 | 
						|
    HWM    		  newHwm = 0;
 | 
						|
    ColTupleList::size_type totalRow;
 | 
						|
    ColStructList::size_type totalColumns;
 | 
						|
    uint64_t rowsLeft = 0;
 | 
						|
    bool newExtent = false;
 | 
						|
    RIDList ridList;
 | 
						|
    ColumnOp* colOp = NULL;
 | 
						|
 | 
						|
    // Set tmp file suffix to modify HDFS db file
 | 
						|
    bool           useTmpSuffix = false;
 | 
						|
 | 
						|
    if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
    {
 | 
						|
        if (!bFirstExtentOnThisPM)
 | 
						|
            useTmpSuffix = true;
 | 
						|
    }
 | 
						|
 | 
						|
    unsigned i = 0;
 | 
						|
#ifdef PROFILE
 | 
						|
    StopWatch timer;
 | 
						|
#endif
 | 
						|
 | 
						|
    // debug information for testing
 | 
						|
    if (isDebug(DEBUG_2))
 | 
						|
    {
 | 
						|
        printf("\nIn wrapper insert\n");
 | 
						|
        printInputValue(colStructList, colValueList, ridList);
 | 
						|
    }
 | 
						|
 | 
						|
    // end
 | 
						|
 | 
						|
    //Convert data type and column width to write engine specific
 | 
						|
    for (i = 0; i < colStructList.size(); i++)
 | 
						|
        Convertor::convertColType(&colStructList[i]);
 | 
						|
 | 
						|
    uint32_t colId = 0;
 | 
						|
    // MCOL-1675: find the smallest column width to calculate the RowID from so
 | 
						|
    // that all HWMs will be incremented by this operation
 | 
						|
    findSmallestColumn(colId, colStructList);
 | 
						|
 | 
						|
    // rc = checkValid(txnid, colStructList, colValueList, ridList);
 | 
						|
    // if (rc != NO_ERROR)
 | 
						|
    //   return rc;
 | 
						|
 | 
						|
    setTransId(txnid);
 | 
						|
    uint16_t  dbRoot, segmentNum;
 | 
						|
    uint32_t partitionNum;
 | 
						|
    string    segFile;
 | 
						|
    bool newFile;
 | 
						|
    TableMetaData* tableMetaData = TableMetaData::makeTableMetaData(tableOid);
 | 
						|
    //populate colStructList with file information
 | 
						|
    IDBDataFile* pFile = NULL;
 | 
						|
    std::vector<DBRootExtentInfo> extentInfo;
 | 
						|
    int currentDBrootIdx = 0;
 | 
						|
    std::vector<BRM::CreateStripeColumnExtentsArgOut> extents;
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // For first batch on this PM:
 | 
						|
    //   o get starting extent from ExtentTracker, and allocate extent if needed
 | 
						|
    //   o construct colStructList and dctnryStructList accordingly
 | 
						|
    //   o save extent information in tableMetaData for future use
 | 
						|
    // If not first batch on this PM:
 | 
						|
    //   o construct colStructList and dctnryStructList from tableMetaData
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    if (isFirstBatchPm)
 | 
						|
    {
 | 
						|
		currentDBrootIdx = dbRootExtentTrackers[colId]->getCurrentDBRootIdx();
 | 
						|
		extentInfo = dbRootExtentTrackers[colId]->getDBRootExtentList();
 | 
						|
        dbRoot = extentInfo[currentDBrootIdx].fDbRoot;
 | 
						|
        partitionNum = extentInfo[currentDBrootIdx].fPartition;
 | 
						|
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        // check whether this extent is the first on this PM
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        if (bFirstExtentOnThisPM)
 | 
						|
        {
 | 
						|
            //cout << "bFirstExtentOnThisPM is " << bFirstExtentOnThisPM << endl;
 | 
						|
            std::vector<BRM::CreateStripeColumnExtentsArgIn> cols;
 | 
						|
            BRM::CreateStripeColumnExtentsArgIn createStripeColumnExtentsArgIn;
 | 
						|
 | 
						|
            for (i = 0; i < colStructList.size(); i++)
 | 
						|
            {
 | 
						|
                createStripeColumnExtentsArgIn.oid = colStructList[i].dataOid;
 | 
						|
                createStripeColumnExtentsArgIn.width = colStructList[i].colWidth;
 | 
						|
                createStripeColumnExtentsArgIn.colDataType = colStructList[i].colDataType;
 | 
						|
                cols.push_back(createStripeColumnExtentsArgIn);
 | 
						|
            }
 | 
						|
 | 
						|
            rc = BRMWrapper::getInstance()->allocateStripeColExtents(cols, dbRoot, partitionNum, segmentNum, extents);
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                return rc;
 | 
						|
 | 
						|
            //Create column files
 | 
						|
            BRM::CPInfoList_t cpinfoList;
 | 
						|
            BRM::CPInfo cpInfo;
 | 
						|
 | 
						|
            if (isUnsigned(colStructList[i].colDataType))
 | 
						|
            {
 | 
						|
                cpInfo.max = 0;
 | 
						|
                cpInfo.min = static_cast<int64_t>(numeric_limits<uint64_t>::max());
 | 
						|
            }
 | 
						|
            else
 | 
						|
            {
 | 
						|
                cpInfo.max = numeric_limits<int64_t>::min();
 | 
						|
                cpInfo.min = numeric_limits<int64_t>::max();
 | 
						|
            }
 | 
						|
 | 
						|
            cpInfo.seqNum = -1;
 | 
						|
 | 
						|
            for ( i = 0; i < extents.size(); i++)
 | 
						|
            {
 | 
						|
                colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
                colOp->initColumn(curCol);
 | 
						|
				colOp->setColParam(curCol, colId, colStructList[i].colWidth, colStructList[i].colDataType,
 | 
						|
                                   colStructList[i].colType, colStructList[i].dataOid, colStructList[i].fCompressionType,
 | 
						|
                                   dbRoot, partitionNum, segmentNum);
 | 
						|
                rc = colOp->extendColumn(curCol, false, extents[i].startBlkOffset, extents[i].startLbid, extents[i].allocSize, dbRoot,
 | 
						|
                                         partitionNum, segmentNum, segFile, pFile, newFile);
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
 | 
						|
                //mark the extents to invalid
 | 
						|
                cpInfo.firstLbid = extents[i].startLbid;
 | 
						|
                cpinfoList.push_back(cpInfo);
 | 
						|
                colStructList[i].fColPartition = partitionNum;
 | 
						|
                colStructList[i].fColSegment = segmentNum;
 | 
						|
                colStructList[i].fColDbRoot = dbRoot;
 | 
						|
                dctnryStructList[i].fColPartition = partitionNum;
 | 
						|
                dctnryStructList[i].fColSegment = segmentNum;
 | 
						|
                dctnryStructList[i].fColDbRoot = dbRoot;
 | 
						|
            }
 | 
						|
 | 
						|
            //mark the extents to invalid
 | 
						|
            rc = BRMWrapper::getInstance()->setExtentsMaxMin(cpinfoList);
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                return rc;
 | 
						|
 | 
						|
            //create corresponding dictionary files
 | 
						|
            for (i = 0; i < dctnryStructList.size(); i++)
 | 
						|
            {
 | 
						|
                if (dctnryStructList[i].dctnryOid > 0)
 | 
						|
                {
 | 
						|
                    rc = createDctnry(txnid, dctnryStructList[i].dctnryOid, dctnryStructList[i].colWidth, dbRoot, partitionNum,
 | 
						|
                                      segmentNum, dctnryStructList[i].fCompressionType);
 | 
						|
 | 
						|
                    if ( rc != NO_ERROR)
 | 
						|
                        return rc;
 | 
						|
                }
 | 
						|
            }
 | 
						|
        }    // if ( bFirstExtentOnThisPM)
 | 
						|
        else // if (!bFirstExtentOnThisPM)
 | 
						|
        {
 | 
						|
            std::vector<DBRootExtentInfo> tmpExtentInfo;
 | 
						|
 | 
						|
            for (i = 0; i < dbRootExtentTrackers.size(); i++)
 | 
						|
            {
 | 
						|
                tmpExtentInfo = dbRootExtentTrackers[i]->getDBRootExtentList();
 | 
						|
                colStructList[i].fColPartition =  tmpExtentInfo[currentDBrootIdx].fPartition;
 | 
						|
                colStructList[i].fColSegment = tmpExtentInfo[currentDBrootIdx].fSegment;
 | 
						|
                colStructList[i].fColDbRoot = tmpExtentInfo[currentDBrootIdx].fDbRoot;
 | 
						|
                //cout << "Load from dbrootExtenttracker oid:dbroot:part:seg = " <<colStructList[i].dataOid<<":"
 | 
						|
                //<<colStructList[i].fColDbRoot<<":"<<colStructList[i].fColPartition<<":"<<colStructList[i].fColSegment<<endl;
 | 
						|
                dctnryStructList[i].fColPartition = tmpExtentInfo[currentDBrootIdx].fPartition;
 | 
						|
                dctnryStructList[i].fColSegment = tmpExtentInfo[currentDBrootIdx].fSegment;
 | 
						|
                dctnryStructList[i].fColDbRoot = tmpExtentInfo[currentDBrootIdx].fDbRoot;
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        // Save the extents info in tableMetaData
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        for (i = 0; i < colStructList.size(); i++)
 | 
						|
        {
 | 
						|
            ColExtsInfo aColExtsInfo = tableMetaData->getColExtsInfo(colStructList[i].dataOid);
 | 
						|
            ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
            while (it != aColExtsInfo.end())
 | 
						|
            {
 | 
						|
                if ((it->dbRoot == colStructList[i].fColDbRoot) && (it->partNum == colStructList[i].fColPartition) && (it->segNum == colStructList[i].fColSegment))
 | 
						|
                    break;
 | 
						|
 | 
						|
                it++;
 | 
						|
            }
 | 
						|
 | 
						|
            if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
            {
 | 
						|
                ColExtInfo aExt;
 | 
						|
                aExt.dbRoot = colStructList[i].fColDbRoot;
 | 
						|
                aExt.partNum = colStructList[i].fColPartition;
 | 
						|
                aExt.segNum = colStructList[i].fColSegment;
 | 
						|
                aExt.compType = colStructList[i].fCompressionType;
 | 
						|
                aExt.isDict = false;
 | 
						|
 | 
						|
                if (bFirstExtentOnThisPM)
 | 
						|
                {
 | 
						|
                    aExt.hwm = extents[i].startBlkOffset;
 | 
						|
                    aExt.isNewExt = true;
 | 
						|
                    //cout << "adding a ext to metadata" << endl;
 | 
						|
                }
 | 
						|
                else
 | 
						|
                {
 | 
						|
                    std::vector<DBRootExtentInfo> tmpExtentInfo;
 | 
						|
                    tmpExtentInfo = dbRootExtentTrackers[i]->getDBRootExtentList();
 | 
						|
                    aExt.isNewExt = false;
 | 
						|
                    aExt.hwm = tmpExtentInfo[currentDBrootIdx].fLocalHwm;
 | 
						|
                    //cout << "oid " << colStructList[i].dataOid << " gets hwm " << aExt.hwm << endl;
 | 
						|
                }
 | 
						|
 | 
						|
                aExt.current = true;
 | 
						|
                aColExtsInfo.push_back(aExt);
 | 
						|
                //cout << "get from extentinfo oid:hwm = " << colStructList[i].dataOid << ":" << aExt.hwm << endl;
 | 
						|
            }
 | 
						|
 | 
						|
            tableMetaData->setColExtsInfo(colStructList[i].dataOid, aColExtsInfo);
 | 
						|
        }
 | 
						|
 | 
						|
        for (i = 0; i < dctnryStructList.size(); i++)
 | 
						|
        {
 | 
						|
            if (dctnryStructList[i].dctnryOid > 0)
 | 
						|
            {
 | 
						|
                ColExtsInfo aColExtsInfo = tableMetaData->getColExtsInfo(dctnryStructList[i].dctnryOid);
 | 
						|
                ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
                while (it != aColExtsInfo.end())
 | 
						|
                {
 | 
						|
                    if ((it->dbRoot == dctnryStructList[i].fColDbRoot) && (it->partNum == dctnryStructList[i].fColPartition) && (it->segNum == dctnryStructList[i].fColSegment))
 | 
						|
                        break;
 | 
						|
 | 
						|
                    it++;
 | 
						|
                }
 | 
						|
 | 
						|
                if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
                {
 | 
						|
                    ColExtInfo aExt;
 | 
						|
                    aExt.dbRoot = dctnryStructList[i].fColDbRoot;
 | 
						|
                    aExt.partNum = dctnryStructList[i].fColPartition;
 | 
						|
                    aExt.segNum = dctnryStructList[i].fColSegment;
 | 
						|
                    aExt.compType = dctnryStructList[i].fCompressionType;
 | 
						|
                    aExt.isDict = true;
 | 
						|
                    aColExtsInfo.push_back(aExt);
 | 
						|
                }
 | 
						|
 | 
						|
                tableMetaData->setColExtsInfo(dctnryStructList[i].dctnryOid, aColExtsInfo);
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
    } // if (isFirstBatchPm)
 | 
						|
    else //get the extent info from tableMetaData
 | 
						|
    {
 | 
						|
        ColExtsInfo aColExtsInfo = tableMetaData->getColExtsInfo(colStructList[colId].dataOid);
 | 
						|
        ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
        while (it != aColExtsInfo.end())
 | 
						|
        {
 | 
						|
            if (it->current)
 | 
						|
                break;
 | 
						|
 | 
						|
            it++;
 | 
						|
        }
 | 
						|
 | 
						|
        if (it == aColExtsInfo.end())
 | 
						|
            return 1;
 | 
						|
 | 
						|
        for (i = 0; i < colStructList.size(); i++)
 | 
						|
        {
 | 
						|
            colStructList[i].fColPartition = it->partNum;
 | 
						|
            colStructList[i].fColSegment = it->segNum;
 | 
						|
            colStructList[i].fColDbRoot = it->dbRoot;
 | 
						|
            dctnryStructList[i].fColPartition = it->partNum;
 | 
						|
            dctnryStructList[i].fColSegment = it->segNum;
 | 
						|
            dctnryStructList[i].fColDbRoot = it->dbRoot;
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    curTupleList = static_cast<ColTupleList>(colValueList[0]);
 | 
						|
    totalRow = curTupleList.size();
 | 
						|
    totalColumns = colStructList.size();
 | 
						|
    rowIdArray = new RID[totalRow];
 | 
						|
    // use scoped_array to ensure ptr deletion regardless of where we return
 | 
						|
    boost::scoped_array<RID> rowIdArrayPtr(rowIdArray);
 | 
						|
    memset(rowIdArray, 0, (sizeof(RID)*totalRow));
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // allocate row id(s)
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
   curColStruct = colStructList[colId];
 | 
						|
    colOp = m_colOp[op(curColStruct.fCompressionType)];
 | 
						|
 | 
						|
    colOp->initColumn(curCol);
 | 
						|
 | 
						|
    //Get the correct segment, partition, column file
 | 
						|
    vector<ExtentInfo> colExtentInfo; //Save those empty extents in case of failure to rollback
 | 
						|
    vector<ExtentInfo> dictExtentInfo; //Save those empty extents in case of failure to rollback
 | 
						|
    vector<ExtentInfo> fileInfo;
 | 
						|
    dbRoot = curColStruct.fColDbRoot;
 | 
						|
    //use the first column to calculate row id
 | 
						|
   ColExtsInfo aColExtsInfo = tableMetaData->getColExtsInfo(colStructList[colId].dataOid);
 | 
						|
    ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
    while (it != aColExtsInfo.end())
 | 
						|
    {
 | 
						|
		if ((it->dbRoot == colStructList[colId].fColDbRoot) && 
 | 
						|
            (it->partNum == colStructList[colId].fColPartition) && 
 | 
						|
            (it->segNum == colStructList[colId].fColSegment) && it->current )
 | 
						|
        {
 | 
						|
            break;
 | 
						|
        }
 | 
						|
        it++;
 | 
						|
    }
 | 
						|
 | 
						|
    if (it != aColExtsInfo.end())
 | 
						|
    {
 | 
						|
        hwm = it->hwm;
 | 
						|
		//cout << "Got from colextinfo hwm for oid " << colStructList[colId].dataOid << " is " << hwm << " and seg is " << colStructList[0].fColSegment << endl;
 | 
						|
    }
 | 
						|
 | 
						|
    oldHwm = hwm; //Save this info for rollback
 | 
						|
    //need to pass real dbRoot, partition, and segment to setColParam
 | 
						|
   colOp->setColParam(curCol, colId, curColStruct.colWidth, curColStruct.colDataType,
 | 
						|
                       curColStruct.colType, curColStruct.dataOid, curColStruct.fCompressionType,
 | 
						|
                       curColStruct.fColDbRoot, curColStruct.fColPartition, curColStruct.fColSegment);
 | 
						|
    rc = colOp->openColumnFile(curCol, segFile, useTmpSuffix); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
    {
 | 
						|
        return rc;
 | 
						|
    }
 | 
						|
 | 
						|
    //get hwm first
 | 
						|
    // @bug 286 : fix for bug 286 - correct the typo in getHWM
 | 
						|
    //RETURN_ON_ERROR(BRMWrapper::getInstance()->getHWM(curColStruct.dataOid, hwm));
 | 
						|
 | 
						|
    Column newCol;
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.start("allocRowId");
 | 
						|
#endif
 | 
						|
    newColStructList = colStructList;
 | 
						|
    newDctnryStructList = dctnryStructList;
 | 
						|
    bool bUseStartExtent = true;
 | 
						|
 | 
						|
    if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
        insertSelect = true;
 | 
						|
 | 
						|
    rc = colOp->allocRowId(txnid, bUseStartExtent,
 | 
						|
                           curCol, (uint64_t)totalRow, rowIdArray, hwm, newExtent, rowsLeft, newHwm, newFile,
 | 
						|
                           newColStructList, newDctnryStructList, dbRootExtentTrackers, insertSelect, true, tableOid, isFirstBatchPm);
 | 
						|
 | 
						|
    //cout << "after allocrowid, total row = " <<totalRow << " newExtent is " << newExtent << endl; 
 | 
						|
    //cout << "column oid " << curColStruct.dataOid << " has hwm:newHwm = " << hwm <<":" << newHwm<< endl;
 | 
						|
    if (rc != NO_ERROR) //Clean up is already done
 | 
						|
        return rc;
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.stop("allocRowId");
 | 
						|
#endif
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Expand initial abbreviated extent if any RID in 1st extent is > 256K.
 | 
						|
    // if totalRow == rowsLeft, then not adding rows to 1st extent, so skip it.
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // DMC-SHARED_NOTHING_NOTE: Is it safe to assume only part0 seg0 is abbreviated?
 | 
						|
    if ((curCol.dataFile.fPartition == 0) &&
 | 
						|
            (curCol.dataFile.fSegment   == 0) &&
 | 
						|
            ((totalRow - rowsLeft) > 0) &&
 | 
						|
            (rowIdArray[totalRow - rowsLeft - 1] >= (RID)INITIAL_EXTENT_ROWS_TO_DISK))
 | 
						|
    {
 | 
						|
       for (unsigned k=0; k<colStructList.size(); k++)
 | 
						|
        {
 | 
						|
           // Skip the selected column
 | 
						|
           if (k == colId)
 | 
						|
               continue;
 | 
						|
            Column expandCol;
 | 
						|
            colOp = m_colOp[op(colStructList[k].fCompressionType)];
 | 
						|
            colOp->setColParam(expandCol, 0,
 | 
						|
                               colStructList[k].colWidth,
 | 
						|
                               colStructList[k].colDataType,
 | 
						|
                               colStructList[k].colType,
 | 
						|
                               colStructList[k].dataOid,
 | 
						|
                               colStructList[k].fCompressionType,
 | 
						|
                               colStructList[k].fColDbRoot,
 | 
						|
                               colStructList[k].fColPartition,
 | 
						|
                               colStructList[k].fColSegment);
 | 
						|
            rc = colOp->openColumnFile(expandCol, segFile, true); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            if (rc == NO_ERROR)
 | 
						|
            {
 | 
						|
                if (colOp->abbreviatedExtent(expandCol.dataFile.pFile, colStructList[k].colWidth))
 | 
						|
                {
 | 
						|
                    rc = colOp->expandAbbrevExtent(expandCol);
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
            {
 | 
						|
                return rc;
 | 
						|
            }
 | 
						|
 | 
						|
            colOp->clearColumn(expandCol); // closes the file (if uncompressed)
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Tokenize data if needed
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    if (insertSelect && isAutoCommitOn)
 | 
						|
        BRMWrapper::setUseVb( false );
 | 
						|
    else
 | 
						|
        BRMWrapper::setUseVb( true );
 | 
						|
 | 
						|
    dictStr::iterator dctStr_iter;
 | 
						|
    ColTupleList::iterator col_iter;
 | 
						|
 | 
						|
    for (i = 0; i < colStructList.size(); i++)
 | 
						|
    {
 | 
						|
        if (colStructList[i].tokenFlag)
 | 
						|
        {
 | 
						|
            dctStr_iter = dictStrList[i].begin();
 | 
						|
            col_iter = colValueList[i].begin();
 | 
						|
            Dctnry* dctnry = m_dctnry[op(dctnryStructList[i].fCompressionType)];
 | 
						|
            rc = dctnry->openDctnry(dctnryStructList[i].dctnryOid,
 | 
						|
                                    dctnryStructList[i].fColDbRoot, dctnryStructList[i].fColPartition,
 | 
						|
                                    dctnryStructList[i].fColSegment,
 | 
						|
                                    useTmpSuffix); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
            {
 | 
						|
                cout << "Error opening dctnry file " << dctnryStructList[i].dctnryOid << endl;
 | 
						|
                return rc;
 | 
						|
            }
 | 
						|
 | 
						|
            for (uint32_t     rows = 0; rows < (totalRow - rowsLeft); rows++)
 | 
						|
            {
 | 
						|
                if (dctStr_iter->length() == 0)
 | 
						|
                {
 | 
						|
                    Token nullToken;
 | 
						|
                    col_iter->data = nullToken;
 | 
						|
                }
 | 
						|
                else
 | 
						|
                {
 | 
						|
#ifdef PROFILE
 | 
						|
                    timer.start("tokenize");
 | 
						|
#endif
 | 
						|
                    DctnryTuple dctTuple;
 | 
						|
                    dctTuple.sigValue = (unsigned char*)dctStr_iter->c_str();
 | 
						|
                    dctTuple.sigSize = dctStr_iter->length();
 | 
						|
                    dctTuple.isNull = false;
 | 
						|
                    rc = tokenize(txnid, dctTuple, dctnryStructList[i].fCompressionType);
 | 
						|
 | 
						|
                    if (rc != NO_ERROR)
 | 
						|
                    {
 | 
						|
                        dctnry->closeDctnry();
 | 
						|
                        return rc;
 | 
						|
                    }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                    timer.stop("tokenize");
 | 
						|
#endif
 | 
						|
                    col_iter->data = dctTuple.token;
 | 
						|
                }
 | 
						|
 | 
						|
                dctStr_iter++;
 | 
						|
                col_iter++;
 | 
						|
 | 
						|
            }
 | 
						|
 | 
						|
            //close dictionary files
 | 
						|
            rc = dctnry->closeDctnry(false);
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                return rc;
 | 
						|
 | 
						|
            if (newExtent)
 | 
						|
            {
 | 
						|
                //@Bug 4854 back up hwm chunk for the file to be modified
 | 
						|
                if (fRBMetaWriter)
 | 
						|
                    fRBMetaWriter->backupDctnryHWMChunk(newDctnryStructList[i].dctnryOid, newDctnryStructList[i].fColDbRoot, newDctnryStructList[i].fColPartition, newDctnryStructList[i].fColSegment);
 | 
						|
 | 
						|
                rc = dctnry->openDctnry(newDctnryStructList[i].dctnryOid,
 | 
						|
                                        newDctnryStructList[i].fColDbRoot, newDctnryStructList[i].fColPartition,
 | 
						|
                                        newDctnryStructList[i].fColSegment,
 | 
						|
                                        false); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
 | 
						|
                for (uint32_t     rows = 0; rows < rowsLeft; rows++)
 | 
						|
                {
 | 
						|
                    if (dctStr_iter->length() == 0)
 | 
						|
                    {
 | 
						|
                        Token nullToken;
 | 
						|
                        col_iter->data = nullToken;
 | 
						|
                    }
 | 
						|
                    else
 | 
						|
                    {
 | 
						|
#ifdef PROFILE
 | 
						|
                        timer.start("tokenize");
 | 
						|
#endif
 | 
						|
                        DctnryTuple dctTuple;
 | 
						|
                        dctTuple.sigValue = (unsigned char*)dctStr_iter->c_str();
 | 
						|
                        dctTuple.sigSize = dctStr_iter->length();
 | 
						|
                        dctTuple.isNull = false;
 | 
						|
                        rc = tokenize(txnid, dctTuple, newDctnryStructList[i].fCompressionType);
 | 
						|
 | 
						|
                        if (rc != NO_ERROR)
 | 
						|
                        {
 | 
						|
                            dctnry->closeDctnry();
 | 
						|
                            return rc;
 | 
						|
                        }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                        timer.stop("tokenize");
 | 
						|
#endif
 | 
						|
                        col_iter->data = dctTuple.token;
 | 
						|
                    }
 | 
						|
 | 
						|
                    dctStr_iter++;
 | 
						|
                    col_iter++;
 | 
						|
                }
 | 
						|
 | 
						|
                //close dictionary files
 | 
						|
                rc = dctnry->closeDctnry(false);
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    if (insertSelect && isAutoCommitOn)
 | 
						|
        BRMWrapper::setUseVb( false );
 | 
						|
    else
 | 
						|
        BRMWrapper::setUseVb( true );
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Update column info structure @Bug 1862 set hwm, and
 | 
						|
    // Prepare ValueList for new extent (if applicable)
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    //@Bug 2205 Check whether all rows go to the new extent
 | 
						|
    RID lastRid = 0;
 | 
						|
    RID lastRidNew = 0;
 | 
						|
 | 
						|
    if (totalRow - rowsLeft > 0)
 | 
						|
    {
 | 
						|
        lastRid = rowIdArray[totalRow - rowsLeft - 1];
 | 
						|
        lastRidNew = rowIdArray[totalRow - 1];
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        lastRid = 0;
 | 
						|
        lastRidNew = rowIdArray[totalRow - 1];
 | 
						|
    }
 | 
						|
 | 
						|
    //cout << "rowid allocated is "  << lastRid << endl;
 | 
						|
    //if a new extent is created, all the columns in this table should have their own new extent
 | 
						|
    //First column already processed
 | 
						|
 | 
						|
    //@Bug 1701. Close the file (if uncompressed)
 | 
						|
    m_colOp[op(curCol.compressionType)]->clearColumn(curCol);
 | 
						|
    //cout << "Saving hwm info for new ext batch" << endl;
 | 
						|
    //Update hwm to set them in the end
 | 
						|
    bool succFlag = false;
 | 
						|
    unsigned colWidth = 0;
 | 
						|
    int      curFbo = 0, curBio;
 | 
						|
 | 
						|
    for (i = 0; i < totalColumns; i++)
 | 
						|
    {
 | 
						|
        //shoud be obtained from saved hwm
 | 
						|
        aColExtsInfo = tableMetaData->getColExtsInfo(colStructList[i].dataOid);
 | 
						|
        it = aColExtsInfo.begin();
 | 
						|
 | 
						|
        while (it != aColExtsInfo.end())
 | 
						|
        {
 | 
						|
            if ((it->dbRoot == colStructList[i].fColDbRoot) && (it->partNum == colStructList[i].fColPartition)
 | 
						|
                    && (it->segNum == colStructList[i].fColSegment) && it->current)
 | 
						|
                break;
 | 
						|
 | 
						|
            it++;
 | 
						|
        }
 | 
						|
 | 
						|
        if (it != aColExtsInfo.end()) //update hwm info
 | 
						|
        {
 | 
						|
            oldHwm = it->hwm;
 | 
						|
        }
 | 
						|
 | 
						|
        // save hwm for the old extent
 | 
						|
        colWidth = colStructList[i].colWidth;
 | 
						|
        succFlag = colOp->calculateRowId(lastRid, BYTE_PER_BLOCK / colWidth, colWidth, curFbo, curBio);
 | 
						|
 | 
						|
        //cout << "insertcolumnrec   oid:rid:fbo:oldhwm = " << colStructList[i].dataOid << ":" << lastRid << ":" << curFbo << ":" << oldHwm << endl;
 | 
						|
        if (succFlag)
 | 
						|
        {
 | 
						|
            if ((HWM)curFbo >= oldHwm)
 | 
						|
            {
 | 
						|
                it->hwm = (HWM)curFbo;
 | 
						|
            }
 | 
						|
 | 
						|
            //@Bug 4947. set current to false for old extent.
 | 
						|
            if (newExtent)
 | 
						|
            {
 | 
						|
                it->current = false;
 | 
						|
            }
 | 
						|
 | 
						|
            //cout << "updated old ext info for oid " << colStructList[i].dataOid << " dbroot:part:seg:hwm:current = "
 | 
						|
            //<< it->dbRoot<<":"<<it->partNum<<":"<<it->segNum<<":"<<it->hwm<<":"<< it->current<< " and newExtent is " << newExtent << endl;
 | 
						|
        }
 | 
						|
        else
 | 
						|
            return ERR_INVALID_PARAM;
 | 
						|
 | 
						|
        //update hwm for the new extent
 | 
						|
        if (newExtent)
 | 
						|
        {
 | 
						|
            it = aColExtsInfo.begin();
 | 
						|
 | 
						|
            while (it != aColExtsInfo.end())
 | 
						|
            {
 | 
						|
                if ((it->dbRoot == newColStructList[i].fColDbRoot) && (it->partNum == newColStructList[i].fColPartition)
 | 
						|
                        && (it->segNum == newColStructList[i].fColSegment) && it->current)
 | 
						|
                    break;
 | 
						|
 | 
						|
                it++;
 | 
						|
            }
 | 
						|
 | 
						|
            succFlag = colOp->calculateRowId(lastRidNew, BYTE_PER_BLOCK / colWidth, colWidth, curFbo, curBio);
 | 
						|
 | 
						|
            if (succFlag)
 | 
						|
            {
 | 
						|
                if (it != aColExtsInfo.end())
 | 
						|
                {
 | 
						|
                    it->hwm = (HWM)curFbo;
 | 
						|
                    //cout << "setting hwm to " << (int)curFbo <<" for seg " <<it->segNum << endl;
 | 
						|
                    it->current = true;
 | 
						|
                }
 | 
						|
            }
 | 
						|
            else
 | 
						|
                return ERR_INVALID_PARAM;
 | 
						|
        }
 | 
						|
 | 
						|
        tableMetaData->setColExtsInfo(colStructList[i].dataOid, aColExtsInfo);
 | 
						|
    }
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    //Prepare the valuelist for the new extent
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    ColTupleList colTupleList;
 | 
						|
    ColTupleList newColTupleList;
 | 
						|
    ColTupleList firstPartTupleList;
 | 
						|
 | 
						|
    for (unsigned i = 0; i < totalColumns; i++)
 | 
						|
    {
 | 
						|
        colTupleList = static_cast<ColTupleList>(colValueList[i]);
 | 
						|
 | 
						|
        for (uint64_t j = rowsLeft; j > 0; j--)
 | 
						|
        {
 | 
						|
            newColTupleList.push_back(colTupleList[totalRow - j]);
 | 
						|
        }
 | 
						|
 | 
						|
        colNewValueList.push_back(newColTupleList);
 | 
						|
        newColTupleList.clear();
 | 
						|
 | 
						|
        //upate the oldvalue list for the old extent
 | 
						|
        for (uint64_t j = 0; j < (totalRow - rowsLeft); j++)
 | 
						|
        {
 | 
						|
            firstPartTupleList.push_back(colTupleList[j]);
 | 
						|
        }
 | 
						|
 | 
						|
        colOldValueList.push_back(firstPartTupleList);
 | 
						|
        firstPartTupleList.clear();
 | 
						|
    }
 | 
						|
 | 
						|
    // end of allocate row id
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.start("writeColumnRec");
 | 
						|
#endif
 | 
						|
//cout << "Writing column record" << endl;
 | 
						|
 | 
						|
    if (rc == NO_ERROR)
 | 
						|
    {
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        //Mark extents invalid
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        vector<BRM::LBID_t> lbids;
 | 
						|
        vector<CalpontSystemCatalog::ColDataType> colDataTypes;
 | 
						|
        bool successFlag = true;
 | 
						|
        unsigned width = 0;
 | 
						|
        int         curFbo = 0, curBio, lastFbo = -1;
 | 
						|
 | 
						|
        if (isFirstBatchPm && (totalRow == rowsLeft))
 | 
						|
        {}
 | 
						|
        else
 | 
						|
        {
 | 
						|
            for (unsigned i = 0; i < colStructList.size(); i++)
 | 
						|
            {
 | 
						|
                colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
                width = colStructList[i].colWidth;
 | 
						|
                successFlag = colOp->calculateRowId(lastRid, BYTE_PER_BLOCK / width, width, curFbo, curBio);
 | 
						|
 | 
						|
                if (successFlag)
 | 
						|
                {
 | 
						|
                    if (curFbo != lastFbo)
 | 
						|
                    {
 | 
						|
                        RETURN_ON_ERROR(AddLBIDtoList(txnid,
 | 
						|
                                                      lbids,
 | 
						|
                                                      colDataTypes,
 | 
						|
                                                      colStructList[i],
 | 
						|
                                                      curFbo));
 | 
						|
                    }
 | 
						|
                }
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        if (lbids.size() > 0)
 | 
						|
            rc = BRMWrapper::getInstance()->markExtentsInvalid(lbids, colDataTypes);
 | 
						|
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        // Write row(s) to database file(s)
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        rc = writeColumnRec(txnid, colStructList, colOldValueList, rowIdArray, newColStructList, colNewValueList, tableOid, useTmpSuffix); // @bug 5572 HDFS tmp file
 | 
						|
    }
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::insertColumnRecsBinary(const TxnID& txnid,
 | 
						|
        ColStructList& colStructList,
 | 
						|
        std::vector<uint64_t>& colValueList,
 | 
						|
        DctnryStructList& dctnryStructList,
 | 
						|
        DictStrList& dictStrList,
 | 
						|
        std::vector<boost::shared_ptr<DBRootExtentTracker> >& dbRootExtentTrackers,
 | 
						|
        RBMetaWriter* fRBMetaWriter,
 | 
						|
        bool bFirstExtentOnThisPM,
 | 
						|
        bool insertSelect,
 | 
						|
        bool isAutoCommitOn,
 | 
						|
        OID tableOid,
 | 
						|
        bool isFirstBatchPm)
 | 
						|
{
 | 
						|
    int            rc;
 | 
						|
    RID*           rowIdArray = NULL;
 | 
						|
    Column         curCol;
 | 
						|
    ColStruct      curColStruct;
 | 
						|
    ColStructList  newColStructList;
 | 
						|
    std::vector<uint64_t> colNewValueList;
 | 
						|
    DctnryStructList newDctnryStructList;
 | 
						|
    HWM            hwm = 0;
 | 
						|
    HWM            oldHwm = 0;
 | 
						|
    HWM    		  newHwm = 0;
 | 
						|
    size_t totalRow;
 | 
						|
    ColStructList::size_type totalColumns;
 | 
						|
    uint64_t rowsLeft = 0;
 | 
						|
    bool newExtent = false;
 | 
						|
    RIDList ridList;
 | 
						|
    ColumnOp* colOp = NULL;
 | 
						|
    std::vector<BRM::LBID_t> dictLbids;
 | 
						|
 | 
						|
    // Set tmp file suffix to modify HDFS db file
 | 
						|
    bool           useTmpSuffix = false;
 | 
						|
 | 
						|
    if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
    {
 | 
						|
        if (!bFirstExtentOnThisPM)
 | 
						|
            useTmpSuffix = true;
 | 
						|
    }
 | 
						|
 | 
						|
    unsigned i = 0;
 | 
						|
#ifdef PROFILE
 | 
						|
    StopWatch timer;
 | 
						|
#endif
 | 
						|
 | 
						|
    //Convert data type and column width to write engine specific
 | 
						|
    for (i = 0; i < colStructList.size(); i++)
 | 
						|
        Convertor::convertColType(&colStructList[i]);
 | 
						|
 | 
						|
    uint32_t colId = 0;
 | 
						|
    // MCOL-1675: find the smallest column width to calculate the RowID from so
 | 
						|
    // that all HWMs will be incremented by this operation
 | 
						|
    findSmallestColumn(colId, colStructList);
 | 
						|
 | 
						|
 | 
						|
    // rc = checkValid(txnid, colStructList, colValueList, ridList);
 | 
						|
    // if (rc != NO_ERROR)
 | 
						|
    //   return rc;
 | 
						|
 | 
						|
    setTransId(txnid);
 | 
						|
    uint16_t  dbRoot, segmentNum;
 | 
						|
    uint32_t partitionNum;
 | 
						|
    string    segFile;
 | 
						|
    bool newFile;
 | 
						|
    TableMetaData* tableMetaData = TableMetaData::makeTableMetaData(tableOid);
 | 
						|
    //populate colStructList with file information
 | 
						|
    IDBDataFile* pFile = NULL;
 | 
						|
    std::vector<DBRootExtentInfo> extentInfo;
 | 
						|
    int currentDBrootIdx = 0;
 | 
						|
    std::vector<BRM::CreateStripeColumnExtentsArgOut> extents;
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // For first batch on this PM:
 | 
						|
    //   o get starting extent from ExtentTracker, and allocate extent if needed
 | 
						|
    //   o construct colStructList and dctnryStructList accordingly
 | 
						|
    //   o save extent information in tableMetaData for future use
 | 
						|
    // If not first batch on this PM:
 | 
						|
    //   o construct colStructList and dctnryStructList from tableMetaData
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    if (isFirstBatchPm)
 | 
						|
    {
 | 
						|
        currentDBrootIdx = dbRootExtentTrackers[colId]->getCurrentDBRootIdx();
 | 
						|
        extentInfo = dbRootExtentTrackers[colId]->getDBRootExtentList();
 | 
						|
        dbRoot = extentInfo[currentDBrootIdx].fDbRoot;
 | 
						|
        partitionNum = extentInfo[currentDBrootIdx].fPartition;
 | 
						|
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        // check whether this extent is the first on this PM
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        if (bFirstExtentOnThisPM)
 | 
						|
        {
 | 
						|
            //cout << "bFirstExtentOnThisPM is " << bFirstExtentOnThisPM << endl;
 | 
						|
            std::vector<BRM::CreateStripeColumnExtentsArgIn> cols;
 | 
						|
            BRM::CreateStripeColumnExtentsArgIn createStripeColumnExtentsArgIn;
 | 
						|
 | 
						|
            for (i = 0; i < colStructList.size(); i++)
 | 
						|
            {
 | 
						|
                createStripeColumnExtentsArgIn.oid = colStructList[i].dataOid;
 | 
						|
                createStripeColumnExtentsArgIn.width = colStructList[i].colWidth;
 | 
						|
                createStripeColumnExtentsArgIn.colDataType = colStructList[i].colDataType;
 | 
						|
                cols.push_back(createStripeColumnExtentsArgIn);
 | 
						|
            }
 | 
						|
 | 
						|
            rc = BRMWrapper::getInstance()->allocateStripeColExtents(cols, dbRoot, partitionNum, segmentNum, extents);
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                return rc;
 | 
						|
 | 
						|
            //Create column files
 | 
						|
            BRM::CPInfoList_t cpinfoList;
 | 
						|
            BRM::CPInfo cpInfo;
 | 
						|
 | 
						|
            if (isUnsigned(colStructList[i].colDataType))
 | 
						|
            {
 | 
						|
                cpInfo.max = 0;
 | 
						|
                cpInfo.min = static_cast<int64_t>(numeric_limits<uint64_t>::max());
 | 
						|
            }
 | 
						|
            else
 | 
						|
            {
 | 
						|
                cpInfo.max = numeric_limits<int64_t>::min();
 | 
						|
                cpInfo.min = numeric_limits<int64_t>::max();
 | 
						|
            }
 | 
						|
 | 
						|
            cpInfo.seqNum = -1;
 | 
						|
 | 
						|
            for ( i = 0; i < extents.size(); i++)
 | 
						|
            {
 | 
						|
                colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
                colOp->initColumn(curCol);
 | 
						|
                colOp->setColParam(curCol, 0, colStructList[i].colWidth, colStructList[i].colDataType,
 | 
						|
                                   colStructList[i].colType, colStructList[i].dataOid, colStructList[i].fCompressionType,
 | 
						|
                                   dbRoot, partitionNum, segmentNum);
 | 
						|
                rc = colOp->extendColumn(curCol, false, extents[i].startBlkOffset, extents[i].startLbid, extents[i].allocSize, dbRoot,
 | 
						|
                                         partitionNum, segmentNum, segFile, pFile, newFile);
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
 | 
						|
                //mark the extents to invalid
 | 
						|
                cpInfo.firstLbid = extents[i].startLbid;
 | 
						|
                cpinfoList.push_back(cpInfo);
 | 
						|
                colStructList[i].fColPartition = partitionNum;
 | 
						|
                colStructList[i].fColSegment = segmentNum;
 | 
						|
                colStructList[i].fColDbRoot = dbRoot;
 | 
						|
                dctnryStructList[i].fColPartition = partitionNum;
 | 
						|
                dctnryStructList[i].fColSegment = segmentNum;
 | 
						|
                dctnryStructList[i].fColDbRoot = dbRoot;
 | 
						|
            }
 | 
						|
 | 
						|
            //mark the extents to invalid
 | 
						|
            rc = BRMWrapper::getInstance()->setExtentsMaxMin(cpinfoList);
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                return rc;
 | 
						|
 | 
						|
            //create corresponding dictionary files
 | 
						|
            for (i = 0; i < dctnryStructList.size(); i++)
 | 
						|
            {
 | 
						|
                if (dctnryStructList[i].dctnryOid > 0)
 | 
						|
                {
 | 
						|
                    rc = createDctnry(txnid, dctnryStructList[i].dctnryOid, dctnryStructList[i].colWidth, dbRoot, partitionNum,
 | 
						|
                                      segmentNum, dctnryStructList[i].fCompressionType);
 | 
						|
 | 
						|
                    if ( rc != NO_ERROR)
 | 
						|
                        return rc;
 | 
						|
                }
 | 
						|
            }
 | 
						|
        }    // if ( bFirstExtentOnThisPM)
 | 
						|
        else // if (!bFirstExtentOnThisPM)
 | 
						|
        {
 | 
						|
            std::vector<DBRootExtentInfo> tmpExtentInfo;
 | 
						|
 | 
						|
            for (i = 0; i < dbRootExtentTrackers.size(); i++)
 | 
						|
            {
 | 
						|
                tmpExtentInfo = dbRootExtentTrackers[i]->getDBRootExtentList();
 | 
						|
                colStructList[i].fColPartition =  tmpExtentInfo[currentDBrootIdx].fPartition;
 | 
						|
                colStructList[i].fColSegment = tmpExtentInfo[currentDBrootIdx].fSegment;
 | 
						|
                colStructList[i].fColDbRoot = tmpExtentInfo[currentDBrootIdx].fDbRoot;
 | 
						|
                //cout << "Load from dbrootExtenttracker oid:dbroot:part:seg = " <<colStructList[i].dataOid<<":"
 | 
						|
                //<<colStructList[i].fColDbRoot<<":"<<colStructList[i].fColPartition<<":"<<colStructList[i].fColSegment<<endl;
 | 
						|
                dctnryStructList[i].fColPartition = tmpExtentInfo[currentDBrootIdx].fPartition;
 | 
						|
                dctnryStructList[i].fColSegment = tmpExtentInfo[currentDBrootIdx].fSegment;
 | 
						|
                dctnryStructList[i].fColDbRoot = tmpExtentInfo[currentDBrootIdx].fDbRoot;
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        // Save the extents info in tableMetaData
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        for (i = 0; i < colStructList.size(); i++)
 | 
						|
        {
 | 
						|
            ColExtsInfo aColExtsInfo = tableMetaData->getColExtsInfo(colStructList[i].dataOid);
 | 
						|
            ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
            while (it != aColExtsInfo.end())
 | 
						|
            {
 | 
						|
                if ((it->dbRoot == colStructList[i].fColDbRoot) && (it->partNum == colStructList[i].fColPartition) && (it->segNum == colStructList[i].fColSegment))
 | 
						|
                    break;
 | 
						|
 | 
						|
                it++;
 | 
						|
            }
 | 
						|
 | 
						|
            if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
            {
 | 
						|
                ColExtInfo aExt;
 | 
						|
                aExt.dbRoot = colStructList[i].fColDbRoot;
 | 
						|
                aExt.partNum = colStructList[i].fColPartition;
 | 
						|
                aExt.segNum = colStructList[i].fColSegment;
 | 
						|
                aExt.compType = colStructList[i].fCompressionType;
 | 
						|
                aExt.isDict = false;
 | 
						|
 | 
						|
                if (bFirstExtentOnThisPM)
 | 
						|
                {
 | 
						|
                    aExt.hwm = extents[i].startBlkOffset;
 | 
						|
                    aExt.isNewExt = true;
 | 
						|
                    //cout << "adding a ext to metadata" << endl;
 | 
						|
                }
 | 
						|
                else
 | 
						|
                {
 | 
						|
                    std::vector<DBRootExtentInfo> tmpExtentInfo;
 | 
						|
                    tmpExtentInfo = dbRootExtentTrackers[i]->getDBRootExtentList();
 | 
						|
                    aExt.isNewExt = false;
 | 
						|
                    aExt.hwm = tmpExtentInfo[currentDBrootIdx].fLocalHwm;
 | 
						|
                    //cout << "oid " << colStructList[i].dataOid << " gets hwm " << aExt.hwm << endl;
 | 
						|
                }
 | 
						|
 | 
						|
                aExt.current = true;
 | 
						|
                aColExtsInfo.push_back(aExt);
 | 
						|
                //cout << "get from extentinfo oid:hwm = " << colStructList[i].dataOid << ":" << aExt.hwm << endl;
 | 
						|
            }
 | 
						|
 | 
						|
            tableMetaData->setColExtsInfo(colStructList[i].dataOid, aColExtsInfo);
 | 
						|
        }
 | 
						|
 | 
						|
        for (i = 0; i < dctnryStructList.size(); i++)
 | 
						|
        {
 | 
						|
            if (dctnryStructList[i].dctnryOid > 0)
 | 
						|
            {
 | 
						|
                ColExtsInfo aColExtsInfo = tableMetaData->getColExtsInfo(dctnryStructList[i].dctnryOid);
 | 
						|
                ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
                while (it != aColExtsInfo.end())
 | 
						|
                {
 | 
						|
                    if ((it->dbRoot == dctnryStructList[i].fColDbRoot) && (it->partNum == dctnryStructList[i].fColPartition) && (it->segNum == dctnryStructList[i].fColSegment))
 | 
						|
                        break;
 | 
						|
 | 
						|
                    it++;
 | 
						|
                }
 | 
						|
 | 
						|
                if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
                {
 | 
						|
                    ColExtInfo aExt;
 | 
						|
                    aExt.dbRoot = dctnryStructList[i].fColDbRoot;
 | 
						|
                    aExt.partNum = dctnryStructList[i].fColPartition;
 | 
						|
                    aExt.segNum = dctnryStructList[i].fColSegment;
 | 
						|
                    aExt.compType = dctnryStructList[i].fCompressionType;
 | 
						|
                    aExt.isDict = true;
 | 
						|
                    aColExtsInfo.push_back(aExt);
 | 
						|
                }
 | 
						|
 | 
						|
                tableMetaData->setColExtsInfo(dctnryStructList[i].dctnryOid, aColExtsInfo);
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
    } // if (isFirstBatchPm)
 | 
						|
    else //get the extent info from tableMetaData
 | 
						|
    {
 | 
						|
        ColExtsInfo aColExtsInfo = tableMetaData->getColExtsInfo(colStructList[colId].dataOid);
 | 
						|
        ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
        while (it != aColExtsInfo.end())
 | 
						|
        {
 | 
						|
            if (it->current)
 | 
						|
                break;
 | 
						|
 | 
						|
            it++;
 | 
						|
        }
 | 
						|
 | 
						|
        if (it == aColExtsInfo.end())
 | 
						|
            return 1;
 | 
						|
 | 
						|
        for (i = 0; i < colStructList.size(); i++)
 | 
						|
        {
 | 
						|
            colStructList[i].fColPartition = it->partNum;
 | 
						|
            colStructList[i].fColSegment = it->segNum;
 | 
						|
            colStructList[i].fColDbRoot = it->dbRoot;
 | 
						|
            dctnryStructList[i].fColPartition = it->partNum;
 | 
						|
            dctnryStructList[i].fColSegment = it->segNum;
 | 
						|
            dctnryStructList[i].fColDbRoot = it->dbRoot;
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    totalColumns = colStructList.size();
 | 
						|
    totalRow = colValueList.size() / totalColumns;
 | 
						|
    rowIdArray = new RID[totalRow];
 | 
						|
    // use scoped_array to ensure ptr deletion regardless of where we return
 | 
						|
    boost::scoped_array<RID> rowIdArrayPtr(rowIdArray);
 | 
						|
    memset(rowIdArray, 0, (sizeof(RID)*totalRow));
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // allocate row id(s)
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
 | 
						|
    curColStruct = colStructList[colId];
 | 
						|
 | 
						|
    colOp = m_colOp[op(curColStruct.fCompressionType)];
 | 
						|
 | 
						|
    colOp->initColumn(curCol);
 | 
						|
 | 
						|
    //Get the correct segment, partition, column file
 | 
						|
    vector<ExtentInfo> colExtentInfo; //Save those empty extents in case of failure to rollback
 | 
						|
    vector<ExtentInfo> dictExtentInfo; //Save those empty extents in case of failure to rollback
 | 
						|
    vector<ExtentInfo> fileInfo;
 | 
						|
    dbRoot = curColStruct.fColDbRoot;
 | 
						|
    //use the smallest column to calculate row id
 | 
						|
    ColExtsInfo aColExtsInfo = tableMetaData->getColExtsInfo(colStructList[colId].dataOid);
 | 
						|
    ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
    while (it != aColExtsInfo.end())
 | 
						|
    {
 | 
						|
        if ((it->dbRoot == colStructList[colId].fColDbRoot) && (it->partNum == colStructList[colId].fColPartition) && (it->segNum == colStructList[colId].fColSegment) && it->current )
 | 
						|
            break;
 | 
						|
 | 
						|
        it++;
 | 
						|
    }
 | 
						|
 | 
						|
    if (it != aColExtsInfo.end())
 | 
						|
    {
 | 
						|
        hwm = it->hwm;
 | 
						|
        //cout << "Got from colextinfo hwm for oid " << colStructList[colId].dataOid << " is " << hwm << " and seg is " << colStructList[colId].fColSegment << endl;
 | 
						|
    }
 | 
						|
 | 
						|
    oldHwm = hwm; //Save this info for rollback
 | 
						|
    //need to pass real dbRoot, partition, and segment to setColParam
 | 
						|
    colOp->setColParam(curCol, colId, curColStruct.colWidth, curColStruct.colDataType,
 | 
						|
                       curColStruct.colType, curColStruct.dataOid, curColStruct.fCompressionType,
 | 
						|
                       curColStruct.fColDbRoot, curColStruct.fColPartition, curColStruct.fColSegment);
 | 
						|
    rc = colOp->openColumnFile(curCol, segFile, useTmpSuffix); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
    {
 | 
						|
        return rc;
 | 
						|
    }
 | 
						|
 | 
						|
    //get hwm first
 | 
						|
    // @bug 286 : fix for bug 286 - correct the typo in getHWM
 | 
						|
    //RETURN_ON_ERROR(BRMWrapper::getInstance()->getHWM(curColStruct.dataOid, hwm));
 | 
						|
 | 
						|
    Column newCol;
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.start("allocRowId");
 | 
						|
#endif
 | 
						|
    newColStructList = colStructList;
 | 
						|
    newDctnryStructList = dctnryStructList;
 | 
						|
    bool bUseStartExtent = true;
 | 
						|
 | 
						|
    if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
        insertSelect = true;
 | 
						|
 | 
						|
    rc = colOp->allocRowId(txnid, bUseStartExtent,
 | 
						|
                           curCol, (uint64_t)totalRow, rowIdArray, hwm, newExtent, rowsLeft, newHwm, newFile,
 | 
						|
                           newColStructList, newDctnryStructList, dbRootExtentTrackers, insertSelect, true, tableOid, isFirstBatchPm);
 | 
						|
 | 
						|
    //cout << "after allocrowid, total row = " <<totalRow << " newExtent is " << newExtent << endl;
 | 
						|
    // cout << "column oid " << curColStruct.dataOid << " has hwm:newHwm = " << hwm <<":" << newHwm<< endl;
 | 
						|
    if (rc != NO_ERROR) //Clean up is already done
 | 
						|
        return rc;
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.stop("allocRowId");
 | 
						|
#endif
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Expand initial abbreviated extent if any RID in 1st extent is > 256K.
 | 
						|
    // if totalRow == rowsLeft, then not adding rows to 1st extent, so skip it.
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // DMC-SHARED_NOTHING_NOTE: Is it safe to assume only part0 seg0 is abbreviated?
 | 
						|
    if ((curCol.dataFile.fPartition == 0) &&
 | 
						|
            (curCol.dataFile.fSegment   == 0) &&
 | 
						|
            ((totalRow - rowsLeft) > 0) &&
 | 
						|
            (rowIdArray[totalRow - rowsLeft - 1] >= (RID)INITIAL_EXTENT_ROWS_TO_DISK))
 | 
						|
    {
 | 
						|
        for (size_t k = 0; k < colStructList.size(); k++)
 | 
						|
        {
 | 
						|
            // Skip the selected column
 | 
						|
            if (k == (size_t)colId)
 | 
						|
                continue;
 | 
						|
 | 
						|
            Column expandCol;
 | 
						|
           colOp = m_colOp[op(colStructList[k].fCompressionType)]; 
 | 
						|
           // Shouldn't we change 0 to colId here?
 | 
						|
            colOp->setColParam(expandCol, 0,
 | 
						|
                               colStructList[k].colWidth,
 | 
						|
                               colStructList[k].colDataType,
 | 
						|
                               colStructList[k].colType,
 | 
						|
                               colStructList[k].dataOid,
 | 
						|
                               colStructList[k].fCompressionType,
 | 
						|
                               colStructList[k].fColDbRoot,
 | 
						|
                               colStructList[k].fColPartition,
 | 
						|
                               colStructList[k].fColSegment);
 | 
						|
            rc = colOp->openColumnFile(expandCol, segFile, true); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            if (rc == NO_ERROR)
 | 
						|
            {
 | 
						|
                if (colOp->abbreviatedExtent(expandCol.dataFile.pFile, colStructList[k].colWidth))
 | 
						|
                {
 | 
						|
                    rc = colOp->expandAbbrevExtent(expandCol);
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
            {
 | 
						|
                return rc;
 | 
						|
            }
 | 
						|
 | 
						|
            colOp->closeColumnFile(expandCol);
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Tokenize data if needed
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    if (insertSelect && isAutoCommitOn)
 | 
						|
        BRMWrapper::setUseVb( false );
 | 
						|
    else
 | 
						|
        BRMWrapper::setUseVb( true );
 | 
						|
 | 
						|
    dictStr::iterator dctStr_iter;
 | 
						|
    uint64_t* colValPtr;
 | 
						|
    size_t rowsPerColumn = colValueList.size() / colStructList.size();
 | 
						|
 | 
						|
    for (i = 0; i < colStructList.size(); i++)
 | 
						|
    {
 | 
						|
        if (colStructList[i].tokenFlag)
 | 
						|
        {
 | 
						|
            dctStr_iter = dictStrList[i].begin();
 | 
						|
            Dctnry* dctnry = m_dctnry[op(dctnryStructList[i].fCompressionType)];
 | 
						|
            rc = dctnry->openDctnry(dctnryStructList[i].dctnryOid,
 | 
						|
                                    dctnryStructList[i].fColDbRoot, dctnryStructList[i].fColPartition,
 | 
						|
                                    dctnryStructList[i].fColSegment,
 | 
						|
                                    useTmpSuffix); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
            {
 | 
						|
                cout << "Error opening dctnry file " << dctnryStructList[i].dctnryOid << endl;
 | 
						|
                return rc;
 | 
						|
            }
 | 
						|
 | 
						|
            for (uint32_t     rows = 0; rows < (totalRow - rowsLeft); rows++)
 | 
						|
            {
 | 
						|
                colValPtr = &colValueList[(i * rowsPerColumn) + rows];
 | 
						|
 | 
						|
                if (dctStr_iter->length() == 0)
 | 
						|
                {
 | 
						|
                    Token nullToken;
 | 
						|
                    memcpy(colValPtr, &nullToken, 8);
 | 
						|
                }
 | 
						|
                else
 | 
						|
                {
 | 
						|
#ifdef PROFILE
 | 
						|
                    timer.start("tokenize");
 | 
						|
#endif
 | 
						|
                    DctnryTuple dctTuple;
 | 
						|
                    dctTuple.sigValue = (unsigned char*)dctStr_iter->c_str();
 | 
						|
                    dctTuple.sigSize = dctStr_iter->length();
 | 
						|
                    dctTuple.isNull = false;
 | 
						|
                    rc = tokenize(txnid, dctTuple, dctnryStructList[i].fCompressionType);
 | 
						|
 | 
						|
                    if (rc != NO_ERROR)
 | 
						|
                    {
 | 
						|
                        dctnry->closeDctnry();
 | 
						|
                        return rc;
 | 
						|
                    }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                    timer.stop("tokenize");
 | 
						|
#endif
 | 
						|
                    memcpy(colValPtr, &dctTuple.token, 8);
 | 
						|
                    dictLbids.push_back(dctTuple.token.fbo);
 | 
						|
                }
 | 
						|
 | 
						|
                dctStr_iter++;
 | 
						|
 | 
						|
            }
 | 
						|
 | 
						|
            //close dictionary files
 | 
						|
            rc = dctnry->closeDctnry(false);
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                return rc;
 | 
						|
 | 
						|
            if (newExtent)
 | 
						|
            {
 | 
						|
                //@Bug 4854 back up hwm chunk for the file to be modified
 | 
						|
                if (fRBMetaWriter)
 | 
						|
                    fRBMetaWriter->backupDctnryHWMChunk(newDctnryStructList[i].dctnryOid, newDctnryStructList[i].fColDbRoot, newDctnryStructList[i].fColPartition, newDctnryStructList[i].fColSegment);
 | 
						|
 | 
						|
                rc = dctnry->openDctnry(newDctnryStructList[i].dctnryOid,
 | 
						|
                                        newDctnryStructList[i].fColDbRoot, newDctnryStructList[i].fColPartition,
 | 
						|
                                        newDctnryStructList[i].fColSegment,
 | 
						|
                                        false); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
 | 
						|
                for (uint32_t     rows = 0; rows < rowsLeft; rows++)
 | 
						|
                {
 | 
						|
                    colValPtr = &colValueList[(i * rowsPerColumn) + rows];
 | 
						|
 | 
						|
                    if (dctStr_iter->length() == 0)
 | 
						|
                    {
 | 
						|
                        Token nullToken;
 | 
						|
                        memcpy(colValPtr, &nullToken, 8);
 | 
						|
                    }
 | 
						|
                    else
 | 
						|
                    {
 | 
						|
#ifdef PROFILE
 | 
						|
                        timer.start("tokenize");
 | 
						|
#endif
 | 
						|
                        DctnryTuple dctTuple;
 | 
						|
                        dctTuple.sigValue = (unsigned char*)dctStr_iter->c_str();
 | 
						|
                        dctTuple.sigSize = dctStr_iter->length();
 | 
						|
                        dctTuple.isNull = false;
 | 
						|
                        rc = tokenize(txnid, dctTuple, newDctnryStructList[i].fCompressionType);
 | 
						|
 | 
						|
                        if (rc != NO_ERROR)
 | 
						|
                        {
 | 
						|
                            dctnry->closeDctnry();
 | 
						|
                            return rc;
 | 
						|
                        }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                        timer.stop("tokenize");
 | 
						|
#endif
 | 
						|
                        memcpy(colValPtr, &dctTuple.token, 8);
 | 
						|
                        dictLbids.push_back(dctTuple.token.fbo);
 | 
						|
                    }
 | 
						|
 | 
						|
                    dctStr_iter++;
 | 
						|
                }
 | 
						|
 | 
						|
                //close dictionary files
 | 
						|
                rc = dctnry->closeDctnry(false);
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    if (insertSelect && isAutoCommitOn)
 | 
						|
        BRMWrapper::setUseVb( false );
 | 
						|
    else
 | 
						|
        BRMWrapper::setUseVb( true );
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Update column info structure @Bug 1862 set hwm, and
 | 
						|
    // Prepare ValueList for new extent (if applicable)
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    //@Bug 2205 Check whether all rows go to the new extent
 | 
						|
    RID lastRid = 0;
 | 
						|
    RID lastRidNew = 0;
 | 
						|
 | 
						|
    if (totalRow - rowsLeft > 0)
 | 
						|
    {
 | 
						|
        lastRid = rowIdArray[totalRow - rowsLeft - 1];
 | 
						|
        lastRidNew = rowIdArray[totalRow - 1];
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        lastRid = 0;
 | 
						|
        lastRidNew = rowIdArray[totalRow - 1];
 | 
						|
    }
 | 
						|
 | 
						|
    //cout << "rowid allocated is "  << lastRid << endl;
 | 
						|
    //if a new extent is created, all the columns in this table should have their own new extent
 | 
						|
    //First column already processed
 | 
						|
 | 
						|
    //@Bug 1701. Close the file (if uncompressed)
 | 
						|
    m_colOp[op(curCol.compressionType)]->closeColumnFile(curCol);
 | 
						|
    //cout << "Saving hwm info for new ext batch" << endl;
 | 
						|
    //Update hwm to set them in the end
 | 
						|
    bool succFlag = false;
 | 
						|
    unsigned colWidth = 0;
 | 
						|
    int      curFbo = 0, curBio;
 | 
						|
 | 
						|
    for (i = 0; i < totalColumns; i++)
 | 
						|
    {
 | 
						|
        //shoud be obtained from saved hwm
 | 
						|
        aColExtsInfo = tableMetaData->getColExtsInfo(colStructList[i].dataOid);
 | 
						|
        it = aColExtsInfo.begin();
 | 
						|
 | 
						|
        while (it != aColExtsInfo.end())
 | 
						|
        {
 | 
						|
            if ((it->dbRoot == colStructList[i].fColDbRoot) && (it->partNum == colStructList[i].fColPartition)
 | 
						|
                    && (it->segNum == colStructList[i].fColSegment) && it->current)
 | 
						|
                break;
 | 
						|
 | 
						|
            it++;
 | 
						|
        }
 | 
						|
 | 
						|
        if (it != aColExtsInfo.end()) //update hwm info
 | 
						|
        {
 | 
						|
            oldHwm = it->hwm;
 | 
						|
 | 
						|
            // save hwm for the old extent
 | 
						|
            colWidth = colStructList[i].colWidth;
 | 
						|
            succFlag = colOp->calculateRowId(lastRid, BYTE_PER_BLOCK / colWidth, colWidth, curFbo, curBio);
 | 
						|
 | 
						|
            //cout << "insertcolumnrec   oid:rid:fbo:oldhwm = " << colStructList[i].dataOid << ":" << lastRid << ":" << curFbo << ":" << oldHwm << endl;
 | 
						|
            if (succFlag)
 | 
						|
            {
 | 
						|
                if ((HWM)curFbo >= oldHwm)
 | 
						|
                {
 | 
						|
                    it->hwm = (HWM)curFbo;
 | 
						|
                }
 | 
						|
 | 
						|
                //@Bug 4947. set current to false for old extent.
 | 
						|
                if (newExtent)
 | 
						|
                {
 | 
						|
                    it->current = false;
 | 
						|
                }
 | 
						|
 | 
						|
                //cout << "updated old ext info for oid " << colStructList[i].dataOid << " dbroot:part:seg:hwm:current = "
 | 
						|
                //<< it->dbRoot<<":"<<it->partNum<<":"<<it->segNum<<":"<<it->hwm<<":"<< it->current<< " and newExtent is " << newExtent << endl;
 | 
						|
            }
 | 
						|
            else
 | 
						|
                return ERR_INVALID_PARAM;
 | 
						|
 | 
						|
        }
 | 
						|
 | 
						|
        //update hwm for the new extent
 | 
						|
        if (newExtent)
 | 
						|
        {
 | 
						|
            it = aColExtsInfo.begin();
 | 
						|
 | 
						|
            while (it != aColExtsInfo.end())
 | 
						|
            {
 | 
						|
                if ((it->dbRoot == newColStructList[i].fColDbRoot) && (it->partNum == newColStructList[i].fColPartition)
 | 
						|
                        && (it->segNum == newColStructList[i].fColSegment) && it->current)
 | 
						|
                    break;
 | 
						|
 | 
						|
                it++;
 | 
						|
            }
 | 
						|
 | 
						|
            colWidth = newColStructList[i].colWidth;
 | 
						|
            succFlag = colOp->calculateRowId(lastRidNew, BYTE_PER_BLOCK / colWidth, colWidth, curFbo, curBio);
 | 
						|
 | 
						|
            if (succFlag)
 | 
						|
            {
 | 
						|
                if (it != aColExtsInfo.end())
 | 
						|
                {
 | 
						|
                    it->hwm = (HWM)curFbo;
 | 
						|
                    //cout << "setting hwm to " << (int)curFbo <<" for seg " <<it->segNum << endl;
 | 
						|
                    it->current = true;
 | 
						|
                }
 | 
						|
            }
 | 
						|
            else
 | 
						|
                return ERR_INVALID_PARAM;
 | 
						|
        }
 | 
						|
 | 
						|
        tableMetaData->setColExtsInfo(colStructList[i].dataOid, aColExtsInfo);
 | 
						|
    }
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    //Prepare the valuelist for the new extent
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
 | 
						|
    for (unsigned i = 1; i <= totalColumns; i++)
 | 
						|
    {
 | 
						|
        // Copy values to second value list
 | 
						|
        for (uint64_t j = rowsLeft; j > 0; j--)
 | 
						|
        {
 | 
						|
            colNewValueList.push_back(colValueList[(totalRow * i) - j]);
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    // end of allocate row id
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.start("writeColumnRec");
 | 
						|
#endif
 | 
						|
//cout << "Writing column record" << endl;
 | 
						|
 | 
						|
    if (rc == NO_ERROR)
 | 
						|
    {
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        //Mark extents invalid
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        vector<BRM::LBID_t> lbids;
 | 
						|
        vector<CalpontSystemCatalog::ColDataType> colDataTypes;
 | 
						|
        bool successFlag = true;
 | 
						|
        unsigned width = 0;
 | 
						|
        int         curFbo = 0, curBio, lastFbo = -1;
 | 
						|
 | 
						|
        if (isFirstBatchPm && (totalRow == rowsLeft))
 | 
						|
        {}
 | 
						|
        else
 | 
						|
        {
 | 
						|
            for (unsigned i = 0; i < colStructList.size(); i++)
 | 
						|
            {
 | 
						|
                colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
                width = colStructList[i].colWidth;
 | 
						|
                successFlag = colOp->calculateRowId(lastRid, BYTE_PER_BLOCK / width, width, curFbo, curBio);
 | 
						|
 | 
						|
                if (successFlag)
 | 
						|
                {
 | 
						|
                    if (curFbo != lastFbo)
 | 
						|
                    {
 | 
						|
                        RETURN_ON_ERROR(AddLBIDtoList(txnid,
 | 
						|
                                                      lbids,
 | 
						|
                                                      colDataTypes,
 | 
						|
                                                      colStructList[i],
 | 
						|
                                                      curFbo));
 | 
						|
                    }
 | 
						|
                }
 | 
						|
                else
 | 
						|
                    return ERR_INVALID_PARAM;
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        // If we create a new extent for this batch
 | 
						|
        for (unsigned i = 0; i < newColStructList.size(); i++)
 | 
						|
        {
 | 
						|
            colOp = m_colOp[op(newColStructList[i].fCompressionType)];
 | 
						|
            width = newColStructList[i].colWidth;
 | 
						|
            successFlag = colOp->calculateRowId(lastRidNew, BYTE_PER_BLOCK / width, width, curFbo, curBio);
 | 
						|
 | 
						|
            if (successFlag)
 | 
						|
            {
 | 
						|
                if (curFbo != lastFbo)
 | 
						|
                {
 | 
						|
                    RETURN_ON_ERROR(AddLBIDtoList(txnid,
 | 
						|
                                                  lbids,
 | 
						|
                                                  colDataTypes,
 | 
						|
                                                  newColStructList[i],
 | 
						|
                                                  curFbo));
 | 
						|
                }
 | 
						|
            }
 | 
						|
            else
 | 
						|
                return ERR_INVALID_PARAM;
 | 
						|
        }
 | 
						|
 | 
						|
        if (lbids.size() > 0)
 | 
						|
            rc = BRMWrapper::getInstance()->markExtentsInvalid(lbids, colDataTypes);
 | 
						|
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        // Write row(s) to database file(s)
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        bool versioning = !(isAutoCommitOn && insertSelect);
 | 
						|
        AddDictToList(txnid, dictLbids);
 | 
						|
        rc = writeColumnRecBinary(txnid, colStructList, colValueList, rowIdArray, newColStructList, colNewValueList, tableOid, useTmpSuffix, versioning); // @bug 5572 HDFS tmp file
 | 
						|
    }
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
int WriteEngineWrapper::insertColumnRec_SYS(const TxnID& txnid,
 | 
						|
        ColStructList& colStructList,
 | 
						|
        ColValueList& colValueList,
 | 
						|
        DctnryStructList& dctnryStructList,
 | 
						|
        DictStrList& dictStrList,
 | 
						|
        const int32_t tableOid)
 | 
						|
{
 | 
						|
    int            rc;
 | 
						|
    RID*           rowIdArray = NULL;
 | 
						|
    ColTupleList   curTupleList;
 | 
						|
    Column         curCol;
 | 
						|
    ColStruct      curColStruct;
 | 
						|
    ColValueList   colOldValueList;
 | 
						|
    ColValueList   colNewValueList;
 | 
						|
    ColStructList  newColStructList;
 | 
						|
    DctnryStructList newDctnryStructList;
 | 
						|
    HWM            hwm = 0;
 | 
						|
    HWM            newHwm = 0;
 | 
						|
    HWM            oldHwm = 0;
 | 
						|
    ColTupleList::size_type totalRow;
 | 
						|
    ColStructList::size_type totalColumns;
 | 
						|
    uint64_t rowsLeft = 0;
 | 
						|
    bool newExtent = false;
 | 
						|
    RIDList ridList;
 | 
						|
    ColumnOp* colOp = NULL;
 | 
						|
    uint32_t i = 0;
 | 
						|
#ifdef PROFILE
 | 
						|
    StopWatch timer;
 | 
						|
#endif
 | 
						|
 | 
						|
    // debug information for testing
 | 
						|
    if (isDebug(DEBUG_2))
 | 
						|
    {
 | 
						|
        printf("\nIn wrapper insert\n");
 | 
						|
        printInputValue(colStructList, colValueList, ridList);
 | 
						|
    }
 | 
						|
 | 
						|
    // end
 | 
						|
 | 
						|
    //Convert data type and column width to write engine specific
 | 
						|
    for (i = 0; i < colStructList.size(); i++)
 | 
						|
        Convertor::convertColType(&colStructList[i]);
 | 
						|
 | 
						|
    rc = checkValid(txnid, colStructList, colValueList, ridList);
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
        return rc;
 | 
						|
 | 
						|
    setTransId(txnid);
 | 
						|
 | 
						|
    curTupleList = static_cast<ColTupleList>(colValueList[0]);
 | 
						|
    totalRow = curTupleList.size();
 | 
						|
    totalColumns = colStructList.size();
 | 
						|
    rowIdArray = new RID[totalRow];
 | 
						|
    // use scoped_array to ensure ptr deletion regardless of where we return
 | 
						|
    boost::scoped_array<RID> rowIdArrayPtr(rowIdArray);
 | 
						|
    memset(rowIdArray, 0, (sizeof(RID)*totalRow));
 | 
						|
 | 
						|
    // allocate row id(s)
 | 
						|
    curColStruct = colStructList[0];
 | 
						|
    colOp = m_colOp[op(curColStruct.fCompressionType)];
 | 
						|
 | 
						|
    colOp->initColumn(curCol);
 | 
						|
 | 
						|
    //Get the correct segment, partition, column file
 | 
						|
    uint16_t dbRoot, segmentNum;
 | 
						|
    uint32_t partitionNum;
 | 
						|
    vector<ExtentInfo> colExtentInfo; //Save those empty extents in case of failure to rollback
 | 
						|
    vector<ExtentInfo> dictExtentInfo; //Save those empty extents in case of failure to rollback
 | 
						|
    vector<ExtentInfo> fileInfo;
 | 
						|
    ExtentInfo info;
 | 
						|
    //Don't search for empty space, always append to the end. May need to revisit this part
 | 
						|
    dbRoot = curColStruct.fColDbRoot;
 | 
						|
    int  extState;
 | 
						|
    bool extFound;
 | 
						|
    RETURN_ON_ERROR(BRMWrapper::getInstance()->getLastHWM_DBroot(
 | 
						|
                        curColStruct.dataOid, dbRoot, partitionNum, segmentNum, hwm,
 | 
						|
                        extState, extFound));
 | 
						|
 | 
						|
    for (i = 0; i < colStructList.size(); i++)
 | 
						|
    {
 | 
						|
        colStructList[i].fColPartition = partitionNum;
 | 
						|
        colStructList[i].fColSegment = segmentNum;
 | 
						|
        colStructList[i].fColDbRoot = dbRoot;
 | 
						|
    }
 | 
						|
 | 
						|
    oldHwm = hwm; //Save this info for rollback
 | 
						|
    //need to pass real dbRoot, partition, and segment to setColParam
 | 
						|
    colOp->setColParam(curCol, 0, curColStruct.colWidth, curColStruct.colDataType,
 | 
						|
                       curColStruct.colType, curColStruct.dataOid, curColStruct.fCompressionType,
 | 
						|
                       dbRoot, partitionNum, segmentNum);
 | 
						|
 | 
						|
    string segFile;
 | 
						|
    rc = colOp->openColumnFile(curCol, segFile, false); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
    {
 | 
						|
        return rc;
 | 
						|
    }
 | 
						|
 | 
						|
    //get hwm first
 | 
						|
    // @bug 286 : fix for bug 286 - correct the typo in getHWM
 | 
						|
    //RETURN_ON_ERROR(BRMWrapper::getInstance()->getHWM(curColStruct.dataOid, hwm));
 | 
						|
 | 
						|
    //...Note that we are casting totalRow to int to be in sync with
 | 
						|
    //...allocRowId().  So we are assuming that totalRow
 | 
						|
    //...(curTupleList.size()) will fit into an int.  We arleady made
 | 
						|
    //...that assumption earlier in this method when we used totalRow
 | 
						|
    //...in the call to calloc() to allocate rowIdArray.
 | 
						|
    Column newCol;
 | 
						|
    bool newFile;
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.start("allocRowId");
 | 
						|
#endif
 | 
						|
 | 
						|
    newColStructList = colStructList;
 | 
						|
    newDctnryStructList = dctnryStructList;
 | 
						|
    std::vector<boost::shared_ptr<DBRootExtentTracker> >   dbRootExtentTrackers;
 | 
						|
    bool bUseStartExtent = true;
 | 
						|
    rc = colOp->allocRowId(txnid, bUseStartExtent,
 | 
						|
                           curCol, (uint64_t)totalRow, rowIdArray, hwm, newExtent, rowsLeft, newHwm, newFile, newColStructList, newDctnryStructList,
 | 
						|
                           dbRootExtentTrackers, false, false, 0);
 | 
						|
 | 
						|
    if ((rc == ERR_FILE_DISK_SPACE) && newExtent)
 | 
						|
    {
 | 
						|
        for (i = 0; i < newColStructList.size(); i++)
 | 
						|
        {
 | 
						|
            info.oid = newColStructList[i].dataOid;
 | 
						|
            info.partitionNum = newColStructList[i].fColPartition;
 | 
						|
            info.segmentNum = newColStructList[i].fColSegment;
 | 
						|
            info.dbRoot = newColStructList[i].fColDbRoot;
 | 
						|
 | 
						|
            if (newFile)
 | 
						|
                fileInfo.push_back (info);
 | 
						|
 | 
						|
            colExtentInfo.push_back (info);
 | 
						|
        }
 | 
						|
 | 
						|
        int rc1 = BRMWrapper::getInstance()->deleteEmptyColExtents(colExtentInfo);
 | 
						|
 | 
						|
        if ((rc1 == 0) &&  newFile)
 | 
						|
        {
 | 
						|
            rc1 = colOp->deleteFile(fileInfo[0].oid, fileInfo[0].dbRoot, fileInfo[0].partitionNum, fileInfo[0].segmentNum);
 | 
						|
 | 
						|
            if ( rc1 != NO_ERROR)
 | 
						|
                return rc;
 | 
						|
 | 
						|
            FileOp fileOp;
 | 
						|
 | 
						|
            for (i = 0; i < newDctnryStructList.size(); i++)
 | 
						|
            {
 | 
						|
                if (newDctnryStructList[i].dctnryOid > 0)
 | 
						|
                {
 | 
						|
                    info.oid = newDctnryStructList[i].dctnryOid;
 | 
						|
                    info.partitionNum = newDctnryStructList[i].fColPartition;
 | 
						|
                    info.segmentNum = newDctnryStructList[i].fColSegment;
 | 
						|
                    info.dbRoot = newDctnryStructList[i].fColDbRoot;
 | 
						|
                    info.newFile = true;
 | 
						|
                    fileInfo.push_back (info);
 | 
						|
                    dictExtentInfo.push_back (info);
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
            if (dictExtentInfo.size() > 0)
 | 
						|
            {
 | 
						|
                rc1 = BRMWrapper::getInstance()->deleteEmptyDictStoreExtents(dictExtentInfo);
 | 
						|
 | 
						|
                if ( rc1 != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
 | 
						|
                for (unsigned j = 0; j < fileInfo.size(); j++)
 | 
						|
                {
 | 
						|
                    rc1 = fileOp.deleteFile(fileInfo[j].oid, fileInfo[j].dbRoot,
 | 
						|
                                            fileInfo[j].partitionNum, fileInfo[j].segmentNum);
 | 
						|
                }
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    TableMetaData* aTableMetaData = TableMetaData::makeTableMetaData(tableOid);
 | 
						|
 | 
						|
    //..Expand initial abbreviated extent if any RID in 1st extent is > 256K
 | 
						|
// DMC-SHARED_NOTHING_NOTE: Is it safe to assume only part0 seg0 is abbreviated?
 | 
						|
    if ((partitionNum == 0) &&
 | 
						|
            (segmentNum   == 0) &&
 | 
						|
            ((totalRow - rowsLeft) > 0) &&
 | 
						|
            (rowIdArray[totalRow - rowsLeft - 1] >= (RID)INITIAL_EXTENT_ROWS_TO_DISK))
 | 
						|
    {
 | 
						|
        for (size_t k = 1; k < colStructList.size(); k++)
 | 
						|
        {
 | 
						|
            Column expandCol;
 | 
						|
            colOp = m_colOp[op(colStructList[k].fCompressionType)];
 | 
						|
            colOp->setColParam(expandCol, 0,
 | 
						|
                               colStructList[k].colWidth,
 | 
						|
                               colStructList[k].colDataType,
 | 
						|
                               colStructList[k].colType,
 | 
						|
                               colStructList[k].dataOid,
 | 
						|
                               colStructList[k].fCompressionType,
 | 
						|
                               dbRoot,
 | 
						|
                               partitionNum,
 | 
						|
                               segmentNum);
 | 
						|
            rc = colOp->openColumnFile(expandCol, segFile, false); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            if (rc == NO_ERROR)
 | 
						|
            {
 | 
						|
                if (colOp->abbreviatedExtent(expandCol.dataFile.pFile, colStructList[k].colWidth))
 | 
						|
                {
 | 
						|
                    rc = colOp->expandAbbrevExtent(expandCol);
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
            {
 | 
						|
                if (newExtent)
 | 
						|
                {
 | 
						|
                    //Remove the empty extent added to the first column
 | 
						|
                    int rc1 = BRMWrapper::getInstance()->
 | 
						|
                              deleteEmptyColExtents(colExtentInfo);
 | 
						|
 | 
						|
                    if ((rc1 == 0) && newFile)
 | 
						|
                    {
 | 
						|
                        rc1 = colOp->deleteFile(fileInfo[0].oid,
 | 
						|
                                                fileInfo[0].dbRoot,
 | 
						|
                                                fileInfo[0].partitionNum,
 | 
						|
                                                fileInfo[0].segmentNum);
 | 
						|
                    }
 | 
						|
                }
 | 
						|
 | 
						|
                colOp->clearColumn(expandCol); // closes the file
 | 
						|
                return rc;
 | 
						|
            }
 | 
						|
 | 
						|
            colOp->clearColumn(expandCol); // closes the file
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    BRMWrapper::setUseVb(true);
 | 
						|
    //Tokenize data if needed
 | 
						|
    dictStr::iterator dctStr_iter;
 | 
						|
    ColTupleList::iterator col_iter;
 | 
						|
 | 
						|
    for (i = 0; i < colStructList.size(); i++)
 | 
						|
    {
 | 
						|
        if (colStructList[i].tokenFlag)
 | 
						|
        {
 | 
						|
            dctStr_iter = dictStrList[i].begin();
 | 
						|
            col_iter = colValueList[i].begin();
 | 
						|
            Dctnry* dctnry = m_dctnry[op(dctnryStructList[i].fCompressionType)];
 | 
						|
 | 
						|
            dctnryStructList[i].fColPartition = partitionNum;
 | 
						|
            dctnryStructList[i].fColSegment = segmentNum;
 | 
						|
            dctnryStructList[i].fColDbRoot = dbRoot;
 | 
						|
            rc = dctnry->openDctnry(dctnryStructList[i].dctnryOid,
 | 
						|
                                    dctnryStructList[i].fColDbRoot, dctnryStructList[i].fColPartition,
 | 
						|
                                    dctnryStructList[i].fColSegment,
 | 
						|
                                    false); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                return rc;
 | 
						|
 | 
						|
            ColExtsInfo aColExtsInfo = aTableMetaData->getColExtsInfo(dctnryStructList[i].dctnryOid);
 | 
						|
            ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
            while (it != aColExtsInfo.end())
 | 
						|
            {
 | 
						|
                if ((it->dbRoot == dctnryStructList[i].fColDbRoot) && (it->partNum == dctnryStructList[i].fColPartition) && (it->segNum == dctnryStructList[i].fColSegment))
 | 
						|
                    break;
 | 
						|
 | 
						|
                it++;
 | 
						|
            }
 | 
						|
 | 
						|
            if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
            {
 | 
						|
                ColExtInfo aExt;
 | 
						|
                aExt.dbRoot = dctnryStructList[i].fColDbRoot;
 | 
						|
                aExt.partNum = dctnryStructList[i].fColPartition;
 | 
						|
                aExt.segNum = dctnryStructList[i].fColSegment;
 | 
						|
                aExt.compType = dctnryStructList[i].fCompressionType;
 | 
						|
                aExt.isDict = true;
 | 
						|
                aColExtsInfo.push_back(aExt);
 | 
						|
                aTableMetaData->setColExtsInfo(dctnryStructList[i].dctnryOid, aColExtsInfo);
 | 
						|
            }
 | 
						|
 | 
						|
            for (uint32_t     rows = 0; rows < (totalRow - rowsLeft); rows++)
 | 
						|
            {
 | 
						|
                if (dctStr_iter->length() == 0)
 | 
						|
                {
 | 
						|
                    Token nullToken;
 | 
						|
                    col_iter->data = nullToken;
 | 
						|
                }
 | 
						|
                else
 | 
						|
                {
 | 
						|
#ifdef PROFILE
 | 
						|
                    timer.start("tokenize");
 | 
						|
#endif
 | 
						|
                    DctnryTuple dctTuple;
 | 
						|
                    dctTuple.sigValue = (unsigned char*)dctStr_iter->c_str();
 | 
						|
                    dctTuple.sigSize = dctStr_iter->length();
 | 
						|
                    dctTuple.isNull = false;
 | 
						|
                    rc = tokenize(txnid, dctTuple, dctnryStructList[i].fCompressionType);
 | 
						|
 | 
						|
                    if (rc != NO_ERROR)
 | 
						|
                    {
 | 
						|
                        dctnry->closeDctnry();
 | 
						|
                        return rc;
 | 
						|
                    }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                    timer.stop("tokenize");
 | 
						|
#endif
 | 
						|
                    col_iter->data = dctTuple.token;
 | 
						|
                }
 | 
						|
 | 
						|
                dctStr_iter++;
 | 
						|
                col_iter++;
 | 
						|
 | 
						|
            }
 | 
						|
 | 
						|
            //close dictionary files
 | 
						|
            rc = dctnry->closeDctnry();
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                return rc;
 | 
						|
 | 
						|
            if (newExtent)
 | 
						|
            {
 | 
						|
                rc = dctnry->openDctnry(newDctnryStructList[i].dctnryOid,
 | 
						|
                                        newDctnryStructList[i].fColDbRoot, newDctnryStructList[i].fColPartition,
 | 
						|
                                        newDctnryStructList[i].fColSegment,
 | 
						|
                                        false); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
 | 
						|
                aColExtsInfo = aTableMetaData->getColExtsInfo(newDctnryStructList[i].dctnryOid);
 | 
						|
                it = aColExtsInfo.begin();
 | 
						|
 | 
						|
                while (it != aColExtsInfo.end())
 | 
						|
                {
 | 
						|
                    if ((it->dbRoot == newDctnryStructList[i].fColDbRoot) && (it->partNum == newDctnryStructList[i].fColPartition) && (it->segNum == newDctnryStructList[i].fColSegment))
 | 
						|
                        break;
 | 
						|
 | 
						|
                    it++;
 | 
						|
                }
 | 
						|
 | 
						|
                if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
                {
 | 
						|
                    ColExtInfo aExt;
 | 
						|
                    aExt.dbRoot = newDctnryStructList[i].fColDbRoot;
 | 
						|
                    aExt.partNum = newDctnryStructList[i].fColPartition;
 | 
						|
                    aExt.segNum = newDctnryStructList[i].fColSegment;
 | 
						|
                    aExt.compType = newDctnryStructList[i].fCompressionType;
 | 
						|
                    aExt.isDict = true;
 | 
						|
                    aColExtsInfo.push_back(aExt);
 | 
						|
                    aTableMetaData->setColExtsInfo(newDctnryStructList[i].dctnryOid, aColExtsInfo);
 | 
						|
                }
 | 
						|
 | 
						|
                for (uint32_t     rows = 0; rows < rowsLeft; rows++)
 | 
						|
                {
 | 
						|
                    if (dctStr_iter->length() == 0)
 | 
						|
                    {
 | 
						|
                        Token nullToken;
 | 
						|
                        col_iter->data = nullToken;
 | 
						|
                    }
 | 
						|
                    else
 | 
						|
                    {
 | 
						|
#ifdef PROFILE
 | 
						|
                        timer.start("tokenize");
 | 
						|
#endif
 | 
						|
                        DctnryTuple dctTuple;
 | 
						|
                        dctTuple.sigValue = (unsigned char*)dctStr_iter->c_str();
 | 
						|
                        dctTuple.sigSize = dctStr_iter->length();
 | 
						|
                        dctTuple.isNull = false;
 | 
						|
                        rc = tokenize(txnid, dctTuple, newDctnryStructList[i].fCompressionType);
 | 
						|
 | 
						|
                        if (rc != NO_ERROR)
 | 
						|
                        {
 | 
						|
                            dctnry->closeDctnry();
 | 
						|
                            return rc;
 | 
						|
                        }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                        timer.stop("tokenize");
 | 
						|
#endif
 | 
						|
                        col_iter->data = dctTuple.token;
 | 
						|
                    }
 | 
						|
 | 
						|
                    dctStr_iter++;
 | 
						|
                    col_iter++;
 | 
						|
                }
 | 
						|
 | 
						|
                //close dictionary files
 | 
						|
                rc = dctnry->closeDctnry();
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
 | 
						|
    //Update column info structure @Bug 1862 set hwm
 | 
						|
    //@Bug 2205 Check whether all rows go to the new extent
 | 
						|
    RID lastRid = 0;
 | 
						|
    RID lastRidNew = 0;
 | 
						|
 | 
						|
    if (totalRow - rowsLeft > 0)
 | 
						|
    {
 | 
						|
        lastRid = rowIdArray[totalRow - rowsLeft - 1];
 | 
						|
        lastRidNew = rowIdArray[totalRow - 1];
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        lastRid = 0;
 | 
						|
        lastRidNew = rowIdArray[totalRow - 1];
 | 
						|
    }
 | 
						|
 | 
						|
    //cout << "rowid allocated is "  << lastRid << endl;
 | 
						|
    //if a new extent is created, all the columns in this table should have their own new extent
 | 
						|
 | 
						|
    //@Bug 1701. Close the file
 | 
						|
    m_colOp[op(curCol.compressionType)]->clearColumn(curCol);
 | 
						|
    std::vector<BulkSetHWMArg> hwmVecNewext;
 | 
						|
    std::vector<BulkSetHWMArg> hwmVecOldext;
 | 
						|
 | 
						|
    if (newExtent) //Save all hwms to set them later.
 | 
						|
    {
 | 
						|
        BulkSetHWMArg aHwmEntryNew;
 | 
						|
        BulkSetHWMArg aHwmEntryOld;
 | 
						|
        bool succFlag = false;
 | 
						|
        unsigned colWidth = 0;
 | 
						|
        int  extState;
 | 
						|
        bool extFound;
 | 
						|
        int      curFbo = 0, curBio;
 | 
						|
 | 
						|
        for (i = 0; i < totalColumns; i++)
 | 
						|
        {
 | 
						|
            Column         curColLocal;
 | 
						|
            colOp->initColumn(curColLocal);
 | 
						|
 | 
						|
            colOp = m_colOp[op(newColStructList[i].fCompressionType)];
 | 
						|
            colOp->setColParam(curColLocal, 0,
 | 
						|
                               newColStructList[i].colWidth, newColStructList[i].colDataType,
 | 
						|
                               newColStructList[i].colType, newColStructList[i].dataOid,
 | 
						|
                               newColStructList[i].fCompressionType, dbRoot, partitionNum, segmentNum);
 | 
						|
 | 
						|
            rc = BRMWrapper::getInstance()->getLastHWM_DBroot(
 | 
						|
                     curColLocal.dataFile.fid, dbRoot, partitionNum, segmentNum, oldHwm,
 | 
						|
                     extState, extFound);
 | 
						|
 | 
						|
            info.oid = curColLocal.dataFile.fid;
 | 
						|
            info.partitionNum = partitionNum;
 | 
						|
            info.segmentNum = segmentNum;
 | 
						|
            info.dbRoot = dbRoot;
 | 
						|
            info.hwm = oldHwm;
 | 
						|
            colExtentInfo.push_back(info);
 | 
						|
            // @Bug 2714 need to set hwm for the old extent
 | 
						|
            colWidth = colStructList[i].colWidth;
 | 
						|
            succFlag = colOp->calculateRowId(lastRid, BYTE_PER_BLOCK / colWidth, colWidth, curFbo, curBio);
 | 
						|
 | 
						|
            //cout << "insertcolumnrec   oid:rid:fbo:hwm = " << colStructList[i].dataOid << ":" << lastRid << ":" << curFbo << ":" << hwm << endl;
 | 
						|
            if (succFlag)
 | 
						|
            {
 | 
						|
                if ((HWM)curFbo > oldHwm)
 | 
						|
                {
 | 
						|
                    aHwmEntryOld.oid = colStructList[i].dataOid;
 | 
						|
                    aHwmEntryOld.partNum = partitionNum;
 | 
						|
                    aHwmEntryOld.segNum = segmentNum;
 | 
						|
                    aHwmEntryOld.hwm = curFbo;
 | 
						|
                    hwmVecOldext.push_back(aHwmEntryOld);
 | 
						|
                }
 | 
						|
            }
 | 
						|
            else
 | 
						|
                return ERR_INVALID_PARAM;
 | 
						|
 | 
						|
            colWidth = newColStructList[i].colWidth;
 | 
						|
            succFlag = colOp->calculateRowId(lastRidNew, BYTE_PER_BLOCK / colWidth, colWidth, curFbo, curBio);
 | 
						|
 | 
						|
            if (succFlag)
 | 
						|
            {
 | 
						|
                aHwmEntryNew.oid = newColStructList[i].dataOid;
 | 
						|
                aHwmEntryNew.partNum = newColStructList[i].fColPartition;
 | 
						|
                aHwmEntryNew.segNum = newColStructList[i].fColSegment;
 | 
						|
                aHwmEntryNew.hwm = curFbo;
 | 
						|
                hwmVecNewext.push_back(aHwmEntryNew);
 | 
						|
            }
 | 
						|
 | 
						|
            m_colOp[op(curColLocal.compressionType)]->clearColumn(curColLocal);
 | 
						|
        }
 | 
						|
 | 
						|
        //Prepare the valuelist for the new extent
 | 
						|
        ColTupleList colTupleList;
 | 
						|
        ColTupleList newColTupleList;
 | 
						|
        ColTupleList firstPartTupleList;
 | 
						|
 | 
						|
        for (unsigned i = 0; i < totalColumns; i++)
 | 
						|
        {
 | 
						|
            colTupleList = static_cast<ColTupleList>(colValueList[i]);
 | 
						|
 | 
						|
            for (uint64_t j = rowsLeft; j > 0; j--)
 | 
						|
            {
 | 
						|
                newColTupleList.push_back(colTupleList[totalRow - j]);
 | 
						|
            }
 | 
						|
 | 
						|
            colNewValueList.push_back(newColTupleList);
 | 
						|
            newColTupleList.clear();
 | 
						|
 | 
						|
            //upate the oldvalue list for the old extent
 | 
						|
            for (uint64_t j = 0; j < (totalRow - rowsLeft); j++)
 | 
						|
            {
 | 
						|
                firstPartTupleList.push_back(colTupleList[j]);
 | 
						|
            }
 | 
						|
 | 
						|
            colOldValueList.push_back(firstPartTupleList);
 | 
						|
            firstPartTupleList.clear();
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
//Mark extents invalid
 | 
						|
    vector<BRM::LBID_t> lbids;
 | 
						|
    vector<CalpontSystemCatalog::ColDataType> colDataTypes;
 | 
						|
    bool successFlag = true;
 | 
						|
    unsigned width = 0;
 | 
						|
    BRM::LBID_t lbid;
 | 
						|
    int         curFbo = 0, curBio, lastFbo = -1;
 | 
						|
 | 
						|
    if (totalRow - rowsLeft > 0)
 | 
						|
    {
 | 
						|
        for (unsigned i = 0; i < colStructList.size(); i++)
 | 
						|
        {
 | 
						|
            colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
            width = colStructList[i].colWidth;
 | 
						|
            successFlag = colOp->calculateRowId(lastRid, BYTE_PER_BLOCK / width, width, curFbo, curBio);
 | 
						|
 | 
						|
            if (successFlag)
 | 
						|
            {
 | 
						|
                if (curFbo != lastFbo)
 | 
						|
                {
 | 
						|
                    RETURN_ON_ERROR(BRMWrapper::getInstance()->getBrmInfo(
 | 
						|
                                        colStructList[i].dataOid, colStructList[i].fColPartition,
 | 
						|
                                        colStructList[i].fColSegment, curFbo, lbid));
 | 
						|
                    lbids.push_back((BRM::LBID_t)lbid);
 | 
						|
                    colDataTypes.push_back(colStructList[i].colDataType);
 | 
						|
                }
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    lastRid = rowIdArray[totalRow - 1];
 | 
						|
 | 
						|
    for (unsigned i = 0; i < newColStructList.size(); i++)
 | 
						|
    {
 | 
						|
        colOp = m_colOp[op(newColStructList[i].fCompressionType)];
 | 
						|
        width = newColStructList[i].colWidth;
 | 
						|
        successFlag = colOp->calculateRowId(lastRid, BYTE_PER_BLOCK / width, width, curFbo, curBio);
 | 
						|
 | 
						|
        if (successFlag)
 | 
						|
        {
 | 
						|
            if (curFbo != lastFbo)
 | 
						|
            {
 | 
						|
                RETURN_ON_ERROR(AddLBIDtoList(txnid,
 | 
						|
                                              lbids,
 | 
						|
                                              colDataTypes,
 | 
						|
                                              newColStructList[i],
 | 
						|
                                              curFbo));
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    //cout << "lbids size = " << lbids.size()<< endl;
 | 
						|
    if (lbids.size() > 0)
 | 
						|
        rc = BRMWrapper::getInstance()->markExtentsInvalid(lbids, colDataTypes);
 | 
						|
 | 
						|
    if (rc == NO_ERROR)
 | 
						|
    {
 | 
						|
        // MCOL-66 The DBRM can't handle concurrent transactions to sys tables
 | 
						|
        static boost::mutex dbrmMutex;
 | 
						|
        boost::mutex::scoped_lock lk(dbrmMutex);
 | 
						|
 | 
						|
        if (newExtent)
 | 
						|
        {
 | 
						|
            rc = writeColumnRec(txnid, colStructList, colOldValueList, rowIdArray, newColStructList, colNewValueList, tableOid, false); // @bug 5572 HDFS tmp file
 | 
						|
        }
 | 
						|
        else
 | 
						|
        {
 | 
						|
            rc = writeColumnRec(txnid, colStructList, colValueList, rowIdArray, newColStructList, colNewValueList, tableOid, false); // @bug 5572 HDFS tmp file
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.stop("writeColumnRec");
 | 
						|
#endif
 | 
						|
//   for (ColTupleList::size_type  i = 0; i < totalRow; i++)
 | 
						|
//      ridList.push_back((RID) rowIdArray[i]);
 | 
						|
 | 
						|
    // if (rc == NO_ERROR)
 | 
						|
    //   rc = flushDataFiles(NO_ERROR);
 | 
						|
 | 
						|
    if ( !newExtent )
 | 
						|
    {
 | 
						|
        //flushVMCache();
 | 
						|
        bool succFlag = false;
 | 
						|
        unsigned colWidth = 0;
 | 
						|
        int  extState;
 | 
						|
        bool extFound;
 | 
						|
        int curFbo = 0, curBio;
 | 
						|
        std::vector<BulkSetHWMArg> hwmVec;
 | 
						|
 | 
						|
        for (unsigned i = 0; i < totalColumns; i++)
 | 
						|
        {
 | 
						|
            //colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
            //Set all columns hwm together
 | 
						|
            BulkSetHWMArg aHwmEntry;
 | 
						|
            RETURN_ON_ERROR(BRMWrapper::getInstance()->getLastHWM_DBroot(colStructList[i].dataOid, dbRoot, partitionNum, segmentNum, hwm,
 | 
						|
                            extState, extFound));
 | 
						|
            colWidth = colStructList[i].colWidth;
 | 
						|
            succFlag = colOp->calculateRowId(lastRid, BYTE_PER_BLOCK / colWidth, colWidth, curFbo, curBio);
 | 
						|
 | 
						|
            //cout << "insertcolumnrec   oid:rid:fbo:hwm = " << colStructList[i].dataOid << ":" << lastRid << ":" << curFbo << ":" << hwm << endl;
 | 
						|
            if (succFlag)
 | 
						|
            {
 | 
						|
                if ((HWM)curFbo > hwm)
 | 
						|
                {
 | 
						|
                    aHwmEntry.oid = colStructList[i].dataOid;
 | 
						|
                    aHwmEntry.partNum = partitionNum;
 | 
						|
                    aHwmEntry.segNum = segmentNum;
 | 
						|
                    aHwmEntry.hwm = curFbo;
 | 
						|
                    hwmVec.push_back(aHwmEntry);
 | 
						|
                }
 | 
						|
            }
 | 
						|
            else
 | 
						|
                return ERR_INVALID_PARAM;
 | 
						|
        }
 | 
						|
 | 
						|
        if (hwmVec.size() > 0 )
 | 
						|
        {
 | 
						|
            std::vector<BRM::CPInfoMerge> mergeCPDataArgs;
 | 
						|
            RETURN_ON_ERROR(BRMWrapper::getInstance()->bulkSetHWMAndCP( hwmVec, mergeCPDataArgs));
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    if (newExtent)
 | 
						|
    {
 | 
						|
#ifdef PROFILE
 | 
						|
        timer.start("flushVMCache");
 | 
						|
#endif
 | 
						|
        std::vector<BRM::CPInfoMerge> mergeCPDataArgs;
 | 
						|
        RETURN_ON_ERROR(BRMWrapper::getInstance()->bulkSetHWMAndCP( hwmVecNewext, mergeCPDataArgs));
 | 
						|
        RETURN_ON_ERROR(BRMWrapper::getInstance()->bulkSetHWMAndCP( hwmVecOldext, mergeCPDataArgs));
 | 
						|
        //flushVMCache();
 | 
						|
#ifdef PROFILE
 | 
						|
        timer.stop("flushVMCache");
 | 
						|
#endif
 | 
						|
    }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.finish();
 | 
						|
#endif
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::insertColumnRec_Single(const TxnID& txnid,
 | 
						|
        ColStructList& colStructList,
 | 
						|
        ColValueList& colValueList,
 | 
						|
        DctnryStructList& dctnryStructList,
 | 
						|
        DictStrList& dictStrList,
 | 
						|
        const int32_t tableOid)
 | 
						|
{
 | 
						|
    int            rc;
 | 
						|
    RID*           rowIdArray = NULL;
 | 
						|
    ColTupleList   curTupleList;
 | 
						|
    Column         curCol;
 | 
						|
    ColStruct      curColStruct;
 | 
						|
    ColValueList   colOldValueList;
 | 
						|
    ColValueList   colNewValueList;
 | 
						|
    ColStructList  newColStructList;
 | 
						|
    DctnryStructList newDctnryStructList;
 | 
						|
    HWM            hwm = 0;
 | 
						|
    HWM            newHwm = 0;
 | 
						|
    HWM            oldHwm = 0;
 | 
						|
    ColTupleList::size_type totalRow;
 | 
						|
    ColStructList::size_type totalColumns;
 | 
						|
    uint64_t rowsLeft = 0;
 | 
						|
    bool newExtent = false;
 | 
						|
    RIDList ridList;
 | 
						|
    ColumnOp* colOp = NULL;
 | 
						|
    uint32_t i = 0;
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    StopWatch timer;
 | 
						|
#endif
 | 
						|
 | 
						|
    // debug information for testing
 | 
						|
    if (isDebug(DEBUG_2))
 | 
						|
    {
 | 
						|
        printf("\nIn wrapper insert\n");
 | 
						|
        printInputValue(colStructList, colValueList, ridList);
 | 
						|
    }
 | 
						|
 | 
						|
    // end
 | 
						|
 | 
						|
    //Convert data type and column width to write engine specific
 | 
						|
    for (i = 0; i < colStructList.size(); i++)
 | 
						|
        Convertor::convertColType(&colStructList[i]);
 | 
						|
 | 
						|
    uint32_t colId = 0;
 | 
						|
    // MCOL-1675: find the smallest column width to calculate the RowID from so
 | 
						|
    // that all HWMs will be incremented by this operation
 | 
						|
    findSmallestColumn(colId, colStructList);
 | 
						|
 | 
						|
    rc = checkValid(txnid, colStructList, colValueList, ridList);
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
        return rc;
 | 
						|
 | 
						|
    setTransId(txnid);
 | 
						|
 | 
						|
    curTupleList = static_cast<ColTupleList>(colValueList[0]);
 | 
						|
    totalRow = curTupleList.size();
 | 
						|
    totalColumns = colStructList.size();
 | 
						|
    rowIdArray = new RID[totalRow];
 | 
						|
    // use scoped_array to ensure ptr deletion regardless of where we return
 | 
						|
    boost::scoped_array<RID> rowIdArrayPtr(rowIdArray);
 | 
						|
    memset(rowIdArray, 0, (sizeof(RID)*totalRow));
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // allocate row id(s)
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
	curColStruct = colStructList[colId];
 | 
						|
    colOp = m_colOp[op(curColStruct.fCompressionType)];
 | 
						|
 | 
						|
    colOp->initColumn(curCol);
 | 
						|
 | 
						|
    //Get the correct segment, partition, column file
 | 
						|
    uint16_t dbRoot;
 | 
						|
    uint16_t segmentNum   = 0;
 | 
						|
    uint32_t partitionNum = 0;
 | 
						|
    //Don't search for empty space, always append to the end. May revisit later
 | 
						|
    dbRoot = curColStruct.fColDbRoot;
 | 
						|
    int  extState;
 | 
						|
    bool bStartExtFound;
 | 
						|
    bool bUseStartExtent = false;
 | 
						|
    RETURN_ON_ERROR(BRMWrapper::getInstance()->getLastHWM_DBroot(
 | 
						|
                        curColStruct.dataOid, dbRoot, partitionNum, segmentNum, hwm,
 | 
						|
                        extState, bStartExtFound));
 | 
						|
 | 
						|
    if ((bStartExtFound) && (extState == BRM::EXTENTAVAILABLE))
 | 
						|
        bUseStartExtent = true;
 | 
						|
 | 
						|
    for (i = 0; i < colStructList.size(); i++)
 | 
						|
    {
 | 
						|
        colStructList[i].fColPartition = partitionNum;
 | 
						|
        colStructList[i].fColSegment   = segmentNum;
 | 
						|
        colStructList[i].fColDbRoot    = dbRoot;
 | 
						|
    }
 | 
						|
 | 
						|
    for (i = 0; i < dctnryStructList.size(); i++)
 | 
						|
    {
 | 
						|
        dctnryStructList[i].fColPartition = partitionNum;
 | 
						|
        dctnryStructList[i].fColSegment   = segmentNum;
 | 
						|
        dctnryStructList[i].fColDbRoot    = dbRoot;
 | 
						|
    }
 | 
						|
 | 
						|
    oldHwm = hwm; //Save this info for rollback
 | 
						|
    //need to pass real dbRoot, partition, and segment to setColParam
 | 
						|
	colOp->setColParam(curCol, colId, curColStruct.colWidth, curColStruct.colDataType,
 | 
						|
                       curColStruct.colType, curColStruct.dataOid, curColStruct.fCompressionType,
 | 
						|
                       dbRoot, partitionNum, segmentNum);
 | 
						|
 | 
						|
    string segFile;
 | 
						|
 | 
						|
    if (bUseStartExtent)
 | 
						|
    {
 | 
						|
        rc = colOp->openColumnFile(curCol, segFile, true); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
        if (rc != NO_ERROR)
 | 
						|
        {
 | 
						|
            return rc;
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    bool newFile;
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.start("allocRowId");
 | 
						|
#endif
 | 
						|
    newColStructList = colStructList;
 | 
						|
    newDctnryStructList = dctnryStructList;
 | 
						|
    std::vector<boost::shared_ptr<DBRootExtentTracker> >  dbRootExtentTrackers;
 | 
						|
    rc = colOp->allocRowId(txnid, bUseStartExtent,
 | 
						|
                           curCol, (uint64_t)totalRow, rowIdArray, hwm, newExtent,
 | 
						|
                           rowsLeft, newHwm, newFile, newColStructList, newDctnryStructList,
 | 
						|
                           dbRootExtentTrackers, false, false, 0);
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Handle case where we ran out of disk space allocating a new extent.
 | 
						|
    // Rollback extentmap and delete any db files that were created.
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
    {
 | 
						|
        if ((rc == ERR_FILE_DISK_SPACE) && newExtent)
 | 
						|
        {
 | 
						|
            vector<ExtentInfo> colExtentInfo;
 | 
						|
            vector<ExtentInfo> dictExtentInfo;
 | 
						|
            vector<ExtentInfo> fileInfo;
 | 
						|
            ExtentInfo info;
 | 
						|
 | 
						|
            for (i = 0; i < newColStructList.size(); i++)
 | 
						|
            {
 | 
						|
                info.oid          = newColStructList[i].dataOid;
 | 
						|
                info.partitionNum = newColStructList[i].fColPartition;
 | 
						|
                info.segmentNum   = newColStructList[i].fColSegment;
 | 
						|
                info.dbRoot       = newColStructList[i].fColDbRoot;
 | 
						|
 | 
						|
                if (newFile)
 | 
						|
                    fileInfo.push_back (info);
 | 
						|
 | 
						|
                colExtentInfo.push_back (info);
 | 
						|
            }
 | 
						|
 | 
						|
            int rc1 = BRMWrapper::getInstance()->deleteEmptyColExtents(colExtentInfo);
 | 
						|
 | 
						|
            // Only rollback dictionary extents "if" store file is new
 | 
						|
            if ((rc1 == 0) && newFile)
 | 
						|
            {
 | 
						|
                for (unsigned int j = 0; j < fileInfo.size(); j++)
 | 
						|
                {
 | 
						|
                    // ignore return code and delete what we can
 | 
						|
                    rc1 = colOp->deleteFile(fileInfo[j].oid,
 | 
						|
                                            fileInfo[j].dbRoot,
 | 
						|
                                            fileInfo[j].partitionNum,
 | 
						|
                                            fileInfo[j].segmentNum);
 | 
						|
                }
 | 
						|
 | 
						|
                fileInfo.clear();
 | 
						|
 | 
						|
                for (i = 0; i < newDctnryStructList.size(); i++)
 | 
						|
                {
 | 
						|
                    if (newDctnryStructList[i].dctnryOid > 0)
 | 
						|
                    {
 | 
						|
                        info.oid          = newDctnryStructList[i].dctnryOid;
 | 
						|
                        info.partitionNum = newDctnryStructList[i].fColPartition;
 | 
						|
                        info.segmentNum   = newDctnryStructList[i].fColSegment;
 | 
						|
                        info.dbRoot       = newDctnryStructList[i].fColDbRoot;
 | 
						|
                        info.newFile      = true;
 | 
						|
                        fileInfo.push_back (info);
 | 
						|
                        dictExtentInfo.push_back (info);
 | 
						|
                    }
 | 
						|
                }
 | 
						|
 | 
						|
                if (dictExtentInfo.size() > 0)
 | 
						|
                {
 | 
						|
                    FileOp fileOp;
 | 
						|
                    rc1 = BRMWrapper::getInstance()->deleteEmptyDictStoreExtents(dictExtentInfo);
 | 
						|
 | 
						|
                    if ( rc1 != NO_ERROR)
 | 
						|
                        return rc;
 | 
						|
 | 
						|
                    for (unsigned j = 0; j < fileInfo.size(); j++)
 | 
						|
                    {
 | 
						|
                        rc1 = fileOp.deleteFile(fileInfo[j].oid,
 | 
						|
                                                fileInfo[j].dbRoot,
 | 
						|
                                                fileInfo[j].partitionNum,
 | 
						|
                                                fileInfo[j].segmentNum);
 | 
						|
                    }
 | 
						|
                }
 | 
						|
            }
 | 
						|
        } // disk space error allocating new extent
 | 
						|
 | 
						|
        return rc;
 | 
						|
    }     // rc != NO_ERROR from call to allocRowID()
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.stop("allocRowId");
 | 
						|
#endif
 | 
						|
 | 
						|
    TableMetaData* aTableMetaData = TableMetaData::makeTableMetaData(tableOid);
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Expand initial abbreviated extent if any RID in 1st extent is > 256K.
 | 
						|
    // if totalRow == rowsLeft, then not adding rows to 1st extent, so skip it.
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
// DMC-SHARED_NOTHING_NOTE: Is it safe to assume only part0 seg0 is abbreviated?
 | 
						|
	if ((colStructList[colId].fColPartition == 0) &&
 | 
						|
		(colStructList[colId].fColSegment   == 0) &&
 | 
						|
            ((totalRow - rowsLeft) > 0) &&
 | 
						|
            (rowIdArray[totalRow - rowsLeft - 1] >= (RID)INITIAL_EXTENT_ROWS_TO_DISK))
 | 
						|
    {
 | 
						|
		for (unsigned k=0; k<colStructList.size(); k++)
 | 
						|
        {
 | 
						|
            if (k == colId)
 | 
						|
               continue;
 | 
						|
            Column expandCol;
 | 
						|
            colOp = m_colOp[op(colStructList[k].fCompressionType)];
 | 
						|
            colOp->setColParam(expandCol, 0,
 | 
						|
                               colStructList[k].colWidth,
 | 
						|
                               colStructList[k].colDataType,
 | 
						|
                               colStructList[k].colType,
 | 
						|
                               colStructList[k].dataOid,
 | 
						|
                               colStructList[k].fCompressionType,
 | 
						|
                               colStructList[k].fColDbRoot,
 | 
						|
                               colStructList[k].fColPartition,
 | 
						|
                               colStructList[k].fColSegment);
 | 
						|
            rc = colOp->openColumnFile(expandCol, segFile, true); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            if (rc == NO_ERROR)
 | 
						|
            {
 | 
						|
                if (colOp->abbreviatedExtent(
 | 
						|
                            expandCol.dataFile.pFile, colStructList[k].colWidth))
 | 
						|
                {
 | 
						|
                    rc = colOp->expandAbbrevExtent(expandCol);
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
            colOp->clearColumn(expandCol); // closes the file
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
            {
 | 
						|
                return rc;
 | 
						|
            }
 | 
						|
        } // loop through columns
 | 
						|
    }     // if starting extent needs to be expanded
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Tokenize data if needed
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    dictStr::iterator dctStr_iter;
 | 
						|
    ColTupleList::iterator col_iter;
 | 
						|
 | 
						|
    for (unsigned i = 0; i < colStructList.size(); i++)
 | 
						|
    {
 | 
						|
        if (colStructList[i].tokenFlag)
 | 
						|
        {
 | 
						|
            dctStr_iter = dictStrList[i].begin();
 | 
						|
            col_iter = colValueList[i].begin();
 | 
						|
            Dctnry* dctnry = m_dctnry[op(dctnryStructList[i].fCompressionType)];
 | 
						|
 | 
						|
            ColExtsInfo aColExtsInfo = aTableMetaData->getColExtsInfo(dctnryStructList[i].dctnryOid);
 | 
						|
            ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
            if (bUseStartExtent)
 | 
						|
            {
 | 
						|
                rc = dctnry->openDctnry(dctnryStructList[i].dctnryOid,
 | 
						|
                                        dctnryStructList[i].fColDbRoot,
 | 
						|
                                        dctnryStructList[i].fColPartition,
 | 
						|
                                        dctnryStructList[i].fColSegment,
 | 
						|
                                        true); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
 | 
						|
                while (it != aColExtsInfo.end())
 | 
						|
                {
 | 
						|
                    if ((it->dbRoot == dctnryStructList[i].fColDbRoot) && (it->partNum == dctnryStructList[i].fColPartition) && (it->segNum == dctnryStructList[i].fColSegment))
 | 
						|
                        break;
 | 
						|
 | 
						|
                    it++;
 | 
						|
                }
 | 
						|
 | 
						|
                if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
                {
 | 
						|
                    ColExtInfo aExt;
 | 
						|
                    aExt.dbRoot = dctnryStructList[i].fColDbRoot;
 | 
						|
                    aExt.partNum = dctnryStructList[i].fColPartition;
 | 
						|
                    aExt.segNum = dctnryStructList[i].fColSegment;
 | 
						|
                    aExt.compType = dctnryStructList[i].fCompressionType;
 | 
						|
                    aExt.isDict = true;
 | 
						|
                    aColExtsInfo.push_back(aExt);
 | 
						|
                    aTableMetaData->setColExtsInfo(dctnryStructList[i].dctnryOid, aColExtsInfo);
 | 
						|
                }
 | 
						|
 | 
						|
 | 
						|
                for (uint32_t rows = 0; rows < (totalRow - rowsLeft); rows++)
 | 
						|
                {
 | 
						|
                    if (dctStr_iter->length() == 0)
 | 
						|
                    {
 | 
						|
                        Token nullToken;
 | 
						|
                        col_iter->data = nullToken;
 | 
						|
                    }
 | 
						|
                    else
 | 
						|
                    {
 | 
						|
#ifdef PROFILE
 | 
						|
                        timer.start("tokenize");
 | 
						|
#endif
 | 
						|
                        DctnryTuple dctTuple;
 | 
						|
                        dctTuple.sigValue = (unsigned char*)dctStr_iter->c_str();
 | 
						|
                        dctTuple.sigSize = dctStr_iter->length();
 | 
						|
                        dctTuple.isNull = false;
 | 
						|
                        rc = tokenize(txnid,
 | 
						|
                                      dctTuple,
 | 
						|
                                      dctnryStructList[i].fCompressionType);
 | 
						|
 | 
						|
                        if (rc != NO_ERROR)
 | 
						|
                        {
 | 
						|
                            dctnry->closeDctnry();
 | 
						|
                            return rc;
 | 
						|
                        }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                        timer.stop("tokenize");
 | 
						|
#endif
 | 
						|
                        col_iter->data = dctTuple.token;
 | 
						|
                    }
 | 
						|
 | 
						|
                    dctStr_iter++;
 | 
						|
                    col_iter++;
 | 
						|
                }
 | 
						|
 | 
						|
                //close dictionary files
 | 
						|
                rc = dctnry->closeDctnry();
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
            } // tokenize dictionary rows in 1st extent
 | 
						|
 | 
						|
            if (newExtent)
 | 
						|
            {
 | 
						|
                rc = dctnry->openDctnry(newDctnryStructList[i].dctnryOid,
 | 
						|
                                        newDctnryStructList[i].fColDbRoot,
 | 
						|
                                        newDctnryStructList[i].fColPartition,
 | 
						|
                                        newDctnryStructList[i].fColSegment,
 | 
						|
                                        false); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
 | 
						|
                aColExtsInfo = aTableMetaData->getColExtsInfo(newDctnryStructList[i].dctnryOid);
 | 
						|
                it = aColExtsInfo.begin();
 | 
						|
 | 
						|
                while (it != aColExtsInfo.end())
 | 
						|
                {
 | 
						|
                    if ((it->dbRoot == newDctnryStructList[i].fColDbRoot) && (it->partNum == newDctnryStructList[i].fColPartition) && (it->segNum == newDctnryStructList[i].fColSegment))
 | 
						|
                        break;
 | 
						|
 | 
						|
                    it++;
 | 
						|
                }
 | 
						|
 | 
						|
                if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
                {
 | 
						|
                    ColExtInfo aExt;
 | 
						|
                    aExt.dbRoot = newDctnryStructList[i].fColDbRoot;
 | 
						|
                    aExt.partNum = newDctnryStructList[i].fColPartition;
 | 
						|
                    aExt.segNum = newDctnryStructList[i].fColSegment;
 | 
						|
                    aExt.compType = newDctnryStructList[i].fCompressionType;
 | 
						|
                    aExt.isDict = true;
 | 
						|
                    aColExtsInfo.push_back(aExt);
 | 
						|
                    aTableMetaData->setColExtsInfo(newDctnryStructList[i].dctnryOid, aColExtsInfo);
 | 
						|
                }
 | 
						|
 | 
						|
                for (uint32_t rows = 0; rows < rowsLeft; rows++)
 | 
						|
                {
 | 
						|
                    if (dctStr_iter->length() == 0)
 | 
						|
                    {
 | 
						|
                        Token nullToken;
 | 
						|
                        col_iter->data = nullToken;
 | 
						|
                    }
 | 
						|
                    else
 | 
						|
                    {
 | 
						|
#ifdef PROFILE
 | 
						|
                        timer.start("tokenize");
 | 
						|
#endif
 | 
						|
                        DctnryTuple dctTuple;
 | 
						|
                        dctTuple.sigValue = (unsigned char*)dctStr_iter->c_str();
 | 
						|
                        dctTuple.sigSize = dctStr_iter->length();
 | 
						|
                        dctTuple.isNull = false;
 | 
						|
                        rc = tokenize(txnid,
 | 
						|
                                      dctTuple,
 | 
						|
                                      newDctnryStructList[i].fCompressionType);
 | 
						|
 | 
						|
                        if (rc != NO_ERROR)
 | 
						|
                        {
 | 
						|
                            dctnry->closeDctnry();
 | 
						|
                            return rc;
 | 
						|
                        }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                        timer.stop("tokenize");
 | 
						|
#endif
 | 
						|
                        col_iter->data = dctTuple.token;
 | 
						|
                    }
 | 
						|
 | 
						|
                    dctStr_iter++;
 | 
						|
                    col_iter++;
 | 
						|
                }
 | 
						|
 | 
						|
                //close dictionary files
 | 
						|
                rc = dctnry->closeDctnry();
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    return rc;
 | 
						|
            } // tokenize dictionary rows in second extent
 | 
						|
        }     // tokenize dictionary columns
 | 
						|
    }         // loop through columns to see which ones need tokenizing
 | 
						|
 | 
						|
    //----------------------------------------------------------------------
 | 
						|
    // Update column info structure @Bug 1862 set hwm, and
 | 
						|
    // Prepare ValueList for new extent (if applicable)
 | 
						|
    //----------------------------------------------------------------------
 | 
						|
    //@Bug 2205 Check whether all rows go to the new extent
 | 
						|
    RID lastRid = 0;
 | 
						|
    RID lastRidNew = 0;
 | 
						|
 | 
						|
    if (totalRow - rowsLeft > 0)
 | 
						|
    {
 | 
						|
        lastRid = rowIdArray[totalRow - rowsLeft - 1];
 | 
						|
        lastRidNew = rowIdArray[totalRow - 1];
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        lastRid = 0;
 | 
						|
        lastRidNew = rowIdArray[totalRow - 1];
 | 
						|
    }
 | 
						|
 | 
						|
    //cout << "rowid allocated is "  << lastRid << endl;
 | 
						|
    //if a new extent is created, all the columns in this table should
 | 
						|
    //have their own new extent
 | 
						|
 | 
						|
    //@Bug 1701. Close the file
 | 
						|
    if (bUseStartExtent)
 | 
						|
    {
 | 
						|
        m_colOp[op(curCol.compressionType)]->clearColumn(curCol);
 | 
						|
    }
 | 
						|
 | 
						|
    std::vector<BulkSetHWMArg> hwmVecNewext;
 | 
						|
    std::vector<BulkSetHWMArg> hwmVecOldext;
 | 
						|
 | 
						|
    if (newExtent) //Save all hwms to set them later.
 | 
						|
    {
 | 
						|
        BulkSetHWMArg aHwmEntryNew;
 | 
						|
        BulkSetHWMArg aHwmEntryOld;
 | 
						|
 | 
						|
        bool succFlag = false;
 | 
						|
        unsigned colWidth = 0;
 | 
						|
        int curFbo = 0, curBio;
 | 
						|
 | 
						|
        for (i = 0; i < totalColumns; i++)
 | 
						|
        {
 | 
						|
            colOp = m_colOp[op(newColStructList[i].fCompressionType)];
 | 
						|
 | 
						|
            // @Bug 2714 need to set hwm for the old extent
 | 
						|
            colWidth = colStructList[i].colWidth;
 | 
						|
            succFlag = colOp->calculateRowId(lastRid,
 | 
						|
                                             BYTE_PER_BLOCK / colWidth, colWidth, curFbo, curBio);
 | 
						|
 | 
						|
            //cout << "insertcolumnrec   oid:rid:fbo:hwm = " <<
 | 
						|
            //colStructList[i].dataOid << ":" << lastRid << ":" <<
 | 
						|
            //curFbo << ":" << hwm << endl;
 | 
						|
            if (succFlag)
 | 
						|
            {
 | 
						|
                if ((HWM)curFbo > oldHwm)
 | 
						|
                {
 | 
						|
                    aHwmEntryOld.oid     = colStructList[i].dataOid;
 | 
						|
                    aHwmEntryOld.partNum = colStructList[i].fColPartition;
 | 
						|
                    aHwmEntryOld.segNum  = colStructList[i].fColSegment;
 | 
						|
                    aHwmEntryOld.hwm     = curFbo;
 | 
						|
                    hwmVecOldext.push_back(aHwmEntryOld);
 | 
						|
                }
 | 
						|
            }
 | 
						|
            else
 | 
						|
                return ERR_INVALID_PARAM;
 | 
						|
 | 
						|
            colWidth = newColStructList[i].colWidth;
 | 
						|
            succFlag = colOp->calculateRowId(lastRidNew,
 | 
						|
                                             BYTE_PER_BLOCK / colWidth, colWidth, curFbo, curBio);
 | 
						|
 | 
						|
            if (succFlag)
 | 
						|
            {
 | 
						|
                aHwmEntryNew.oid     = newColStructList[i].dataOid;
 | 
						|
                aHwmEntryNew.partNum = newColStructList[i].fColPartition;
 | 
						|
                aHwmEntryNew.segNum  = newColStructList[i].fColSegment;
 | 
						|
                aHwmEntryNew.hwm     = curFbo;
 | 
						|
                hwmVecNewext.push_back(aHwmEntryNew);
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        // Prepare the valuelist for the new extent
 | 
						|
        //----------------------------------------------------------------------
 | 
						|
        ColTupleList colTupleList;
 | 
						|
        ColTupleList newColTupleList;
 | 
						|
        ColTupleList firstPartTupleList;
 | 
						|
 | 
						|
        for (unsigned i = 0; i < totalColumns; i++)
 | 
						|
        {
 | 
						|
            colTupleList = static_cast<ColTupleList>(colValueList[i]);
 | 
						|
 | 
						|
            for (uint64_t j = rowsLeft; j > 0; j--)
 | 
						|
            {
 | 
						|
                newColTupleList.push_back(colTupleList[totalRow - j]);
 | 
						|
            }
 | 
						|
 | 
						|
            colNewValueList.push_back(newColTupleList);
 | 
						|
 | 
						|
            newColTupleList.clear();
 | 
						|
 | 
						|
            //upate the oldvalue list for the old extent
 | 
						|
            for (uint64_t j = 0; j < (totalRow - rowsLeft); j++)
 | 
						|
            {
 | 
						|
                firstPartTupleList.push_back(colTupleList[j]);
 | 
						|
            }
 | 
						|
 | 
						|
            colOldValueList.push_back(firstPartTupleList);
 | 
						|
            firstPartTupleList.clear();
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    //Mark extents invalid
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    vector<BRM::LBID_t> lbids;
 | 
						|
    vector<CalpontSystemCatalog::ColDataType> colDataTypes;
 | 
						|
    bool successFlag = true;
 | 
						|
    unsigned width = 0;
 | 
						|
    //BRM::LBID_t lbid;
 | 
						|
    int curFbo = 0, curBio, lastFbo = -1;
 | 
						|
    /*	if (totalRow-rowsLeft > 0)
 | 
						|
    	{
 | 
						|
    		for (unsigned i = 0; i < colStructList.size(); i++)
 | 
						|
    		{
 | 
						|
    			colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
    			width = colStructList[i].colWidth;
 | 
						|
    			successFlag = colOp->calculateRowId(lastRid ,
 | 
						|
    				BYTE_PER_BLOCK/width, width, curFbo, curBio);
 | 
						|
    			if (successFlag) {
 | 
						|
    				if (curFbo != lastFbo) {
 | 
						|
    					RETURN_ON_ERROR(BRMWrapper::getInstance()->getBrmInfo(
 | 
						|
    						colStructList[i].dataOid,
 | 
						|
    						colStructList[i].fColPartition,
 | 
						|
    						colStructList[i].fColSegment, curFbo, lbid));
 | 
						|
    					lbids.push_back((BRM::LBID_t)lbid);
 | 
						|
    					colDataTypes.push_back(colStructList[i].colDataType);
 | 
						|
    				}
 | 
						|
    			}
 | 
						|
    		}
 | 
						|
    	}
 | 
						|
    */
 | 
						|
    lastRid = rowIdArray[totalRow - 1];
 | 
						|
 | 
						|
    for (unsigned i = 0; i < colStructList.size(); i++)
 | 
						|
    {
 | 
						|
        colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
        width = colStructList[i].colWidth;
 | 
						|
        successFlag = colOp->calculateRowId(lastRid,
 | 
						|
                                            BYTE_PER_BLOCK / width, width, curFbo, curBio);
 | 
						|
 | 
						|
        if (successFlag)
 | 
						|
        {
 | 
						|
            if (curFbo != lastFbo)
 | 
						|
            {
 | 
						|
                colDataTypes.push_back(colStructList[i].colDataType);
 | 
						|
                RETURN_ON_ERROR(AddLBIDtoList(txnid,
 | 
						|
                                              lbids,
 | 
						|
                                              colDataTypes,
 | 
						|
                                              colStructList[i],
 | 
						|
                                              curFbo));
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    //cout << "lbids size = " << lbids.size()<< endl;
 | 
						|
    if (lbids.size() > 0)
 | 
						|
        rc = BRMWrapper::getInstance()->markExtentsInvalid(lbids, colDataTypes);
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Write row(s) to database file(s)
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.start("writeColumnRec");
 | 
						|
#endif
 | 
						|
 | 
						|
    if (rc == NO_ERROR)
 | 
						|
    {
 | 
						|
        if (newExtent)
 | 
						|
        {
 | 
						|
            rc = writeColumnRec(txnid, colStructList, colOldValueList,
 | 
						|
                                rowIdArray, newColStructList, colNewValueList, tableOid,
 | 
						|
                                false); // @bug 5572 HDFS tmp file
 | 
						|
        }
 | 
						|
        else
 | 
						|
        {
 | 
						|
            rc = writeColumnRec(txnid, colStructList, colValueList,
 | 
						|
                                rowIdArray, newColStructList, colNewValueList, tableOid,
 | 
						|
                                true); // @bug 5572 HDFS tmp file
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.stop("writeColumnRec");
 | 
						|
#endif
 | 
						|
//  for (ColTupleList::size_type  i = 0; i < totalRow; i++)
 | 
						|
//      ridList.push_back((RID) rowIdArray[i]);
 | 
						|
 | 
						|
//  if (rc == NO_ERROR)
 | 
						|
//  rc = flushDataFiles(NO_ERROR);
 | 
						|
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    // Update BRM
 | 
						|
    //--------------------------------------------------------------------------
 | 
						|
    if ( !newExtent )
 | 
						|
    {
 | 
						|
        //flushVMCache();
 | 
						|
        bool succFlag = false;
 | 
						|
        unsigned colWidth = 0;
 | 
						|
        int  extState;
 | 
						|
        bool extFound;
 | 
						|
        int curFbo = 0, curBio;
 | 
						|
        std::vector<BulkSetHWMArg> hwmVec;
 | 
						|
 | 
						|
        for (unsigned i = 0; i < totalColumns; i++)
 | 
						|
        {
 | 
						|
            //colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
            //Set all columns hwm together
 | 
						|
            BulkSetHWMArg aHwmEntry;
 | 
						|
            RETURN_ON_ERROR(BRMWrapper::getInstance()->getLastHWM_DBroot(
 | 
						|
                                colStructList[i].dataOid,
 | 
						|
                                colStructList[i].fColDbRoot,
 | 
						|
                                colStructList[i].fColPartition,
 | 
						|
                                colStructList[i].fColSegment,
 | 
						|
                                hwm,
 | 
						|
                                extState, extFound));
 | 
						|
            colWidth = colStructList[i].colWidth;
 | 
						|
            succFlag = colOp->calculateRowId(lastRid,
 | 
						|
                                             BYTE_PER_BLOCK / colWidth, colWidth, curFbo, curBio);
 | 
						|
 | 
						|
            //cout << "insertcolumnrec   oid:rid:fbo:hwm = " <<
 | 
						|
            //colStructList[i].dataOid << ":" << lastRid << ":" <<
 | 
						|
            //curFbo << ":" << hwm << endl;
 | 
						|
            if (succFlag)
 | 
						|
            {
 | 
						|
                if ((HWM)curFbo > hwm)
 | 
						|
                {
 | 
						|
                    aHwmEntry.oid     = colStructList[i].dataOid;
 | 
						|
                    aHwmEntry.partNum = colStructList[i].fColPartition;
 | 
						|
                    aHwmEntry.segNum  = colStructList[i].fColSegment;
 | 
						|
                    aHwmEntry.hwm     = curFbo;
 | 
						|
                    hwmVec.push_back(aHwmEntry);
 | 
						|
                }
 | 
						|
            }
 | 
						|
            else
 | 
						|
                return ERR_INVALID_PARAM;
 | 
						|
        }
 | 
						|
 | 
						|
        std::vector<BRM::CPInfoMerge> mergeCPDataArgs;
 | 
						|
        RETURN_ON_ERROR(BRMWrapper::getInstance()->bulkSetHWMAndCP(
 | 
						|
                            hwmVec, mergeCPDataArgs));
 | 
						|
    }
 | 
						|
    else // if (newExtent)
 | 
						|
    {
 | 
						|
#ifdef PROFILE
 | 
						|
        timer.start("flushVMCache");
 | 
						|
#endif
 | 
						|
        std::vector<BRM::CPInfoMerge> mergeCPDataArgs;
 | 
						|
 | 
						|
        if (hwmVecNewext.size() > 0)
 | 
						|
            RETURN_ON_ERROR(BRMWrapper::getInstance()->bulkSetHWMAndCP(
 | 
						|
                                hwmVecNewext, mergeCPDataArgs));
 | 
						|
 | 
						|
        if (hwmVecOldext.size() > 0)
 | 
						|
            RETURN_ON_ERROR(BRMWrapper::getInstance()->bulkSetHWMAndCP(
 | 
						|
                                hwmVecOldext, mergeCPDataArgs));
 | 
						|
 | 
						|
        //flushVMCache();
 | 
						|
#ifdef PROFILE
 | 
						|
        timer.stop("flushVMCache");
 | 
						|
#endif
 | 
						|
    }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.finish();
 | 
						|
#endif
 | 
						|
    //flush PrimProc FD cache moved to we_dmlcommandproc.cpp
 | 
						|
    /*	ColsExtsInfoMap colsExtsInfoMap = aTableMetaData->getColsExtsInfoMap();
 | 
						|
    	ColsExtsInfoMap::iterator it = colsExtsInfoMap.begin();
 | 
						|
    	ColExtsInfo::iterator aIt;
 | 
						|
    	std::vector<BRM::FileInfo> files;
 | 
						|
    	BRM::FileInfo aFile;
 | 
						|
    	while (it != colsExtsInfoMap.end())
 | 
						|
    	{
 | 
						|
    		aIt = (it->second).begin();
 | 
						|
    		aFile.oid = it->first;
 | 
						|
    		//cout << "OID:" << aArg.oid;
 | 
						|
    		while (aIt != (it->second).end())
 | 
						|
    		{
 | 
						|
    			aFile.partitionNum = aIt->partNum;
 | 
						|
    			aFile.dbRoot =aIt->dbRoot;
 | 
						|
    			aFile.segmentNum = aIt->segNum;
 | 
						|
    			aFile.compType = aIt->compType;
 | 
						|
    			files.push_back(aFile);
 | 
						|
    			//cout <<"Added to files oid:dbroot:part:seg:compType = " << aFile.oid<<":"<<aFile.dbRoot<<":"<<aFile.partitionNum<<":"<<aFile.segmentNum
 | 
						|
    			//<<":"<<aFile.compType <<endl;
 | 
						|
    			aIt++;
 | 
						|
    		}
 | 
						|
    		it++;
 | 
						|
    	}
 | 
						|
    	if ((idbdatafile::IDBPolicy::useHdfs()) && (files.size() > 0))
 | 
						|
    		cacheutils::purgePrimProcFdCache(files, Config::getLocalModuleID());
 | 
						|
    	TableMetaData::removeTableMetaData(tableOid);	*/
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
/*@brief printInputValue - Print input value
 | 
						|
*/
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Print input value
 | 
						|
 * PARAMETERS:
 | 
						|
 *    tableOid - table object id
 | 
						|
 *    colStructList - column struct list
 | 
						|
 *    colValueList - column value list
 | 
						|
 *    ridList - RID list
 | 
						|
 * RETURN:
 | 
						|
 *    none
 | 
						|
 ***********************************************************/
 | 
						|
void WriteEngineWrapper::printInputValue(const ColStructList& colStructList,
 | 
						|
        const ColValueList& colValueList,
 | 
						|
        const RIDList& ridList) const
 | 
						|
{
 | 
						|
    ColTupleList   curTupleList;
 | 
						|
    ColStruct      curColStruct;
 | 
						|
    ColTuple       curTuple;
 | 
						|
    string         curStr;
 | 
						|
    ColStructList::size_type i;
 | 
						|
    ColTupleList::size_type  j;
 | 
						|
 | 
						|
    printf("\n=========================\n");
 | 
						|
//      printf("\nTable OID : %d \n", tableOid);
 | 
						|
 | 
						|
    printf("\nTotal RIDs: %zu\n", ridList.size());
 | 
						|
 | 
						|
    for (i = 0; i < ridList.size(); i++)
 | 
						|
        cout << "RID[" << i << "] : " << ridList[i] << "\n";
 | 
						|
 | 
						|
    printf("\nTotal Columns: %zu\n", colStructList.size());
 | 
						|
 | 
						|
 | 
						|
    for (i = 0; i < colStructList.size(); i++)
 | 
						|
    {
 | 
						|
        curColStruct = colStructList[i];
 | 
						|
        curTupleList = colValueList[i];
 | 
						|
 | 
						|
        printf("\nColumn[%zu]", i);
 | 
						|
        printf("\nData file OID : %d \t", curColStruct.dataOid);
 | 
						|
        printf("\tWidth : %d \t Type: %d", curColStruct.colWidth, curColStruct.colDataType);
 | 
						|
        printf("\nTotal values : %zu \n", curTupleList.size());
 | 
						|
 | 
						|
        for (j = 0; j < curTupleList.size(); j++)
 | 
						|
        {
 | 
						|
            curTuple = curTupleList[j];
 | 
						|
 | 
						|
            try
 | 
						|
            {
 | 
						|
                if (curTuple.data.type() == typeid(int))
 | 
						|
                    curStr = boost::lexical_cast<string>(boost::any_cast<int>(curTuple.data));
 | 
						|
                else if (curTuple.data.type() == typeid(float))
 | 
						|
                    curStr = boost::lexical_cast<string>(boost::any_cast<float>(curTuple.data));
 | 
						|
                else if (curTuple.data.type() == typeid(long long))
 | 
						|
                    curStr = boost::lexical_cast<string>(boost::any_cast<long long>(curTuple.data));
 | 
						|
                else if (curTuple.data.type() == typeid(double))
 | 
						|
                    curStr = boost::lexical_cast<string>(boost::any_cast<double>(curTuple.data));
 | 
						|
//               else
 | 
						|
//               if (curTuple.data.type() == typeid(bool))
 | 
						|
//                  curStr = boost::lexical_cast<string>(boost::any_cast<bool>(curTuple.data));
 | 
						|
                else if (curTuple.data.type() == typeid(short))
 | 
						|
                    curStr = boost::lexical_cast<string>(boost::any_cast<short>(curTuple.data));
 | 
						|
                else if (curTuple.data.type() == typeid(char))
 | 
						|
                    curStr = boost::lexical_cast<string>(boost::any_cast<char>(curTuple.data));
 | 
						|
                else
 | 
						|
                    curStr = boost::any_cast<string>(curTuple.data);
 | 
						|
            }
 | 
						|
            catch (...)
 | 
						|
            {
 | 
						|
            }
 | 
						|
 | 
						|
            if (isDebug(DEBUG_3))
 | 
						|
                printf("Value[%zu] : %s\n", j, curStr.c_str());
 | 
						|
        }
 | 
						|
 | 
						|
    }
 | 
						|
 | 
						|
    printf("\n=========================\n");
 | 
						|
}
 | 
						|
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Process version buffer before any write operation
 | 
						|
 * PARAMETERS:
 | 
						|
 *    txnid - transaction id
 | 
						|
 *    oid - column oid
 | 
						|
 *    totalRow - total number of rows
 | 
						|
 *    rowIdArray - rowid array
 | 
						|
 * RETURN:
 | 
						|
 *    NO_ERROR if success
 | 
						|
 *    others if something wrong in inserting the value
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::processVersionBuffer(IDBDataFile* pFile, const TxnID& txnid,
 | 
						|
        const ColStruct& colStruct, int width,
 | 
						|
        int totalRow, const RID* rowIdArray, vector<LBIDRange>&   rangeList)
 | 
						|
{
 | 
						|
    if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
        return 0;
 | 
						|
 | 
						|
    RID         curRowId;
 | 
						|
    int         rc = NO_ERROR;
 | 
						|
    int         curFbo = 0, curBio, lastFbo = -1;
 | 
						|
    bool        successFlag;
 | 
						|
    BRM::LBID_t lbid;
 | 
						|
    BRM::VER_t  verId = (BRM::VER_t) txnid;
 | 
						|
    vector<uint32_t> fboList;
 | 
						|
    LBIDRange   range;
 | 
						|
    ColumnOp* colOp = m_colOp[op(colStruct.fCompressionType)];
 | 
						|
 | 
						|
    for (int i = 0; i < totalRow; i++)
 | 
						|
    {
 | 
						|
        curRowId = rowIdArray[i];
 | 
						|
        //cout << "processVersionBuffer got rid " << curRowId << endl;
 | 
						|
        successFlag = colOp->calculateRowId(curRowId, BYTE_PER_BLOCK / width, width, curFbo, curBio);
 | 
						|
 | 
						|
        if (successFlag)
 | 
						|
        {
 | 
						|
            if (curFbo != lastFbo)
 | 
						|
            {
 | 
						|
                //cout << "processVersionBuffer is processing lbid  " << lbid << endl;
 | 
						|
                RETURN_ON_ERROR(BRMWrapper::getInstance()->getBrmInfo(
 | 
						|
                                    colStruct.dataOid, colStruct.fColPartition, colStruct.fColSegment, curFbo, lbid));
 | 
						|
                //cout << "processVersionBuffer is processing lbid  " << lbid << endl;
 | 
						|
                fboList.push_back((uint32_t)curFbo);
 | 
						|
                range.start = lbid;
 | 
						|
                range.size = 1;
 | 
						|
                rangeList.push_back(range);
 | 
						|
            }
 | 
						|
 | 
						|
            lastFbo = curFbo;
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    std::vector<VBRange> freeList;
 | 
						|
    rc = BRMWrapper::getInstance()->
 | 
						|
         writeVB(pFile, verId, colStruct.dataOid, fboList, rangeList, colOp, freeList, colStruct.fColDbRoot);
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::processVersionBuffers(IDBDataFile* pFile, const TxnID& txnid,
 | 
						|
        const ColStruct& colStruct, int width,
 | 
						|
        int totalRow, const RIDList& ridList,
 | 
						|
        vector<LBIDRange>&    rangeList)
 | 
						|
{
 | 
						|
    if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
        return 0;
 | 
						|
 | 
						|
    RID         curRowId;
 | 
						|
    int         rc = NO_ERROR;
 | 
						|
    int         curFbo = 0, curBio, lastFbo = -1;
 | 
						|
    bool        successFlag;
 | 
						|
    BRM::LBID_t lbid;
 | 
						|
    BRM::VER_t  verId = (BRM::VER_t) txnid;
 | 
						|
    LBIDRange   range;
 | 
						|
    vector<uint32_t> fboList;
 | 
						|
    //vector<LBIDRange>   rangeList;
 | 
						|
    ColumnOp* colOp = m_colOp[op(colStruct.fCompressionType)];
 | 
						|
 | 
						|
    for (int i = 0; i < totalRow; i++)
 | 
						|
    {
 | 
						|
        curRowId = ridList[i];
 | 
						|
        //cout << "processVersionBuffer got rid " << curRowId << endl;
 | 
						|
        successFlag = colOp->calculateRowId(curRowId, BYTE_PER_BLOCK / width, width, curFbo, curBio);
 | 
						|
 | 
						|
        if (successFlag)
 | 
						|
        {
 | 
						|
            if (curFbo != lastFbo)
 | 
						|
            {
 | 
						|
                //cout << "processVersionBuffer is processing lbid  " << lbid << endl;
 | 
						|
                RETURN_ON_ERROR(BRMWrapper::getInstance()->getBrmInfo(
 | 
						|
                                    colStruct.dataOid, colStruct.fColPartition, colStruct.fColSegment, curFbo, lbid));
 | 
						|
                //cout << "processVersionBuffer is processing lbid  " << lbid << endl;
 | 
						|
                fboList.push_back((uint32_t)curFbo);
 | 
						|
                range.start = lbid;
 | 
						|
                range.size = 1;
 | 
						|
                rangeList.push_back(range);
 | 
						|
            }
 | 
						|
 | 
						|
            lastFbo = curFbo;
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
//cout << "calling writeVB with blocks " << rangeList.size() << endl;
 | 
						|
    std::vector<VBRange> freeList;
 | 
						|
    rc = BRMWrapper::getInstance()->
 | 
						|
         writeVB(pFile, verId, colStruct.dataOid, fboList, rangeList, colOp, freeList, colStruct.fColDbRoot);
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::processBeginVBCopy(const TxnID& txnid, const vector<ColStruct>& colStructList, const RIDList& ridList,
 | 
						|
        std::vector<VBRange>& freeList, vector<vector<uint32_t> >& fboLists, vector<vector<LBIDRange> >& rangeLists,
 | 
						|
        vector<LBIDRange>&   rangeListTot)
 | 
						|
{
 | 
						|
    if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
        return 0;
 | 
						|
 | 
						|
    RID         curRowId;
 | 
						|
    int         rc = NO_ERROR;
 | 
						|
    int         curFbo = 0, curBio, lastFbo = -1;
 | 
						|
    bool        successFlag;
 | 
						|
    BRM::LBID_t lbid;
 | 
						|
    LBIDRange   range;
 | 
						|
 | 
						|
//StopWatch timer;
 | 
						|
// timer.start("calculation");
 | 
						|
    for (uint32_t j = 0; j < colStructList.size(); j++)
 | 
						|
    {
 | 
						|
        vector<uint32_t> fboList;
 | 
						|
        vector<LBIDRange>    rangeList;
 | 
						|
        lastFbo = -1;
 | 
						|
        ColumnOp* colOp = m_colOp[op(colStructList[j].fCompressionType)];
 | 
						|
 | 
						|
        ColStruct curColStruct = colStructList[j];
 | 
						|
        Convertor::convertColType(&curColStruct);
 | 
						|
 | 
						|
        for (uint32_t i = 0; i < ridList.size(); i++)
 | 
						|
        {
 | 
						|
            curRowId = ridList[i];
 | 
						|
            //cout << "processVersionBuffer got rid " << curRowId << endl;
 | 
						|
            successFlag = colOp->calculateRowId(curRowId, BYTE_PER_BLOCK / curColStruct.colWidth, curColStruct.colWidth, curFbo, curBio);
 | 
						|
 | 
						|
            if (successFlag)
 | 
						|
            {
 | 
						|
                if (curFbo != lastFbo)
 | 
						|
                {
 | 
						|
                    //cout << "processVersionBuffer is processing curFbo  " << curFbo << endl;
 | 
						|
                    RETURN_ON_ERROR(BRMWrapper::getInstance()->getBrmInfo(
 | 
						|
                                        colStructList[j].dataOid, colStructList[j].fColPartition, colStructList[j].fColSegment, curFbo, lbid));
 | 
						|
                    //cout << "beginVBCopy is processing lbid:transaction  " << lbid <<":"<<txnid<< endl;
 | 
						|
                    fboList.push_back((uint32_t)curFbo);
 | 
						|
                    range.start = lbid;
 | 
						|
                    range.size = 1;
 | 
						|
                    rangeList.push_back(range);
 | 
						|
                }
 | 
						|
 | 
						|
                lastFbo = curFbo;
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        BRMWrapper::getInstance()->pruneLBIDList(txnid, &rangeList, &fboList);
 | 
						|
        rangeLists.push_back(rangeList);
 | 
						|
 | 
						|
        fboLists.push_back(fboList);
 | 
						|
        rangeListTot.insert(rangeListTot.end(), rangeList.begin(), rangeList.end());
 | 
						|
    }
 | 
						|
 | 
						|
    if (rangeListTot.size() > 0)
 | 
						|
        rc = BRMWrapper::getInstance()->getDbrmObject()->beginVBCopy(txnid, colStructList[0].fColDbRoot, rangeListTot, freeList);
 | 
						|
 | 
						|
//timer.stop("beginVBCopy");
 | 
						|
//timer.finish();
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
/**
 | 
						|
* @brief Process versioning for batch insert - only version the hwm block.
 | 
						|
*/
 | 
						|
#if 0
 | 
						|
int WriteEngineWrapper::processBatchVersions(const TxnID& txnid, std::vector<Column> columns, std::vector<BRM::LBIDRange>&   rangeList)
 | 
						|
{
 | 
						|
    int rc = 0;
 | 
						|
    std::vector<DbFileOp*> fileOps;
 | 
						|
 | 
						|
    //open the column files
 | 
						|
    for ( unsigned i = 0; i < columns.size(); i++)
 | 
						|
    {
 | 
						|
        ColumnOp* colOp = m_colOp[op(columns[i].compressionType)];
 | 
						|
        Column curCol;
 | 
						|
        // set params
 | 
						|
        colOp->initColumn(curCol);
 | 
						|
        ColType colType;
 | 
						|
        Convertor::convertColType(columns[i].colDataType, colType);
 | 
						|
        colOp->setColParam(curCol, 0, columns[i].colWidth,
 | 
						|
                           columns[i].colDataType, colType, columns[i].dataFile.oid,
 | 
						|
                           columns[i].compressionType,
 | 
						|
                           columns[i].dataFile.fDbRoot, columns[i].dataFile.fPartition, columns[i].dataFile.fSegment);
 | 
						|
        string segFile;
 | 
						|
        rc = colOp->openColumnFile(curCol, segFile, IO_BUFF_SIZE);
 | 
						|
 | 
						|
        if (rc != NO_ERROR)
 | 
						|
            break;
 | 
						|
 | 
						|
        columns[i].dataFile.pFile = curCol.dataFile.pFile;
 | 
						|
        fileOps.push_back(colOp);
 | 
						|
    }
 | 
						|
 | 
						|
    if ( rc == 0)
 | 
						|
    {
 | 
						|
        BRM::VER_t  verId = (BRM::VER_t) txnid;
 | 
						|
        rc = BRMWrapper::getInstance()->writeBatchVBs(verId, columns, rangeList, fileOps);
 | 
						|
    }
 | 
						|
 | 
						|
    //close files
 | 
						|
    for ( unsigned i = 0; i < columns.size(); i++)
 | 
						|
    {
 | 
						|
        ColumnOp* colOp = dynamic_cast<ColumnOp*> (fileOps[i]);
 | 
						|
        Column curCol;
 | 
						|
        // set params
 | 
						|
        colOp->initColumn(curCol);
 | 
						|
        ColType colType;
 | 
						|
        Convertor::convertColType(columns[i].colDataType, colType);
 | 
						|
        colOp->setColParam(curCol, 0, columns[i].colWidth,
 | 
						|
                           columns[i].colDataType, colType, columns[i].dataFile.oid,
 | 
						|
                           columns[i].compressionType,
 | 
						|
                           columns[i].dataFile.fDbRoot, columns[i].dataFile.fPartition, columns[i].dataFile.fSegment);
 | 
						|
        curCol.dataFile.pFile = columns[i].dataFile.pFile;
 | 
						|
        colOp->clearColumn(curCol);
 | 
						|
    }
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
#endif
 | 
						|
void WriteEngineWrapper::writeVBEnd(const TxnID& txnid, std::vector<BRM::LBIDRange>&   rangeList)
 | 
						|
{
 | 
						|
    if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
        return;
 | 
						|
 | 
						|
    BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::updateColumnRec(const TxnID& txnid,
 | 
						|
                                        vector<ColStructList>& colExtentsStruct,
 | 
						|
                                        ColValueList& colValueList,
 | 
						|
                                        vector<void*>& colOldValueList,
 | 
						|
                                        vector<RIDList>& ridLists,
 | 
						|
                                        vector<DctnryStructList>& dctnryExtentsStruct,
 | 
						|
                                        DctnryValueList& dctnryValueList,
 | 
						|
                                        const int32_t tableOid)
 | 
						|
{
 | 
						|
    int            rc = 0;
 | 
						|
    //RID*           rowIdArray = NULL;
 | 
						|
    //RIDList::size_type i;
 | 
						|
    unsigned numExtents = colExtentsStruct.size();
 | 
						|
    // ColValueList tmpColValueList;
 | 
						|
    RIDList::const_iterator ridsIter;
 | 
						|
    ColStructList colStructList;
 | 
						|
    DctnryStructList dctnryStructList;
 | 
						|
    ColumnOp* colOp = NULL;
 | 
						|
 | 
						|
    for (unsigned extent = 0; extent < numExtents; extent++)
 | 
						|
    {
 | 
						|
        ridsIter = ridLists[extent].begin();
 | 
						|
 | 
						|
        //rowIdArray = (RID*)calloc(sizeof(RID), ridLists[extent].size());
 | 
						|
 | 
						|
        colStructList = colExtentsStruct[extent];
 | 
						|
        dctnryStructList = dctnryExtentsStruct[extent];
 | 
						|
 | 
						|
        if (m_opType != DELETE)
 | 
						|
        {
 | 
						|
 | 
						|
            /*            ColTuple colTuple;
 | 
						|
                     ColTupleList colTupleList;
 | 
						|
                     for (i=0; i < colValueList.size(); i++)
 | 
						|
                     {
 | 
						|
                         colTupleList = colValueList[i];
 | 
						|
                         colTuple = colTupleList[0];
 | 
						|
                         for (unsigned i = 1; i < ridLists[extent].size(); i++)
 | 
						|
                         {
 | 
						|
                             colTupleList.push_back(colTuple);
 | 
						|
                         }
 | 
						|
                         tmpColValueList.push_back(colTupleList);
 | 
						|
                     }
 | 
						|
            */
 | 
						|
            //Tokenize data if needed
 | 
						|
            vector<Token> tokenList;
 | 
						|
 | 
						|
            DctColTupleList::iterator dctCol_iter;
 | 
						|
            ColTupleList::iterator col_iter;
 | 
						|
 | 
						|
            for (unsigned i = 0; i < colStructList.size(); i++)
 | 
						|
            {
 | 
						|
                if (colStructList[i].tokenFlag)
 | 
						|
                {
 | 
						|
                    // only need to tokenize once
 | 
						|
                    dctCol_iter = dctnryValueList[i].begin();
 | 
						|
                    //col_iter = colValueList[i].begin();
 | 
						|
                    Token token;
 | 
						|
 | 
						|
                    if (!dctCol_iter->isNull)
 | 
						|
                    {
 | 
						|
                        RETURN_ON_ERROR(tokenize(
 | 
						|
                                            txnid, dctnryStructList[i], *dctCol_iter, true)); // @bug 5572 HDFS tmp file
 | 
						|
                        token = dctCol_iter->token;
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
//timer.stop("tokenize");
 | 
						|
#endif
 | 
						|
                    }
 | 
						|
                    else
 | 
						|
                    {
 | 
						|
                        //if (dctnryStructList[i].dctnryOid == 2001)
 | 
						|
                        //	std::cout << " got null token for string " << dctCol_iter->sigValue <<std::endl;
 | 
						|
                    }
 | 
						|
 | 
						|
                    //if (dctnryStructList[i].dctnryOid == 2001)
 | 
						|
                    //std::cout << " got token for string " << dctCol_iter->sigValue << " op:fbo = " << token.op <<":"<<token.fbo << std::endl;
 | 
						|
                    tokenList.push_back(token);
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
            int dicPos = 0;
 | 
						|
 | 
						|
            for (unsigned i = 0; i < colStructList.size(); i++)
 | 
						|
            {
 | 
						|
                if (colStructList[i].tokenFlag)
 | 
						|
                {
 | 
						|
                    // only need to tokenize once
 | 
						|
                    col_iter = colValueList[i].begin();
 | 
						|
 | 
						|
                    while (col_iter != colValueList[i].end())
 | 
						|
                    {
 | 
						|
                        col_iter->data = tokenList[dicPos];
 | 
						|
                        col_iter++;
 | 
						|
                    }
 | 
						|
 | 
						|
                    dicPos++;
 | 
						|
                }
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        RIDList::iterator rid_iter;
 | 
						|
        /*    i = 0;
 | 
						|
              while (rid_iter != ridLists[extent].end())
 | 
						|
              {
 | 
						|
                 rowIdArray[i] = *rid_iter;
 | 
						|
                 rid_iter++;
 | 
						|
                 i++;
 | 
						|
              }
 | 
						|
        */
 | 
						|
        //Mark extents invalid
 | 
						|
        //if (colStructList[0].dataOid < 3000) {
 | 
						|
        vector<BRM::LBID_t> lbids;
 | 
						|
        vector<CalpontSystemCatalog::ColDataType> colDataTypes;
 | 
						|
        bool successFlag = true;
 | 
						|
        unsigned width = 0;
 | 
						|
        int      curFbo = 0, curBio, lastFbo = -1;
 | 
						|
        rid_iter = ridLists[extent].begin();
 | 
						|
        RID aRid = *rid_iter;
 | 
						|
 | 
						|
        for (unsigned j = 0; j < colStructList.size(); j++)
 | 
						|
        {
 | 
						|
            colOp = m_colOp[op(colStructList[j].fCompressionType)];
 | 
						|
 | 
						|
            if (colStructList[j].tokenFlag)
 | 
						|
                continue;
 | 
						|
 | 
						|
            width = colOp->getCorrectRowWidth(colStructList[j].colDataType, colStructList[j].colWidth);
 | 
						|
            successFlag = colOp->calculateRowId(aRid, BYTE_PER_BLOCK / width, width, curFbo, curBio);
 | 
						|
 | 
						|
            if (successFlag)
 | 
						|
            {
 | 
						|
                if (curFbo != lastFbo)
 | 
						|
                {
 | 
						|
                    RETURN_ON_ERROR(AddLBIDtoList(txnid,
 | 
						|
                                                  lbids,
 | 
						|
                                                  colDataTypes,
 | 
						|
                                                  colStructList[j],
 | 
						|
                                                  curFbo));
 | 
						|
                }
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        //cout << "lbids size = " << lbids.size()<< endl;
 | 
						|
//#ifdef PROFILE
 | 
						|
//timer.start("markExtentsInvalid");
 | 
						|
//#endif
 | 
						|
        if (lbids.size() > 0)
 | 
						|
            rc = BRMWrapper::getInstance()->markExtentsInvalid(lbids, colDataTypes);
 | 
						|
 | 
						|
        //}
 | 
						|
 | 
						|
        if ( m_opType != DELETE)
 | 
						|
            m_opType = UPDATE;
 | 
						|
 | 
						|
        rc = writeColumnRec(txnid, colStructList, colValueList, colOldValueList,
 | 
						|
                            ridLists[extent], tableOid, true, ridLists[extent].size());
 | 
						|
 | 
						|
//    if (rowIdArray)
 | 
						|
//       free(rowIdArray);
 | 
						|
 | 
						|
        m_opType = NOOP;
 | 
						|
 | 
						|
        if (rc != NO_ERROR)
 | 
						|
            break;
 | 
						|
    }
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::updateColumnRecs(const TxnID& txnid,
 | 
						|
        vector<ColStruct>& colExtentsStruct,
 | 
						|
        ColValueList& colValueList,
 | 
						|
        const RIDList& ridLists,
 | 
						|
        const int32_t tableOid)
 | 
						|
{
 | 
						|
    //Mark extents invalid
 | 
						|
    //int rc = 0;
 | 
						|
    //if (colExtentsStruct[0].dataOid < 3000)
 | 
						|
    //{
 | 
						|
    vector<BRM::LBID_t> lbids;
 | 
						|
    vector<CalpontSystemCatalog::ColDataType> colDataTypes;
 | 
						|
    ColumnOp* colOp = NULL;
 | 
						|
    bool successFlag = true;
 | 
						|
    unsigned width = 0;
 | 
						|
    \
 | 
						|
    int curFbo = 0, curBio, lastFbo = -1;
 | 
						|
    RID aRid = ridLists[0];
 | 
						|
    int rc = 0;
 | 
						|
 | 
						|
    for (unsigned j = 0; j < colExtentsStruct.size(); j++)
 | 
						|
    {
 | 
						|
        colOp = m_colOp[op(colExtentsStruct[j].fCompressionType)];
 | 
						|
 | 
						|
        if (colExtentsStruct[j].tokenFlag)
 | 
						|
            continue;
 | 
						|
 | 
						|
        width = colOp->getCorrectRowWidth(colExtentsStruct[j].colDataType, colExtentsStruct[j].colWidth);
 | 
						|
        successFlag = colOp->calculateRowId(aRid, BYTE_PER_BLOCK / width, width, curFbo, curBio);
 | 
						|
 | 
						|
        if (successFlag)
 | 
						|
        {
 | 
						|
            if (curFbo != lastFbo)
 | 
						|
            {
 | 
						|
                RETURN_ON_ERROR(AddLBIDtoList(txnid,
 | 
						|
                                              lbids,
 | 
						|
                                              colDataTypes,
 | 
						|
                                              colExtentsStruct[j],
 | 
						|
                                              curFbo));
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    if (lbids.size() > 0)
 | 
						|
    {
 | 
						|
//        cout << "BRMWrapper::getInstance()->markExtentsInvalid(lbids); " << lbids.size() << " lbids" << endl;
 | 
						|
        rc = BRMWrapper::getInstance()->markExtentsInvalid(lbids, colDataTypes);
 | 
						|
    }
 | 
						|
 | 
						|
    //}
 | 
						|
    if ( m_opType != DELETE)
 | 
						|
        m_opType = UPDATE;
 | 
						|
 | 
						|
    rc = writeColumnRecords (txnid, colExtentsStruct, colValueList, ridLists, tableOid);
 | 
						|
    m_opType = NOOP;
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::writeColumnRecords(const TxnID& txnid,
 | 
						|
        vector<ColStruct>& colStructList,
 | 
						|
        ColValueList& colValueList,
 | 
						|
        const RIDList& ridLists, const int32_t tableOid, bool versioning)
 | 
						|
{
 | 
						|
    bool           bExcp;
 | 
						|
    int            rc = 0;
 | 
						|
    void*          valArray = NULL;
 | 
						|
    Column         curCol;
 | 
						|
    ColStruct      curColStruct;
 | 
						|
    ColTupleList   curTupleList;
 | 
						|
    ColStructList::size_type  totalColumn;
 | 
						|
    ColStructList::size_type  i;
 | 
						|
    ColTupleList::size_type   totalRow;
 | 
						|
    setTransId(txnid);
 | 
						|
    totalColumn = colStructList.size();
 | 
						|
    totalRow = ridLists.size();
 | 
						|
 | 
						|
    TableMetaData* aTbaleMetaData = TableMetaData::makeTableMetaData(tableOid);
 | 
						|
 | 
						|
    for (i = 0; i < totalColumn; i++)
 | 
						|
    {
 | 
						|
        valArray = NULL;
 | 
						|
        curColStruct = colStructList[i];
 | 
						|
        curTupleList = colValueList[i];
 | 
						|
        ColumnOp* colOp = m_colOp[op(curColStruct.fCompressionType)];
 | 
						|
 | 
						|
        Convertor::convertColType(&curColStruct);
 | 
						|
 | 
						|
        // set params
 | 
						|
        colOp->initColumn(curCol);
 | 
						|
 | 
						|
        colOp->setColParam(curCol, 0, curColStruct.colWidth,
 | 
						|
                           curColStruct.colDataType, curColStruct.colType, curColStruct.dataOid,
 | 
						|
                           curColStruct.fCompressionType,
 | 
						|
                           curColStruct.fColDbRoot, curColStruct.fColPartition, curColStruct.fColSegment);
 | 
						|
 | 
						|
        ColExtsInfo aColExtsInfo = aTbaleMetaData->getColExtsInfo(curColStruct.dataOid);
 | 
						|
        ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
        while (it != aColExtsInfo.end())
 | 
						|
        {
 | 
						|
            if ((it->dbRoot == curColStruct.fColDbRoot) && (it->partNum == curColStruct.fColPartition) && (it->segNum == curColStruct.fColSegment))
 | 
						|
                break;
 | 
						|
 | 
						|
            it++;
 | 
						|
        }
 | 
						|
 | 
						|
        if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
        {
 | 
						|
            ColExtInfo aExt;
 | 
						|
            aExt.dbRoot = curColStruct.fColDbRoot;
 | 
						|
            aExt.partNum = curColStruct.fColPartition;
 | 
						|
            aExt.segNum = curColStruct.fColSegment;
 | 
						|
            aExt.compType = curColStruct.fCompressionType;
 | 
						|
            aExt.isDict = false;
 | 
						|
            aColExtsInfo.push_back(aExt);
 | 
						|
            aTbaleMetaData->setColExtsInfo(colStructList[i].dataOid, aColExtsInfo);
 | 
						|
        }
 | 
						|
 | 
						|
        string segFile;
 | 
						|
        rc = colOp->openColumnFile(curCol, segFile, true); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
        if (rc != NO_ERROR)
 | 
						|
            break;
 | 
						|
 | 
						|
        vector<LBIDRange>   rangeList;
 | 
						|
 | 
						|
        if (versioning)
 | 
						|
        {
 | 
						|
            rc = processVersionBuffers(curCol.dataFile.pFile, txnid, curColStruct,
 | 
						|
                                       curColStruct.colWidth, totalRow, ridLists, rangeList);
 | 
						|
        }
 | 
						|
 | 
						|
        if (rc != NO_ERROR)
 | 
						|
        {
 | 
						|
            if (curColStruct.fCompressionType == 0)
 | 
						|
            {
 | 
						|
                curCol.dataFile.pFile->flush();
 | 
						|
            }
 | 
						|
 | 
						|
            BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
            break;
 | 
						|
        }
 | 
						|
 | 
						|
        switch (curColStruct.colType)
 | 
						|
        {
 | 
						|
            case WriteEngine::WR_INT:
 | 
						|
                valArray = (int*) calloc(sizeof(int), totalRow);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_UINT:
 | 
						|
                valArray = (uint32_t*) calloc(sizeof(uint32_t), totalRow);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
            case WriteEngine::WR_CHAR:
 | 
						|
            case WriteEngine::WR_BLOB:
 | 
						|
            case WriteEngine::WR_TEXT:
 | 
						|
                valArray = (char*) calloc(sizeof(char), totalRow * MAX_COLUMN_BOUNDARY);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_FLOAT:
 | 
						|
                valArray = (float*) calloc(sizeof(float), totalRow);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_DOUBLE:
 | 
						|
                valArray = (double*) calloc(sizeof(double), totalRow);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_BYTE:
 | 
						|
                valArray = (char*) calloc(sizeof(char), totalRow);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_UBYTE:
 | 
						|
                valArray = (uint8_t*) calloc(sizeof(uint8_t), totalRow);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_SHORT:
 | 
						|
                valArray = (short*) calloc(sizeof(short), totalRow);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_USHORT:
 | 
						|
                valArray = (uint16_t*) calloc(sizeof(uint16_t), totalRow);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_LONGLONG:
 | 
						|
                valArray = (long long*) calloc(sizeof(long long), totalRow);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_ULONGLONG:
 | 
						|
                valArray = (uint64_t*) calloc(sizeof(uint64_t), totalRow);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_TOKEN:
 | 
						|
                valArray = (Token*) calloc(sizeof(Token), totalRow);
 | 
						|
                break;
 | 
						|
        }
 | 
						|
 | 
						|
        // convert values to valArray
 | 
						|
        bExcp = false;
 | 
						|
 | 
						|
        try
 | 
						|
        {
 | 
						|
            convertValArray(totalRow, curColStruct.colType, curTupleList, valArray);
 | 
						|
        }
 | 
						|
        catch (...)
 | 
						|
        {
 | 
						|
            bExcp = true;
 | 
						|
        }
 | 
						|
 | 
						|
        if (bExcp)
 | 
						|
        {
 | 
						|
            BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
            return ERR_PARSING;
 | 
						|
        }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
        timer.start("writeRow ");
 | 
						|
#endif
 | 
						|
        rc = colOp->writeRowsValues(curCol, totalRow, ridLists, valArray);
 | 
						|
#ifdef PROFILE
 | 
						|
        timer.stop("writeRow ");
 | 
						|
#endif
 | 
						|
        colOp->clearColumn(curCol);
 | 
						|
 | 
						|
        if (curColStruct.fCompressionType == 0)
 | 
						|
        {
 | 
						|
            std::vector<BRM::FileInfo> files;
 | 
						|
            BRM::FileInfo aFile;
 | 
						|
            aFile.partitionNum = curColStruct.fColPartition;
 | 
						|
            aFile.dbRoot = curColStruct.fColDbRoot;;
 | 
						|
            aFile.segmentNum = curColStruct.fColSegment;
 | 
						|
            aFile.compType = curColStruct.fCompressionType;
 | 
						|
            files.push_back(aFile);
 | 
						|
 | 
						|
            if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
                cacheutils::purgePrimProcFdCache(files, Config::getLocalModuleID());
 | 
						|
        }
 | 
						|
 | 
						|
        BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
 | 
						|
        if (valArray != NULL)
 | 
						|
            free(valArray);
 | 
						|
 | 
						|
        // check error
 | 
						|
        if (rc != NO_ERROR)
 | 
						|
            break;
 | 
						|
    }
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
/*@brief writeColumnRec - Write values to a column
 | 
						|
*/
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Write values to a column
 | 
						|
 * PARAMETERS:
 | 
						|
 *    tableOid - table object id
 | 
						|
 *    colStructList - column struct list
 | 
						|
 *    colValueList - column value list
 | 
						|
 *    colNewStructList - the new extent struct list
 | 
						|
 *    colNewValueList - column value list for the new extent
 | 
						|
 *    rowIdArray -  row id list
 | 
						|
 *    useTmpSuffix - use temp suffix for db output file
 | 
						|
 * RETURN:
 | 
						|
 *    NO_ERROR if success
 | 
						|
 *    others if something wrong in inserting the value
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::writeColumnRec(const TxnID& txnid,
 | 
						|
                                       const ColStructList& colStructList,
 | 
						|
                                       ColValueList& colValueList,
 | 
						|
                                       RID* rowIdArray,
 | 
						|
                                       const ColStructList& newColStructList,
 | 
						|
                                       ColValueList& newColValueList,
 | 
						|
                                       const int32_t tableOid,
 | 
						|
                                       bool useTmpSuffix,
 | 
						|
                                       bool versioning)
 | 
						|
{
 | 
						|
    bool           bExcp;
 | 
						|
    int            rc = 0;
 | 
						|
    void*          valArray;
 | 
						|
    string         segFile;
 | 
						|
    Column         curCol;
 | 
						|
    ColTupleList   oldTupleList;
 | 
						|
    ColStructList::size_type  totalColumn;
 | 
						|
    ColStructList::size_type  i;
 | 
						|
    ColTupleList::size_type   totalRow1, totalRow2;
 | 
						|
 | 
						|
    setTransId(txnid);
 | 
						|
 | 
						|
    totalColumn = colStructList.size();
 | 
						|
#ifdef PROFILE
 | 
						|
    StopWatch timer;
 | 
						|
#endif
 | 
						|
 | 
						|
    if (newColValueList.size() > 0)
 | 
						|
    {
 | 
						|
        totalRow1 = colValueList[0].size();
 | 
						|
        totalRow2 = newColValueList[0].size();
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        totalRow1 = colValueList[0].size();
 | 
						|
        totalRow2 = 0;
 | 
						|
    }
 | 
						|
 | 
						|
    TableMetaData* aTbaleMetaData = TableMetaData::makeTableMetaData(tableOid);
 | 
						|
 | 
						|
    for (i = 0; i < totalColumn; i++)
 | 
						|
    {
 | 
						|
        if (totalRow2 > 0)
 | 
						|
        {
 | 
						|
            RID* secondPart = rowIdArray + totalRow1;
 | 
						|
 | 
						|
            //@Bug 2205 Check if all rows go to the new extent
 | 
						|
            if (totalRow1 > 0)
 | 
						|
            {
 | 
						|
                //Write the first batch
 | 
						|
                valArray = NULL;
 | 
						|
                RID* firstPart = rowIdArray;
 | 
						|
                ColumnOp* colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
 | 
						|
                // set params
 | 
						|
                colOp->initColumn(curCol);
 | 
						|
                // need to pass real dbRoot, partition, and segment to setColParam
 | 
						|
                colOp->setColParam(curCol, 0, colStructList[i].colWidth,
 | 
						|
                                   colStructList[i].colDataType, colStructList[i].colType, colStructList[i].dataOid,
 | 
						|
                                   colStructList[i].fCompressionType, colStructList[i].fColDbRoot,
 | 
						|
                                   colStructList[i].fColPartition, colStructList[i].fColSegment);
 | 
						|
 | 
						|
                ColExtsInfo aColExtsInfo = aTbaleMetaData->getColExtsInfo(colStructList[i].dataOid);
 | 
						|
                ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
                while (it != aColExtsInfo.end())
 | 
						|
                {
 | 
						|
                    if ((it->dbRoot == colStructList[i].fColDbRoot) && (it->partNum == colStructList[i].fColPartition) && (it->segNum == colStructList[i].fColSegment))
 | 
						|
                        break;
 | 
						|
 | 
						|
                    it++;
 | 
						|
                }
 | 
						|
 | 
						|
                if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
                {
 | 
						|
                    ColExtInfo aExt;
 | 
						|
                    aExt.dbRoot = colStructList[i].fColDbRoot;
 | 
						|
                    aExt.partNum = colStructList[i].fColPartition;
 | 
						|
                    aExt.segNum = colStructList[i].fColSegment;
 | 
						|
                    aExt.compType = colStructList[i].fCompressionType;
 | 
						|
                    aColExtsInfo.push_back(aExt);
 | 
						|
                    aTbaleMetaData->setColExtsInfo(colStructList[i].dataOid, aColExtsInfo);
 | 
						|
                }
 | 
						|
 | 
						|
                rc = colOp->openColumnFile(curCol, segFile, useTmpSuffix, IO_BUFF_SIZE); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    break;
 | 
						|
 | 
						|
                // handling versioning
 | 
						|
                vector<LBIDRange>   rangeList;
 | 
						|
 | 
						|
                if (versioning)
 | 
						|
                {
 | 
						|
                    rc = processVersionBuffer(curCol.dataFile.pFile, txnid, colStructList[i],
 | 
						|
                                              colStructList[i].colWidth, totalRow1, firstPart, rangeList);
 | 
						|
 | 
						|
                    if (rc != NO_ERROR)
 | 
						|
                    {
 | 
						|
                        if (colStructList[i].fCompressionType == 0)
 | 
						|
                        {
 | 
						|
                            curCol.dataFile.pFile->flush();
 | 
						|
                        }
 | 
						|
 | 
						|
                        BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
                        break;
 | 
						|
                    }
 | 
						|
                }
 | 
						|
 | 
						|
                //totalRow1 -= totalRow2;
 | 
						|
                // have to init the size here
 | 
						|
                // nullArray = (bool*) malloc(sizeof(bool) * totalRow);
 | 
						|
                switch (colStructList[i].colType)
 | 
						|
                {
 | 
						|
                    case WriteEngine::WR_INT:
 | 
						|
                        valArray = (int*) calloc(sizeof(int), totalRow1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_UINT:
 | 
						|
                        valArray = (uint32_t*) calloc(sizeof(uint32_t), totalRow1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
                    case WriteEngine::WR_CHAR:
 | 
						|
                    case WriteEngine::WR_BLOB:
 | 
						|
                    case WriteEngine::WR_TEXT:
 | 
						|
                        valArray = (char*) calloc(sizeof(char), totalRow1 * MAX_COLUMN_BOUNDARY);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_FLOAT:
 | 
						|
                        valArray = (float*) calloc(sizeof(float), totalRow1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_DOUBLE:
 | 
						|
                        valArray = (double*) calloc(sizeof(double), totalRow1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_BYTE:
 | 
						|
                        valArray = (char*) calloc(sizeof(char), totalRow1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_UBYTE:
 | 
						|
                        valArray = (uint8_t*) calloc(sizeof(uint8_t), totalRow1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_SHORT:
 | 
						|
                        valArray = (short*) calloc(sizeof(short), totalRow1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_USHORT:
 | 
						|
                        valArray = (uint16_t*) calloc(sizeof(uint16_t), totalRow1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_LONGLONG:
 | 
						|
                        valArray = (long long*) calloc(sizeof(long long), totalRow1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_ULONGLONG:
 | 
						|
                        valArray = (uint64_t*) calloc(sizeof(uint64_t), totalRow1);
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_TOKEN:
 | 
						|
                        valArray = (Token*) calloc(sizeof(Token), totalRow1);
 | 
						|
                        break;
 | 
						|
                }
 | 
						|
 | 
						|
                // convert values to valArray
 | 
						|
                if (m_opType != DELETE)
 | 
						|
                {
 | 
						|
                    bExcp = false;
 | 
						|
 | 
						|
                    try
 | 
						|
                    {
 | 
						|
                        convertValArray(totalRow1, colStructList[i].colType, colValueList[i], valArray);
 | 
						|
                    }
 | 
						|
                    catch (...)
 | 
						|
                    {
 | 
						|
                        bExcp = true;
 | 
						|
                    }
 | 
						|
 | 
						|
                    if (bExcp)
 | 
						|
                    {
 | 
						|
                        if (versioning)
 | 
						|
                            BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
 | 
						|
                        return ERR_PARSING;
 | 
						|
                    }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                    timer.start("writeRow ");
 | 
						|
#endif
 | 
						|
                    rc = colOp->writeRow(curCol, totalRow1, firstPart, valArray);
 | 
						|
#ifdef PROFILE
 | 
						|
                    timer.stop("writeRow ");
 | 
						|
#endif
 | 
						|
                }
 | 
						|
                else
 | 
						|
                {
 | 
						|
#ifdef PROFILE
 | 
						|
                    timer.start("writeRow ");
 | 
						|
#endif
 | 
						|
                    rc = colOp->writeRow(curCol, totalRow1, rowIdArray, valArray, true);
 | 
						|
#ifdef PROFILE
 | 
						|
                    timer.stop("writeRow ");
 | 
						|
#endif
 | 
						|
                }
 | 
						|
 | 
						|
                colOp->clearColumn(curCol);
 | 
						|
 | 
						|
                if (versioning)
 | 
						|
                    BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
 | 
						|
                if (valArray != NULL)
 | 
						|
                    free(valArray);
 | 
						|
 | 
						|
                // check error
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                    break;
 | 
						|
            }
 | 
						|
 | 
						|
            //Process the second batch
 | 
						|
            valArray = NULL;
 | 
						|
 | 
						|
            ColumnOp* colOp = m_colOp[op(newColStructList[i].fCompressionType)];
 | 
						|
 | 
						|
            // set params
 | 
						|
            colOp->initColumn(curCol);
 | 
						|
            colOp->setColParam(curCol, 0, newColStructList[i].colWidth,
 | 
						|
                               newColStructList[i].colDataType, newColStructList[i].colType, newColStructList[i].dataOid,
 | 
						|
                               newColStructList[i].fCompressionType, newColStructList[i].fColDbRoot,
 | 
						|
                               newColStructList[i].fColPartition, newColStructList[i].fColSegment);
 | 
						|
 | 
						|
            ColExtsInfo aColExtsInfo = aTbaleMetaData->getColExtsInfo(newColStructList[i].dataOid);
 | 
						|
            ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
            while (it != aColExtsInfo.end())
 | 
						|
            {
 | 
						|
                if ((it->dbRoot == newColStructList[i].fColDbRoot) && (it->partNum == newColStructList[i].fColPartition) && (it->segNum == newColStructList[i].fColSegment))
 | 
						|
                    break;
 | 
						|
 | 
						|
                it++;
 | 
						|
            }
 | 
						|
 | 
						|
            if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
            {
 | 
						|
                ColExtInfo aExt;
 | 
						|
                aExt.dbRoot = newColStructList[i].fColDbRoot;
 | 
						|
                aExt.partNum = newColStructList[i].fColPartition;
 | 
						|
                aExt.segNum = newColStructList[i].fColSegment;
 | 
						|
                aExt.compType = newColStructList[i].fCompressionType;
 | 
						|
                aColExtsInfo.push_back(aExt);
 | 
						|
                aTbaleMetaData->setColExtsInfo(newColStructList[i].dataOid, aColExtsInfo);
 | 
						|
            }
 | 
						|
 | 
						|
            // Pass "false" for hdfs tmp file flag.  Since we only allow 1
 | 
						|
            // extent per segment file (with HDFS), we can assume a second
 | 
						|
            // extent is going to a new file (and won't need tmp file).
 | 
						|
            rc = colOp->openColumnFile(curCol, segFile, false, IO_BUFF_SIZE); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                break;
 | 
						|
 | 
						|
            // handling versioning
 | 
						|
            vector<LBIDRange>   rangeList;
 | 
						|
 | 
						|
            if (versioning)
 | 
						|
            {
 | 
						|
                rc = processVersionBuffer(curCol.dataFile.pFile, txnid, newColStructList[i],
 | 
						|
                                          newColStructList[i].colWidth, totalRow2, secondPart, rangeList);
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                {
 | 
						|
                    if (newColStructList[i].fCompressionType == 0)
 | 
						|
                    {
 | 
						|
                        curCol.dataFile.pFile->flush();
 | 
						|
                    }
 | 
						|
 | 
						|
                    BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
                    break;
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
            //totalRow1 -= totalRow2;
 | 
						|
            // have to init the size here
 | 
						|
//       nullArray = (bool*) malloc(sizeof(bool) * totalRow);
 | 
						|
            switch (newColStructList[i].colType)
 | 
						|
            {
 | 
						|
                case WriteEngine::WR_INT:
 | 
						|
                    valArray = (int*) calloc(sizeof(int), totalRow2);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_UINT:
 | 
						|
                    valArray = (uint32_t*) calloc(sizeof(uint32_t), totalRow2);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
                case WriteEngine::WR_CHAR:
 | 
						|
                case WriteEngine::WR_BLOB:
 | 
						|
                case WriteEngine::WR_TEXT:
 | 
						|
                    valArray = (char*) calloc(sizeof(char), totalRow2 * MAX_COLUMN_BOUNDARY);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_FLOAT:
 | 
						|
                    valArray = (float*) calloc(sizeof(float), totalRow2);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_DOUBLE:
 | 
						|
                    valArray = (double*) calloc(sizeof(double), totalRow2);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_BYTE:
 | 
						|
                    valArray = (char*) calloc(sizeof(char), totalRow2);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_UBYTE:
 | 
						|
                    valArray = (uint8_t*) calloc(sizeof(uint8_t), totalRow2);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_SHORT:
 | 
						|
                    valArray = (short*) calloc(sizeof(short), totalRow2);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_USHORT:
 | 
						|
                    valArray = (uint16_t*) calloc(sizeof(uint16_t), totalRow2);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_LONGLONG:
 | 
						|
                    valArray = (long long*) calloc(sizeof(long long), totalRow2);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_ULONGLONG:
 | 
						|
                    valArray = (uint64_t*) calloc(sizeof(uint64_t), totalRow2);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_TOKEN:
 | 
						|
                    valArray = (Token*) calloc(sizeof(Token), totalRow2);
 | 
						|
                    break;
 | 
						|
            }
 | 
						|
 | 
						|
            // convert values to valArray
 | 
						|
            if (m_opType != DELETE)
 | 
						|
            {
 | 
						|
                bExcp = false;
 | 
						|
 | 
						|
                try
 | 
						|
                {
 | 
						|
                    convertValArray(totalRow2, newColStructList[i].colType, newColValueList[i], valArray);
 | 
						|
                }
 | 
						|
                catch (...)
 | 
						|
                {
 | 
						|
                    bExcp = true;
 | 
						|
                }
 | 
						|
 | 
						|
                if (bExcp)
 | 
						|
                {
 | 
						|
                    if (versioning)
 | 
						|
                        BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
 | 
						|
                    return ERR_PARSING;
 | 
						|
                }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                timer.start("writeRow ");
 | 
						|
#endif
 | 
						|
                rc = colOp->writeRow(curCol, totalRow2, secondPart, valArray);
 | 
						|
#ifdef PROFILE
 | 
						|
                timer.stop("writeRow ");
 | 
						|
#endif
 | 
						|
            }
 | 
						|
            else
 | 
						|
            {
 | 
						|
#ifdef PROFILE
 | 
						|
                timer.start("writeRow ");
 | 
						|
#endif
 | 
						|
                rc = colOp->writeRow(curCol, totalRow2, rowIdArray, valArray, true);
 | 
						|
#ifdef PROFILE
 | 
						|
                timer.stop("writeRow ");
 | 
						|
#endif
 | 
						|
            }
 | 
						|
 | 
						|
 | 
						|
            colOp->clearColumn(curCol);
 | 
						|
 | 
						|
            if (versioning)
 | 
						|
                BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
 | 
						|
            if (valArray != NULL)
 | 
						|
                free(valArray);
 | 
						|
 | 
						|
            // check error
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                break;
 | 
						|
        }
 | 
						|
        else
 | 
						|
        {
 | 
						|
            valArray = NULL;
 | 
						|
 | 
						|
            ColumnOp* colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
 | 
						|
            // set params
 | 
						|
            colOp->initColumn(curCol);
 | 
						|
            colOp->setColParam(curCol, 0, colStructList[i].colWidth,
 | 
						|
                               colStructList[i].colDataType, colStructList[i].colType, colStructList[i].dataOid,
 | 
						|
                               colStructList[i].fCompressionType, colStructList[i].fColDbRoot,
 | 
						|
                               colStructList[i].fColPartition, colStructList[i].fColSegment);
 | 
						|
 | 
						|
            rc = colOp->openColumnFile(curCol, segFile, useTmpSuffix, IO_BUFF_SIZE); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            //cout << " Opened file oid " << curCol.dataFile.pFile << endl;
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                break;
 | 
						|
 | 
						|
            ColExtsInfo aColExtsInfo = aTbaleMetaData->getColExtsInfo(colStructList[i].dataOid);
 | 
						|
            ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
            while (it != aColExtsInfo.end())
 | 
						|
            {
 | 
						|
                if ((it->dbRoot == colStructList[i].fColDbRoot) && (it->partNum == colStructList[i].fColPartition) && (it->segNum == colStructList[i].fColSegment))
 | 
						|
                    break;
 | 
						|
 | 
						|
                it++;
 | 
						|
            }
 | 
						|
 | 
						|
            if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
            {
 | 
						|
                ColExtInfo aExt;
 | 
						|
                aExt.dbRoot = colStructList[i].fColDbRoot;
 | 
						|
                aExt.partNum = colStructList[i].fColPartition;
 | 
						|
                aExt.segNum = colStructList[i].fColSegment;
 | 
						|
                aExt.compType = colStructList[i].fCompressionType;
 | 
						|
                aColExtsInfo.push_back(aExt);
 | 
						|
                aTbaleMetaData->setColExtsInfo(colStructList[i].dataOid, aColExtsInfo);
 | 
						|
            }
 | 
						|
 | 
						|
            // handling versioning
 | 
						|
            vector<LBIDRange>   rangeList;
 | 
						|
 | 
						|
            if (versioning)
 | 
						|
            {
 | 
						|
                rc = processVersionBuffer(curCol.dataFile.pFile, txnid, colStructList[i],
 | 
						|
                                          colStructList[i].colWidth, totalRow1, rowIdArray, rangeList);
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                {
 | 
						|
                    if (colStructList[i].fCompressionType == 0)
 | 
						|
                    {
 | 
						|
                        curCol.dataFile.pFile->flush();
 | 
						|
                    }
 | 
						|
 | 
						|
                    BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
                    break;
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
            // have to init the size here
 | 
						|
//       nullArray = (bool*) malloc(sizeof(bool) * totalRow);
 | 
						|
            switch (colStructList[i].colType)
 | 
						|
            {
 | 
						|
                case WriteEngine::WR_INT:
 | 
						|
                    valArray = (int*) calloc(sizeof(int), totalRow1);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_UINT:
 | 
						|
                    valArray = (uint32_t*) calloc(sizeof(uint32_t), totalRow1);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
                case WriteEngine::WR_CHAR:
 | 
						|
                case WriteEngine::WR_BLOB:
 | 
						|
                case WriteEngine::WR_TEXT:
 | 
						|
                    valArray = (char*) calloc(sizeof(char), totalRow1 * MAX_COLUMN_BOUNDARY);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_FLOAT:
 | 
						|
                    valArray = (float*) calloc(sizeof(float), totalRow1);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_DOUBLE:
 | 
						|
                    valArray = (double*) calloc(sizeof(double), totalRow1);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_BYTE:
 | 
						|
                    valArray = (char*) calloc(sizeof(char), totalRow1);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_UBYTE:
 | 
						|
                    valArray = (uint8_t*) calloc(sizeof(uint8_t), totalRow1);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_SHORT:
 | 
						|
                    valArray = (short*) calloc(sizeof(short), totalRow1);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_USHORT:
 | 
						|
                    valArray = (uint16_t*) calloc(sizeof(uint16_t), totalRow1);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_LONGLONG:
 | 
						|
                    valArray = (long long*) calloc(sizeof(long long), totalRow1);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_ULONGLONG:
 | 
						|
                    valArray = (uint64_t*) calloc(sizeof(uint64_t), totalRow1);
 | 
						|
                    break;
 | 
						|
 | 
						|
                case WriteEngine::WR_TOKEN:
 | 
						|
                    valArray = (Token*) calloc(sizeof(Token), totalRow1);
 | 
						|
                    break;
 | 
						|
            }
 | 
						|
 | 
						|
            // convert values to valArray
 | 
						|
            if (m_opType != DELETE)
 | 
						|
            {
 | 
						|
                bExcp = false;
 | 
						|
 | 
						|
                try
 | 
						|
                {
 | 
						|
                    convertValArray(totalRow1, colStructList[i].colType, colValueList[i], valArray);
 | 
						|
                }
 | 
						|
                catch (...)
 | 
						|
                {
 | 
						|
                    bExcp = true;
 | 
						|
                }
 | 
						|
 | 
						|
                if (bExcp)
 | 
						|
                {
 | 
						|
                    if (versioning)
 | 
						|
                        BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
 | 
						|
                    return ERR_PARSING;
 | 
						|
                }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
                timer.start("writeRow ");
 | 
						|
#endif
 | 
						|
                rc = colOp->writeRow(curCol, totalRow1, rowIdArray, valArray);
 | 
						|
#ifdef PROFILE
 | 
						|
                timer.stop("writeRow ");
 | 
						|
#endif
 | 
						|
            }
 | 
						|
            else
 | 
						|
            {
 | 
						|
#ifdef PROFILE
 | 
						|
                timer.start("writeRow ");
 | 
						|
#endif
 | 
						|
                rc = colOp->writeRow(curCol, totalRow1, rowIdArray, valArray, true);
 | 
						|
#ifdef PROFILE
 | 
						|
                timer.stop("writeRow ");
 | 
						|
#endif
 | 
						|
            }
 | 
						|
 | 
						|
            colOp->clearColumn(curCol);
 | 
						|
 | 
						|
            if (versioning)
 | 
						|
                BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
 | 
						|
            if (valArray != NULL)
 | 
						|
                free(valArray);
 | 
						|
 | 
						|
            // check error
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                break;
 | 
						|
        }
 | 
						|
    } // end of for (i = 0
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.finish();
 | 
						|
#endif
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::writeColumnRecBinary(const TxnID& txnid,
 | 
						|
        const ColStructList& colStructList,
 | 
						|
        std::vector<uint64_t>& colValueList,
 | 
						|
        RID* rowIdArray,
 | 
						|
        const ColStructList& newColStructList,
 | 
						|
        std::vector<uint64_t>& newColValueList,
 | 
						|
        const int32_t tableOid,
 | 
						|
        bool useTmpSuffix,
 | 
						|
        bool versioning)
 | 
						|
{
 | 
						|
    int            rc = 0;
 | 
						|
    void*          valArray = NULL;
 | 
						|
    string         segFile;
 | 
						|
    Column         curCol;
 | 
						|
    ColStructList::size_type  totalColumn;
 | 
						|
    ColStructList::size_type  i;
 | 
						|
    size_t   totalRow1, totalRow2;
 | 
						|
 | 
						|
    setTransId(txnid);
 | 
						|
 | 
						|
    totalColumn = colStructList.size();
 | 
						|
#ifdef PROFILE
 | 
						|
    StopWatch timer;
 | 
						|
#endif
 | 
						|
 | 
						|
    totalRow1 = colValueList.size() / totalColumn;
 | 
						|
 | 
						|
    if (newColValueList.size() > 0)
 | 
						|
    {
 | 
						|
        totalRow2 = newColValueList.size() / newColStructList.size();
 | 
						|
        totalRow1 -= totalRow2;
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        totalRow2 = 0;
 | 
						|
    }
 | 
						|
 | 
						|
    // It is possible totalRow1 is zero but totalRow2 has values
 | 
						|
    if ((totalRow1 == 0) && (totalRow2 == 0))
 | 
						|
        return rc;
 | 
						|
 | 
						|
    TableMetaData* aTbaleMetaData = TableMetaData::makeTableMetaData(tableOid);
 | 
						|
 | 
						|
    if (totalRow1)
 | 
						|
    {
 | 
						|
        valArray = malloc(sizeof(uint64_t) * totalRow1);
 | 
						|
 | 
						|
        for (i = 0; i < totalColumn; i++)
 | 
						|
        {
 | 
						|
            //@Bug 2205 Check if all rows go to the new extent
 | 
						|
            //Write the first batch
 | 
						|
            RID* firstPart = rowIdArray;
 | 
						|
            ColumnOp* colOp = m_colOp[op(colStructList[i].fCompressionType)];
 | 
						|
 | 
						|
            // set params
 | 
						|
            colOp->initColumn(curCol);
 | 
						|
            // need to pass real dbRoot, partition, and segment to setColParam
 | 
						|
            colOp->setColParam(curCol, 0, colStructList[i].colWidth,
 | 
						|
                               colStructList[i].colDataType, colStructList[i].colType, colStructList[i].dataOid,
 | 
						|
                               colStructList[i].fCompressionType, colStructList[i].fColDbRoot,
 | 
						|
                               colStructList[i].fColPartition, colStructList[i].fColSegment);
 | 
						|
 | 
						|
            ColExtsInfo aColExtsInfo = aTbaleMetaData->getColExtsInfo(colStructList[i].dataOid);
 | 
						|
            ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
            while (it != aColExtsInfo.end())
 | 
						|
            {
 | 
						|
                if ((it->dbRoot == colStructList[i].fColDbRoot) && (it->partNum == colStructList[i].fColPartition) && (it->segNum == colStructList[i].fColSegment))
 | 
						|
                    break;
 | 
						|
 | 
						|
                it++;
 | 
						|
            }
 | 
						|
 | 
						|
            if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
            {
 | 
						|
                ColExtInfo aExt;
 | 
						|
                aExt.dbRoot = colStructList[i].fColDbRoot;
 | 
						|
                aExt.partNum = colStructList[i].fColPartition;
 | 
						|
                aExt.segNum = colStructList[i].fColSegment;
 | 
						|
                aExt.compType = colStructList[i].fCompressionType;
 | 
						|
                aColExtsInfo.push_back(aExt);
 | 
						|
                aTbaleMetaData->setColExtsInfo(colStructList[i].dataOid, aColExtsInfo);
 | 
						|
            }
 | 
						|
 | 
						|
            rc = colOp->openColumnFile(curCol, segFile, useTmpSuffix, IO_BUFF_SIZE); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                break;
 | 
						|
 | 
						|
            // handling versioning
 | 
						|
            vector<LBIDRange>   rangeList;
 | 
						|
 | 
						|
            if (versioning)
 | 
						|
            {
 | 
						|
                rc = processVersionBuffer(curCol.dataFile.pFile, txnid, colStructList[i],
 | 
						|
                                          colStructList[i].colWidth, totalRow1, firstPart, rangeList);
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                {
 | 
						|
                    if (colStructList[i].fCompressionType == 0)
 | 
						|
                    {
 | 
						|
                        curCol.dataFile.pFile->flush();
 | 
						|
                    }
 | 
						|
 | 
						|
                    BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
                    break;
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
            //totalRow1 -= totalRow2;
 | 
						|
            // have to init the size here
 | 
						|
            // nullArray = (bool*) malloc(sizeof(bool) * totalRow);
 | 
						|
            uint8_t tmp8;
 | 
						|
            uint16_t tmp16;
 | 
						|
            uint32_t tmp32;
 | 
						|
 | 
						|
            for (size_t j = 0; j < totalRow1; j++)
 | 
						|
            {
 | 
						|
                uint64_t curValue = colValueList[((totalRow1 + totalRow2) * i) + j];
 | 
						|
 | 
						|
                switch (colStructList[i].colType)
 | 
						|
                {
 | 
						|
                    case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
                    case WriteEngine::WR_CHAR:
 | 
						|
                    case WriteEngine::WR_BLOB:
 | 
						|
                    case WriteEngine::WR_TEXT:
 | 
						|
                        ((uint64_t*)valArray)[j] = curValue;
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_INT:
 | 
						|
                    case WriteEngine::WR_UINT:
 | 
						|
                    case WriteEngine::WR_FLOAT:
 | 
						|
                        tmp32 = curValue;
 | 
						|
                        ((uint32_t*)valArray)[j] = tmp32;
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_ULONGLONG:
 | 
						|
                    case WriteEngine::WR_LONGLONG:
 | 
						|
                    case WriteEngine::WR_DOUBLE:
 | 
						|
                    case WriteEngine::WR_TOKEN:
 | 
						|
                        ((uint64_t*)valArray)[j] = curValue;
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_BYTE:
 | 
						|
                    case WriteEngine::WR_UBYTE:
 | 
						|
                        tmp8 = curValue;
 | 
						|
                        ((uint8_t*)valArray)[j] = tmp8;
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_SHORT:
 | 
						|
                    case WriteEngine::WR_USHORT:
 | 
						|
                        tmp16 = curValue;
 | 
						|
                        ((uint16_t*)valArray)[j] = tmp16;
 | 
						|
                        break;
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
            timer.start("writeRow ");
 | 
						|
#endif
 | 
						|
            rc = colOp->writeRow(curCol, totalRow1, firstPart, valArray);
 | 
						|
#ifdef PROFILE
 | 
						|
            timer.stop("writeRow ");
 | 
						|
#endif
 | 
						|
            colOp->closeColumnFile(curCol);
 | 
						|
 | 
						|
            if (versioning)
 | 
						|
                BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
 | 
						|
            // check error
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                break;
 | 
						|
 | 
						|
        } // end of for (i = 0
 | 
						|
 | 
						|
        if (valArray != NULL)
 | 
						|
        {
 | 
						|
            free(valArray);
 | 
						|
            valArray = NULL;
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    // MCOL-1176 - Write second extent
 | 
						|
    if (totalRow2)
 | 
						|
    {
 | 
						|
        valArray = malloc(sizeof(uint64_t) * totalRow2);
 | 
						|
 | 
						|
        for (i = 0; i < newColStructList.size(); i++)
 | 
						|
        {
 | 
						|
            //@Bug 2205 Check if all rows go to the new extent
 | 
						|
            //Write the first batch
 | 
						|
            RID* secondPart = rowIdArray + totalRow1;
 | 
						|
            ColumnOp* colOp = m_colOp[op(newColStructList[i].fCompressionType)];
 | 
						|
 | 
						|
            // set params
 | 
						|
            colOp->initColumn(curCol);
 | 
						|
            // need to pass real dbRoot, partition, and segment to setColParam
 | 
						|
            colOp->setColParam(curCol, 0, newColStructList[i].colWidth,
 | 
						|
                               newColStructList[i].colDataType, newColStructList[i].colType, newColStructList[i].dataOid,
 | 
						|
                               newColStructList[i].fCompressionType, newColStructList[i].fColDbRoot,
 | 
						|
                               newColStructList[i].fColPartition, newColStructList[i].fColSegment);
 | 
						|
 | 
						|
            ColExtsInfo aColExtsInfo = aTbaleMetaData->getColExtsInfo(newColStructList[i].dataOid);
 | 
						|
            ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
            while (it != aColExtsInfo.end())
 | 
						|
            {
 | 
						|
                if ((it->dbRoot == newColStructList[i].fColDbRoot) && (it->partNum == newColStructList[i].fColPartition) && (it->segNum == colStructList[i].fColSegment))
 | 
						|
                    break;
 | 
						|
 | 
						|
                it++;
 | 
						|
            }
 | 
						|
 | 
						|
            if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
            {
 | 
						|
                ColExtInfo aExt;
 | 
						|
                aExt.dbRoot = newColStructList[i].fColDbRoot;
 | 
						|
                aExt.partNum = newColStructList[i].fColPartition;
 | 
						|
                aExt.segNum = newColStructList[i].fColSegment;
 | 
						|
                aExt.compType = newColStructList[i].fCompressionType;
 | 
						|
                aColExtsInfo.push_back(aExt);
 | 
						|
                aTbaleMetaData->setColExtsInfo(newColStructList[i].dataOid, aColExtsInfo);
 | 
						|
            }
 | 
						|
 | 
						|
            rc = colOp->openColumnFile(curCol, segFile, useTmpSuffix, IO_BUFF_SIZE); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                break;
 | 
						|
 | 
						|
            // handling versioning
 | 
						|
            vector<LBIDRange>   rangeList;
 | 
						|
 | 
						|
            if (versioning)
 | 
						|
            {
 | 
						|
                rc = processVersionBuffer(curCol.dataFile.pFile, txnid, newColStructList[i],
 | 
						|
                                          newColStructList[i].colWidth, totalRow2, secondPart, rangeList);
 | 
						|
 | 
						|
                if (rc != NO_ERROR)
 | 
						|
                {
 | 
						|
                    if (newColStructList[i].fCompressionType == 0)
 | 
						|
                    {
 | 
						|
                        curCol.dataFile.pFile->flush();
 | 
						|
                    }
 | 
						|
 | 
						|
                    BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
                    break;
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
            //totalRow1 -= totalRow2;
 | 
						|
            // have to init the size here
 | 
						|
            // nullArray = (bool*) malloc(sizeof(bool) * totalRow);
 | 
						|
            uint8_t tmp8;
 | 
						|
            uint16_t tmp16;
 | 
						|
            uint32_t tmp32;
 | 
						|
 | 
						|
            for (size_t j = 0; j < totalRow2; j++)
 | 
						|
            {
 | 
						|
                uint64_t curValue = newColValueList[(totalRow2 * i) + j];
 | 
						|
 | 
						|
                switch (newColStructList[i].colType)
 | 
						|
                {
 | 
						|
                    case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
                    case WriteEngine::WR_CHAR:
 | 
						|
                    case WriteEngine::WR_BLOB:
 | 
						|
                    case WriteEngine::WR_TEXT:
 | 
						|
                        ((uint64_t*)valArray)[j] = curValue;
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_INT:
 | 
						|
                    case WriteEngine::WR_UINT:
 | 
						|
                    case WriteEngine::WR_FLOAT:
 | 
						|
                        tmp32 = curValue;
 | 
						|
                        ((uint32_t*)valArray)[j] = tmp32;
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_ULONGLONG:
 | 
						|
                    case WriteEngine::WR_LONGLONG:
 | 
						|
                    case WriteEngine::WR_DOUBLE:
 | 
						|
                    case WriteEngine::WR_TOKEN:
 | 
						|
                        ((uint64_t*)valArray)[j] = curValue;
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_BYTE:
 | 
						|
                    case WriteEngine::WR_UBYTE:
 | 
						|
                        tmp8 = curValue;
 | 
						|
                        ((uint8_t*)valArray)[j] = tmp8;
 | 
						|
                        break;
 | 
						|
 | 
						|
                    case WriteEngine::WR_SHORT:
 | 
						|
                    case WriteEngine::WR_USHORT:
 | 
						|
                        tmp16 = curValue;
 | 
						|
                        ((uint16_t*)valArray)[j] = tmp16;
 | 
						|
                        break;
 | 
						|
                }
 | 
						|
            }
 | 
						|
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
            timer.start("writeRow ");
 | 
						|
#endif
 | 
						|
            rc = colOp->writeRow(curCol, totalRow2, secondPart, valArray);
 | 
						|
#ifdef PROFILE
 | 
						|
            timer.stop("writeRow ");
 | 
						|
#endif
 | 
						|
            colOp->closeColumnFile(curCol);
 | 
						|
 | 
						|
            if (versioning)
 | 
						|
                BRMWrapper::getInstance()->writeVBEnd(txnid, rangeList);
 | 
						|
 | 
						|
            // check error
 | 
						|
            if (rc != NO_ERROR)
 | 
						|
                break;
 | 
						|
 | 
						|
        } // end of for (i = 0
 | 
						|
    }
 | 
						|
 | 
						|
    if (valArray != NULL)
 | 
						|
        free(valArray);
 | 
						|
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    timer.finish();
 | 
						|
#endif
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
int WriteEngineWrapper::writeColumnRec(const TxnID& txnid,
 | 
						|
                                       const ColStructList& colStructList,
 | 
						|
                                       const ColValueList& colValueList,
 | 
						|
                                       vector<void*>& colOldValueList,
 | 
						|
                                       const RIDList& ridList,
 | 
						|
                                       const int32_t tableOid,
 | 
						|
                                       bool convertStructFlag,
 | 
						|
                                       ColTupleList::size_type nRows)
 | 
						|
{
 | 
						|
    bool           bExcp;
 | 
						|
    int            rc = 0;
 | 
						|
    void*          valArray = NULL;
 | 
						|
    Column         curCol;
 | 
						|
    ColStruct      curColStruct;
 | 
						|
    ColTupleList   curTupleList, oldTupleList;
 | 
						|
    ColStructList::size_type  totalColumn;
 | 
						|
    ColStructList::size_type  i;
 | 
						|
    ColTupleList::size_type   totalRow;
 | 
						|
 | 
						|
    setTransId(txnid);
 | 
						|
    colOldValueList.clear();
 | 
						|
    totalColumn = colStructList.size();
 | 
						|
    totalRow = nRows;
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
    StopWatch timer;
 | 
						|
#endif
 | 
						|
 | 
						|
    vector<LBIDRange>   rangeListTot;
 | 
						|
    std::vector<VBRange> freeList;
 | 
						|
    vector<vector<uint32_t> > fboLists;
 | 
						|
    vector<vector<LBIDRange> > rangeLists;
 | 
						|
    rc = processBeginVBCopy(txnid, colStructList, ridList, freeList, fboLists, rangeLists, rangeListTot);
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
    {
 | 
						|
        if (rangeListTot.size() > 0)
 | 
						|
            BRMWrapper::getInstance()->writeVBEnd(txnid, rangeListTot);
 | 
						|
 | 
						|
        switch (rc)
 | 
						|
        {
 | 
						|
            case BRM::ERR_DEADLOCK:
 | 
						|
                return ERR_BRM_DEAD_LOCK;
 | 
						|
 | 
						|
            case BRM::ERR_VBBM_OVERFLOW:
 | 
						|
                return ERR_BRM_VB_OVERFLOW;
 | 
						|
 | 
						|
            case BRM::ERR_NETWORK:
 | 
						|
                return ERR_BRM_NETWORK;
 | 
						|
 | 
						|
            case BRM::ERR_READONLY:
 | 
						|
                return ERR_BRM_READONLY;
 | 
						|
 | 
						|
            default:
 | 
						|
                return ERR_BRM_BEGIN_COPY;
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    VBRange aRange;
 | 
						|
    uint32_t blocksProcessedThisOid = 0;
 | 
						|
    uint32_t blocksProcessed = 0;
 | 
						|
    std::vector<BRM::FileInfo> files;
 | 
						|
    TableMetaData* aTbaleMetaData = TableMetaData::makeTableMetaData(tableOid);
 | 
						|
 | 
						|
    for (i = 0; i < totalColumn; i++)
 | 
						|
    {
 | 
						|
        valArray = NULL;
 | 
						|
        curColStruct = colStructList[i];
 | 
						|
        curTupleList = colValueList[i]; //same value for all rows
 | 
						|
        ColumnOp* colOp = m_colOp[op(curColStruct.fCompressionType)];
 | 
						|
 | 
						|
        // convert column data type
 | 
						|
        if (convertStructFlag)
 | 
						|
            Convertor::convertColType(&curColStruct);
 | 
						|
 | 
						|
        // set params
 | 
						|
        colOp->initColumn(curCol);
 | 
						|
        colOp->setColParam(curCol, 0, curColStruct.colWidth,
 | 
						|
                           curColStruct.colDataType, curColStruct.colType, curColStruct.dataOid,
 | 
						|
                           curColStruct.fCompressionType, curColStruct.fColDbRoot,
 | 
						|
                           curColStruct.fColPartition, curColStruct.fColSegment);
 | 
						|
 | 
						|
 | 
						|
        ColExtsInfo aColExtsInfo = aTbaleMetaData->getColExtsInfo(curColStruct.dataOid);
 | 
						|
        ColExtsInfo::iterator it = aColExtsInfo.begin();
 | 
						|
 | 
						|
        while (it != aColExtsInfo.end())
 | 
						|
        {
 | 
						|
            if ((it->dbRoot == curColStruct.fColDbRoot) && (it->partNum == curColStruct.fColPartition) && (it->segNum == curColStruct.fColSegment))
 | 
						|
                break;
 | 
						|
 | 
						|
            it++;
 | 
						|
        }
 | 
						|
 | 
						|
        if (it == aColExtsInfo.end()) //add this one to the list
 | 
						|
        {
 | 
						|
            ColExtInfo aExt;
 | 
						|
            aExt.dbRoot = curColStruct.fColDbRoot;
 | 
						|
            aExt.partNum = curColStruct.fColPartition;
 | 
						|
            aExt.segNum = curColStruct.fColSegment;
 | 
						|
            aExt.compType = curColStruct.fCompressionType;
 | 
						|
            aColExtsInfo.push_back(aExt);
 | 
						|
            aTbaleMetaData->setColExtsInfo(colStructList[i].dataOid, aColExtsInfo);
 | 
						|
        }
 | 
						|
 | 
						|
        string segFile;
 | 
						|
        rc = colOp->openColumnFile(curCol, segFile, true, IO_BUFF_SIZE); // @bug 5572 HDFS tmp file
 | 
						|
 | 
						|
        if (rc != NO_ERROR)
 | 
						|
            break;
 | 
						|
 | 
						|
        if (curColStruct.fCompressionType == 0)
 | 
						|
        {
 | 
						|
            BRM::FileInfo aFile;
 | 
						|
            aFile.oid = curColStruct.dataOid;
 | 
						|
            aFile.partitionNum = curColStruct.fColPartition;
 | 
						|
            aFile.dbRoot = curColStruct.fColDbRoot;;
 | 
						|
            aFile.segmentNum = curColStruct.fColSegment;
 | 
						|
            aFile.compType = curColStruct.fCompressionType;
 | 
						|
            files.push_back(aFile);
 | 
						|
        }
 | 
						|
 | 
						|
        // handling versioning
 | 
						|
        //cout << " pass to processVersionBuffer rid " << rowIdArray[0] << endl;
 | 
						|
        //cout << "dataOid:fColPartition = " << curColStruct.dataOid << ":" << curColStruct.fColPartition << endl;
 | 
						|
//timer.start("processVersionBuffers");
 | 
						|
        //vector<LBIDRange>   rangeList;
 | 
						|
        // rc = processVersionBuffers(curCol.dataFile.pFile, txnid, curColStruct, curColStruct.colWidth, totalRow, ridList, rangeList);
 | 
						|
        std::vector<VBRange> curFreeList;
 | 
						|
        uint32_t blockUsed = 0;
 | 
						|
 | 
						|
        if (!idbdatafile::IDBPolicy::useHdfs())
 | 
						|
        {
 | 
						|
            if (rangeListTot.size() > 0)
 | 
						|
            {
 | 
						|
                if (freeList[0].size >= (blocksProcessed + rangeLists[i].size()))
 | 
						|
                {
 | 
						|
                    aRange.vbOID = freeList[0].vbOID;
 | 
						|
                    aRange.vbFBO = freeList[0].vbFBO + blocksProcessed;
 | 
						|
                    aRange.size = rangeLists[i].size();
 | 
						|
                    curFreeList.push_back(aRange);
 | 
						|
                    //cout << "range size = " << aRange.size <<" and blocksProcessed = " << blocksProcessed<< endl;
 | 
						|
                }
 | 
						|
                else
 | 
						|
                {
 | 
						|
                    aRange.vbOID = freeList[0].vbOID;
 | 
						|
                    aRange.vbFBO = freeList[0].vbFBO + blocksProcessed;
 | 
						|
                    aRange.size = freeList[0].size - blocksProcessed;
 | 
						|
                    blockUsed = aRange.size;
 | 
						|
                    curFreeList.push_back(aRange);
 | 
						|
 | 
						|
                    if (freeList.size() > 1)
 | 
						|
                    {
 | 
						|
                        aRange.vbOID = freeList[1].vbOID;
 | 
						|
                        aRange.vbFBO = freeList[1].vbFBO + blocksProcessedThisOid;
 | 
						|
                        aRange.size = rangeLists[i].size() - blockUsed;
 | 
						|
                        curFreeList.push_back(aRange);
 | 
						|
                        blocksProcessedThisOid += aRange.size;
 | 
						|
                    }
 | 
						|
                    else
 | 
						|
                    {
 | 
						|
                        rc = 1;
 | 
						|
                        break;
 | 
						|
                    }
 | 
						|
 | 
						|
                    //cout << "curFreeList size = " << curFreeList.size() << endl;
 | 
						|
 | 
						|
                }
 | 
						|
 | 
						|
                blocksProcessed += rangeLists[i].size();
 | 
						|
 | 
						|
                //timer.start("Delete:writeVB");
 | 
						|
                rc = BRMWrapper::getInstance()->
 | 
						|
                     writeVB(curCol.dataFile.pFile, (BRM::VER_t)txnid,
 | 
						|
                             curColStruct.dataOid, fboLists[i], rangeLists[i],
 | 
						|
                             colOp, curFreeList, curColStruct.fColDbRoot, true);
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        //timer.stop("Delete:writeVB");
 | 
						|
//timer.stop("processVersionBuffers");
 | 
						|
        // cout << " rc for processVersionBuffer is " << rc << endl;
 | 
						|
        if (rc != NO_ERROR)
 | 
						|
        {
 | 
						|
            if (curColStruct.fCompressionType == 0)
 | 
						|
            {
 | 
						|
                curCol.dataFile.pFile->flush();
 | 
						|
            }
 | 
						|
 | 
						|
            if (rangeListTot.size() > 0)
 | 
						|
                BRMWrapper::getInstance()->writeVBEnd(txnid, rangeListTot);
 | 
						|
 | 
						|
            break;
 | 
						|
        }
 | 
						|
 | 
						|
        switch (curColStruct.colType)
 | 
						|
        {
 | 
						|
            case WriteEngine::WR_INT:
 | 
						|
                valArray = (int*) calloc(sizeof(int), 1);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_UINT:
 | 
						|
                valArray = (uint32_t*) calloc(sizeof(uint32_t), 1);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_VARBINARY : // treat same as char for now
 | 
						|
            case WriteEngine::WR_CHAR:
 | 
						|
            case WriteEngine::WR_BLOB:
 | 
						|
            case WriteEngine::WR_TEXT:
 | 
						|
                valArray = (char*) calloc(sizeof(char), 1 * MAX_COLUMN_BOUNDARY);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_FLOAT:
 | 
						|
                valArray = (float*) calloc(sizeof(float), 1);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_DOUBLE:
 | 
						|
                valArray = (double*) calloc(sizeof(double), 1);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_BYTE:
 | 
						|
                valArray = (char*) calloc(sizeof(char), 1);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_UBYTE:
 | 
						|
                valArray = (uint8_t*) calloc(sizeof(uint8_t), 1);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_SHORT:
 | 
						|
                valArray = (short*) calloc(sizeof(short), 1);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_USHORT:
 | 
						|
                valArray = (uint16_t*) calloc(sizeof(uint16_t), 1);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_LONGLONG:
 | 
						|
                valArray = (long long*) calloc(sizeof(long long), 1);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_ULONGLONG:
 | 
						|
                valArray = (uint64_t*) calloc(sizeof(uint64_t), 1);
 | 
						|
                break;
 | 
						|
 | 
						|
            case WriteEngine::WR_TOKEN:
 | 
						|
                valArray = (Token*) calloc(sizeof(Token), 1);
 | 
						|
                break;
 | 
						|
        }
 | 
						|
 | 
						|
        // convert values to valArray
 | 
						|
        if (m_opType != DELETE)
 | 
						|
        {
 | 
						|
            bExcp = false;
 | 
						|
            ColTuple    curTuple;
 | 
						|
            curTuple = curTupleList[0];
 | 
						|
 | 
						|
            try
 | 
						|
            {
 | 
						|
                convertValue(curColStruct.colType, valArray, curTuple.data);
 | 
						|
            }
 | 
						|
            catch (...)
 | 
						|
            {
 | 
						|
                bExcp = true;
 | 
						|
            }
 | 
						|
 | 
						|
            if (bExcp)
 | 
						|
            {
 | 
						|
                if (rangeListTot.size() > 0)
 | 
						|
                    BRMWrapper::getInstance()->writeVBEnd(txnid, rangeListTot);
 | 
						|
 | 
						|
                return ERR_PARSING;
 | 
						|
            }
 | 
						|
 | 
						|
#ifdef PROFILE
 | 
						|
            timer.start("writeRow ");
 | 
						|
#endif
 | 
						|
            rc = colOp->writeRows(curCol, totalRow, ridList, valArray);
 | 
						|
#ifdef PROFILE
 | 
						|
            timer.stop("writeRow ");
 | 
						|
#endif
 | 
						|
        }
 | 
						|
        else
 | 
						|
        {
 | 
						|
#ifdef PROFILE
 | 
						|
            timer.start("writeRows ");
 | 
						|
#endif
 | 
						|
            rc = colOp->writeRows(curCol, totalRow, ridList, valArray, 0, true);
 | 
						|
#ifdef PROFILE
 | 
						|
            timer.stop("writeRows ");
 | 
						|
#endif
 | 
						|
        }
 | 
						|
 | 
						|
//     colOldValueList.push_back(oldValArray);
 | 
						|
//timer.start("Delete:closefile");
 | 
						|
        colOp->clearColumn(curCol);
 | 
						|
 | 
						|
//timer.stop("Delete:closefile");
 | 
						|
        if (valArray != NULL)
 | 
						|
            free(valArray);
 | 
						|
 | 
						|
        // check error
 | 
						|
        if (rc != NO_ERROR)
 | 
						|
            break;
 | 
						|
 | 
						|
    } // end of for (i = 0)
 | 
						|
 | 
						|
// timer.start("Delete:purgePrimProcFdCache");
 | 
						|
    if ((idbdatafile::IDBPolicy::useHdfs()) && (files.size() > 0))
 | 
						|
        cacheutils::purgePrimProcFdCache(files, Config::getLocalModuleID());
 | 
						|
 | 
						|
//if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
//			cacheutils::dropPrimProcFdCache();
 | 
						|
//timer.stop("Delete:purgePrimProcFdCache");
 | 
						|
    if (rangeListTot.size() > 0)
 | 
						|
        BRMWrapper::getInstance()->writeVBEnd(txnid, rangeListTot);
 | 
						|
 | 
						|
//timer.stop("Delete:writecolrec");
 | 
						|
//#ifdef PROFILE
 | 
						|
//timer.finish();
 | 
						|
//#endif
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
/*@brief tokenize - return a token for a given signature and size
 | 
						|
*/
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *  return a token for a given signature and size
 | 
						|
 *  If it is not in the dictionary, the signature
 | 
						|
 *  will be added to the dictionary and the index tree
 | 
						|
 *  If it is already in the dictionary, then
 | 
						|
 *  the token will be returned
 | 
						|
 *  This function does not open and close files.
 | 
						|
 *  users need to use openDctnry and CloseDctnry
 | 
						|
 * PARAMETERS:
 | 
						|
 *  DctnryTuple& dctnryTuple - holds the sigValue, sigSize and token
 | 
						|
 * RETURN:
 | 
						|
 *    NO_ERROR if success
 | 
						|
 *    others if something wrong in inserting the value
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::tokenize(const TxnID& txnid, DctnryTuple& dctnryTuple, int ct)
 | 
						|
{
 | 
						|
    int cop = op(ct);
 | 
						|
    m_dctnry[cop]->setTransId(txnid);
 | 
						|
    //cout << "Tokenizing dctnryTuple.sigValue " << dctnryTuple.sigValue << endl;
 | 
						|
    return m_dctnry[cop]->updateDctnry(dctnryTuple.sigValue, dctnryTuple.sigSize, dctnryTuple.token);
 | 
						|
}
 | 
						|
 | 
						|
/*@brief tokenize - return a token for a given signature and size
 | 
						|
 *                          accept OIDs as input
 | 
						|
*/
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *  Token for a given signature and size
 | 
						|
 *  If it is not in the dictionary, the signature
 | 
						|
 *  will be added to the dictionary and the index tree
 | 
						|
 *  If it is already in the dictionary, then
 | 
						|
 *  the token will be returned
 | 
						|
 * PARAMETERS:
 | 
						|
 *  DctnryTuple& dctnryTuple - holds the sigValue, sigSize and token
 | 
						|
 *  DctnryStruct dctnryStruct- contain the 3 OID for dictionary,
 | 
						|
 *                             tree and list.
 | 
						|
 * RETURN:
 | 
						|
 *    NO_ERROR if success
 | 
						|
 *    others if something wrong in inserting the value
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::tokenize(const TxnID& txnid,
 | 
						|
                                 DctnryStruct& dctnryStruct,
 | 
						|
                                 DctnryTuple& dctnryTuple,
 | 
						|
                                 bool useTmpSuffix) // @bug 5572 HDFS tmp file
 | 
						|
{
 | 
						|
    //find the corresponding column segment file the token is going to be inserted.
 | 
						|
 | 
						|
    Dctnry* dctnry = m_dctnry[op(dctnryStruct.fCompressionType)];
 | 
						|
    int rc = dctnry->openDctnry(dctnryStruct.dctnryOid,
 | 
						|
                                dctnryStruct.fColDbRoot, dctnryStruct.fColPartition,
 | 
						|
                                dctnryStruct.fColSegment,
 | 
						|
                                useTmpSuffix); // @bug 5572 TBD
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
        return rc;
 | 
						|
 | 
						|
    rc = tokenize(txnid, dctnryTuple, dctnryStruct.fCompressionType);
 | 
						|
 | 
						|
    int rc2 = dctnry->closeDctnry(true); // close file, even if tokenize() fails
 | 
						|
 | 
						|
    if ((rc == NO_ERROR) && (rc2 != NO_ERROR))
 | 
						|
        rc = rc2;
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Create column files, including data and bitmap files
 | 
						|
 * PARAMETERS:
 | 
						|
 *    dataOid - column data file id
 | 
						|
 *    bitmapOid - column bitmap file id
 | 
						|
 *    colWidth - column width
 | 
						|
 *    dbRoot   - DBRoot where file is to be located
 | 
						|
 *    partition - Starting partition number for segment file path
 | 
						|
 *     segment - segment number
 | 
						|
 *     compressionType - compression type
 | 
						|
 * RETURN:
 | 
						|
 *    NO_ERROR if success
 | 
						|
 *    ERR_FILE_EXIST if file exists
 | 
						|
 *    ERR_FILE_CREATE if something wrong in creating the file
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::createDctnry(const TxnID& txnid,
 | 
						|
                                     const OID& dctnryOid,
 | 
						|
                                     int colWidth,
 | 
						|
                                     uint16_t dbRoot,
 | 
						|
                                     uint32_t partiotion,
 | 
						|
                                     uint16_t segment,
 | 
						|
                                     int compressionType)
 | 
						|
{
 | 
						|
    BRM::LBID_t startLbid;
 | 
						|
    return m_dctnry[op(compressionType)]->
 | 
						|
           createDctnry( dctnryOid, colWidth, dbRoot, partiotion, segment, startLbid);
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::convertRidToColumn (RID& rid, uint16_t& dbRoot, uint32_t& partition,
 | 
						|
        uint16_t& segment, RID filesPerColumnPartition,
 | 
						|
        RID  extentsPerSegmentFile, RID extentRows,
 | 
						|
        uint16_t startDBRoot, unsigned dbrootCnt)
 | 
						|
{
 | 
						|
    int rc = 0;
 | 
						|
    partition = rid / (filesPerColumnPartition * extentsPerSegmentFile * extentRows);
 | 
						|
 | 
						|
    segment = (((rid % (filesPerColumnPartition * extentsPerSegmentFile * extentRows)) / extentRows)) % filesPerColumnPartition;
 | 
						|
 | 
						|
    dbRoot = ((startDBRoot - 1 + segment) % dbrootCnt) + 1;
 | 
						|
 | 
						|
    //Calculate the relative rid for this segment file
 | 
						|
    RID relRidInPartition = rid - ((RID)partition * (RID)filesPerColumnPartition * (RID)extentsPerSegmentFile * (RID)extentRows);
 | 
						|
    assert (relRidInPartition <= (RID)filesPerColumnPartition * (RID)extentsPerSegmentFile * (RID)extentRows);
 | 
						|
    uint32_t numExtentsInThisPart = relRidInPartition / extentRows;
 | 
						|
    unsigned numExtentsInThisSegPart = numExtentsInThisPart / filesPerColumnPartition;
 | 
						|
    RID relRidInThisExtent = relRidInPartition - numExtentsInThisPart * extentRows;
 | 
						|
    rid = relRidInThisExtent +  numExtentsInThisSegPart * extentRows;
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Clears table lock for the specified table lock ID.
 | 
						|
 * PARAMETERS:
 | 
						|
 *    lockID - table lock to be released
 | 
						|
 *    errMsg - if error occurs, this is the return error message
 | 
						|
 * RETURN:
 | 
						|
 *    NO_ERROR if operation is successful
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::clearTableLockOnly(
 | 
						|
    uint64_t     lockID,
 | 
						|
    std::string& errMsg)
 | 
						|
{
 | 
						|
    bool bReleased;
 | 
						|
 | 
						|
    int rc = BRMWrapper::getInstance()->releaseTableLock( lockID,
 | 
						|
             bReleased, errMsg);
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Rolls back the state of the extentmap and database files for the
 | 
						|
 *    specified table OID, using the metadata previously saved to disk.
 | 
						|
 *    Also clears the table lock for the specified table OID.
 | 
						|
 * PARAMETERS:
 | 
						|
 *    tableOid - table OID to be rolled back
 | 
						|
 *    lockID   - table lock corresponding to tableOid
 | 
						|
 *    tableName - table name associated with tableOid
 | 
						|
 *    applName - application that is driving this bulk rollback
 | 
						|
 *    debugConsole - enable debug logging to the console
 | 
						|
 *    errorMsg - error message explaining any rollback failure
 | 
						|
 * RETURN:
 | 
						|
 *    NO_ERROR if rollback completed succesfully
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::bulkRollback(OID   tableOid,
 | 
						|
                                     uint64_t lockID,
 | 
						|
                                     const std::string& tableName,
 | 
						|
                                     const std::string& applName,
 | 
						|
                                     bool debugConsole, string& errorMsg)
 | 
						|
{
 | 
						|
    errorMsg.clear();
 | 
						|
 | 
						|
    BulkRollbackMgr rollbackMgr(tableOid, lockID, tableName, applName);
 | 
						|
 | 
						|
    if (debugConsole)
 | 
						|
        rollbackMgr.setDebugConsole(true);
 | 
						|
 | 
						|
    // We used to pass "false" to not keep (delete) the metafiles at the end of
 | 
						|
    // the rollback.  But after the transition to sharedNothing, we pass "true"
 | 
						|
    // to initially keep these files.  The metafiles are deleted later, only
 | 
						|
    // after all the distributed bulk rollbacks are successfully completed.
 | 
						|
    int rc = rollbackMgr.rollback( true );
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
        errorMsg = rollbackMgr.getErrorMsg();
 | 
						|
 | 
						|
    // Ignore the return code for now; more important to base rc on the
 | 
						|
    // success or failure of the previous work
 | 
						|
    BRMWrapper::getInstance()->takeSnapshot();
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::rollbackCommon(const TxnID& txnid, int sessionId)
 | 
						|
{
 | 
						|
    //Remove the unwanted tmp files and recover compressed chunks.
 | 
						|
    string prefix;
 | 
						|
 | 
						|
    // BUG 4312
 | 
						|
    RemoveTxnFromLBIDMap(txnid);
 | 
						|
    RemoveTxnFromDictMap(txnid);
 | 
						|
 | 
						|
    config::Config* config = config::Config::makeConfig();
 | 
						|
    prefix = config->getConfig("SystemConfig", "DBRMRoot");
 | 
						|
 | 
						|
    if (prefix.length() == 0)
 | 
						|
    {
 | 
						|
        cerr << "Need a valid DBRMRoot entry in Calpont configuation file";
 | 
						|
        return -1;
 | 
						|
    }
 | 
						|
 | 
						|
    uint64_t pos =  prefix.find_last_of ("/") ;
 | 
						|
    std::string aDMLLogFileName;
 | 
						|
 | 
						|
    if (pos != string::npos)
 | 
						|
    {
 | 
						|
        aDMLLogFileName = prefix.substr(0, pos + 1); //Get the file path
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        logging::Message::Args args;
 | 
						|
        args.add("RollbackTran cannot find the dbrm directory for the DML log file");
 | 
						|
        SimpleSysLog::instance()->logMsg(args, logging::LOG_TYPE_CRITICAL, logging::M0007);
 | 
						|
        return -1;
 | 
						|
 | 
						|
    }
 | 
						|
 | 
						|
    std::ostringstream oss;
 | 
						|
    oss << txnid << "_" << Config::getLocalModuleID();
 | 
						|
    aDMLLogFileName += "DMLLog_" + oss.str();
 | 
						|
 | 
						|
    if (IDBPolicy::exists(aDMLLogFileName.c_str()))
 | 
						|
    {
 | 
						|
        // TODO-for now the DML log file will always be in a local
 | 
						|
        // filesystem since IDBDataFile doesn't have any support for
 | 
						|
        // a cpp iostream interface.  need to decide if this is ok.
 | 
						|
        boost::scoped_ptr<IDBDataFile> aDMLLogFile(IDBDataFile::open(
 | 
						|
                    IDBPolicy::getType(aDMLLogFileName.c_str(),
 | 
						|
                                       IDBPolicy::WRITEENG),
 | 
						|
                    aDMLLogFileName.c_str(), "r", 0));
 | 
						|
 | 
						|
        if (aDMLLogFile) //need recover
 | 
						|
        {
 | 
						|
            ssize_t fileSize = aDMLLogFile->size();
 | 
						|
            boost::scoped_array<char> buf(new char[fileSize]);
 | 
						|
 | 
						|
            if (aDMLLogFile->read(buf.get(), fileSize) != fileSize)
 | 
						|
                return ERR_FILE_READ;
 | 
						|
 | 
						|
            std::istringstream strstream(string(buf.get(), fileSize));
 | 
						|
            std::string backUpFileType;
 | 
						|
            std::string filename;
 | 
						|
            int64_t size;
 | 
						|
            int64_t offset;
 | 
						|
 | 
						|
            while (strstream >> backUpFileType >> filename >> size >> offset)
 | 
						|
            {
 | 
						|
                //cout << "Found: " <<  backUpFileType << " name " << filename << "size: " << size << " offset: " << offset << endl;
 | 
						|
                std::ostringstream oss;
 | 
						|
                oss << "RollbackTran found " <<  backUpFileType << " name " << filename << " size: " << size << " offset: " << offset;
 | 
						|
                logging::Message::Args args;
 | 
						|
                args.add(oss.str());
 | 
						|
                SimpleSysLog::instance()->logMsg(args, logging::LOG_TYPE_INFO, logging::M0007);
 | 
						|
 | 
						|
                if (backUpFileType.compare("rlc") == 0)
 | 
						|
                {
 | 
						|
                    //remove the rlc file
 | 
						|
                    filename += ".rlc";
 | 
						|
                    //cout << " File removed: " << filename << endl;
 | 
						|
                    IDBPolicy::remove(filename.c_str());
 | 
						|
                    logging::Message::Args args1;
 | 
						|
                    args1.add(filename);
 | 
						|
                    args1.add(" is removed.");
 | 
						|
                    SimpleSysLog::instance()->logMsg(args1, logging::LOG_TYPE_INFO, logging::M0007);
 | 
						|
                }
 | 
						|
                else if (backUpFileType.compare("tmp") == 0)
 | 
						|
                {
 | 
						|
                    int rc = NO_ERROR;
 | 
						|
                    string orig(filename + ".orig");
 | 
						|
 | 
						|
                    // restore the orig file
 | 
						|
                    if (IDBPolicy::exists(orig.c_str()))
 | 
						|
                    {
 | 
						|
                        // not likely both cdf and tmp exist
 | 
						|
                        if (IDBPolicy::exists(filename.c_str()) &&
 | 
						|
                                IDBPolicy::remove(filename.c_str()) != 0)
 | 
						|
                            rc = ERR_COMP_REMOVE_FILE;
 | 
						|
 | 
						|
                        if (rc == NO_ERROR && IDBPolicy::rename(orig.c_str(), filename.c_str()) != 0)
 | 
						|
                            rc = ERR_COMP_RENAME_FILE;
 | 
						|
                    }
 | 
						|
 | 
						|
                    // remove the tmp file
 | 
						|
                    string tmp(filename + ".tmp");
 | 
						|
 | 
						|
                    if (rc == NO_ERROR && IDBPolicy::exists(tmp.c_str()) &&
 | 
						|
                            IDBPolicy::remove(tmp.c_str()) != 0)
 | 
						|
                        rc = ERR_COMP_REMOVE_FILE;
 | 
						|
 | 
						|
                    // remove the chunk shifting helper
 | 
						|
                    string rlc(filename + ".rlc");
 | 
						|
 | 
						|
                    if (rc == NO_ERROR && IDBPolicy::exists(rlc.c_str()) &&
 | 
						|
                            IDBPolicy::remove(rlc.c_str()) != 0)
 | 
						|
                        rc = ERR_COMP_REMOVE_FILE;
 | 
						|
 | 
						|
                    logging::Message::Args args1;
 | 
						|
                    args1.add(filename);
 | 
						|
 | 
						|
                    if (rc == NO_ERROR)
 | 
						|
                    {
 | 
						|
                        args1.add(" is restored.");
 | 
						|
                        SimpleSysLog::instance()->logMsg(args1,
 | 
						|
                                                         logging::LOG_TYPE_INFO, logging::M0007);
 | 
						|
                    }
 | 
						|
                    else
 | 
						|
                    {
 | 
						|
                        args1.add(" may not restored: ");
 | 
						|
                        args1.add(rc);
 | 
						|
                        SimpleSysLog::instance()->logMsg(args1,
 | 
						|
                                                         logging::LOG_TYPE_CRITICAL, logging::M0007);
 | 
						|
 | 
						|
                        return rc;
 | 
						|
                    }
 | 
						|
                }
 | 
						|
                else
 | 
						|
                {
 | 
						|
                    //copy back to the data file
 | 
						|
                    std::string backFileName(filename);
 | 
						|
 | 
						|
                    if (backUpFileType.compare("chk") == 0 )
 | 
						|
                        backFileName += ".chk";
 | 
						|
                    else
 | 
						|
                        backFileName += ".hdr";
 | 
						|
 | 
						|
                    //cout << "Rollback found file " << backFileName << endl;
 | 
						|
                    IDBDataFile* sourceFile = IDBDataFile::open(
 | 
						|
                                                  IDBPolicy::getType(backFileName.c_str(), IDBPolicy::WRITEENG),
 | 
						|
                                                  backFileName.c_str(), "r", 0);
 | 
						|
                    IDBDataFile* targetFile = IDBDataFile::open(
 | 
						|
                                                  IDBPolicy::getType(filename.c_str(), IDBPolicy::WRITEENG),
 | 
						|
                                                  filename.c_str(), "r+", 0);
 | 
						|
 | 
						|
                    size_t byteRead;
 | 
						|
                    unsigned char* readBuf = new unsigned char[size];
 | 
						|
                    boost::scoped_array<unsigned char> readBufPtr( readBuf );
 | 
						|
 | 
						|
                    if ( sourceFile != NULL )
 | 
						|
                    {
 | 
						|
                        int rc = sourceFile->seek( 0, 0 );
 | 
						|
 | 
						|
                        if (rc)
 | 
						|
                            return ERR_FILE_SEEK;
 | 
						|
 | 
						|
                        byteRead = sourceFile->read( readBuf, size );
 | 
						|
 | 
						|
                        if ( (int) byteRead != size )
 | 
						|
                        {
 | 
						|
                            logging::Message::Args args6;
 | 
						|
                            args6.add("Rollback cannot read backup file ");
 | 
						|
                            args6.add(backFileName);
 | 
						|
                            SimpleSysLog::instance()->logMsg(args6, logging::LOG_TYPE_ERROR, logging::M0007);
 | 
						|
                            return ERR_FILE_READ;
 | 
						|
                        }
 | 
						|
                    }
 | 
						|
                    else
 | 
						|
                    {
 | 
						|
                        logging::Message::Args args5;
 | 
						|
                        args5.add("Rollback cannot open backup file ");
 | 
						|
                        args5.add(backFileName);
 | 
						|
                        SimpleSysLog::instance()->logMsg(args5, logging::LOG_TYPE_ERROR, logging::M0007);
 | 
						|
                        return ERR_FILE_NULL;
 | 
						|
                    }
 | 
						|
 | 
						|
                    size_t byteWrite;
 | 
						|
 | 
						|
                    if ( targetFile != NULL )
 | 
						|
                    {
 | 
						|
                        int rc = targetFile->seek( offset, 0 );
 | 
						|
 | 
						|
                        if (rc)
 | 
						|
                            return ERR_FILE_SEEK;
 | 
						|
 | 
						|
                        byteWrite = targetFile->write( readBuf, size );
 | 
						|
 | 
						|
                        if ( (int) byteWrite != size )
 | 
						|
                        {
 | 
						|
                            logging::Message::Args args3;
 | 
						|
                            args3.add("Rollback cannot copy to file ");
 | 
						|
                            args3.add(filename);
 | 
						|
                            args3.add( "from file ");
 | 
						|
                            args3.add(backFileName);
 | 
						|
                            SimpleSysLog::instance()->logMsg(args3, logging::LOG_TYPE_ERROR, logging::M0007);
 | 
						|
 | 
						|
                            return ERR_FILE_WRITE;
 | 
						|
                        }
 | 
						|
                    }
 | 
						|
                    else
 | 
						|
                    {
 | 
						|
                        logging::Message::Args args4;
 | 
						|
                        args4.add("Rollback cannot open target file ");
 | 
						|
                        args4.add(filename);
 | 
						|
                        SimpleSysLog::instance()->logMsg(args4, logging::LOG_TYPE_ERROR, logging::M0007);
 | 
						|
                        return ERR_FILE_NULL;
 | 
						|
                    }
 | 
						|
 | 
						|
                    //cout << "Rollback copied to file " << filename << " from file " << backFileName << endl;
 | 
						|
 | 
						|
                    delete targetFile;
 | 
						|
                    delete sourceFile;
 | 
						|
                    IDBPolicy::remove( backFileName.c_str() );
 | 
						|
                    logging::Message::Args arg1;
 | 
						|
                    arg1.add("Rollback copied to file ");
 | 
						|
                    arg1.add(filename);
 | 
						|
                    arg1.add( "from file ");
 | 
						|
                    arg1.add(backFileName);
 | 
						|
                    SimpleSysLog::instance()->logMsg(arg1, logging::LOG_TYPE_INFO, logging::M0007);
 | 
						|
                }
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        IDBPolicy::remove(aDMLLogFileName.c_str());
 | 
						|
    }
 | 
						|
 | 
						|
    return 0;
 | 
						|
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::rollbackTran(const TxnID& txnid, int sessionId)
 | 
						|
{
 | 
						|
    if ( rollbackCommon( txnid, sessionId ) != 0 )
 | 
						|
        return -1;
 | 
						|
 | 
						|
    return BRMWrapper::getInstance()->rollBack(txnid, sessionId);
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::rollbackBlocks(const TxnID& txnid, int sessionId)
 | 
						|
{
 | 
						|
    if ( rollbackCommon( txnid, sessionId ) != 0 )
 | 
						|
        return -1;
 | 
						|
 | 
						|
    return BRMWrapper::getInstance()->rollBackBlocks(txnid, sessionId);
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::rollbackVersion(const TxnID& txnid, int sessionId)
 | 
						|
{
 | 
						|
    // BUG 4312
 | 
						|
    RemoveTxnFromLBIDMap(txnid);
 | 
						|
    RemoveTxnFromDictMap(txnid);
 | 
						|
 | 
						|
    return BRMWrapper::getInstance()->rollBackVersion(txnid, sessionId);
 | 
						|
}
 | 
						|
 | 
						|
int WriteEngineWrapper::updateNextValue(const TxnID txnId, const OID& columnoid, const uint64_t nextVal, const uint32_t sessionID, const uint16_t dbRoot)
 | 
						|
{
 | 
						|
    int rc = NO_ERROR;
 | 
						|
    boost::shared_ptr<CalpontSystemCatalog> systemCatalogPtr;
 | 
						|
    RIDList ridList;
 | 
						|
    ColValueList colValueList;
 | 
						|
    WriteEngine::ColTupleList colTuples;
 | 
						|
    ColStructList colStructList;
 | 
						|
    WriteEngine::ColStruct colStruct;
 | 
						|
    colStruct.dataOid = OID_SYSCOLUMN_NEXTVALUE;
 | 
						|
    colStruct.colWidth = 8;
 | 
						|
    colStruct.tokenFlag = false;
 | 
						|
    colStruct.colDataType =  CalpontSystemCatalog::UBIGINT;
 | 
						|
    colStruct.fColDbRoot = dbRoot;
 | 
						|
 | 
						|
    if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
        colStruct.fCompressionType = 2;
 | 
						|
 | 
						|
    colStructList.push_back(colStruct);
 | 
						|
    ColTuple colTuple;
 | 
						|
    systemCatalogPtr = CalpontSystemCatalog::makeCalpontSystemCatalog(sessionID);
 | 
						|
    systemCatalogPtr->identity(CalpontSystemCatalog::EC);
 | 
						|
    CalpontSystemCatalog::ROPair ropair;
 | 
						|
 | 
						|
    try
 | 
						|
    {
 | 
						|
        ropair = systemCatalogPtr->nextAutoIncrRid(columnoid);
 | 
						|
    }
 | 
						|
    catch (...)
 | 
						|
    {
 | 
						|
        rc = ERR_AUTOINC_RID;
 | 
						|
    }
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
        return rc;
 | 
						|
 | 
						|
    ridList.push_back(ropair.rid);
 | 
						|
    colTuple.data = nextVal;
 | 
						|
    colTuples.push_back(colTuple);
 | 
						|
    colValueList.push_back(colTuples);
 | 
						|
    //TxnID txnid;
 | 
						|
    rc = writeColumnRecords(txnId, colStructList, colValueList, ridList, SYSCOLUMN_BASE, false);
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
        return rc;
 | 
						|
 | 
						|
    //flush PrimProc cache
 | 
						|
    vector<LBID_t> blockList;
 | 
						|
    BRM::LBIDRange_v lbidRanges;
 | 
						|
    rc = BRMWrapper::getInstance()->lookupLbidRanges(OID_SYSCOLUMN_NEXTVALUE,
 | 
						|
            lbidRanges);
 | 
						|
 | 
						|
    if (rc != NO_ERROR)
 | 
						|
        return rc;
 | 
						|
 | 
						|
    LBIDRange_v::iterator it;
 | 
						|
 | 
						|
    for (it = lbidRanges.begin(); it != lbidRanges.end(); it++)
 | 
						|
    {
 | 
						|
        for (LBID_t  lbid = it->start; lbid < (it->start + it->size); lbid++)
 | 
						|
        {
 | 
						|
            blockList.push_back(lbid);
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    //Bug 5459 Flush FD cache
 | 
						|
    std::vector<BRM::FileInfo> files;
 | 
						|
    BRM::FileInfo aFile;
 | 
						|
    aFile.oid = colStruct.dataOid;
 | 
						|
    aFile.partitionNum = colStruct.fColPartition;
 | 
						|
    aFile.dbRoot = colStruct.fColDbRoot;;
 | 
						|
    aFile.segmentNum = colStruct.fColSegment;
 | 
						|
    aFile.compType = colStruct.fCompressionType;
 | 
						|
    files.push_back(aFile);
 | 
						|
 | 
						|
    if (idbdatafile::IDBPolicy::useHdfs())
 | 
						|
        cacheutils::purgePrimProcFdCache(files, Config::getLocalModuleID());
 | 
						|
 | 
						|
    rc = cacheutils::flushPrimProcAllverBlocks (blockList);
 | 
						|
 | 
						|
    if (rc != 0)
 | 
						|
        rc = ERR_BLKCACHE_FLUSH_LIST; // translate to WE error
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Flush compressed files in chunk manager
 | 
						|
 * PARAMETERS:
 | 
						|
 *    none
 | 
						|
 * RETURN:
 | 
						|
 *    none
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::flushDataFiles(int rc, const TxnID txnId, std::map<FID, FID>& columnOids)
 | 
						|
{
 | 
						|
    RemoveTxnFromLBIDMap(txnId);
 | 
						|
    RemoveTxnFromDictMap(txnId);
 | 
						|
 | 
						|
    for (int i = 0; i < TOTAL_COMPRESS_OP; i++)
 | 
						|
    {
 | 
						|
        int rc1 = m_colOp[i]->flushFile(rc, columnOids);
 | 
						|
        int rc2 = m_dctnry[i]->flushFile(rc, columnOids);
 | 
						|
 | 
						|
        if (rc == NO_ERROR)
 | 
						|
        {
 | 
						|
            rc = (rc1 != NO_ERROR) ? rc1 : rc2;
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    return rc;
 | 
						|
}
 | 
						|
 | 
						|
void WriteEngineWrapper::AddDictToList(const TxnID txnid,
 | 
						|
                                       std::vector<BRM::LBID_t>& lbids)
 | 
						|
{
 | 
						|
    std::tr1::unordered_map<TxnID, dictLBIDRec_t>::iterator mapIter;
 | 
						|
 | 
						|
    mapIter = m_dictLBIDMap.find(txnid);
 | 
						|
 | 
						|
    if (mapIter == m_dictLBIDMap.end())
 | 
						|
    {
 | 
						|
        dictLBIDRec_t tempRecord;
 | 
						|
        tempRecord.insert(lbids.begin(), lbids.end());
 | 
						|
        m_dictLBIDMap[txnid] = tempRecord;
 | 
						|
        return;
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        dictLBIDRec_t& txnRecord = mapIter->second;
 | 
						|
        txnRecord.insert(lbids.begin(), lbids.end());
 | 
						|
    }
 | 
						|
 | 
						|
}
 | 
						|
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Add an lbid to a list of lbids for sending to markExtentsInvalid.
 | 
						|
 *    However, rather than storing each lbid, store only unique first
 | 
						|
 *    lbids. This is an optimization to prevent invalidating the same
 | 
						|
 *    extents over and over.
 | 
						|
 * PARAMETERS:
 | 
						|
 *    txnid - the lbid list is per txn. We use this to keep transactions
 | 
						|
 *            seperated.
 | 
						|
 *    lbids - the current list of lbids. We add to this list
 | 
						|
 *            if the discovered lbid is in a new extent.
 | 
						|
 *   These next are needed for dbrm to get the lbid
 | 
						|
 *    oid       -the table oid.
 | 
						|
 *    colPartition - the table column partition
 | 
						|
 *    segment   - table segment
 | 
						|
 *    fbo       - file block offset
 | 
						|
 * RETURN: 0 => OK. -1 => error
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::AddLBIDtoList(const TxnID     txnid,
 | 
						|
                                      std::vector<BRM::LBID_t>& lbids,
 | 
						|
                                      std::vector<CalpontSystemCatalog::ColDataType>& colDataTypes,
 | 
						|
                                      const ColStruct& colStruct,
 | 
						|
                                      const int       fbo)
 | 
						|
{
 | 
						|
    int rtn = 0;
 | 
						|
 | 
						|
    BRM::LBID_t     startingLBID;
 | 
						|
    SP_TxnLBIDRec_t spTxnLBIDRec;
 | 
						|
    std::tr1::unordered_map<TxnID, SP_TxnLBIDRec_t>::iterator mapIter;
 | 
						|
 | 
						|
    // Find the set of extent starting LBIDs for this transaction. If not found, then create it.
 | 
						|
    mapIter = m_txnLBIDMap.find(txnid);
 | 
						|
 | 
						|
    if (mapIter == m_txnLBIDMap.end())
 | 
						|
    {
 | 
						|
        // This is a new transaction.
 | 
						|
        SP_TxnLBIDRec_t  sptemp(new TxnLBIDRec);
 | 
						|
        spTxnLBIDRec = sptemp;
 | 
						|
        m_txnLBIDMap[txnid] = spTxnLBIDRec;
 | 
						|
//        cout << "New transaction entry " << txnid << " transaction count " << m_txnLBIDMap.size() << endl;
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        spTxnLBIDRec = (*mapIter).second;
 | 
						|
    }
 | 
						|
 | 
						|
    // Get the extent starting lbid given all these values (startingLBID is an out parameter).
 | 
						|
    rtn = BRMWrapper::getInstance()->getStartLbid(colStruct.dataOid, colStruct.fColPartition,
 | 
						|
            colStruct.fColSegment, fbo, startingLBID);
 | 
						|
 | 
						|
    if (rtn != 0)
 | 
						|
        return -1;
 | 
						|
 | 
						|
    if (spTxnLBIDRec->m_LBIDMap.find(startingLBID) == spTxnLBIDRec->m_LBIDMap.end())
 | 
						|
    {
 | 
						|
        // Not found in the map. This must be a new extent. Add it to the list.
 | 
						|
//        cout << "Adding lbid " << startingLBID << " to txn " << txnid << endl;
 | 
						|
        spTxnLBIDRec->AddLBID(startingLBID);
 | 
						|
        lbids.push_back((BRM::LBID_t)startingLBID);
 | 
						|
        colDataTypes.push_back(colStruct.colDataType);
 | 
						|
    }
 | 
						|
    else
 | 
						|
    {
 | 
						|
        ++spTxnLBIDRec->m_squashedLbids;
 | 
						|
    }
 | 
						|
 | 
						|
    // If the starting LBID list has grown to more than 2000, truncate.
 | 
						|
    // This is the purpose of the seqnum. If spTxnLBIDRec->m_lastSeqnum
 | 
						|
    // is divisible by 1000 and size() > 1000, get rid of everything older
 | 
						|
    // than the last 1000 entries. This is to save memory in large
 | 
						|
    // transactions. We assume older extents are unlikely to be hit again.
 | 
						|
    if (spTxnLBIDRec->m_lastSeqnum % 1000 == 0
 | 
						|
            && spTxnLBIDRec->m_LBIDMap.size() > 1000)
 | 
						|
    {
 | 
						|
//        cout << "Trimming the LBID list for " << txnid << ". LBID count is " << spTxnLBIDRec->m_LBIDMap.size() << endl;
 | 
						|
        uint32_t firstDrop = spTxnLBIDRec->m_lastSeqnum - 1000;
 | 
						|
        std::tr1::unordered_map<BRM::LBID_t, uint32_t>::iterator iter;
 | 
						|
 | 
						|
        for (iter = spTxnLBIDRec->m_LBIDMap.begin(); iter != spTxnLBIDRec->m_LBIDMap.end();)
 | 
						|
        {
 | 
						|
            if ((*iter).second < firstDrop)
 | 
						|
            {
 | 
						|
                iter = spTxnLBIDRec->m_LBIDMap.erase(iter);
 | 
						|
            }
 | 
						|
            else
 | 
						|
            {
 | 
						|
                ++iter;
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
//        cout << "LBID count is now" << spTxnLBIDRec->m_LBIDMap.size() << endl;
 | 
						|
    }
 | 
						|
 | 
						|
    return rtn;
 | 
						|
}
 | 
						|
 | 
						|
void WriteEngineWrapper::RemoveTxnFromDictMap(const TxnID txnid)
 | 
						|
{
 | 
						|
    std::tr1::unordered_map<TxnID, dictLBIDRec_t>::iterator mapIter;
 | 
						|
 | 
						|
    mapIter = m_dictLBIDMap.find(txnid);
 | 
						|
 | 
						|
    if (mapIter != m_dictLBIDMap.end())
 | 
						|
    {
 | 
						|
        m_dictLBIDMap.erase(txnid);
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
/***********************************************************
 | 
						|
 * DESCRIPTION:
 | 
						|
 *    Remove a transaction LBID list from the LBID map
 | 
						|
 *    Called when a transaction ends, either commit or rollback
 | 
						|
 * PARAMETERS:
 | 
						|
 *    txnid - the transaction to remove.
 | 
						|
 * RETURN:
 | 
						|
 *    0 => success or not found, -1 => error
 | 
						|
 ***********************************************************/
 | 
						|
int WriteEngineWrapper::RemoveTxnFromLBIDMap(const TxnID txnid)
 | 
						|
{
 | 
						|
    int rtn = 0;
 | 
						|
    std::tr1::unordered_map<TxnID, SP_TxnLBIDRec_t>::iterator mapIter;
 | 
						|
 | 
						|
    // Find the set of extent starting LBIDs for this transaction. If not found, then create it.
 | 
						|
    try
 | 
						|
    {
 | 
						|
        mapIter = m_txnLBIDMap.find(txnid);
 | 
						|
 | 
						|
        if (mapIter != m_txnLBIDMap.end())
 | 
						|
        {
 | 
						|
            SP_TxnLBIDRec_t spTxnLBIDRec = (*mapIter).second;
 | 
						|
            // Debug
 | 
						|
//            cout << "Remove transaction entry " << txnid << " transaction count " << m_txnLBIDMap.size() << endl;
 | 
						|
//            cout << "    count = " << spTxnLBIDRec->m_LBIDMap.size() <<
 | 
						|
//                    ", lastSeqnum = " <<  spTxnLBIDRec->m_lastSeqnum <<
 | 
						|
//                    ", squashed lbids = " << spTxnLBIDRec->m_squashedLbids << endl;
 | 
						|
            m_txnLBIDMap.erase(txnid);   // spTxnLBIDRec is auto-destroyed
 | 
						|
        }
 | 
						|
    }
 | 
						|
    catch (...)
 | 
						|
    {
 | 
						|
        rtn = -1;
 | 
						|
    }
 | 
						|
 | 
						|
    return rtn;
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
} //end of namespace
 | 
						|
// vim:ts=4 sw=4:
 | 
						|
 |