mariadb-columnstore-engine/writeengine/splitter/we_cmdargs.cpp

/* Copyright (C) 2014 InfiniDB, Inc.
   Copyright (C) 2016 MariaDB Corporation

   This program is free software; you can redistribute it and/or
   modify it under the terms of the GNU General Public License
   as published by the Free Software Foundation; version 2 of
   the License.

   This program is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License for more details.

   You should have received a copy of the GNU General Public License
   along with this program; if not, write to the Free Software
   Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
   MA 02110-1301, USA. */

#include <unistd.h>
#include <cstdlib>
#include <cstdio>
#include <cstring>
#include <ctime>

#include <vector>
#include <string>
#include <sstream>
#include <iostream>
#include <exception>
#include <stdexcept>
#include <cerrno>
using namespace std;

#include <boost/uuid/uuid.hpp>
#include <boost/uuid/uuid_generators.hpp>
#include <boost/uuid/uuid_io.hpp>
#include <boost/filesystem.hpp>

#include "dataconvert.h"
#include "liboamcpp.h"
using namespace oam;

#include "we_cmdargs.h"

#include "installdir.h"

namespace WriteEngine
{

//----------------------------------------------------------------------
//----------------------------------------------------------------------
WECmdArgs::WECmdArgs(int argc, char** argv) :
    fMultiTableCount(0),
    fJobLogOnly(false),
    fHelp(false),
    fMode(1),
    fArgMode(-1),
    fQuiteMode(true),
    fConsoleLog(false),
    fVerbose(0),
    fBatchQty(10000),
    fNoOfReadThrds(0),
    fDebugLvl(0),
    fMaxErrors(-1),
    fReadBufSize(0),
    fIOReadBufSize(0),
    fSetBufSize(0),
    fColDelim('|'),
    fEnclosedChar(0),
    fEscChar(0),
    fNoOfWriteThrds(0),
    fNullStrMode(false),
    fImportDataMode(IMPORT_DATA_TEXT),
    fCpiInvoke(false),
    fBlockMode3(false),
    fbTruncationAsError(false),
    fUUID(boost::uuids::nil_generator()()),
    fConsoleOutput(true),
    fTimeZone("SYSTEM")
{
    try
    {
        appTestFunction();
        parseCmdLineArgs(argc, argv);
    }
    catch (std::exception& exp)
    {
        std::string exceptMsg( exp.what() );
        exceptMsg += "\nTry 'cpimport -h' for more information.";
        throw (runtime_error( exceptMsg ));
    }
}

//----------------------------------------------------------------------

void WECmdArgs::appTestFunction()
{

    // testing begins
    //std::string aJobFile("/home/bpaul/Calpont/data/bulk/job/Job_1234.xml");
    //std::string aJobFile("/usr/local/mariadb/columnstore/data/bulk/job/Job_1234.xml");
    //setSchemaAndTableFromJobFile(aJobFile);
    //setEnclByAndEscCharFromJobFile(aJobFile);
    //exit(1);

    //testing ends
    return;
}

//----------------------------------------------------------------------
std::string WECmdArgs::getCpImportCmdLine()
{
    std::ostringstream aSS;
    std::string aCmdLine;


    aSS << fPrgmName;	//prgm name as arg[0]

    if (fHelp)
    {
        aSS << " -h ";
        aCmdLine = aSS.str();
        return aCmdLine;
    }

    //checkJobIdCase();			// check if JobID


    if ((fPmFile.length() > 0) && (0 == getMode()))
        aSS << " -l " << fPmFile;

    //BUG 4379 if -m is not given while prep args, default is m=1 but
    //on single node -m will set it to 3, after prep args.
    //if((fPmFilePath.length()>0)&&(1!=getMode()))
    //	aSS << " -f " << fPmFilePath;
    if ((fPmFilePath.length() > 0) && (1 != getMode()))
    {
        if (fPmFilePath == "STDIN")	//if stdin, must pass it
            aSS << " -f " << fPmFilePath;
        else if (2 == getArgMode())	//Mode 2 we need to pass the -f option
            aSS << " -f " << fPmFilePath;
        else if (3 == getArgMode()) 	//-m given, -f built in already.
            aSS << " -f " << fPmFilePath;
        else if (0 == fLocFile.length()) //No filename given, from job file
            aSS << " -f " << fPmFilePath;
    }

    if (fUsername.length() > 0)
        aSS << " -U " << fUsername;

    if (fJobId.length() > 0)
        aSS << " -j " << fJobId;

    if (fNoOfReadThrds > 0)
        aSS << " -r " << fNoOfReadThrds;

    if (fNoOfWriteThrds > 0)
        aSS << " -w " << fNoOfWriteThrds;

    if (fMaxErrors >= 0)
        aSS << " -e " << fMaxErrors;

    // BUG 5088
    if (fDebugLvl > 0)
        aSS << " -d " << fDebugLvl;

    if (fSetBufSize > 0)
        aSS << " -B " << fSetBufSize;

    if (fColDelim != '|')
    {
        if (fColDelim == '\t')
            aSS << " -s " << "\\t"; //- working with user '\t'
        // NONE of the following will work.
        //aSS << " -s " << "\t"; //aSS << " -s " << "\"\\t\""; //aSS << " -s " << "'\\t'";
        else
            aSS << " -s " << fColDelim;
    }

    if (fEnclosedChar != 0)
        aSS << " -E " << fEnclosedChar;

    if (fEscChar != 0)
        aSS << " -C " << fEscChar;

    if (fNullStrMode)
        aSS << " -n " << '1';

    if (fImportDataMode != IMPORT_DATA_TEXT)
        aSS << " -I " << fImportDataMode;

    //if(fConfig.length()>0)
    //	aSS << " -c " << fConfig;
    if (fReadBufSize > 0)
    {
        cout << "setting fReadBufSize = " << fReadBufSize;
        aSS << " -c " << fReadBufSize;
    }

    if (fIOReadBufSize > 0)
        aSS << " -b " << fIOReadBufSize;


    if ((fJobPath.length() > 0) && (fMode == 3))
        aSS << " -p " << fJobPath;


    if (fConsoleLog)
        aSS << " -i ";

    if ((fMode == 1) || (fMode == 2))
    {
        aSS << " -R " << getBrmRptFileName();
        aSS << " -m " << fMode;
    }

    aSS << " -P " << getModuleID();
    aSS << " -T " << fTimeZone;

    if (fbTruncationAsError)
        aSS << " -S ";

    if (!fS3Key.empty() && !(fMode == 0 || fMode == 1))
    {
        if (fS3Secret.empty() || fS3Bucket.empty() || fS3Region.empty())
            throw (runtime_error("Not all required S3 options provided"));
        aSS << " -y " << fS3Key;
        aSS << " -K " << fS3Secret;
        aSS << " -t " << fS3Bucket;
        aSS << " -g " << fS3Region;

        if (!fS3Host.empty())
        {
            aSS << " -H " << fS3Host;
        }
    }

    if ((fJobId.length() > 0) && (fMode == 1) && (!fJobLogOnly))
    {
        // if JobPath provided, make it w.r.t WES
        aSS << " -p " << fTmpFileDir;
        aSS << " -fSTDIN";
    }
    else if ((fJobId.length() > 0) && (fMode == 2) && (!fJobLogOnly))
    {
        // if JobPath provided, make it w.r.t WES
        aSS << " -p " << fTmpFileDir;

        if (fPmFile.length() > 0)
            aSS << " -l " << fPmFile;

        if (fPmFilePath.length() > 0)
            aSS << " -f " << fPmFilePath;
    }
    else	// do not provide schema & table with JobId
    {

        if (!fUUID.is_nil())
            aSS << " -u" << boost::uuids::to_string(fUUID);

        if (fSchema.length() > 0)
            aSS << " " << fSchema;
        //else if((fMode != 0)||(fMode==3))	//TODO make it mode3 + jobID
        else if (fJobId.length() > 0)
        { }// may or may not contain Schema.
        //else if((fMode == 1)||(fMode==2))	//TODO make it mode3 + jobID
        else if (fMode != 0)
            throw (runtime_error("Schema not available"));

        if (fTable.length() > 0)
            aSS << " " << fTable;
        else if (fJobId.length() > 0)
        {} //may or may not contain Table.
        else if (fMode != 0)
            throw (runtime_error("Tablename not available"));

        //else if((fMode != 0)||(fMode==3))	//TODO make it mode3 + jobID
        //else if((fMode == 1)||(fMode == 2))	//TODO make it mode3 + jobID
        //    throw (runtime_error("Tablename not available"));
        if ((fPmFile.length() > 0) && (2 == getMode()))
        {
            //if(fPmFilePath.length()>0)
            //	aSS << " " << fPmFilePath;
            aSS << " " << fPmFile;
        }
        else if (2 == getMode())
            throw (runtime_error("loadFile [-l ] not available"));

    }

    if ((fLocFile.length() > 0) && (fLocFile != "STDIN") && (3 == getMode()))
    {
        //Bug 4342 multi-files mode 3 support
        //convert all the spaces into 'commas'
        if (fLocFile.find_first_of(' ') == string::npos)
            aSS << " " << fLocFile;
        else
        {
            std::string aLocFiles = replaceCharInStr(fLocFile, ' ', ',');
            aSS << " " << aLocFiles;
        }
    }

    try
    {
        aCmdLine = aSS.str();
    }
    catch (exception&)
    {
        throw runtime_error("getcpImportCmdLine failed");
    }

    return aCmdLine;
}


//----------------------------------------------------------------------

//BUG 4205 (part FIX) - need to implement more into it
bool WECmdArgs::checkForCornerCases()
{
    //BUG 4210
    this->checkJobIdCase();		//Need to do this before we go further


    if (fMode == 0)
    {
        if (!fJobId.empty())
        {
            //cout << "Invalid option mode 0 with a Job File" << endl;
            throw (runtime_error("Mode 0 with a Job file option is not valid!!"
                                 "\nTry 'cpimport -h' for more information."));
        }
        else if (!fJobPath.empty())
        {
            cout << "Invalid option mode 0 with a Job Path" << endl;
            throw (runtime_error("Mismatched options"
                                 "\nTry 'cpimport -h' for more information."));
        }
        else if (!fSchema.empty())
        {
            cout << "Invalid option in mode 0 with a schema name" << endl;
            throw (runtime_error("Mismatched options."));
        }
        else if (!fTable.empty())
        {
            cout << "Invalid option in mode 0 with a table name" << endl;
            throw (runtime_error("Mismatched options."));
        }
        else if ((!fPmFilePath.empty()) && (fPmFilePath != "STDIN"))
        {
            cout << "Invalid option -f in Mode 0 with value other than STDIN" << endl;
            throw (runtime_error("Mismatched options."));
        }

        if (fSetBufSize)
        {
            cout << "Invalid option -B with Mode 0" << endl;
            throw (runtime_error("Mismatched options."));
        }
        else if (fIOReadBufSize)
        {
            cout << "Invalid option -b with Mode 0" << endl;
            throw (runtime_error("Mismatched options."));
        }
        else if (fMaxErrors >= 0)
        {
            cout << "Invalid option -e with Mode 0" << endl;
            throw (runtime_error("Mismatched options."));
        }
        else if (fConsoleLog)
        {
            cout << "Invalid option -i with Mode 0" << endl;
            throw (runtime_error("Mismatched options."));
        }
        else if (fReadBufSize)
        {
            cout << "Invalid option -c with Mode 0" << endl;
            throw (runtime_error("Mismatched options."));
        }
        else if (fNoOfReadThrds)
        {
            cout << "Invalid option -r with Mode 0" << endl;
            throw (runtime_error("Mismatched options."));
        }
        else if (fNoOfWriteThrds)
        {
            cout << "Invalid option -w with Mode 0" << endl;
            throw (runtime_error("Mismatched options."));
        }

        if (fImportDataMode != IMPORT_DATA_TEXT)
        {
            cout << "Invalid option -I with Mode 0" << endl;
            throw (runtime_error("Mismatched options."));
        }

    }

    if (fMode == 1)
    {
        if (!fJobId.empty())
        {
            if ((!fPmFilePath.empty()) && (fPmFilePath == "STDIN"))
            {
                // do not do anything.. this is good.
            }
        }
        // Mode 1, if Input Path is existing and input file is not existing
        // it is an error, bce it assumes all the files in directory.
        // In mode 2, we are passing info to cpimport.bin, which will take care
        // of it, as in Mode 3.
        else if ((!fPmFilePath.empty()) && (fPmFile.empty()))
        {
            // assumed since position param is missing
            if ((fLocFile == "STDIN") && (fPmFilePath != "STDIN"))
            {
                cout << "Invalid options in Mode 1 : option -l " << endl;
                cout << " or input file position parameter needed" << endl;
                //cout << "\tOption (-j) should follow with option -l option or "
                //		"an input file position parameter" << endl;
                throw (runtime_error("In Mode 1 Error occurred!! "
                                     "\nTry 'cpimport -h' for more information."));
            }
        }
    }

    if (fMode == 2)
    {
        if (fPmFile.empty())
            throw(runtime_error("Mode 2 require PM based filename [-l]"
                                "\nTry 'cpimport -h' for more information."));

        if ((fPmFilePath.empty()) && (fPmFile.at(0) != '/'))
            throw(runtime_error("Mode 2 require remote file opts -f and -l or "\
                                "a fully qualified path for the remote file."
                                "\nTry 'cpimport -h' for more information."));
        if (!fS3Key.empty())
            throw(runtime_error("Mode 2 & an input file from S3 does not make sense."));
    }

    if (fMode == 3)
    {
        if (fPmVec.size())
        {
            cout << "Invalid option -P with Mode 3" << endl;
            throw (runtime_error("Mismatched options."));
        }

    }

    return true;
}

//----------------------------------------------------------------------

bool WECmdArgs::str2PmList(std::string& PmList, VecInts& V)
{
    const int BUFLEN = 512;
    char aBuff[BUFLEN];


    int aLen = PmList.length();

    if (aLen > 0)
    {
        strncpy(aBuff, PmList.c_str(), BUFLEN);
        aBuff[BUFLEN - 1] = 0;
    }
    else
        return false;

    char* pTok = strtok(aBuff, ",");

    while (pTok != NULL)
    {
        int aPmId = 0;

        try
        {
            aPmId = atoi(pTok);
            V.push_back(aPmId);
        }
        catch (exception& ex)
        {
            std::stringstream aErr;
            aErr << "Wrong PM id format : " << ex.what();
            //cout << "Wrong PM id format : "<< ex.what() << endl;
            throw (runtime_error(aErr.str()));
        }

        pTok = strtok(NULL, ",");
    }

    return true;
}

//----------------------------------------------------------------------

void WECmdArgs::usage()
{
    cout << "Simple usage using positional parameters (no XML job file):\n";
    cout << "\tcpimport dbName tblName [loadFile] [-h] [-m mode]\n";
    cout << "\t\t [-f path] [-d debugLevel] [-c readbufSize] [-b readBufs] \n";
    cout << "\t\t [-r readers] [-j JobID] [-e maxErrs] [-B libBufSize] [-w parsers]\n";
    cout << "\t\t [-s c] [-E enclosedChar] [-C escapeChar] [-n NullOption]\n";
    cout << "\t\t [-q batchQty] [-p jobPath] [-P list of PMs] [-S] [-i] [-v verbose]\n";
    cout << "\t\t [-I binaryOpt] [-T timeZone]\n";


    cout << "Traditional usage without positional parameters (XML job file required):\n";
    cout << "\tcpimport -j jobID\n";
    cout << "\t\t [-h] [-m mode] [-r readers] [-w parsers] [-s c] [-f path]\n";
    cout << "\t\t [-b readBufs] [-p path] [-c readBufSize] [-e maxErrs] [-B libBufSize]\n";
    cout << "\t\t [-n NullOption] [-E encloseChar] [-C escapeChar] [-i] [-v verbose]\n";
    cout << "\t\t [-d debugLevel] [-q batchQty] [-l loadFile] [-P list of PMs] [-S]\n";
    cout << "\t\t [-I binaryOpt] [-T timeZone]\n";

    cout << "\n\nPositional parameters:\n";
    cout << "\tdbName     Name of the database to load\n";
    cout << "\ttblName    Name of table to load\n";
    cout << "\tloadFile   Optional input file name in current directory,\n";
    cout << "\t\t\tunless a fully qualified name is given.\n";
    cout << "\t\t\tIf not given, input read from STDIN.\n";

    cout << "\n\nOptions:\n"
         << "\t-b\tNumber of read buffers\n"
         << "\t-c\tApplication read buffer size(in bytes)\n"
         << "\t-d\tPrint different level(1-3) debug message\n"
         << "\t-e\tMax number of allowable error per table per PM\n"
         << "\t-f\tData file directory path.\n"
         << "\t\t\tDefault is current working directory.\n"
         << "\t\t\tIn Mode 1, -f represents the local input file path.\n"
         << "\t\t\tIn Mode 2, -f represents the PM based input file path.\n"
         << "\t\t\tIn Mode 3, -f represents the local input file path.\n"
         << "\t-l\tName of import file to be loaded, relative to -f path,\n"
         << "\t-h\tPrint this message.\n"
         << "\t-q\tBatch Quantity, Number of rows distributed per batch in Mode 1\n"
         << "\t-i\tPrint extended info to console in Mode 3.\n"
         << "\t-j\tJob ID. In simple usage, default is the table OID.\n"
         << "\t\t\tunless a fully qualified input file name is given.\n"
         << "\t-n\tNullOption (0-treat the string NULL as data (default);\n"
         << "\t\t\t1-treat the string NULL as a NULL value)\n"
         << "\t-p\tPath for XML job description file.\n"
         << "\t-r\tNumber of readers.\n"
         << "\t-s\t'c' is the delimiter between column values.\n"
         << "\t-B\tI/O library read buffer size (in bytes)\n"
         << "\t-w\tNumber of parsers.\n"
         << "\t-E\tEnclosed by character if field values are enclosed.\n"
         << "\t-C\tEscape character used in conjunction with 'enclosed by'\n"
         << "\t\t\tcharacter, or as part of NULL escape sequence ('\\N');\n"
         << "\t\t\tdefault is '\\'\n"
         << "\t-I\tImport binary data; how to treat NULL values:\n"
         << "\t\t\t1 - import NULL values\n"
         << "\t\t\t2 - saturate NULL values\n"
         << "\t-P\tList of PMs ex: -P 1,2,3. Default is all PMs.\n"
         << "\t-S\tTreat string truncations as errors.\n"
         << "\t-m\tmode\n"
         << "\t\t\t1 - rows will be loaded in a distributed manner across PMs.\n"
         << "\t\t\t2 - PM based input files loaded onto their respective PM.\n"
         << "\t\t\t3 - input files will be loaded on the local PM.\n"
         << "\t-T\tTimezone used for TIMESTAMP datatype.\n"
         << "\t\tPossible values: \"SYSTEM\" (default)\n"
         << "\t\t               : Offset in the form +/-HH:MM\n"
         << "\t-y\tS3 Authentication Key (for S3 imports)\n"
         << "\t-K\tS3 Authentication Secret (for S3 imports)\n"
         << "\t-t\tS3 Bucket (for S3 imports)\n"
         << "\t-H\tS3 Hostname (for S3 imports, Amazon's S3 default)\n"
         << "\t-g\tS3 Region (for S3 imports)\n";

    cout << "\nExample1: Traditional usage\n"
         << "\tcpimport -j 1234";
    cout << "\nExample2: Some column values are enclosed within double quotes.\n"
         << "\tcpimport -j 3000 -E '\"'";
    cout << "\nExample3: Import a nation table without a Job XML file\n"
         << "\tcpimport -j 301 tpch nation nation.tbl";
    cout << "\nExample4: Import a nation table to all PMs in Mode 1\n"
         << "\tcpimport -m 1 tpch nation nation.tbl";
    cout << "\nExample4: Import a nation table to only PM1 and PM2 in Mode 1\n"
         << "\tcpimport -m 1 -P 1,2 tpch nation nation.tbl";
    cout << "\nExample5: Import nation.tbl from PMs to nation table in Mode 2\n"
         << "\tcpimport -m 2 tpch nation -f /var/lib/columnstore/data/bulk/data/import/ -l nation.tbl";
    cout << "\nExample6: Import nation.tbl in mode 3\n"
         << "\tcpimport -m 3 tpch nation nation.tbl\n\n";


    exit(1);
}


//-----------------------------------------------------------------------------

void WECmdArgs::parseCmdLineArgs(int argc, char** argv)
{
    int aCh;
    std::string importPath;
    bool aJobType = false;


    if (argc > 0)
        fPrgmName = "cpimport.bin"; //argv[0] is splitter but we need cpimport

    while ((aCh = getopt(argc, argv,
                         "d:j:w:s:v:l:r:b:e:B:f:q:ihm:E:C:P:I:n:p:c:ST:Ny:K:t:H:g:U:"))
            != EOF)
    {
        switch (aCh)
        {
            case 'm':
            {
                fArgMode = atoi(optarg);

                //cout << "Mode level set to " << fMode << endl;
                if ((fArgMode > -1) && (fArgMode <= 3)) {}
                else
                    throw runtime_error("Wrong Mode level");

                break;
            }

            case 'B':
            {
                errno = 0;
                long lValue = strtol(optarg, 0, 10);

                if ((errno != 0) || (lValue < 1) || (lValue > INT_MAX))
                    throw runtime_error("Option -B is invalid or out of range");

                fSetBufSize = lValue;
                break;
            }

            case 'b':
            {
                errno = 0;
                long lValue = strtol(optarg, 0, 10);

                if ((errno != 0) || (lValue < 1) || (lValue > INT_MAX))
                    throw runtime_error("Option -b is invalid or out of range");

                fIOReadBufSize = lValue;
                break;
            }

            case 'e':
            {
                errno = 0;
                long lValue = strtol(optarg, 0, 10);

                if ((errno != 0) || (lValue < 0) || (lValue > INT_MAX))
                    throw runtime_error("Option -e is invalid or out of range");

                fMaxErrors = lValue;
                break;
            }

            case 'i':
            {
                fConsoleLog = true;
                break;
            }

            case 'c':
            {
                errno = 0;
                long lValue = strtol(optarg, 0, 10);

                if ((errno != 0) || (lValue < 1) || (lValue > INT_MAX))
                    throw runtime_error("Option -c is invalid or out of range");

                fReadBufSize = lValue;
                break;
            }

            case 'j': // -j: jobID
            {
                errno = 0;
                long lValue = strtol(optarg, 0, 10);

                if ((errno != 0) || (lValue < 0) || (lValue > INT_MAX))
                    throw runtime_error("Option -j is invalid or out of range");

                fJobId = optarg;
                fOrigJobId = fJobId;	// in case if we need to split it.

                if (0 == fJobId.length()) throw runtime_error("Wrong JobID Value");

                aJobType = true;
                break;
            }

            case 'v': // verbose
            {
                string aVerbLen = optarg;
                fVerbose = aVerbLen.length();
                fDebugLvl = fVerbose;
                break;
            }

            case 'd': // -d debug
            {
                errno = 0;
                long lValue = strtol(optarg, 0, 10);

                if ((errno != 0) || (lValue < 1) || (lValue > INT_MAX))
                    throw runtime_error("Option -d is invalid or out of range");

                fDebugLvl = lValue;

                if (fDebugLvl > 0 && fDebugLvl <= 3)
                {
                    cout << "\nDebug level set to " << fDebugLvl << endl;
                }
                else
                {
                    throw runtime_error("Wrong Debug level");
                }

                break;
            }

            case 'r': // -r: num read threads
            {
                errno = 0;
                long lValue = strtol(optarg, 0, 10);

                if ((errno != 0) || (lValue < 1) || (lValue > INT_MAX))
                    throw runtime_error("Option -r is invalid or out of range");

                fNoOfReadThrds = lValue;
                break;
            }

            case 'w': // -w: num parse threads
            {
                errno = 0;
                long lValue = strtol(optarg, 0, 10);

                if ((errno != 0) || (lValue < 1) || (lValue > INT_MAX))
                    throw runtime_error("Option -w is invalid or out of range");

                fNoOfWriteThrds = lValue;
                break;
            }

            case 's': // -s: column delimiter
            {
                if (!strcmp(optarg, "\\t"))
                {
                    fColDelim = '\t';

                    if (fDebugLvl) cout << "Column delimiter : " << "\\t" << endl;
                }
                else
                {
                    fColDelim = optarg[0];

                    if (fDebugLvl) cout << "Column delimiter : " << fColDelim << endl;
                }

                break;
            }

            case 'l': // -l: if JobId (-j), it can be input file
            {
                fPmFile = optarg;

                if (0 == fPmFile.length()) throw runtime_error("Wrong local filename");

                break;
            }

            case 'f': // -f: import file path
            {
                fPmFilePath = optarg;
                break;
            }

            case 'n': // -n: treat "NULL" as null
            {
                // default is 0, ie it is equal to not giving this option
                int nullStringMode = atoi(optarg);

                if ((nullStringMode != 0) && (nullStringMode != 1))
                {
                    throw (runtime_error(
                               "Invalid NULL option; value can be 0 or 1"));
                }

                if (nullStringMode)
                    fNullStrMode = true;
                else
                    fNullStrMode = false; // This is default

                break;
            }

            case 'P': // -p: list of PM's
            {
                try
                {
                    std::string aPmList = optarg;

                    if (!str2PmList(aPmList, fPmVec))
                        throw(runtime_error("PM list is wrong"));
                }
                catch (runtime_error& ex)
                {
                    throw (ex);
                }

                break;
            }

            case 'p':
            {
                fJobPath = optarg;
                break;
            }

            case 'E': // -E: enclosed by char
            {
                fEnclosedChar = optarg[0];
                //cout << "Enclosed by Character : " << optarg[0] << endl;
                break;
            }

            case 'C': // -C: enclosed escape char
            {
                fEscChar = optarg[0];
                //cout << "Escape Character  : " << optarg[0] << endl;
                break;
            }

            case 'h': // -h: help
            {
                //usage(); // will exit(1) here
                fHelp = true;
                break;
            }

            case 'I': // -I: binary mode (null handling)
            {
                // default is text mode, unless -I option is specified
                int binaryMode = atoi(optarg);

                if (binaryMode == 1)
                {
                    fImportDataMode = IMPORT_DATA_BIN_ACCEPT_NULL;
                }
                else if (binaryMode == 2)
                {
                    fImportDataMode = IMPORT_DATA_BIN_SAT_NULL;
                }
                else
                {
                    throw (runtime_error(
                               "Invalid Binary mode; value can be 1 or 2"));
                }

                break;
            }

            case 'S': // -S: Treat string truncations as errors
            {
                setTruncationAsError(true);
                //cout << "TruncationAsError  : true" << endl;
                break;
            }

            case 'T':
            {
                std::string timeZone = optarg;
                long offset;

                if (timeZone != "SYSTEM" && dataconvert::timeZoneToOffset(timeZone.c_str(), timeZone.size(), &offset))
                {
                    throw (runtime_error(
                               "Value for option -T is invalid"));
                }

                fTimeZone = timeZone;
                break;
            }

            case 'q': // -q: batch quantity - default value is 10000
            {
                errno = 0;
                long long lValue = strtoll(optarg, 0, 10);

                if ((errno != 0) || (lValue < 1) || (lValue > UINT_MAX))
                    throw runtime_error("Option -q is invalid or out of range");

                fBatchQty = lValue;

                if (fBatchQty < 10000) fBatchQty = 10000;
                else if (fBatchQty > 100000) fBatchQty = 10000;

                break;
            }

            case 'N': //-N no console output
            {
                fConsoleOutput = false;
                break;
            }

            case 'y': //-y S3 Key
            {
                fS3Key = optarg;
                break;
            }

            case 'K': //-K S3 Secret
            {
                fS3Secret = optarg;
                break;
            }

            case 'H': //-H S3 Host
            {
                fS3Host = optarg;
                break;
            }

            case 't': //-t S3 bucket
            {
                fS3Bucket = optarg;
                break;
            }

            case 'g': //-g S3 Region
            {
                fS3Region = optarg;
                break;
            }

            case 'U': //-U username of the files owner
            {
                fUsername = optarg;
                break;
            }

            default:
            {
                std::string aErr = "Unknown command line option " + aCh;
                //cout << "Unknown command line option " << aCh << endl;
                throw (runtime_error(aErr));
            }
        }
    }

    if (fHelp) usage();	//BUG 4210

    if (fArgMode != -1) fMode = fArgMode;	//BUG 4210

    std::string bulkRootPath = getBulkRootDir();

    checkForBulkLogDir(bulkRootPath);

    if (2 == fArgMode && fPmFilePath.empty())
        throw runtime_error("-f option is mandatory with mode 2.");

    if (aJobType)
    {
        if (0 == fArgMode) throw runtime_error("Incompatible mode and option types");

        if (optind < argc)
        {
            fSchema = argv[optind]; // 1st pos parm
            optind++;

            if (optind < argc)
            {
                fTable = argv[optind]; // 2nd pos parm
                optind++;
            }
            else
            {
                // if schema is there, table name should be there
                throw runtime_error("No table name specified with schema.");
            }

            if (optind < argc) // see if input file name is given
            {
                // 3rd pos parm
                fLocFile = argv[optind];

                if ((fLocFile.at(0) != '/') && (fLocFile != "STDIN"))
                {
                    std::string aTmp = fLocFile;

                    // BUG 4379 -f given? use that
                    if ((!fPmFilePath.empty()) && (fMode == 1))
                        fLocFile = fPmFilePath + "/" + aTmp;
                    else if (fPmFilePath.empty())
                        fLocFile = bulkRootPath + "/data/import/" + aTmp;
                }
            }
            else
            {
                if (!fPmFile.empty())
                    fLocFile = fPmFile;
                //BUG 4186
                //else  // else take it from the jobxml file
                //	fLocFile = "STDIN";
                //Historically cpimport works with jobfile as
                // -l <fileName> && -f <filePath>   or
                // -fSTDIN as the stdin, it will override colxml loadfile entry
                // if -fSTDIN is not provided get i/p file from jobfile
                else if ((!fPmFilePath.empty()) && (fPmFilePath == "STDIN"))
                    fLocFile = "STDIN";

                // else take it from the jobxml file
            }

            if ((fSchema.length() > 0) && (fTable.length() > 0) && (fLocFile.length() > 0))
                fJobLogOnly = true;
        }
        else
        {
            if (!fPmFile.empty())
            {
                fLocFile = fPmFile;

                if (!fPmFilePath.empty())
                {
                    if (fPmFilePath == "STDIN")
                    {
                        throw runtime_error("Conflicting options -l and -fSTDIN");
                    }
                    else
                    {
                        std::string aTmp = fLocFile;

                        if ((!fPmFilePath.empty()) && (fMode == 1)) //BUG 4379 -f given? use that
                            fLocFile = fPmFilePath + "/" + aTmp;
                        else if (!fPmFilePath.empty())
                            fLocFile = bulkRootPath + "/data/import/" + aTmp;
                    }

                }

                if ((fLocFile.at(0) != '/') && (fLocFile != "STDIN") && (fPmFilePath.empty()))
                {
                    std::string aTmp = fLocFile;
                    fLocFile = bulkRootPath + "/data/import/" + aTmp;
                }
            }
            //BUG 4186
            //else
            //	fLocFile = "STDIN";
            //Historically cpimport works with jobfile as
            // -l <fileName> && -f <filePath>   or
            // -fSTDIN as the stdin, it will override colxml loadfile entry
            // if -fSTDIN is not provided get i/p file from jobfile
            else if ((!fPmFilePath.empty()) && (fPmFilePath == "STDIN"))
                fLocFile = "STDIN";

            // else take it from the jobxml file
        }

    }
    // Get positional arguments, User can provide:
    // 1. no positional parameters	- Mode 0 & stdin
    // 2. Two positional parameters (schema and table names) - Mode 1/2, stdin
    // 3. Three positional parameters (schema, table, and import file name)
    else if (optind < argc) // see if db schema name is given
    {
        if (fArgMode == 0)
        {
            //added the code as per BUG 4245
            if (!fPmFilePath.empty())
            {
                fLocFile = fPmFilePath;

                if (fLocFile != "STDIN")
                    throw(runtime_error("ERROR: In Mode 0, -f option can only have value STDIN"));
            }
            else
            {
                fLocFile = argv[optind];
                optind++;
            }

            if (optind < argc) //dest filename provided
            {
                fPmFile = argv[optind];

                if ((fPmFile.at(0) != '/') && (fS3Key.empty()))
                {
                    std::string aTmp = fPmFile;
                    fPmFile = bulkRootPath + "/data/import/" + aTmp;
                }
            }
            else // no dest filename
            {
                if (fLocFile == "STDIN")
                    throw(runtime_error("ERROR: Destination file name required!!"));

                if (fLocFile.at(0) == '/')	//local FQ-filename,parse out filename
                    fPmFile = getFileNameFromPath(fLocFile);
                else
                    fPmFile = fLocFile;

                if ((fPmFile.at(0) != '/') && (fS3Key.empty()))	//should be true all the time
                {
                    std::string aTmp = fPmFile;
                    fPmFile = bulkRootPath + "/data/import/" + aTmp;
                }
            }

            /* commented out for BUG 4245
            if(fPmFilePath.empty())
            	fLocFile = argv[optind];
            else
            	fLocFile = fPmFilePath +"/"+ argv[optind];

            if (fPmFile.empty()) //BUG 4200
            {
            	//if(fLocFile.at(0)== '/')
            	//	fPmFile = fLocFile;
            	//else
            	if(fLocFile.at(0)!='/')
            		fPmFile = bulkRootPath + "/data/import/"+ fLocFile;
            }
            else
            {
            	if(fPmFile.at(0)!='/')
            	{
            		std::string aTmp = fPmFile;
            		fPmFile = bulkRootPath + "/data/import/"+aTmp;
            	}
            }
            */
        }
        else
            fSchema = argv[optind]; // 1st pos parm

        optind++;

        if (optind < argc) // see if table name is given
        {
            fTable = argv[optind]; // 2nd pos parm
            optind++;

            if (optind < argc) // see if input file name is given
            {
                // 3rd pos parm
                fLocFile = argv[optind];

                //BUG 4379 if -f option given we need to use that path,
                //over riding bug 4231. look at the code below
                //BUG 4231 - This bug over writes 4199 and commenting out changes
                //BUG 4199
                //Path not provided, not fully qualified, Look in import dir
                //if((fLocFile.at(0)!= '/')&&(fLocFile != "STDIN"))
                //{
                //	std::string aTmp = fLocFile;
                //	fLocFile = bulkRootPath + "/data/import/"+ aTmp;
                //}
                //BUG 4379 if -f option given we need to use that path
                if ((fLocFile.at(0) != '/') && (fLocFile != "STDIN"))
                {
                    std::string aTmp = fLocFile;

                    //if -f given? use that otherwise just go ahead with CWD
                    if ((!fPmFilePath.empty()) && (fMode == 1))
                        fLocFile = fPmFilePath + "/" + aTmp;

                    // TODO - if -f option is given and a list of files are
                    // are provided, we need to be able to import all that.
                }


            }
            else
            {
                if (fPmFile.length() > 0)
                {
                    // BUG 4210
                    //if (fPmFilePath.length() > 0)
                    //{
                    //	fLocFile = fPmFilePath +"/"+ fPmFile;
                    //}
                    //else
                    if (fPmFilePath.empty())
                    {
                        //NOTE - un-commenting with an if statement for Mode 2
                        //BUG 4231 makes it comment out the below changes,
                        //This will not change even though directly, to be
                        //on safer side, we should take out this too.
                        //check path fully qualified? then set as data import
                        if (2 == fArgMode)
                        {
                            //BUG 4342
                            if ((fPmFile.at(0) != '/') && (fS3Key.empty()))
                            {
                                std::string aTmp = fPmFile;
                                fPmFile = PrepMode2ListOfFiles(aTmp);
                            }
                            else
                            {
                                if (fPmFile.find_first_of(' ') != string::npos)
                                {
                                    std::string aPmFiles = replaceCharInStr(fPmFile, ' ', ',');
                                    fPmFile = aPmFiles;
                                }
                            }
                        }

                        fLocFile = fPmFile;
                    }
                }
                else
                {
                    fLocFile = "STDIN";
                }

                //cout << "LocFile set as stdin" << endl;
            }
        }
        else
        {
            // If Mode is not 0 and table name is a required argument
            if (fArgMode != 0)
                throw(runtime_error("No table name specified with schema."));
        }

    }
    else
    {
        // for testing we are allowing data from stdin even with Mode 0
        // that is without LocFileName
        if (0 == fArgMode)
        {
            fLocFile = "STDIN";	//cout << "LocFile set as stdin" << endl;
        }
        else
        {
            // If Mode 0, LocFileName is reqd and otherwies Schema is required
            throw (runtime_error("No schema or local filename specified."));
        }
    }

    /* check for all-or-nothing cmdline args to enable S3 import */
    int s3Tmp = (fS3Key.empty() ? 0 : 1) + (fS3Bucket.empty() ? 0 : 1) +
        (fS3Secret.empty() ? 0 : 1) + (fS3Region.empty() ? 0 : 1);
    if (s3Tmp != 0 && s3Tmp != 4)
        throw runtime_error("The access key, secret, bucket, and region are all required to import from S3");
}

std::string WECmdArgs::getJobFileName()
{
    std::ostringstream aSS;
    string aJobIdFileName;

    if (fJobId.length() > 0)
    {
        if (fJobPath.length() > 0)
            aSS << fJobPath;
        else
        {
            fJobPath = config::Config::makeConfig()->getConfig("WriteEngine",
                       "BulkRoot") + "/Job";
            aSS << fJobPath;
        }

        aSS << "/Job_" << fJobId << ".xml";
        aJobIdFileName = aSS.str();
    }

    return aJobIdFileName;
}

bool WECmdArgs::getPmStatus(int Id)
{
    // if no PMID's provided on cmdline, return true;
    if (0 == fPmVec.size()) return true;

    VecInts::iterator aIt = fPmVec.begin();

    while (aIt != fPmVec.end())
    {
        if (*aIt == static_cast<unsigned int>(Id))
            return true;

        ++aIt;
    }

    return false;
}


//------------------------------------------------------------------------------
// It is a recursive call.
std::string WECmdArgs::getBrmRptFileName()
{
    if (!fBrmRptFile.empty())
        return fBrmRptFile;

    string brmRptFileName = getTmpFileDir();

    if (!brmRptFileName.empty())
    {
        fTmpFileDir = brmRptFileName;
        char aBuff[64];
        time_t aTime;
        struct tm pTm;
        time(&aTime);
        localtime_r(&aTime, &pTm);

        // BUG 4424
        //			M   D   H   M   S
        snprintf(aBuff, sizeof(aBuff), "/BrmRpt%02d%02d%02d%02d%02d%d.rpt",
                 pTm.tm_mon, pTm.tm_mday, pTm.tm_hour,
                 pTm.tm_min, pTm.tm_sec, getpid());
        brmRptFileName += aBuff;
    }
    else
    {
        //cout << "ERROR: Could not find TempFileDir in Columnstore.xml" << endl;
        throw (runtime_error("Could not find TempFileDir in Columnstore.xml"));
    }

    setBrmRptFileName(brmRptFileName);

    return brmRptFileName;

}
//------------------------------------------------------------------------------

void WECmdArgs::addJobFilesToVector(std::string& JobName)
{
    //if((!fSchema.empty())&&(!fTable.empty())&&(!fLocFile.empty())) return;

    WEXmlgetter aXmlGetter(JobName);
    vector<string> aSections;
    aSections.push_back("BulkJob");
    aSections.push_back("Schema");
    aSections.push_back("Table");

    //BUG 4163
    typedef std::vector<string> TableVec;
    TableVec aTableVec;
    aXmlGetter.getConfig(aSections[1], aSections[2], aTableVec);
    setMultiTableCount(aTableVec.size());

    if (getMultiTableCount() > 1)
    {
        splitConfigFilePerTable(JobName, aTableVec.size());
    }
    else
    {
        fVecJobFiles.push_back(JobName);
    }

}

//------------------------------------------------------------------------------
// Set the schema, table, and loadfile name from the xml job file.
// If running in binary mode, we also get the list of columns for the table,
// so that we can determine the exact fixed record length of the incoming data.
//------------------------------------------------------------------------------
void WECmdArgs::setSchemaAndTableFromJobFile(std::string& JobName)
{
    if (((fVecJobFiles.size() == 1) && (!fSchema.empty()) &&
            (!fTable.empty()) && (!fLocFile.empty()))  &&
            (fImportDataMode == IMPORT_DATA_TEXT)) return;

    WEXmlgetter aXmlGetter(JobName);
    vector<string> aSections;
    aSections.push_back("BulkJob");
    aSections.push_back("Schema");
    aSections.push_back("Table");

    // Reset the fSchema, fTable, and FLocFile
    if ((fVecJobFiles.size() > 1) ||
            (fSchema.empty()) || (fTable.empty()) || (fLocFile.empty()))
    {
        std::string aSchemaTable;
        std::string aInputFile;

        aSchemaTable = aXmlGetter.getAttribute(aSections, "tblName");

        if (getDebugLvl() > 1) cout << "schema.table = " << aSchemaTable << endl;

        aInputFile = aXmlGetter.getAttribute(aSections, "loadName");

        if (getDebugLvl() > 1) cout << "xml::InputFile = " << aInputFile << endl;

        if (aSchemaTable.length() > 0)
        {
            char aSchema[64];
            char aTable[64];
            int aRet = aSchemaTable.find('.');

            if (aRet > 0)
            {
                int aLen = aSchemaTable.copy(aSchema, aRet);

                if (getDebugLvl() > 1) cout << "Schema: " << aSchema << endl;

                aSchema[aLen] = 0;

                if (fSchema.empty()) fSchema = aSchema;

                aLen = aSchemaTable.copy(aTable, aSchemaTable.length(), aRet + 1 );
                aTable[aLen] = 0;

                if (getDebugLvl() > 1) cout << "Table: " << aTable << endl;

                fTable = aTable;
            }
            else
                throw runtime_error(
                    "JobFile ERROR: Can't get Schema and Table Name");
        }
        else
        {
            throw runtime_error(
                "JobFile ERROR: Can't get Schema and Table Name");
        }

        if ((fLocFile.empty()) && (!aInputFile.empty()))
        {
            string bulkRootPath = config::Config::makeConfig()->getConfig(
                                      "WriteEngine", "BulkRoot");

            if (aInputFile.at(0) == '/')
                fLocFile = aInputFile;
            else if ((!fPmFilePath.empty()) && (fMode == 1))
                fLocFile = fPmFilePath + "/" + aInputFile;
            else if ((!bulkRootPath.empty()) && (fPmFilePath.empty()))
                fLocFile = bulkRootPath + "/data/import/" + aInputFile;
            else
                fLocFile = aInputFile;

            if (fArgMode == 2) fPmFile = fLocFile;
        }

        if (getDebugLvl() > 1) cout << "schema = " << fSchema << endl;

        if (getDebugLvl() > 1) cout << "TableName = " << fTable << endl;

        if (getDebugLvl() > 1) cout << "Input File = " << fLocFile << endl;
    }

    // Reset the list of columns we will be importing from the input data
    fColFldsFromJobFile.clear();

    if (fImportDataMode != IMPORT_DATA_TEXT)
    {
        aSections.push_back("Column");
        aXmlGetter.getAttributeListForAllChildren(
            aSections, "colName", fColFldsFromJobFile);
    }
}

//------------------------------------------------------------------------------
void WECmdArgs::checkJobIdCase()
{
    if ((fJobId.empty()) || (fJobLogOnly) || (fMode == 3) || (fMode == 0)) return;

    if (fJobPath.empty())
    {
        string bulkRootPath = config::Config::makeConfig()->getConfig(
                                  "WriteEngine", "BulkRoot");
        //cout << "checkJobIdCase::BulkRoot: " << bulkRootPath << endl;

        if (!bulkRootPath.empty())
            fJobPath = bulkRootPath + "/job";
        else
            throw runtime_error("Config Error: BulkRoot not found in Columnstore.xml");
    }

    char aBuff[256];

    if (!fJobPath.empty())
        snprintf(aBuff, sizeof(aBuff), "%s/Job_%s.xml", fJobPath.c_str(),
                 fJobId.c_str());
    else	// for time being
        snprintf(aBuff, sizeof(aBuff), "/var/lib/columnstore/data/bulk/job/Job_%s.xml",
                 fJobId.c_str());

    std::string aJobFileName(aBuff);

    //cout << "checkJobIdCase::aJobFileName: " << aJobFileName << endl;


    //BUG 4171
    addJobFilesToVector(aJobFileName);

    aJobFileName =  fVecJobFiles[0];
    setSchemaAndTableFromJobFile(aJobFileName);
    setEnclByAndEscCharFromJobFile(aJobFileName);

}

//------------------------------------------------------------------------------

std::string WECmdArgs::getTmpFileDir()
{
    if (!fTmpFileDir.empty()) return fTmpFileDir;

    fTmpFileDir = startup::StartUp::tmpDir();

    if (fTmpFileDir.empty())
        throw( runtime_error("Config ERROR: TmpFileDir not found!!"));
    else
        return fTmpFileDir;
}

//------------------------------------------------------------------------------

std::string WECmdArgs::getBulkRootDir()
{
    if (!fBulkRoot.empty()) return fBulkRoot;

    fBulkRoot = config::Config::makeConfig()->getConfig("WriteEngine",
                "BulkRoot");

    if (fBulkRoot.empty())
        throw( runtime_error("Config ERROR: <BulkRoot> not found!!"));
    else
        return fBulkRoot;
}

//------------------------------------------------------------------------------

unsigned int WECmdArgs::getBatchQuantity()
{
    return (fBatchQty >= 10000) ? fBatchQty : 10000;	//default Batch Qty is 10000
}

//------------------------------------------------------------------------------

void WECmdArgs::setEnclByAndEscCharFromJobFile(std::string& JobName)
{
    if ((fEnclosedChar == 0))	// check anything in Jobxml file
    {
        WEXmlgetter aXmlGetter(JobName);
        vector<string> aSections;
        aSections.push_back("BulkJob");
        aSections.push_back("EnclosedByChar");

        try
        {
            //std::string aTable = aXmlGetter.getConfig(aSection, aElement);
            std::string aEnclosedBy = aXmlGetter.getValue(aSections);

            if (getDebugLvl() > 1)cout << "aEncloseBy = " << aEnclosedBy << endl;

            if (!aEnclosedBy.empty())
            {
                fEnclosedChar = aEnclosedBy.at(0);
            }
        }
        catch (std::runtime_error&)
        {
            // do not do anything
        }
    }

    if (fEscChar == 0)	// check anything in Jobxml file
    {
        WEXmlgetter aXmlGetter(JobName);
        vector<string> aSections;
        aSections.push_back("BulkJob");
        aSections.push_back("EscapeChar");

        try
        {
            //std::string aTable = aXmlGetter.getConfig(aSection, aElement);
            std::string aEscChar = aXmlGetter.getValue(aSections);

            if (getDebugLvl() > 1) cout << "aEscapeChar = " << aEscChar << endl;

            if (!aEscChar.empty())
            {
                fEscChar = aEscChar.at(0);
            }
        }
        catch (std::runtime_error&)
        {
            // do not do anything
        }
    }

}

//------------------------------------------------------------------------------
std::string WECmdArgs::getFileNameFromPath(const std::string& Path) const
{
    char aBuff[64];
    int iDx = Path.find_last_of('/');
    iDx++;		// compensate for the forward slash
    int aCx = Path.size() - iDx;
    Path.copy(aBuff, aCx, iDx);
    aBuff[aCx] = 0;
    return aBuff;
}

//------------------------------------------------------------------------------
std::string WECmdArgs::getModuleID()
{
    oam::Oam oam;
    oam::oamModuleInfo_t sModInfo;
    std::string sModuleID;
    char szModuleIDandPID[64];
    int nModuleNumber;

    try
    {
        sModInfo = oam.getModuleInfo();
        sModuleID = boost::get < 1 > (sModInfo);
        nModuleNumber = boost::get < 2 > (sModInfo);
        snprintf(szModuleIDandPID, sizeof(szModuleIDandPID), "%s%d-%d",
                 sModuleID.c_str(), nModuleNumber, getpid());
        sModuleID = szModuleIDandPID;
    }
    catch (exception&)
    {
        sModuleID = "unknown";
    }

    return sModuleID;
}

//------------------------------------------------------------------------------


void WECmdArgs::splitConfigFilePerTable(std::string& ConfigName, int tblCount)
{
    std::string aOpenTag = "<Table ";
    std::string aCloseTag = "</Table>";
    std::string aCloseSchemaTag = "</Schema>";

    std::vector<std::ofstream*> aVecFiles;

    //std::vector<std::string> aVecConfigs;
    for (int aIdx = 1; aIdx <= tblCount; aIdx++)
    {
        char aConfName[128];
        snprintf(aConfName, sizeof(aConfName), "%s_%d.xml", ConfigName.c_str(), aIdx);
        //aVecConfigs.push_back(aConfName);
        fVecJobFiles.push_back(aConfName);
        std::ofstream* pCopy = new std::ofstream;
        //pCopy->open(aConfName, std::ios_base::app);
        pCopy->open(aConfName);
        aVecFiles.push_back(pCopy);
    }


    std::ifstream aMaster;
    aMaster.open(ConfigName.c_str());

    if (aMaster.is_open())
    {
        char aBuff[256];
        int aTblNo = 0;
        size_t aStrPos = std::string::npos;
        bool aOpenFound = false;
        bool aCloseFound = false;

        while (!aMaster.eof())
        {
            aMaster.getline(aBuff, sizeof(aBuff) - 1);
            unsigned int aLen = aMaster.gcount();

            if ((aLen < (sizeof(aBuff) - 2)) && (aLen > 0))
            {
                aBuff[aLen - 1] = '\n';
                aBuff[aLen] = 0;
                string aData = aBuff;
                //cout << "Data Read " << aBuff;

                if (!aOpenFound)
                {
                    aStrPos = aData.find(aOpenTag);

                    if (aStrPos != std::string::npos)
                    {
                        aOpenFound = true;
                        aTblNo++;
                        write2ConfigFiles(aVecFiles, aBuff, aTblNo);
                    }
                    else
                    {
                        if ((!aOpenFound) && (aCloseFound))
                        {
                            aStrPos = aData.find(aCloseSchemaTag);

                            if (aStrPos != std::string::npos)
                            {
                                aOpenFound = false;
                                aCloseFound = false;
                                aTblNo = 0;
                            }
                        }

                        write2ConfigFiles(aVecFiles, aBuff, aTblNo);
                    }
                }
                else
                {
                    aStrPos = aData.find(aCloseTag);

                    if (aStrPos != std::string::npos)
                    {
                        aOpenFound = false;
                        aCloseFound = true;
                        write2ConfigFiles(aVecFiles, aBuff, aTblNo);
                    }
                    else
                    {
                        write2ConfigFiles(aVecFiles, aBuff, aTblNo);
                    }
                }
            }
        }//while Master.eof
    }
    else
    {
        throw runtime_error("Could not open Job Config file");
    }


    for (unsigned int Idx = 0; Idx < aVecFiles.size(); Idx++)
    {
        aVecFiles[Idx]->close();
        delete aVecFiles[Idx];
    }

    aVecFiles.clear();

}

//------------------------------------------------------------------------------

void WECmdArgs::write2ConfigFiles(std::vector<std::ofstream*>& Files,
                                  char* pBuff, int FileIdx)
{

    if (FileIdx == 0)
    {
        std::vector<std::ofstream*>::iterator aIt = Files.begin();

        while (aIt != Files.end())
        {
            std::ofstream* pCopy = (*aIt);
            pCopy->write(pBuff, strlen(pBuff));
            ++aIt;
        }
    }
    else
    {
        Files[FileIdx - 1]->write(pBuff, strlen(pBuff));
    }
}

//------------------------------------------------------------------------------

void WECmdArgs::updateWithJobFile(int Idx)
{
    setLocFile("");	// resetting the from the previous import
    std::string aJobFileName =  fVecJobFiles[Idx];
    setSchemaAndTableFromJobFile(aJobFileName);
    setEnclByAndEscCharFromJobFile(aJobFileName);
    setJobFileName(aJobFileName);

    std::ostringstream aSS;
    aSS << fOrigJobId << ".xml_" << (Idx + 1);
    fJobId = aSS.str();
}


//------------------------------------------------------------------------------

std::string WECmdArgs::replaceCharInStr(const std::string& Str, char C, char R)
{
    std::stringstream aSs;

    size_t start = 0, end = 0;
    end = Str.find_first_of(C);

    do
    {
        if (end != string::npos)
        {
            aSs << Str.substr(start, end - start) << R;
            start = end + 1;
        }
        else
        {
            aSs << Str.substr(start, end - start);
            break;
        }

        end = Str.find_first_of(C, start);
    }
    while (start != end);

    return aSs.str();
}

//------------------------------------------------------------------------------
// Introduced to handle Bug 4342 with Mode 2

std::string WECmdArgs::PrepMode2ListOfFiles(std::string& FileName)
{
    VecArgs aInfileList;
    std::string bulkRootPath = getBulkRootDir();
    //cout << "Inside PrepMode2ListOfFiles("<< FileName << ")" << endl;
    std::string aFileName = FileName;

    istringstream iss(aFileName);
    size_t start = 0, end = 0;
    const char* sep = " ,|";

    end = aFileName.find_first_of(sep);

    do
    {
        if (end != string::npos)
        {
            std::string aFile = aFileName.substr(start, end - start);

            if (getDebugLvl() > 1)
                cout << "File: " << aFileName.substr(start, end - start) << endl;

            start = end + 1;
            aInfileList.push_back(aFile);
        }
        else
        {
            std::string aFile = aFileName.substr(start, end - start);

            if (getDebugLvl() > 1)
                cout << "Next Input File " << aFileName.substr(start, end - start) << endl;

            aInfileList.push_back(aFile);
            break;
        }

        end = aFileName.find_first_of(sep, start);
    }
    while (start != end);

    std::ostringstream aSS;
    int aVecSize = aInfileList.size();
    int aVecIdx = 0;

    // Take file list one by one and append it to one string
    while (aVecIdx < aVecSize)
    {
        std::string aNextFile = aInfileList[aVecIdx];
        aVecIdx++;

        //aInfileList.pop_front();
        if (aNextFile.at(0) != '/')
        {
            aSS << bulkRootPath << "/data/import/" + aNextFile;
        }
        else
        {
            aSS << aNextFile;
        }

        if (aVecIdx < aVecSize) aSS << ",";
    }

    //cout << "File list are = " << aSS.str() << endl;

    return aSS.str();
}

//------------------------------------------------------------------------------
// Get set of column names in the "current" table being processed from the
// Job xml file.
//------------------------------------------------------------------------------
void WECmdArgs::getColumnList( std::set<std::string>& columnList ) const
{
    columnList.clear();

    for (unsigned k = 0; k < fColFldsFromJobFile.size(); k++)
    {
        columnList.insert( fColFldsFromJobFile[k] );
    }
}

//-----------------------------------------------------------------------------
// check for the bulkload log directory. If it is not existing, create it
// w.r.t Bug 6137
//-----------------------------------------------------------------------------

void WECmdArgs::checkForBulkLogDir(const std::string& BulkRoot)
{
    if ( !boost::filesystem::exists(BulkRoot.c_str()) )
    {
        cout << "Creating directory : " << BulkRoot << endl;
        boost::filesystem::create_directories(BulkRoot.c_str());
    }

    if ( boost::filesystem::exists(BulkRoot.c_str()) )
    {
        // create the job directory also if not existing
        std::ostringstream aSS;
        aSS << BulkRoot;
        aSS << "/job";
        std::string jobDir = aSS.str();

        if ( !boost::filesystem::exists(jobDir.c_str()) )
        {
            cout << "Creating directory : " << jobDir << endl;
            bool aSuccess = boost::filesystem::create_directories(jobDir.c_str());

            if (!aSuccess)
            {
                cout << "\nFailed to create job directory, check permissions\n" << endl;
                throw runtime_error("Failed to create job directory, check permissions");
            }
        }

        std::ostringstream aSS2;
        aSS2 << BulkRoot;
        aSS2 << "/log";
        std::string logDir = aSS2.str();

        if ( !boost::filesystem::exists(logDir.c_str()) )
        {
            cout << "Creating directory : " << logDir << endl;
            bool aSuccess = boost::filesystem::create_directories(logDir.c_str());

            if (!aSuccess)
            {
                cout << "\nFailed to create bulk log directory, check permissions\n" << endl;
                throw runtime_error("Failed to create bulk log directory, check permissions");
            }
        }
    }
    else
    {
        cout << "\nFailed to create bulk directory, check permissions\n" << endl;
        throw runtime_error("Failed to create bulk directory, check permissions");
    }
}


} /* namespace WriteEngine */