You've already forked mariadb-columnstore-engine
							
							
				mirror of
				https://github.com/mariadb-corporation/mariadb-columnstore-engine.git
				synced 2025-10-31 18:30:33 +03:00 
			
		
		
		
	* feat(cpimport): MCOL-4882 add a parameter to skip header rows * chore(cpimport): MCOL-4882 Use boost::program_options to arguments parsing * feat(cpimport.bin): MCOL-4882 Add missing changes * add test * fix clang * add missing cmdline argument * fix bug * Fix double lines skipping * Fix incorrect --silent (-N) parsing * fix default --max-errors processing * fix overwriting default username * move initialization to members declaration
		
			
				
	
	
		
			370 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			370 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /* Copyright (C) 2014 InfiniDB, Inc.
 | |
| 
 | |
|    This program is free software; you can redistribute it and/or
 | |
|    modify it under the terms of the GNU General Public License
 | |
|    as published by the Free Software Foundation; version 2 of
 | |
|    the License.
 | |
| 
 | |
|    This program is distributed in the hope that it will be useful,
 | |
|    but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|    GNU General Public License for more details.
 | |
| 
 | |
|    You should have received a copy of the GNU General Public License
 | |
|    along with this program; if not, write to the Free Software
 | |
|    Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
 | |
|    MA 02110-1301, USA. */
 | |
| 
 | |
| /*******************************************************************************
 | |
|  * $Id$
 | |
|  *
 | |
|  *******************************************************************************/
 | |
| 
 | |
| /*
 | |
|  * we_xmlgetter.cpp
 | |
|  *
 | |
|  *  Created on: Feb 7, 2012
 | |
|  *      Author: bpaul
 | |
|  */
 | |
| 
 | |
| #include <stdio.h>
 | |
| #include <string.h>
 | |
| #include <unistd.h>
 | |
| #include <stdexcept>
 | |
| #include <iostream>
 | |
| 
 | |
| #include <string>
 | |
| #include <vector>
 | |
| using namespace std;
 | |
| 
 | |
| #include "we_xmlgetter.h"
 | |
| 
 | |
| using namespace std;
 | |
| 
 | |
| namespace WriteEngine
 | |
| {
 | |
| //------------------------------------------------------------------------------
 | |
| // WEXmlgetter constructor
 | |
| //------------------------------------------------------------------------------
 | |
| WEXmlgetter::WEXmlgetter(const std::string& ConfigName)
 | |
|  : fConfigName(ConfigName)
 | |
|  , fDoc(nullptr)
 | |
|  , fpRoot(nullptr)
 | |
| {
 | |
|   //  xmlNodePtr curPtr;
 | |
|   fDoc = xmlParseFile(ConfigName.c_str());
 | |
| 
 | |
|   if (fDoc == nullptr)
 | |
|     throw runtime_error("WEXmlgetter::getConfig(): no XML document!");
 | |
| 
 | |
|   fpRoot = xmlDocGetRootElement(fDoc);
 | |
| 
 | |
|   if (fpRoot == nullptr)
 | |
|   {
 | |
|     xmlFreeDoc(fDoc);
 | |
|     fDoc = nullptr;
 | |
|     throw runtime_error("WEXmlgetter::getConfig(): no XML Root Tag!");
 | |
|   }
 | |
| }
 | |
| 
 | |
| //------------------------------------------------------------------------------
 | |
| // WEXmlgetter destructor
 | |
| //------------------------------------------------------------------------------
 | |
| WEXmlgetter::~WEXmlgetter()
 | |
| {
 | |
|   xmlFreeDoc(fDoc);
 | |
|   fDoc = nullptr;
 | |
| }
 | |
| 
 | |
| //------------------------------------------------------------------------------
 | |
| // Get/return the property or attribute value (strVal) for the specified xml tag
 | |
| // (pNode) and property/attribute (pTag)
 | |
| //------------------------------------------------------------------------------
 | |
| bool WEXmlgetter::getNodeAttribute(const xmlNode* pNode, const char* pTag, std::string& strVal)
 | |
| {
 | |
|   xmlChar* pTmp = nullptr;
 | |
|   bool bFound = false;
 | |
| 
 | |
|   pTmp = xmlGetProp(pNode, reinterpret_cast<const xmlChar*>(pTag));
 | |
| 
 | |
|   if (pTmp)
 | |
|   {
 | |
|     bFound = true;
 | |
|     strVal = reinterpret_cast<char*>(pTmp);
 | |
|     xmlFree(pTmp);
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     strVal.clear();
 | |
|   }  // end if
 | |
| 
 | |
|   return bFound;
 | |
| }
 | |
| 
 | |
| //------------------------------------------------------------------------------
 | |
| // Get/return the node content (strVal) for the specified xml tag (pNode)
 | |
| //------------------------------------------------------------------------------
 | |
| bool WEXmlgetter::getNodeContent(const xmlNode* pNode, std::string& strVal)
 | |
| {
 | |
|   xmlChar* pTmp = nullptr;
 | |
|   bool bFound = false;
 | |
| 
 | |
|   if (pNode->children != nullptr)
 | |
|   {
 | |
|     pTmp = xmlNodeGetContent(pNode->children);
 | |
| 
 | |
|     if (pTmp)
 | |
|     {
 | |
|       bFound = true;
 | |
|       strVal = reinterpret_cast<char*>(pTmp);
 | |
|       xmlFree(pTmp);
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       strVal.clear();
 | |
|     }
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     strVal.clear();
 | |
|   }
 | |
| 
 | |
|   return bFound;
 | |
| }
 | |
| 
 | |
| //------------------------------------------------------------------------------
 | |
| // Get/returns node content for the "first" child node under each section/name.
 | |
| // Example:
 | |
| //   <section>
 | |
| //     <name>
 | |
| //       <subname1>
 | |
| //       </subname1>
 | |
| //     </name>
 | |
| //     <name>
 | |
| //       <subname1>
 | |
| //       </subname1>
 | |
| //     </name>
 | |
| //   </section>
 | |
| //
 | |
| // Looks like xml2 is currently returning the text node as the first child
 | |
| // node under a node.  So in the example above, this function is currently
 | |
| // always returning the text node content inside each <name> rather than
 | |
| // any <subname1> node that might be within each <name> tag.
 | |
| //------------------------------------------------------------------------------
 | |
| void WEXmlgetter::getConfig(const string& section, const string& name, vector<string>& values) const
 | |
| {
 | |
|   string res;
 | |
| 
 | |
|   if (section.empty())
 | |
|     throw invalid_argument("Config::getConfig: section must have a length");
 | |
| 
 | |
|   const xmlNode* pPtr = fpRoot->xmlChildrenNode;
 | |
| 
 | |
|   while (pPtr != nullptr)
 | |
|   {
 | |
|     // cout << "pPtr->name:    " <<
 | |
|     //	(const xmlChar*)pPtr->name << std::endl;
 | |
| 
 | |
|     if ((!xmlStrcmp(pPtr->name, reinterpret_cast<const xmlChar*>(section.c_str()))))
 | |
|     {
 | |
|       xmlNodePtr pPtr2 = pPtr->xmlChildrenNode;
 | |
| 
 | |
|       while (pPtr2 != nullptr)
 | |
|       {
 | |
|         // cout << "  pPtr2->name: " <<
 | |
|         //	(const xmlChar*)pPtr2->name << std::endl;
 | |
| 
 | |
|         if ((!xmlStrcmp(pPtr2->name, reinterpret_cast<const xmlChar*>(name.c_str()))))
 | |
|         {
 | |
|           xmlNodePtr pPtr3 = pPtr2->xmlChildrenNode;
 | |
|           values.emplace_back(reinterpret_cast<const char*>(pPtr3->content));
 | |
| 
 | |
|           // cout << "    pPtr3->name: " <<
 | |
|           //	(const xmlChar*)pPtr3->name <<
 | |
|           //	"; content: " << (const xmlChar*)pPtr3->content <<
 | |
|           //	"; len: " << strlen((char*)pPtr3->content) << std::endl;
 | |
|         }
 | |
| 
 | |
|         pPtr2 = pPtr2->next;
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     pPtr = pPtr->next;
 | |
|   }
 | |
| }
 | |
| 
 | |
| //------------------------------------------------------------------------------
 | |
| // Returns node content for the last node in the node tree defined by
 | |
| // "sections".  So if sections[] were:
 | |
| //   sections[0] = "house"
 | |
| //   sections[1] = "room"
 | |
| // Then this function would return the node content for the first <room>
 | |
| // tag found under the first <house> tag.
 | |
| // Function assumes that the desired node has no children nodes other than
 | |
| // the text content node.
 | |
| //------------------------------------------------------------------------------
 | |
| std::string WEXmlgetter::getValue(const vector<string>& sections) const
 | |
| {
 | |
|   std::string aRet;
 | |
|   const xmlNode* pPtr = fpRoot;
 | |
|   auto aSize = sections.size();
 | |
|   size_t aIdx = 0;
 | |
| 
 | |
|   // cout << aSize << endl;
 | |
|   while (aIdx < aSize)
 | |
|   {
 | |
|     // cout << aIdx <<" "<< sections[aIdx] << endl;
 | |
|     pPtr = getNode(pPtr, sections[aIdx]);
 | |
| 
 | |
|     if ((pPtr == nullptr) || (aIdx == aSize - 1))
 | |
|       break;
 | |
|     else
 | |
|     {
 | |
|       // cout << "getValue Name " << (const char*)pPtr->name << endl;
 | |
|       pPtr = pPtr->xmlChildrenNode;
 | |
|       aIdx++;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (pPtr != nullptr)
 | |
|   {
 | |
|     // aRet = (const char*)pPtr->content;
 | |
|     std::string aBuff;
 | |
| 
 | |
|     if (getNodeContent(pPtr, aBuff))
 | |
|       aRet = aBuff;
 | |
|   }
 | |
| 
 | |
|   return aRet;
 | |
| }
 | |
| 
 | |
| //------------------------------------------------------------------------------
 | |
| // Iterate through the sibling nodes starting with pParent, looking for
 | |
| // a node with the specified name (section).  The xmlNode (if found) is
 | |
| // returned.
 | |
| //------------------------------------------------------------------------------
 | |
| const xmlNode* WEXmlgetter::getNode(const xmlNode* pParent, const string& section)
 | |
| {
 | |
|   if (pParent == nullptr)
 | |
|     return nullptr;
 | |
| 
 | |
|   const xmlNode* pPtr = pParent;
 | |
| 
 | |
|   while (pPtr != nullptr)
 | |
|   {
 | |
|     // cout << "getNode Name " << (const char*)pPtr->name << endl;
 | |
|     if (!xmlStrcmp(pPtr->name, reinterpret_cast<const xmlChar*>(section.c_str())))
 | |
|       return pPtr;
 | |
|     else
 | |
|       pPtr = pPtr->next;
 | |
|   }
 | |
| 
 | |
|   return pPtr;
 | |
| }
 | |
| 
 | |
| //------------------------------------------------------------------------------
 | |
| // Iterate down through the node tree represented by the sections vector.
 | |
| // In the last child of this tree, we look for the specified attribute tag,
 | |
| // and return its value.
 | |
| //------------------------------------------------------------------------------
 | |
| std::string WEXmlgetter::getAttribute(const vector<string>& sections, const string& Tag) const
 | |
| {
 | |
|   std::string aRet;
 | |
|   const xmlNode* pPtr = fpRoot;
 | |
|   auto aSize = sections.size();
 | |
| 
 | |
|   if (aSize == 0)
 | |
|     throw invalid_argument("WEXmlgetter::getAttribute(): section must be valid");
 | |
| 
 | |
|   size_t aIdx = 0;
 | |
| 
 | |
|   // cout << aSize << endl;
 | |
|   while (aIdx < aSize)
 | |
|   {
 | |
|     // cout << aIdx <<" "<< sections[aIdx] << endl;
 | |
|     pPtr = getNode(pPtr, sections[aIdx]);
 | |
| 
 | |
|     if ((pPtr == nullptr) || (aIdx == aSize - 1))
 | |
|       break;
 | |
|     else
 | |
|     {
 | |
|       // cout << "getValue Name " << (const char*)pPtr->name << endl;
 | |
|       pPtr = pPtr->xmlChildrenNode;
 | |
|       aIdx++;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (pPtr != nullptr)
 | |
|   {
 | |
|     std::string aBuff;
 | |
| 
 | |
|     // cout << "attrTagNode Name " << (const char*)pPtr->name << endl;
 | |
|     if (getNodeAttribute(pPtr, Tag.c_str(), aBuff))
 | |
|       aRet = aBuff;
 | |
| 
 | |
|     // aRet = (const char*)pPtr->content;
 | |
|     // cout << "Attribute("<<Tag<<") = "<< aRet<< endl;
 | |
|   }
 | |
| 
 | |
|   return aRet;
 | |
| }
 | |
| 
 | |
| //------------------------------------------------------------------------------
 | |
| // Iterate down through the node tree represented by the sections vector.
 | |
| // At the end of the branch, there may be several sibling nodes matching
 | |
| // the node search vector.
 | |
| // For each of the matching children nodes found, we look for the specified
 | |
| // attribute tag, and return its value.  Hence a vector of attribute values
 | |
| // is returned.
 | |
| //------------------------------------------------------------------------------
 | |
| void WEXmlgetter::getAttributeListForAllChildren(const vector<string>& sections, const string& attributeTag,
 | |
|                                                  vector<string>& attributeValues) const
 | |
| {
 | |
|   const xmlNode* pPtr = fpRoot;
 | |
|   auto aSize = sections.size();
 | |
| 
 | |
|   if (aSize == 0)
 | |
|   {
 | |
|     throw invalid_argument(
 | |
|         "WEXmlgetter::getAttributeListForAllChildren():"
 | |
|         " No XML nodes specified in section search list");
 | |
|   }
 | |
| 
 | |
|   // Step down the branch that has the nodes of interest
 | |
|   size_t aIdx = 0;
 | |
| 
 | |
|   while (aIdx < aSize)
 | |
|   {
 | |
|     pPtr = getNode(pPtr, sections[aIdx]);
 | |
| 
 | |
|     if ((pPtr == nullptr) || (aIdx == aSize - 1))
 | |
|     {
 | |
|       break;
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       pPtr = pPtr->xmlChildrenNode;
 | |
|       aIdx++;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   // Look for all the "matching" nodes at the end of the branch, and
 | |
|   // get the requested attribute value for each matching node.
 | |
|   if (pPtr != nullptr)
 | |
|   {
 | |
|     while (pPtr != nullptr)
 | |
|     {
 | |
|       std::string attrib;
 | |
| 
 | |
|       if (getNodeAttribute(pPtr, attributeTag.c_str(), attrib))
 | |
|       {
 | |
|         attributeValues.push_back(attrib);
 | |
|       }
 | |
| 
 | |
|       pPtr = pPtr->next;
 | |
|     }
 | |
|   }
 | |
| }
 | |
| 
 | |
| } /* namespace WriteEngine */
 |