You've already forked mariadb-columnstore-engine
							
							
				mirror of
				https://github.com/mariadb-corporation/mariadb-columnstore-engine.git
				synced 2025-11-03 17:13:17 +03:00 
			
		
		
		
	* MSan added with fixes for libc++ * libc++ sepatare build * add libc++ to ci * libstdc++ in CI * libcpp and msan to external projects * std::sqrt * awful_hack(ci): install whole llvm instead of libc++ in terrible way for test containers * Adding ddeb packages for teststages and repos * libc++ more for test container * save some money on debug * colored coredumps * revert ci * chore(ci): collect asan ubsan and libc++ build with mtr and regression status ignored
		
			
				
	
	
		
			253 lines
		
	
	
		
			8.9 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			253 lines
		
	
	
		
			8.9 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
/* Copyright (C) 2014 InfiniDB, Inc.
 | 
						|
 | 
						|
   This program is free software; you can redistribute it and/or
 | 
						|
   modify it under the terms of the GNU General Public License
 | 
						|
   as published by the Free Software Foundation; version 2 of
 | 
						|
   the License.
 | 
						|
 | 
						|
   This program is distributed in the hope that it will be useful,
 | 
						|
   but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
						|
   GNU General Public License for more details.
 | 
						|
 | 
						|
   You should have received a copy of the GNU General Public License
 | 
						|
   along with this program; if not, write to the Free Software
 | 
						|
   Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
 | 
						|
   MA 02110-1301, USA. */
 | 
						|
 | 
						|
/*******************************************************************************
 | 
						|
 * $Id: we_colextinf.h 4501 2013-01-31 21:15:58Z dcathey $
 | 
						|
 *
 | 
						|
 ******************************************************************************/
 | 
						|
 | 
						|
/** @file
 | 
						|
 * Contains class to track column information per extent.
 | 
						|
 * For ex: this is where we track the min/max values per extent for a column.
 | 
						|
 */
 | 
						|
 | 
						|
#pragma once
 | 
						|
 | 
						|
#include <limits>
 | 
						|
#include <stdint.h>
 | 
						|
#include <set>
 | 
						|
#include <unordered.h>
 | 
						|
 | 
						|
#include <boost/thread/mutex.hpp>
 | 
						|
 | 
						|
#include "brmtypes.h"
 | 
						|
#include "we_type.h"
 | 
						|
#include "dataconvert.h"
 | 
						|
 | 
						|
namespace WriteEngine
 | 
						|
{
 | 
						|
class Log;
 | 
						|
class BRMReporter;
 | 
						|
typedef execplan::CalpontSystemCatalog::ColDataType ColDataType;
 | 
						|
//------------------------------------------------------------------------------
 | 
						|
/** @brief Class to store min/max and LBID information for an extent.
 | 
						|
 *  For character data, the min and max values are maintained in reverse
 | 
						|
 *  order to facilitate string comparisions.  When the range is sent to
 | 
						|
 *  BRM, the bytes will be swapped back into the correct order.
 | 
						|
 *  BRM will need to be told when the column carries character data, so
 | 
						|
 *  that BRM can do the correct binary comparisons of the char data.
 | 
						|
 */
 | 
						|
//------------------------------------------------------------------------------
 | 
						|
class ColExtInfEntry
 | 
						|
{
 | 
						|
 public:
 | 
						|
  // Default constructor
 | 
						|
  ColExtInfEntry() : fLbid(INVALID_LBID), fMinVal(LLONG_MIN), fMaxVal(LLONG_MIN), fNewExtent(true)
 | 
						|
  {
 | 
						|
    utils::int128Min(fbigMaxVal);
 | 
						|
    utils::int128Max(fbigMinVal);
 | 
						|
  }
 | 
						|
 | 
						|
  // Used to create entry for an existing extent we are going to add data to.
 | 
						|
  ColExtInfEntry(BRM::LBID_t lbid, bool bIsNewExtent)
 | 
						|
   : fLbid(lbid), fMinVal(LLONG_MIN), fMaxVal(LLONG_MIN), fNewExtent(bIsNewExtent)
 | 
						|
  {
 | 
						|
    utils::int128Min(fbigMaxVal);
 | 
						|
    utils::int128Max(fbigMinVal);
 | 
						|
  }
 | 
						|
 | 
						|
  // Used to create entry for a new extent, with LBID not yet allocated
 | 
						|
  ColExtInfEntry(int64_t minVal, int64_t maxVal)
 | 
						|
   : fLbid(INVALID_LBID), fMinVal(minVal), fMaxVal(maxVal), fNewExtent(true)
 | 
						|
  {
 | 
						|
  }
 | 
						|
 | 
						|
  // Used to create entry for a new extent, with LBID not yet allocated
 | 
						|
  ColExtInfEntry(int128_t bigMinVal, int128_t bigMaxVal)
 | 
						|
   : fLbid(INVALID_LBID), fNewExtent(true), fbigMinVal(bigMinVal), fbigMaxVal(bigMaxVal)
 | 
						|
  {
 | 
						|
  }
 | 
						|
 | 
						|
  // Used to create entry for a new extent, with LBID not yet allocated
 | 
						|
  ColExtInfEntry(uint64_t minVal, uint64_t maxVal)
 | 
						|
   : fLbid(INVALID_LBID)
 | 
						|
   , fMinVal(static_cast<int64_t>(minVal))
 | 
						|
   , fMaxVal(static_cast<int64_t>(maxVal))
 | 
						|
   , fNewExtent(true)
 | 
						|
  {
 | 
						|
  }
 | 
						|
 | 
						|
  // Used to create entry for a new extent, with LBID not yet allocated
 | 
						|
  ColExtInfEntry(uint128_t bigMinVal, uint128_t bigMaxVal)
 | 
						|
   : fLbid(INVALID_LBID)
 | 
						|
   , fNewExtent(true)
 | 
						|
   , fbigMinVal(static_cast<int128_t>(bigMinVal))
 | 
						|
   , fbigMaxVal(static_cast<int128_t>(bigMaxVal))
 | 
						|
  {
 | 
						|
  }
 | 
						|
 | 
						|
  BRM::LBID_t fLbid;  // LBID for an extent; should be the starting LBID
 | 
						|
  int64_t fMinVal;    // minimum value for extent associated with LBID
 | 
						|
  int64_t fMaxVal;    // maximum value for extent associated with LBID
 | 
						|
  bool fNewExtent;    // is this a new extent
 | 
						|
  union
 | 
						|
  {
 | 
						|
    int128_t fbigMinVal;
 | 
						|
    int64_t fMinVal_;
 | 
						|
  };
 | 
						|
  union
 | 
						|
  {
 | 
						|
    int128_t fbigMaxVal;
 | 
						|
    int64_t fMaxVal_;
 | 
						|
  };
 | 
						|
};
 | 
						|
 | 
						|
//------------------------------------------------------------------------------
 | 
						|
/** @brief Hash function used to store ColEntInfEntry objects into a map; using
 | 
						|
 *  the last input Row number in the extent, as the key.
 | 
						|
 */
 | 
						|
//------------------------------------------------------------------------------
 | 
						|
struct uint64Hasher
 | 
						|
{
 | 
						|
  std::size_t operator()(RID val) const
 | 
						|
  {
 | 
						|
    return static_cast<std::size_t>(val);
 | 
						|
  }
 | 
						|
};
 | 
						|
 | 
						|
//------------------------------------------------------------------------------
 | 
						|
/** @brief Stub base class for ColExtInf; used for column data types that do
 | 
						|
 *  not need the functionality of ColExtInf (ex: floats and dictionaries).
 | 
						|
 */
 | 
						|
//------------------------------------------------------------------------------
 | 
						|
class ColExtInfBase
 | 
						|
{
 | 
						|
 public:
 | 
						|
  ColExtInfBase() = default;
 | 
						|
  virtual ~ColExtInfBase() = default;
 | 
						|
 | 
						|
  virtual void addFirstEntry(RID /*lastInputRow*/, BRM::LBID_t /*lbid*/, bool /*bIsNewExtent*/)
 | 
						|
  {
 | 
						|
  }
 | 
						|
 | 
						|
  virtual void addOrUpdateEntry(RID /*lastInputRow*/, int64_t /*minVal*/, int64_t /*maxVal*/,
 | 
						|
                                ColDataType /*colDataType*/, int /*width*/)
 | 
						|
  {
 | 
						|
  }
 | 
						|
 | 
						|
  virtual void addOrUpdateEntry(RID /*lastInputRow*/, int128_t /*minVal*/, int128_t /*maxVal*/,
 | 
						|
                                ColDataType /*colDataType*/, int /*width*/)
 | 
						|
  {
 | 
						|
  }
 | 
						|
 | 
						|
  virtual void getCPInfoForBRM(JobColumn /*column*/, BRMReporter& /*brmReporter*/)
 | 
						|
  {
 | 
						|
  }
 | 
						|
  virtual void print(const JobColumn& /*column*/)
 | 
						|
  {
 | 
						|
  }
 | 
						|
  virtual int updateEntryLbid(BRM::LBID_t /*startLbid*/)
 | 
						|
  {
 | 
						|
    return NO_ERROR;
 | 
						|
  }
 | 
						|
};
 | 
						|
 | 
						|
//------------------------------------------------------------------------------
 | 
						|
/** @brief Collects LBID and min/max info about the extents that are loaded.
 | 
						|
 *
 | 
						|
 *  As a Read buffer is parsed, addOrUpdateEntryi() is called to add the extent,
 | 
						|
 *  and it's information to the collection.  For new extents, we have to add
 | 
						|
 *  the LBID later, when the extent is allocated, since the extent's first
 | 
						|
 *  buffer will be finished before the extent is allocated from BRM.  In this
 | 
						|
 *  case, updateEntryLbid() is called to add the LBID.  The specified LBID is
 | 
						|
 *  assigned to the extent with the lowest Row id that is awaiting an LBID.
 | 
						|
 *  This should be a safe assumption to make, that the extents will be allocated
 | 
						|
 *  in Row id order.   lastInputRow numbers are relative to the first row in
 | 
						|
 *  the import (ie: Row 0 is the first row in the *.tbl file).
 | 
						|
 */
 | 
						|
//------------------------------------------------------------------------------
 | 
						|
class ColExtInf : public ColExtInfBase
 | 
						|
{
 | 
						|
 public:
 | 
						|
  /** @brief Constructor
 | 
						|
   *  @param logger Log object using for debug logging.
 | 
						|
   */
 | 
						|
  ColExtInf(OID oid, Log* logger) : fColOid(oid), fLog(logger)
 | 
						|
  {
 | 
						|
  }
 | 
						|
  ~ColExtInf() override = default;
 | 
						|
 | 
						|
  /** @brief Add an entry for first extent, for the specified Row and LBID.
 | 
						|
   *  @param lastInputRow Last input Row for old extent we are adding data to
 | 
						|
   *  @param lbid         LBID of the relevant extent.
 | 
						|
   *  @param bIsNewExtent Treat as new or existing extent when CP min/max is
 | 
						|
   *                      sent to BRM
 | 
						|
   */
 | 
						|
  void addFirstEntry(RID lastInputRow, BRM::LBID_t lbid, bool bIsNewExtent) override;
 | 
						|
 | 
						|
  /** @brief Add or update an entry for the specified Row and its min/max val.
 | 
						|
   *         If new extent, LBID will be added later when extent is allocated.
 | 
						|
   *  @param lastInputRow Last input Row for a new extent being loaded.
 | 
						|
   *  @param minVal       Minimum value for the latest buffer read
 | 
						|
   *  @param maxVal       Maximum value for the latest buffer read
 | 
						|
   */
 | 
						|
  template <typename T>
 | 
						|
  void addOrUpdateEntryTemplate(RID lastInputRow, T minVal, T maxVal, ColDataType colDataType, int width);
 | 
						|
 | 
						|
  void addOrUpdateEntry(RID lastInputRow, int64_t minVal, int64_t maxVal, ColDataType colDataType,
 | 
						|
                        int width) override
 | 
						|
  {
 | 
						|
    addOrUpdateEntryTemplate(lastInputRow, minVal, maxVal, colDataType, width);
 | 
						|
  }
 | 
						|
 | 
						|
  void addOrUpdateEntry(RID lastInputRow, int128_t minVal, int128_t maxVal, ColDataType colDataType,
 | 
						|
                        int width) override
 | 
						|
  {
 | 
						|
    addOrUpdateEntryTemplate(lastInputRow, minVal, maxVal, colDataType, width);
 | 
						|
  }
 | 
						|
 | 
						|
  /** @brief Send updated Casual Partition (CP) info to BRM.
 | 
						|
   */
 | 
						|
  void getCPInfoForBRM(JobColumn column, BRMReporter& brmReporter) override;
 | 
						|
 | 
						|
  /** @brief Debug print function.
 | 
						|
   */
 | 
						|
  void print(const JobColumn& column) override;
 | 
						|
 | 
						|
  /** @brief Add extent's LBID to the oldest entry that is awaiting an LBID
 | 
						|
   *  @param startLbid Starting LBID for a pending extent.
 | 
						|
   *  @return NO_ERROR upon success; else error if extent entry not found
 | 
						|
   */
 | 
						|
  int updateEntryLbid(BRM::LBID_t startLbid) override;
 | 
						|
 | 
						|
 private:
 | 
						|
  OID fColOid;                       // Column OID for the relevant extents
 | 
						|
  Log* fLog;                         // Log used for debug logging
 | 
						|
  boost::mutex fMapMutex;            // protects unordered map access
 | 
						|
  std::set<RID> fPendingExtentRows;  // list of lastInputRow entries that
 | 
						|
  // are awaiting an LBID assignment.
 | 
						|
 | 
						|
  // unordered map where we collect the min/max values per extent
 | 
						|
  std::tr1::unordered_map<RID, ColExtInfEntry, uint64Hasher> fMap;
 | 
						|
 | 
						|
  // disable copy constructor and assignment operator
 | 
						|
  ColExtInf(const ColExtInf&);
 | 
						|
  ColExtInf& operator=(const ColExtInf&);
 | 
						|
};
 | 
						|
 | 
						|
}  // namespace WriteEngine
 |