You've already forked mariadb-columnstore-engine
							
							
				mirror of
				https://github.com/mariadb-corporation/mariadb-columnstore-engine.git
				synced 2025-10-31 18:30:33 +03:00 
			
		
		
		
	* Fix clang warnings * Remove vim tab guides * initialize variables * 'strncpy' output truncated before terminating nul copying as many bytes from a string as its length * Fix ISO C++17 does not allow 'register' storage class specifier for outdated bison * chars are unsigned on ARM, having if (ival < 0) always false * chars are unsigned by default on ARM and comparison with -1 if always true
		
			
				
	
	
		
			262 lines
		
	
	
		
			7.3 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			262 lines
		
	
	
		
			7.3 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*
 | |
|    Copyright (c) 2017, MariaDB
 | |
|    Copyright (C) 2014 InfiniDB, Inc.
 | |
| 
 | |
|    This program is free software; you can redistribute it and/or
 | |
|    modify it under the terms of the GNU General Public License
 | |
|    as published by the Free Software Foundation; version 2 of
 | |
|    the License.
 | |
| 
 | |
|    This program is distributed in the hope that it will be useful,
 | |
|    but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|    GNU General Public License for more details.
 | |
| 
 | |
|    You should have received a copy of the GNU General Public License
 | |
|    along with this program; if not, write to the Free Software
 | |
|    Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
 | |
|    MA 02110-1301, USA.
 | |
| */
 | |
| 
 | |
| //#define NDEBUG
 | |
| #include <cassert>
 | |
| #include <sstream>
 | |
| #include <iomanip>
 | |
| using namespace std;
 | |
| 
 | |
| #include <boost/shared_ptr.hpp>
 | |
| 
 | |
| #include "loggingid.h"
 | |
| #include "errorcodes.h"
 | |
| #include "idberrorinfo.h"
 | |
| using namespace logging;
 | |
| 
 | |
| #include "rowgroup.h"
 | |
| using namespace rowgroup;
 | |
| 
 | |
| #include "idborderby.h"
 | |
| using namespace ordering;
 | |
| 
 | |
| #include "windowfunctionstep.h"
 | |
| using namespace joblist;
 | |
| 
 | |
| #include "windowfunctiontype.h"
 | |
| #include "framebound.h"
 | |
| #include "windowframe.h"
 | |
| #include "windowfunction.h"
 | |
| 
 | |
| namespace windowfunction
 | |
| {
 | |
| WindowFunction::WindowFunction(boost::shared_ptr<WindowFunctionType>& f,
 | |
|                                boost::shared_ptr<ordering::EqualCompData>& p,
 | |
|                                boost::shared_ptr<OrderByData>& o, boost::shared_ptr<WindowFrame>& w,
 | |
|                                const RowGroup& g, const Row& r)
 | |
|  : fFunctionType(f), fPartitionBy(p), fOrderBy(o), fFrame(w), fRowGroup(g), fRow(r)
 | |
| {
 | |
| }
 | |
| 
 | |
| WindowFunction::~WindowFunction()
 | |
| {
 | |
| }
 | |
| 
 | |
| void WindowFunction::operator()()
 | |
| {
 | |
|   try
 | |
|   {
 | |
|     fRowData.reset(new vector<RowPosition>(fStep->getRowData()));
 | |
| 
 | |
|     if (fOrderBy->rule().fCompares.size() > 0)
 | |
|       sort(fRowData->begin(), fRowData->size());
 | |
| 
 | |
|     // get partitions
 | |
|     if (fPartitionBy.get() != NULL && !fStep->cancelled())
 | |
|     {
 | |
|       int64_t i = 0;
 | |
|       int64_t j = 1;
 | |
|       int64_t rowCnt = fRowData->size();
 | |
| 
 | |
|       for (j = 1; j < rowCnt; j++)
 | |
|       {
 | |
|         if ((*(fPartitionBy.get()))(getPointer((*fRowData)[j - 1]), getPointer((*fRowData)[j])))
 | |
|           continue;
 | |
| 
 | |
|         fPartition.push_back(make_pair(i, j - 1));
 | |
|         i = j;
 | |
|       }
 | |
| 
 | |
|       fPartition.push_back(make_pair(i, j - 1));
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       fPartition.push_back(make_pair(0, fRowData->size()));
 | |
|     }
 | |
| 
 | |
|     // compute partition by partition
 | |
|     int64_t uft = fFrame->upper()->boundType();
 | |
|     int64_t lft = fFrame->lower()->boundType();
 | |
|     bool upperUbnd = (uft == WF__UNBOUNDED_PRECEDING || uft == WF__UNBOUNDED_FOLLOWING);
 | |
|     bool lowerUbnd = (lft == WF__UNBOUNDED_PRECEDING || lft == WF__UNBOUNDED_FOLLOWING);
 | |
|     bool upperCnrw = (uft == WF__CURRENT_ROW);
 | |
|     bool lowerCnrw = (lft == WF__CURRENT_ROW);
 | |
|     fFunctionType->setRowData(fRowData);
 | |
|     fFunctionType->setRowMetaData(fRowGroup, fRow);
 | |
|     fFrame->setRowData(fRowData);
 | |
|     fFrame->setRowMetaData(fRowGroup, fRow);
 | |
| 
 | |
|     for (uint64_t k = 0; k < fPartition.size() && !fStep->cancelled(); k++)
 | |
|     {
 | |
|       fFunctionType->resetData();
 | |
|       fFunctionType->partition(fPartition[k]);
 | |
| 
 | |
|       int64_t begin = fPartition[k].first;
 | |
|       int64_t end = fPartition[k].second;
 | |
| 
 | |
|       if (upperUbnd && lowerUbnd)
 | |
|       {
 | |
|         fFunctionType->operator()(begin, end, WF__BOUND_ALL);
 | |
|       }
 | |
|       else if (upperUbnd && lowerCnrw)
 | |
|       {
 | |
|         if (fFrame->unit() == WF__FRAME_ROWS)
 | |
|         {
 | |
|           for (int64_t i = begin; i <= end && !fStep->cancelled(); i++)
 | |
|           {
 | |
|             fFunctionType->operator()(begin, i, i);
 | |
|           }
 | |
|         }
 | |
|         else
 | |
|         {
 | |
|           for (int64_t i = begin; i <= end && !fStep->cancelled(); i++)
 | |
|           {
 | |
|             pair<int64_t, int64_t> w = fFrame->getWindow(begin, end, i);
 | |
|             int64_t j = i;
 | |
| 
 | |
|             if (w.second > i)
 | |
|               j = w.second;
 | |
| 
 | |
|             fFunctionType->operator()(begin, j, i);
 | |
|           }
 | |
|         }
 | |
|       }
 | |
|       else if (upperCnrw && lowerUbnd)
 | |
|       {
 | |
|         if (fFrame->unit() == WF__FRAME_ROWS)
 | |
|         {
 | |
|           for (int64_t i = end; i >= begin && !fStep->cancelled(); i--)
 | |
|           {
 | |
|             fFunctionType->operator()(i, end, i);
 | |
|           }
 | |
|         }
 | |
|         else
 | |
|         {
 | |
|           for (int64_t i = end; i >= begin && !fStep->cancelled(); i--)
 | |
|           {
 | |
|             pair<int64_t, int64_t> w = fFrame->getWindow(begin, end, i);
 | |
|             int64_t j = i;
 | |
| 
 | |
|             if (w.first < i)
 | |
|               j = w.first;
 | |
| 
 | |
|             fFunctionType->operator()(j, end, i);
 | |
|           }
 | |
|         }
 | |
|       }
 | |
|       else
 | |
|       {
 | |
|         pair<int64_t, int64_t> w;
 | |
|         pair<int64_t, int64_t> prevFrame;
 | |
|         int64_t b, e;
 | |
|         bool firstTime = true;
 | |
| 
 | |
|         for (int64_t i = begin; i <= end && !fStep->cancelled(); i++)
 | |
|         {
 | |
|           w = fFrame->getWindow(begin, end, i);
 | |
|           b = w.first;
 | |
|           e = w.second;
 | |
| 
 | |
|           if (firstTime)
 | |
|           {
 | |
|             prevFrame = w;
 | |
|           }
 | |
| 
 | |
|           // UDAnF functions may have a dropValue function implemented.
 | |
|           // If they do, we can optimize by calling dropValue() for those
 | |
|           // values leaving the window and nextValue for those entering, rather
 | |
|           // than a resetData() and then iterating over the entire window.
 | |
|           // Built-in functions may have this functionality added in the future.
 | |
|           // If b > e then the frame is entirely outside of the partition
 | |
|           // and there's no values to drop
 | |
|           if (!firstTime && (b <= e) && fFunctionType->dropValues(prevFrame.first, w.first))
 | |
|           {
 | |
|             // Adjust the beginning of the frame for nextValue
 | |
|             // to start where the previous frame left off.
 | |
|             b = prevFrame.second + 1;
 | |
|           }
 | |
|           else
 | |
|           {
 | |
|             // If dropValues failed or doesn't exist,
 | |
|             // calculate the entire frame.
 | |
|             fFunctionType->resetData();
 | |
|           }
 | |
|           fFunctionType->operator()(b, e, i);  // UDAnF: Calls nextValue and evaluate
 | |
|           prevFrame = w;
 | |
|           firstTime = false;
 | |
|         }
 | |
|       }
 | |
|     }
 | |
|   }
 | |
|   catch (...)
 | |
|   {
 | |
|     fStep->handleException(std::current_exception(), logging::ERR_EXECUTE_WINDOW_FUNCTION,
 | |
|                            logging::ERR_WF_DATA_SET_TOO_BIG, "WindowFunction::operator()");
 | |
|   }
 | |
| }
 | |
| 
 | |
| void WindowFunction::setCallback(joblist::WindowFunctionStep* step, int id)
 | |
| {
 | |
|   fStep = step;
 | |
|   fId = id;
 | |
|   fFunctionType->setCallback(step);
 | |
|   fFrame->setCallback(step);
 | |
| }
 | |
| 
 | |
| const Row& WindowFunction::getRow() const
 | |
| {
 | |
|   return fRow;
 | |
| }
 | |
| 
 | |
| void WindowFunction::sort(std::vector<RowPosition>::iterator v, uint64_t n)
 | |
| {
 | |
|   // recursive function termination condition.
 | |
|   if (n < 2 || fStep->cancelled())
 | |
|     return;
 | |
| 
 | |
|   RowPosition p = *(v + n / 2);                   // pivot value
 | |
|   vector<RowPosition>::iterator l = v;            // low   address
 | |
|   vector<RowPosition>::iterator h = v + (n - 1);  // high  address
 | |
| 
 | |
|   while (l <= h && !(fStep->cancelled()))
 | |
|   {
 | |
|     // Can use while here, but need check boundary and cancel status.
 | |
|     if (fOrderBy->operator()(getPointer(*l), getPointer(p)))
 | |
|     {
 | |
|       l++;
 | |
|     }
 | |
|     else if (fOrderBy->operator()(getPointer(p), getPointer(*h)))
 | |
|     {
 | |
|       h--;
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       RowPosition t = *l;  // temp value for swap
 | |
|       *l++ = *h;
 | |
|       *h-- = t;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   sort(v, std::distance(v, h) + 1);
 | |
|   sort(l, std::distance(l, v) + n);
 | |
| }
 | |
| 
 | |
| }  // namespace windowfunction
 |