You've already forked mariadb-columnstore-engine
							
							
				mirror of
				https://github.com/mariadb-corporation/mariadb-columnstore-engine.git
				synced 2025-10-31 18:30:33 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			332 lines
		
	
	
		
			8.1 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			332 lines
		
	
	
		
			8.1 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /* Copyright (C) 2017 MariaDB Corporaton
 | |
| 
 | |
|    This program is free software; you can redistribute it and/or
 | |
|    modify it under the terms of the GNU General Public License
 | |
|    as published by the Free Software Foundation; version 2 of
 | |
|    the License.
 | |
| 
 | |
|    This program is distributed in the hope that it will be useful,
 | |
|    but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|    GNU General Public License for more details.
 | |
| 
 | |
|    You should have received a copy of the GNU General Public License
 | |
|    along with this program; if not, write to the Free Software
 | |
|    Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
 | |
|    MA 02110-1301, USA. */
 | |
| 
 | |
| #include <sstream>
 | |
| #include <cstring>
 | |
| #include <typeinfo>
 | |
| #include "median.h"
 | |
| #include "bytestream.h"
 | |
| #include "objectreader.h"
 | |
| 
 | |
| using namespace mcsv1sdk;
 | |
| 
 | |
| mcsv1_UDAF::ReturnCode median::init(mcsv1Context* context,
 | |
|                                     COL_TYPES& colTypes)
 | |
| {
 | |
|     if (colTypes.size() < 1)
 | |
|     {
 | |
|         // The error message will be prepended with
 | |
|         // "The storage engine for the table doesn't support "
 | |
|         context->setErrorMessage("median() with 0 arguments");
 | |
|         return mcsv1_UDAF::ERROR;
 | |
|     }
 | |
| 
 | |
|     if (colTypes.size() > 1)
 | |
|     {
 | |
|         context->setErrorMessage("median() with more than 1 argument");
 | |
|         return mcsv1_UDAF::ERROR;
 | |
|     }
 | |
| 
 | |
|     if (!(isNumeric(colTypes[0].second)))
 | |
|     {
 | |
|         // The error message will be prepended with
 | |
|         // "The storage engine for the table doesn't support "
 | |
|         context->setErrorMessage("median() with non-numeric argument");
 | |
|         return mcsv1_UDAF::ERROR;
 | |
|     }
 | |
| 
 | |
|     context->setResultType(CalpontSystemCatalog::DOUBLE);
 | |
|     context->setColWidth(8);
 | |
|     context->setScale(context->getScale() * 2);
 | |
|     context->setPrecision(19);
 | |
|     context->setRunFlag(mcsv1sdk::UDAF_IGNORE_NULLS);
 | |
|     return mcsv1_UDAF::SUCCESS;
 | |
| 
 | |
| }
 | |
| 
 | |
| mcsv1_UDAF::ReturnCode median::reset(mcsv1Context* context)
 | |
| {
 | |
|     MedianData* data = static_cast<MedianData*>(context->getUserData());
 | |
|     data->mData.clear();
 | |
|     return mcsv1_UDAF::SUCCESS;
 | |
| }
 | |
| 
 | |
| mcsv1_UDAF::ReturnCode median::nextValue(mcsv1Context* context,
 | |
|         std::vector<ColumnDatum>& valsIn)
 | |
| {
 | |
|     static_any::any& valIn = valsIn[0].columnData;
 | |
|     MEDIAN_DATA& data = static_cast<MedianData*>(context->getUserData())->mData;
 | |
|     DATATYPE val = 0.0;
 | |
| 
 | |
|     if (valIn.empty())
 | |
|     {
 | |
|         return mcsv1_UDAF::SUCCESS; // Ought not happen when UDAF_IGNORE_NULLS is on.
 | |
|     }
 | |
| 
 | |
|     if (valIn.compatible(charTypeId))
 | |
|     {
 | |
|         val = valIn.cast<char>();
 | |
|     }
 | |
|     else if (valIn.compatible(scharTypeId))
 | |
|     {
 | |
|         val = valIn.cast<signed char>();
 | |
|     }
 | |
|     else if (valIn.compatible(shortTypeId))
 | |
|     {
 | |
|         val = valIn.cast<short>();
 | |
|     }
 | |
|     else if (valIn.compatible(intTypeId))
 | |
|     {
 | |
|         val = valIn.cast<int>();
 | |
|     }
 | |
|     else if (valIn.compatible(longTypeId))
 | |
|     {
 | |
|         val = valIn.cast<long>();
 | |
|     }
 | |
|     else if (valIn.compatible(llTypeId))
 | |
|     {
 | |
|         val = valIn.cast<long long>();
 | |
|     }
 | |
|     else if (valIn.compatible(ucharTypeId))
 | |
|     {
 | |
|         val = valIn.cast<unsigned char>();
 | |
|     }
 | |
|     else if (valIn.compatible(ushortTypeId))
 | |
|     {
 | |
|         val = valIn.cast<unsigned short>();
 | |
|     }
 | |
|     else if (valIn.compatible(uintTypeId))
 | |
|     {
 | |
|         val = valIn.cast<unsigned int>();
 | |
|     }
 | |
|     else if (valIn.compatible(ulongTypeId))
 | |
|     {
 | |
|         val = valIn.cast<unsigned long>();
 | |
|     }
 | |
|     else if (valIn.compatible(ullTypeId))
 | |
|     {
 | |
|         val = valIn.cast<unsigned long long>();
 | |
|     }
 | |
|     else if (valIn.compatible(floatTypeId))
 | |
|     {
 | |
|         val = valIn.cast<float>();
 | |
|     }
 | |
|     else if (valIn.compatible(doubleTypeId))
 | |
|     {
 | |
|         val = valIn.cast<double>();
 | |
|     }
 | |
| 
 | |
|     // For decimal types, we need to move the decimal point.
 | |
|     uint32_t scale = valsIn[0].scale;
 | |
| 
 | |
|     if (val != 0 && scale > 0)
 | |
|     {
 | |
|         val /= pow(10.0, (double)scale);
 | |
|     }
 | |
| 
 | |
|     data[val]++;
 | |
| 
 | |
|     return mcsv1_UDAF::SUCCESS;
 | |
| }
 | |
| 
 | |
| mcsv1_UDAF::ReturnCode median::subEvaluate(mcsv1Context* context, const UserData* userDataIn)
 | |
| {
 | |
|     if (!userDataIn)
 | |
|     {
 | |
|         return mcsv1_UDAF::SUCCESS;
 | |
|     }
 | |
| 
 | |
|     MEDIAN_DATA& outData = static_cast<MedianData*>(context->getUserData())->mData;
 | |
|     const MEDIAN_DATA& inData = static_cast<const MedianData*>(userDataIn)->mData;
 | |
|     MEDIAN_DATA::const_iterator iter = inData.begin();
 | |
| 
 | |
|     for (; iter != inData.end(); ++iter)
 | |
|     {
 | |
|         outData[iter->first] += iter->second;
 | |
|     }
 | |
| 
 | |
|     return mcsv1_UDAF::SUCCESS;
 | |
| }
 | |
| 
 | |
| mcsv1_UDAF::ReturnCode median::evaluate(mcsv1Context* context, static_any::any& valOut)
 | |
| {
 | |
|     uint64_t cnt1 = 0, cnt2 = 0;
 | |
|     MEDIAN_DATA& data = static_cast<MedianData*>(context->getUserData())->mData;
 | |
| 
 | |
|     if (data.size() == 0)
 | |
|     {
 | |
|         valOut = (DATATYPE)0;
 | |
|         return mcsv1_UDAF::SUCCESS;
 | |
|     }
 | |
| 
 | |
|     MEDIAN_DATA::iterator iter(data.begin());
 | |
|     MEDIAN_DATA::iterator revfrom(data.end());
 | |
|     MEDIAN_DATA::reverse_iterator riter(revfrom);
 | |
|     cnt1 += iter->second;
 | |
|     cnt2 += riter->second;
 | |
| 
 | |
|     while (iter->first < riter->first)
 | |
|     {
 | |
|         while (cnt1 < cnt2 && iter->first < riter->first)
 | |
|         {
 | |
|             ++iter;
 | |
|             cnt1 += iter->second;
 | |
|         }
 | |
| 
 | |
|         while (cnt2 < cnt1 && iter->first < riter->first)
 | |
|         {
 | |
|             ++riter;
 | |
|             cnt2 += riter->second;
 | |
|         }
 | |
| 
 | |
|         while (cnt1 == cnt2 && iter->first < riter->first)
 | |
|         {
 | |
|             ++iter;
 | |
|             cnt1 += iter->second;
 | |
| 
 | |
|             if (iter->first > riter->first)
 | |
|             {
 | |
|                 break;
 | |
|             }
 | |
| 
 | |
|             ++riter;
 | |
|             cnt2 += riter->second;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     valOut = (iter->first + riter->first) / 2;
 | |
|     return mcsv1_UDAF::SUCCESS;
 | |
| }
 | |
| 
 | |
| mcsv1_UDAF::ReturnCode median::dropValue(mcsv1Context* context,
 | |
|         std::vector<ColumnDatum>& valsDropped)
 | |
| {
 | |
|     static_any::any& valIn = valsDropped[0].columnData;
 | |
|     MEDIAN_DATA& data = static_cast<MedianData*>(context->getUserData())->mData;
 | |
|     DATATYPE val = 0.0;
 | |
| 
 | |
|     if (valIn.empty())
 | |
|     {
 | |
|         return mcsv1_UDAF::SUCCESS; // Ought not happen when UDAF_IGNORE_NULLS is on.
 | |
|     }
 | |
| 
 | |
|     if (valIn.compatible(charTypeId))
 | |
|     {
 | |
|         val = valIn.cast<char>();
 | |
|     }
 | |
|     else if (valIn.compatible(scharTypeId))
 | |
|     {
 | |
|         val = valIn.cast<signed char>();
 | |
|     }
 | |
|     else if (valIn.compatible(shortTypeId))
 | |
|     {
 | |
|         val = valIn.cast<short>();
 | |
|     }
 | |
|     else if (valIn.compatible(intTypeId))
 | |
|     {
 | |
|         val = valIn.cast<int>();
 | |
|     }
 | |
|     else if (valIn.compatible(longTypeId))
 | |
|     {
 | |
|         val = valIn.cast<long>();
 | |
|     }
 | |
|     else if (valIn.compatible(llTypeId))
 | |
|     {
 | |
|         val = valIn.cast<long long>();
 | |
|     }
 | |
|     else if (valIn.compatible(ucharTypeId))
 | |
|     {
 | |
|         val = valIn.cast<unsigned char>();
 | |
|     }
 | |
|     else if (valIn.compatible(ushortTypeId))
 | |
|     {
 | |
|         val = valIn.cast<unsigned short>();
 | |
|     }
 | |
|     else if (valIn.compatible(uintTypeId))
 | |
|     {
 | |
|         val = valIn.cast<unsigned int>();
 | |
|     }
 | |
|     else if (valIn.compatible(ulongTypeId))
 | |
|     {
 | |
|         val = valIn.cast<unsigned long>();
 | |
|     }
 | |
|     else if (valIn.compatible(ullTypeId))
 | |
|     {
 | |
|         val = valIn.cast<unsigned long long>();
 | |
|     }
 | |
|     else if (valIn.compatible(floatTypeId))
 | |
|     {
 | |
|         val = valIn.cast<float>();
 | |
|     }
 | |
|     else if (valIn.compatible(doubleTypeId))
 | |
|     {
 | |
|         val = valIn.cast<double>();
 | |
|     }
 | |
| 
 | |
|     // For decimal types, we need to move the decimal point.
 | |
|     uint32_t scale = valsDropped[0].scale;
 | |
| 
 | |
|     if (val != 0 && scale > 0)
 | |
|     {
 | |
|         val /= pow(10.0, (double)scale);
 | |
|     }
 | |
| 
 | |
|     data[val]--;
 | |
| 
 | |
|     return mcsv1_UDAF::SUCCESS;
 | |
| }
 | |
| 
 | |
| mcsv1_UDAF::ReturnCode median::createUserData(UserData*& userData, int32_t& length)
 | |
| {
 | |
|     userData = new MedianData;
 | |
|     length = sizeof(MedianData);
 | |
|     return mcsv1_UDAF::SUCCESS;
 | |
| }
 | |
| 
 | |
| void MedianData::serialize(messageqcpp::ByteStream& bs) const
 | |
| {
 | |
|     MEDIAN_DATA::const_iterator iter = mData.begin();
 | |
|     DATATYPE num;
 | |
|     uint32_t cnt;
 | |
|     bs << (int32_t)mData.size();
 | |
| 
 | |
|     for (; iter != mData.end(); ++iter)
 | |
|     {
 | |
|         num = iter->first;
 | |
|         bs << num;
 | |
|         cnt = iter->second;
 | |
|         bs << cnt;
 | |
|     }
 | |
| }
 | |
| 
 | |
| void MedianData::unserialize(messageqcpp::ByteStream& bs)
 | |
| {
 | |
|     mData.clear();
 | |
|     int32_t sz;
 | |
|     DATATYPE num;
 | |
|     uint32_t cnt;
 | |
|     bs >> sz;
 | |
| 
 | |
|     for (int i = 0; i < sz; ++i)
 | |
|     {
 | |
|         bs >> num;
 | |
|         bs >> cnt;
 | |
|         mData[num] = cnt;
 | |
|     }
 | |
| }
 | |
| 
 |