You've already forked mariadb-columnstore-engine
mirror of
https://github.com/mariadb-corporation/mariadb-columnstore-engine.git
synced 2025-07-30 19:23:07 +03:00
158 lines
4.7 KiB
C++
158 lines
4.7 KiB
C++
/* Copyright (C) 2017 MariaDB Corporation
|
|
|
|
This program is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU General Public License
|
|
as published by the Free Software Foundation; version 2 of
|
|
the License.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
|
|
MA 02110-1301, USA. */
|
|
|
|
#include <sstream>
|
|
#include <cstring>
|
|
#include <typeinfo>
|
|
#include "regr_intercept.h"
|
|
#include "bytestream.h"
|
|
#include "objectreader.h"
|
|
|
|
using namespace mcsv1sdk;
|
|
|
|
class Add_regr_intercept_ToUDAFMap
|
|
{
|
|
public:
|
|
Add_regr_intercept_ToUDAFMap()
|
|
{
|
|
UDAFMap::getMap()["regr_intercept"] = new regr_intercept();
|
|
}
|
|
};
|
|
|
|
static Add_regr_intercept_ToUDAFMap addToMap;
|
|
|
|
// Use the simple data model
|
|
struct regr_intercept_data
|
|
{
|
|
uint64_t cnt;
|
|
long double sumx;
|
|
long double sumx2; // sum of (x squared)
|
|
long double sumy;
|
|
long double sumxy; // sum of x * y
|
|
};
|
|
|
|
mcsv1_UDAF::ReturnCode regr_intercept::init(mcsv1Context* context, ColumnDatum* colTypes)
|
|
{
|
|
if (context->getParameterCount() != 2)
|
|
{
|
|
// The error message will be prepended with
|
|
// "The storage engine for the table doesn't support "
|
|
context->setErrorMessage("regr_intercept() with other than 2 arguments");
|
|
return mcsv1_UDAF::ERROR;
|
|
}
|
|
if (!(isNumeric(colTypes[0].dataType) && isNumeric(colTypes[1].dataType)))
|
|
{
|
|
// The error message will be prepended with
|
|
// "The storage engine for the table doesn't support "
|
|
context->setErrorMessage("regr_intercept() with non-numeric arguments");
|
|
return mcsv1_UDAF::ERROR;
|
|
}
|
|
|
|
context->setUserDataSize(sizeof(regr_intercept_data));
|
|
context->setResultType(execplan::CalpontSystemCatalog::DOUBLE);
|
|
context->setColWidth(8);
|
|
context->setScale(DECIMAL_NOT_SPECIFIED);
|
|
context->setPrecision(0);
|
|
context->setRunFlag(mcsv1sdk::UDAF_IGNORE_NULLS);
|
|
return mcsv1_UDAF::SUCCESS;
|
|
}
|
|
|
|
mcsv1_UDAF::ReturnCode regr_intercept::reset(mcsv1Context* context)
|
|
{
|
|
struct regr_intercept_data* data = (struct regr_intercept_data*)context->getUserData()->data;
|
|
data->cnt = 0;
|
|
data->sumx = 0.0;
|
|
data->sumx2 = 0.0;
|
|
data->sumy = 0.0;
|
|
data->sumxy = 0.0;
|
|
return mcsv1_UDAF::SUCCESS;
|
|
}
|
|
|
|
mcsv1_UDAF::ReturnCode regr_intercept::nextValue(mcsv1Context* context, ColumnDatum* valsIn)
|
|
{
|
|
double valy = toDouble(valsIn[0]);
|
|
double valx = toDouble(valsIn[1]);
|
|
struct regr_intercept_data* data = (struct regr_intercept_data*)context->getUserData()->data;
|
|
|
|
data->sumy += valy;
|
|
data->sumx += valx;
|
|
data->sumx2 += valx * valx;
|
|
|
|
data->sumxy += valx * valy;
|
|
++data->cnt;
|
|
|
|
return mcsv1_UDAF::SUCCESS;
|
|
}
|
|
|
|
mcsv1_UDAF::ReturnCode regr_intercept::subEvaluate(mcsv1Context* context, const UserData* userDataIn)
|
|
{
|
|
if (!userDataIn)
|
|
{
|
|
return mcsv1_UDAF::SUCCESS;
|
|
}
|
|
|
|
struct regr_intercept_data* outData = (struct regr_intercept_data*)context->getUserData()->data;
|
|
struct regr_intercept_data* inData = (struct regr_intercept_data*)userDataIn->data;
|
|
|
|
outData->sumx += inData->sumx;
|
|
outData->sumx2 += inData->sumx2;
|
|
outData->sumy += inData->sumy;
|
|
outData->sumxy += inData->sumxy;
|
|
outData->cnt += inData->cnt;
|
|
|
|
return mcsv1_UDAF::SUCCESS;
|
|
}
|
|
|
|
mcsv1_UDAF::ReturnCode regr_intercept::evaluate(mcsv1Context* context, static_any::any& valOut)
|
|
{
|
|
struct regr_intercept_data* data = (struct regr_intercept_data*)context->getUserData()->data;
|
|
long double N = data->cnt;
|
|
if (N > 1)
|
|
{
|
|
long double sumx = data->sumx;
|
|
long double sumy = data->sumy;
|
|
long double sumx2 = data->sumx2;
|
|
long double sumxy = data->sumxy;
|
|
// regr_intercept is AVG(y) - slope(y,x)*avg(x)
|
|
// We do some algebra and we can get a slightly smaller calculation
|
|
long double numerator = sumy * sumx2 - sumx * sumxy;
|
|
long double var_pop =
|
|
(N * sumx2) - (sumx * sumx); // Not realy var_pop, but sort of after some reductions
|
|
if (var_pop > 0)
|
|
{
|
|
valOut = static_cast<double>(numerator / var_pop);
|
|
}
|
|
}
|
|
return mcsv1_UDAF::SUCCESS;
|
|
}
|
|
|
|
mcsv1_UDAF::ReturnCode regr_intercept::dropValue(mcsv1Context* context, ColumnDatum* valsDropped)
|
|
{
|
|
double valy = toDouble(valsDropped[0]);
|
|
double valx = toDouble(valsDropped[1]);
|
|
struct regr_intercept_data* data = (struct regr_intercept_data*)context->getUserData()->data;
|
|
|
|
data->sumy -= valy;
|
|
data->sumx -= valx;
|
|
data->sumx2 -= valx * valx;
|
|
|
|
data->sumxy -= valx * valy;
|
|
--data->cnt;
|
|
|
|
return mcsv1_UDAF::SUCCESS;
|
|
}
|