/* Copyright (C) 2017 MariaDB Corporation This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; version 2 of the License. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */ #include #include #include #include "regr_intercept.h" #include "bytestream.h" #include "objectreader.h" using namespace mcsv1sdk; class Add_regr_intercept_ToUDAFMap { public: Add_regr_intercept_ToUDAFMap() { UDAFMap::getMap()["regr_intercept"] = new regr_intercept(); } }; static Add_regr_intercept_ToUDAFMap addToMap; // Use the simple data model struct regr_intercept_data { uint64_t cnt; long double sumx; long double sumx2; // sum of (x squared) long double sumy; long double sumxy; // sum of x * y }; mcsv1_UDAF::ReturnCode regr_intercept::init(mcsv1Context* context, ColumnDatum* colTypes) { if (context->getParameterCount() != 2) { // The error message will be prepended with // "The storage engine for the table doesn't support " context->setErrorMessage("regr_intercept() with other than 2 arguments"); return mcsv1_UDAF::ERROR; } if (!(isNumeric(colTypes[0].dataType) && isNumeric(colTypes[1].dataType))) { // The error message will be prepended with // "The storage engine for the table doesn't support " context->setErrorMessage("regr_intercept() with non-numeric arguments"); return mcsv1_UDAF::ERROR; } context->setUserDataSize(sizeof(regr_intercept_data)); context->setResultType(execplan::CalpontSystemCatalog::DOUBLE); context->setColWidth(8); context->setScale(DECIMAL_NOT_SPECIFIED); context->setPrecision(0); context->setRunFlag(mcsv1sdk::UDAF_IGNORE_NULLS); return mcsv1_UDAF::SUCCESS; } mcsv1_UDAF::ReturnCode regr_intercept::reset(mcsv1Context* context) { struct regr_intercept_data* data = (struct regr_intercept_data*)context->getUserData()->data; data->cnt = 0; data->sumx = 0.0; data->sumx2 = 0.0; data->sumy = 0.0; data->sumxy = 0.0; return mcsv1_UDAF::SUCCESS; } mcsv1_UDAF::ReturnCode regr_intercept::nextValue(mcsv1Context* context, ColumnDatum* valsIn) { double valy = toDouble(valsIn[0]); double valx = toDouble(valsIn[1]); struct regr_intercept_data* data = (struct regr_intercept_data*)context->getUserData()->data; data->sumy += valy; data->sumx += valx; data->sumx2 += valx * valx; data->sumxy += valx * valy; ++data->cnt; return mcsv1_UDAF::SUCCESS; } mcsv1_UDAF::ReturnCode regr_intercept::subEvaluate(mcsv1Context* context, const UserData* userDataIn) { if (!userDataIn) { return mcsv1_UDAF::SUCCESS; } struct regr_intercept_data* outData = (struct regr_intercept_data*)context->getUserData()->data; struct regr_intercept_data* inData = (struct regr_intercept_data*)userDataIn->data; outData->sumx += inData->sumx; outData->sumx2 += inData->sumx2; outData->sumy += inData->sumy; outData->sumxy += inData->sumxy; outData->cnt += inData->cnt; return mcsv1_UDAF::SUCCESS; } mcsv1_UDAF::ReturnCode regr_intercept::evaluate(mcsv1Context* context, static_any::any& valOut) { struct regr_intercept_data* data = (struct regr_intercept_data*)context->getUserData()->data; long double N = data->cnt; if (N > 1) { long double sumx = data->sumx; long double sumy = data->sumy; long double sumx2 = data->sumx2; long double sumxy = data->sumxy; // regr_intercept is AVG(y) - slope(y,x)*avg(x) // We do some algebra and we can get a slightly smaller calculation long double numerator = sumy * sumx2 - sumx * sumxy; long double var_pop = (N * sumx2) - (sumx * sumx); // Not realy var_pop, but sort of after some reductions if (var_pop > 0) { valOut = static_cast(numerator / var_pop); } } return mcsv1_UDAF::SUCCESS; } mcsv1_UDAF::ReturnCode regr_intercept::dropValue(mcsv1Context* context, ColumnDatum* valsDropped) { double valy = toDouble(valsDropped[0]); double valx = toDouble(valsDropped[1]); struct regr_intercept_data* data = (struct regr_intercept_data*)context->getUserData()->data; data->sumy -= valy; data->sumx -= valx; data->sumx2 -= valx * valx; data->sumxy -= valx * valy; --data->cnt; return mcsv1_UDAF::SUCCESS; }