1
0
mirror of https://github.com/mariadb-corporation/mariadb-columnstore-engine.git synced 2025-04-18 21:44:02 +03:00
Andrey Piskunov b6808c97f1
MCOL-4530: common conjuction top rewrite (#2673)
Added logical transformation of the execplan::ParseTrees with the taking out the common factor in expression of the form "(A and B) or (A and C)" for the purposes of passing a TPCH 19 query.

Co-authored-by: Leonid Fedorov <leonid.fedorov@mariadb.com>
2023-02-27 19:23:19 +03:00

617 lines
12 KiB
C++
Executable File

/* Copyright (C) 2022 MariaDB Corporation
This program is free software; you can redistribute it and/or modify it under the terms of the GNU General
Public License as published by the Free Software Foundation; version 2 of the License. This program is
distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty
of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
You should have received a copy of the GNU General Public License along with this program; if not, write to
the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
#include <gtest/gtest.h>
#include <algorithm>
#include <memory>
#include "rewrites.h"
#include "bytestream.h"
#include "objectreader.h"
#include "unitqueries_before.h"
#include "unitqueries_after.h"
#include "query19_init.h"
#include "query19_fixed.h"
using TreePtr = std::unique_ptr<execplan::ParseTree>;
bool treeEqual(execplan::ParseTree* fst, execplan::ParseTree* snd, int depth = 0)
{
if (fst == nullptr)
{
return snd == nullptr;
}
if (snd == nullptr)
{
return fst == nullptr;
}
auto comp = execplan::NodeSemanticComparator();
if (comp(fst, snd) || comp(fst, snd))
{
std::cerr << "Data " << fst->data()->data() << " differs from " << snd->data()->data() << " at level " << depth << '\n';
return false;
}
return (treeEqual(fst->left(), snd->left(), depth + 1) && treeEqual(fst->right(), snd->right(), depth + 1)) ||
(treeEqual(fst->left(), snd->right(), depth + 1) && treeEqual(fst->right(), snd->left(), depth + 1));
}
#define REWRITE_TREE_TEST_DEBUG false
void printTree(const std::string& queryName, execplan::ParseTree* tree, const std::string& treeName)
{
#if REWRITE_TREE_TEST_DEBUG
std::string dotPath = std::string("/tmp/") + queryName;
std::string dotFile = dotPath + "." + treeName + ".dot";
tree->drawTree(dotFile);
std::string dotInvoke = "dot -Tpng ";
std::string convertCommand = dotInvoke + dotFile + " -o " + dotFile + ".png";
[[maybe_unused]] auto _ = std::system(convertCommand.c_str());
#endif
}
struct ParseTreeTestParam
{
std::string queryName;
std::vector<unsigned char>* query = nullptr;
std::vector<unsigned char>* manually_rewritten_query = nullptr;
friend std::ostream& operator<<(std::ostream& os, const ParseTreeTestParam& bar)
{
return os << bar.queryName;
}
};
class ParseTreeTest : public testing::TestWithParam<::ParseTreeTestParam> {};
TEST_P(ParseTreeTest, Rewrite)
{
messageqcpp::ByteStream stream;
stream.load(GetParam().query->data(), GetParam().query->size());
execplan::ParseTree* initialTree = execplan::ObjectReader::createParseTree(stream);
printTree(GetParam().queryName, initialTree, "initial");
TreePtr rewrittenTree;
rewrittenTree.reset(execplan::extractCommonLeafConjunctionsToRoot<true>(initialTree));
if (GetParam().manually_rewritten_query)
{
stream.load(GetParam().manually_rewritten_query->data(), GetParam().manually_rewritten_query->size());
TreePtr manuallyRewrittenTree;
manuallyRewrittenTree.reset(execplan::ObjectReader::createParseTree(stream));
bool result = treeEqual(manuallyRewrittenTree.get(), rewrittenTree.get());
printTree(GetParam().queryName, rewrittenTree.get(), "rewritten");
printTree(GetParam().queryName, manuallyRewrittenTree.get(), "reference");
EXPECT_TRUE(result);
}
else
{
bool result = treeEqual(initialTree, rewrittenTree.get());
printTree(GetParam().queryName, rewrittenTree.get(), "rewritten");
EXPECT_TRUE(result);
}
}
INSTANTIATE_TEST_SUITE_P(TreeRewrites, ParseTreeTest, testing::Values(
/*
select t1.posname, t2.posname from t1,t2
where
(
t1.id = t2.id
and t1.pos + t2.pos < 1000
)
or
(
t1.id = t2.id
and t1.pos + t2.pos > 15000
);
*/
ParseTreeTestParam{"Query_1", &__test_query_before_1, &__test_query_after_1},
/*
select t1.posname, t2.posname
from t1,t2
where
t1.id = t2.id
and (t1.pos + t2.pos < 1000);
*/
ParseTreeTestParam{"Query_2", &__test_query_before_2},
/*
select t1.posname, t2.posname
from t1,t2
where
(t1.pos + t2.pos < 1000)
or
(t1.pos + t2.pos > 16000)
or
(t1.posname < dcba);
*/
ParseTreeTestParam{"Query_3", &__test_query_before_3},
/*
select t1.posname, t2.posname
from t1,t2
where
(t1.pos > 20)
or
(t2.posname in (select t1.posname from t1 where t1.pos > 20));
*/
ParseTreeTestParam{"Query_4", &__test_query_before_4},
/*select t1.posname, t2.posname from t1,t2
where
(
t1.id = t2.id
or t1.pos + t2.pos < 1000
)
and
(
t1.id = t2.id
or t1.pos + t2.pos > 15000
);
*/
ParseTreeTestParam{"Query_5", &__test_query_before_5},
/*select t1.posname, t2.posname from t1,t2
where
(
t1.id = t2.rid
or t1.pos + t2.pos < 1000
)
and
(
t1.id = t2.id
or t1.pos + t2.pos > 15000
);
*/
ParseTreeTestParam{"Query_6", &__test_query_before_6},
/*
select t1.posname
from t1
where
t1.posname in
(
select t1.posname
from t1
where posname > 'qwer'
and
id < 30
);
*/
ParseTreeTestParam{"Query_7", &__test_query_before_7},
/*select t1.posname, t2.posname
from t1,t2
where t1.posname in
(
select t1.posname
from t1
where posname > 'qwer'
and id < 30
)
and t1.id = t2.id;
*/
ParseTreeTestParam{"Query_8", &__test_query_before_8},
/*select t1.posname, t2.posname
from t1,t2
where t1.posname in
(
select t1.posname
from t1
where posname > 'qwer'
and id < 30
) and
(
t1.id = t2.id
and t1.id = t2.rid
);
*/
ParseTreeTestParam{"Query_9", &__test_query_before_9},
/*select * from t1
where
(
posname > 'qwer'
and id < 30
)
or
(
pos > 5000
and place > 'abcdefghij'
);
*/
ParseTreeTestParam{"Query_10", &__test_query_before_10},
/*select *
from t1
where
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
);
*/
ParseTreeTestParam{"Query_11", &__test_query_before_11, &__test_query_after_11},
/*select *
from t1
where
(
pos > 5000
and id < 30
)
and
(
pos > 5000
and id < 30
);
*/
ParseTreeTestParam{"Query_12", &__test_query_before_12},
/*select *
from t1
where
(
pos > 5000
or id < 30
)
or
(
pos > 5000
or id < 30
);
*/
ParseTreeTestParam{"Query_13", &__test_query_before_13},
/*select *
from t1
where
(
id in
(
select id
from t2
where posname > 'qwer'
and rid > 10
)
)
and
(
pos > 5000
or id < 30
);
*/
ParseTreeTestParam{"Query_14", &__test_query_before_14},
/*select *
from t1
where
(
id in
(
select id
from t2
where
(
posname > 'qwer'
and rid < 10
)
or
(
posname > 'qwer'
and rid > 40
)
)
)
and
(
pos > 5000
or id < 30);
*/
ParseTreeTestParam{"Query_15", &__test_query_before_15, &__test_query_after_15},
/*
select *
from t1
where
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
);
*/
ParseTreeTestParam{"Query_16", &__test_query_before_16, &__test_query_after_16},
/*
select *
from t1
where
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
);
*/
ParseTreeTestParam{"Query_17", &__test_query_before_17, &__test_query_after_17},
/*
select *
from t1
where
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
);
*/
ParseTreeTestParam{"Query_18", &__test_query_before_18, &__test_query_after_18},
/*
select *
from t1
where
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
)
or
(
pos > 5000
and id < 30
);
*/
ParseTreeTestParam{"Query_19", &__test_query_before_19, &__test_query_after_19},
/*
select *
from t1
where
(
pos > 5000
and id < 30
)
or
(
posname > 'qwer'
and
id < 30
and
place > 'abcdefghij'
);
*/
ParseTreeTestParam{"Query_20", &__test_query_before_20, &__test_query_after_20},
/*
select *
from t1
where
(
pos > 5000
and id < 30
)
or
(
posname > 'qwer'
and
id < 30
and
place > 'abcdefghij'
)
or
(
id < 30
and
place < 'zyxqwertyu'
);
*/
ParseTreeTestParam{"Query_21", &__test_query_before_21, &__test_query_after_21},
/*
select *
from t1
where
(pos > 5000 and id < 30)
or
(posname > 'qwer' and id < 30 and place > 'abcdefghij' and pos > 5000)
or
(id < 30 and place < 'zyxqwertyu' and pos > 5000)
or
(pos > 5000 and id < 30);
*/
ParseTreeTestParam{"Query_22", &__test_query_before_22, &__test_query_after_22},
/*
select *
from t1
where
(5000 < pos and id < 30)
or
(posname > 'qwer' and id < 30 and place > 'abcdefghij' and 5000 < pos)
or
(30 > id and place < 'zyxqwertyu' and pos > 5000)
or
(pos > 5000 and id < 30);
*/
ParseTreeTestParam{"Query_23", &__test_query_before_23, &__test_query_after_23},
/*
select *
from t1
where
(pos > 5000 and id < 30 and rid > 20)
or
(posname > 'qwer' and id < 30 and place > 'abcdefghij' and pos > 5000 and rid > 20)
or
(id < 30 and place < 'zyxqwertyu' and pos > 5000 and rid > 20)
or
(pos > 5000 and id < 30 and rid > 20)
or
(pos > 5000 and id < 30 and place < 'zyxqwertyu' and rid > 20);
*/
ParseTreeTestParam{"Query_27", &__test_query_before_27, &__test_query_after_27},
/*
select *
from t1
where
(pos > 5000 and id < 30 and rid > 20 and place < 'zyxqwertyu')
or
(posname > 'qwer' and id < 30 and place > 'abcdefghij' and place < 'zyxqwertyu' and pos > 5000 and rid > 20)
or
(id < 30 and place < 'zyxqwertyu' and pos > 5000 and rid > 20)
or
(pos > 5000 and id < 30 and rid > 20 and place < 'zyxqwertyu' and place < 'zyxqwertyu');
*/
ParseTreeTestParam{"Query_28", &__test_query_before_28, &__test_query_after_28},
ParseTreeTestParam{"TPCH_19", &__query19_tree_init, &__query19_tree_fixed}
),
[](const ::testing::TestParamInfo<ParseTreeTest::ParamType>& info) {
return info.param.queryName;
}
);
struct ComparatorTestParam
{
std::string queryName;
std::string filter;
std::vector<std::string> existingFilters;
bool contains;
friend std::ostream& operator<<(std::ostream& os, const ComparatorTestParam& bar)
{
return os << bar.queryName;
}
};
class ParseTreeComparatorTest : public testing::TestWithParam<ComparatorTestParam> {};
struct TestComparator
{
bool operator()(std::unique_ptr<execplan::ParseTree> const& left,
std::unique_ptr<execplan::ParseTree> const& right) const
{
execplan::NodeSemanticComparator comp;
return comp(left.get(), right.get());
}
};
TEST_P(ParseTreeComparatorTest, CompareContains)
{
std::set<std::unique_ptr<execplan::ParseTree>, TestComparator> container;
for (auto const& f : GetParam().existingFilters)
{
container.insert(std::make_unique<execplan::ParseTree>(new execplan::SimpleFilter(f, execplan::SimpleFilter::ForTestPurposesWithoutColumnsOIDS{})));
}
auto filter = std::make_unique<execplan::ParseTree>(new execplan::SimpleFilter(
GetParam().filter, execplan::SimpleFilter::ForTestPurposesWithoutColumnsOIDS{}));
ASSERT_EQ(GetParam().contains, container.contains(filter));
}
INSTANTIATE_TEST_SUITE_P(
Comparator, ParseTreeComparatorTest,
testing::Values(ComparatorTestParam{"SimpleInverse1", "a=b", {"b=a", "a=a"}, true},
ComparatorTestParam{"SimpleInverse2", "acb=bdd", {"b>a", "a=b", "bdd=acb"}, true},
ComparatorTestParam{"SimpleInverseOpposite", "a<b", {"b>a"}, true},
ComparatorTestParam{"SimpleInverseOpposite2", "a<b", {"a=c", "d=e", "b>a", "a<=b"}, true},
ComparatorTestParam{"SimpleContains", "a<b", {"a<b", "a=b", "acb=bdd"}, true},
ComparatorTestParam{"SimpleNotContains", "a<b", {"a<b1", "a=b", "acb=bdd"}, false}),
[](const ::testing::TestParamInfo<ParseTreeComparatorTest::ParamType>& info)
{ return info.param.queryName; });