1
0
mirror of https://github.com/mariadb-corporation/mariadb-columnstore-engine.git synced 2025-10-30 07:25:34 +03:00
Files
mariadb-columnstore-engine/tests/rbo_hybrid.cpp

534 lines
20 KiB
C++

/*
* Unit tests for RBO parallel rewrite functionality using hybrid real/mock approach
* Uses real MariaDB ColumnStore classes where practical, minimal mocks where system infrastructure is
* required
*/
#include <gtest/gtest.h>
#include <memory>
#include <vector>
#include <string>
#include <dbcon/rbo/rbo_apply_parallel_ces.h>
#include <dbcon/execplan/calpontselectexecutionplan.h>
#include <dbcon/execplan/simplecolumn.h>
#include <dbcon/mysql/ha_mcs_impl_if.h>
class RBOHybridTest : public ::testing::Test
{
protected:
void SetUp() override
{
}
void TearDown() override
{
}
// Mock SimpleColumn that doesn't require Syscat infrastructure
class MockSimpleColumn : public execplan::SimpleColumn
{
public:
MockSimpleColumn(const std::string& schema, const std::string& table, const std::string& column)
: execplan::SimpleColumn()
{
// Set basic properties without requiring Syscat
schemaName(schema);
tableName(table);
columnName(column);
// Note: OID and other system-dependent properties are not set
}
};
// Helper to create a mock SimpleColumn
boost::shared_ptr<MockSimpleColumn> createMockSimpleColumn(const std::string& schema,
const std::string& table,
const std::string& column)
{
return boost::shared_ptr<MockSimpleColumn>(new MockSimpleColumn(schema, table, column));
}
// Helper to create a real CalpontSelectExecutionPlan
boost::shared_ptr<execplan::CalpontSelectExecutionPlan> createCSEP()
{
return boost::shared_ptr<execplan::CalpontSelectExecutionPlan>(
new execplan::CalpontSelectExecutionPlan());
}
// Helper to create a real TableAliasName (this is just a struct, no system dependencies)
execplan::CalpontSystemCatalog::TableAliasName createTableAlias(const std::string& schema,
const std::string& table,
const std::string& alias = "",
bool isColumnStore = true)
{
execplan::CalpontSystemCatalog::TableAliasName tableAlias;
tableAlias.schema = schema;
tableAlias.table = table;
tableAlias.alias = alias.empty() ? table : alias;
tableAlias.view = "";
tableAlias.fisColumnStore = isColumnStore;
return tableAlias;
}
// Mock structures needed for RBOptimizerContext
struct MockTHD
{
// Minimal THD mock for testing
uint64_t thread_id = 1;
// Add other fields as needed
};
struct MockGatewayInfo
{
std::unordered_map<
cal_impl_if::SchemaAndTableName,
std::map<std::string, std::pair<execplan::SimpleColumn, std::vector<Histogram_json_hb*>>>,
cal_impl_if::SchemaAndTableNameHash>
tableStatisticsMap;
// Helper method to find statistics for a table
std::map<std::string, std::pair<execplan::SimpleColumn, std::vector<Histogram_json_hb*>>>*
findStatisticsForATable(const cal_impl_if::SchemaAndTableName& schemaAndTable)
{
auto it = tableStatisticsMap.find(schemaAndTable);
return (it != tableStatisticsMap.end()) ? &(it->second) : nullptr;
}
};
// Create a simplified mock approach since RBOptimizerContext is complex to mock properly
// We'll create a wrapper that provides the interface we need for testing
class MockRBOptimizerContextWrapper
{
private:
MockTHD mockTHD;
MockGatewayInfo mockGWI;
public:
MockRBOptimizerContextWrapper()
{
}
// Helper to add test statistics
void addTableStatistics(const std::string& schema, const std::string& table, const std::string& column,
Histogram_json_hb* histogram)
{
cal_impl_if::SchemaAndTableName schemaAndTable = {schema, table};
execplan::SimpleColumn simpleCol; // Mock column
std::vector<Histogram_json_hb*> histograms = {histogram};
mockGWI.tableStatisticsMap[schemaAndTable][column] = std::make_pair(simpleCol, histograms);
}
// Get the mock gateway info for testing helper functions
MockGatewayInfo& getGWI()
{
return mockGWI;
}
};
// Helper to create a mock optimizer context
std::unique_ptr<MockRBOptimizerContextWrapper> createMockOptimizerContext()
{
return std::make_unique<MockRBOptimizerContextWrapper>();
}
// Mock histogram for testing (Histogram_json_hb is final, so we can't inherit)
// We'll use a simple wrapper approach instead
struct MockHistogramData
{
std::vector<uint32_t> testValues;
MockHistogramData(const std::vector<uint32_t>& values) : testValues(values)
{
}
};
boost::shared_ptr<MockHistogramData> createMockHistogram(const std::vector<uint32_t>& values)
{
return boost::shared_ptr<MockHistogramData>(new MockHistogramData(values));
}
};
// Test helper functions that work with real data structures
TEST_F(RBOHybridTest, HelperFunctionsWithRealStructures)
{
// Test someAreForeignTables with real CSEP and real TableAliasName structures
auto csep = createCSEP();
// Initially empty, should return false
EXPECT_FALSE(optimizer::details::someAreForeignTables(*csep));
// Create table lists using real TableAliasName structures
execplan::CalpontSelectExecutionPlan::TableList tables;
// Add ColumnStore table (real structure)
auto csTable = createTableAlias("test_schema", "cs_table", "", true);
tables.push_back(csTable);
csep->tableList(tables);
EXPECT_FALSE(optimizer::details::someAreForeignTables(*csep));
// Add foreign table (real structure)
auto foreignTable = createTableAlias("test_schema", "foreign_table", "", false);
tables.push_back(foreignTable);
csep->tableList(tables);
EXPECT_TRUE(optimizer::details::someAreForeignTables(*csep));
}
// Test tableIsInUnion with real CSEP and TableAliasName
TEST_F(RBOHybridTest, TableIsInUnionWithRealStructures)
{
auto csep = createCSEP();
auto testTable = createTableAlias("test_schema", "test_table");
// Test with no unions
EXPECT_FALSE(optimizer::details::tableIsInUnion(testTable, *csep));
// Create a union subquery using real CSEP
auto unionPlan = createCSEP();
execplan::CalpontSelectExecutionPlan::TableList unionTables;
unionTables.push_back(testTable);
unionPlan->tableList(unionTables);
// Add to union vector
execplan::CalpontSelectExecutionPlan::SelectList unions;
boost::shared_ptr<execplan::CalpontExecutionPlan> unionPlanBase = unionPlan;
unions.push_back(unionPlanBase);
csep->unionVec(unions);
// Test with table present in union
EXPECT_TRUE(optimizer::details::tableIsInUnion(testTable, *csep));
// Test with table not present in union
auto otherTable = createTableAlias("test_schema", "other_table");
EXPECT_FALSE(optimizer::details::tableIsInUnion(otherTable, *csep));
}
// Test real TableAliasName structure functionality
TEST_F(RBOHybridTest, RealTableAliasNameBasics)
{
// Test creating and manipulating real TableAliasName structures
auto table1 = createTableAlias("schema1", "table1", "alias1", true);
auto table2 = createTableAlias("schema2", "table2", "", false);
EXPECT_EQ("schema1", table1.schema);
EXPECT_EQ("table1", table1.table);
EXPECT_EQ("alias1", table1.alias);
EXPECT_TRUE(table1.fisColumnStore);
EXPECT_EQ("schema2", table2.schema);
EXPECT_EQ("table2", table2.table);
EXPECT_EQ("table2", table2.alias); // Should default to table name
EXPECT_FALSE(table2.fisColumnStore);
}
// Test real CalpontSelectExecutionPlan functionality
TEST_F(RBOHybridTest, RealCSEPBasics)
{
auto csep = createCSEP();
// Test table list operations with real structures
execplan::CalpontSelectExecutionPlan::TableList tables;
auto table1 = createTableAlias("schema1", "table1");
auto table2 = createTableAlias("schema2", "table2");
tables.push_back(table1);
tables.push_back(table2);
csep->tableList(tables);
const auto& retrievedTables = csep->tableList();
EXPECT_EQ(2u, retrievedTables.size());
EXPECT_EQ("schema1", retrievedTables[0].schema);
EXPECT_EQ("table1", retrievedTables[0].table);
EXPECT_EQ("schema2", retrievedTables[1].schema);
EXPECT_EQ("table2", retrievedTables[1].table);
}
// Test with mock SimpleColumn (since real one requires Syscat)
TEST_F(RBOHybridTest, MockSimpleColumnBasics)
{
auto column = createMockSimpleColumn("test_schema", "test_table", "test_column");
EXPECT_EQ("test_schema", column->schemaName());
EXPECT_EQ("test_table", column->tableName());
EXPECT_EQ("test_column", column->columnName());
// Test that we can modify column properties
column->schemaName("new_schema");
column->tableName("new_table");
column->columnName("new_column");
EXPECT_EQ("new_schema", column->schemaName());
EXPECT_EQ("new_table", column->tableName());
EXPECT_EQ("new_column", column->columnName());
}
// Test integration with real CSEP and mock columns
TEST_F(RBOHybridTest, CSEPWithMockColumns)
{
auto csep = createCSEP();
// Test returned columns operations with mock SimpleColumns
execplan::CalpontSelectExecutionPlan::ReturnedColumnList cols;
auto column1 = createMockSimpleColumn("schema1", "table1", "col1");
auto column2 = createMockSimpleColumn("schema2", "table2", "col2");
boost::shared_ptr<execplan::ReturnedColumn> col1Base = column1;
boost::shared_ptr<execplan::ReturnedColumn> col2Base = column2;
cols.push_back(col1Base);
cols.push_back(col2Base);
csep->returnedCols(cols);
const auto& retrievedCols = csep->returnedCols();
EXPECT_EQ(2u, retrievedCols.size());
// Test casting back to MockSimpleColumn
auto mockCol1 = boost::dynamic_pointer_cast<MockSimpleColumn>(retrievedCols[0]);
EXPECT_NE(nullptr, mockCol1);
if (mockCol1)
{
EXPECT_EQ("schema1", mockCol1->schemaName());
EXPECT_EQ("table1", mockCol1->tableName());
EXPECT_EQ("col1", mockCol1->columnName());
}
}
// Test helper functions that can work with mock context
TEST_F(RBOHybridTest, HelperFunctionsWithMockContext)
{
auto csep = createCSEP();
auto mockCtx = createMockOptimizerContext();
// Add mixed table types
execplan::CalpontSelectExecutionPlan::TableList tables;
auto csTable = createTableAlias("test_schema", "cs_table", "", true);
auto foreignTable = createTableAlias("test_schema", "foreign_table", "", false);
tables.push_back(csTable);
tables.push_back(foreignTable);
csep->tableList(tables);
// Test someAreForeignTables (doesn't need context)
EXPECT_TRUE(optimizer::details::someAreForeignTables(*csep));
// Note: Functions that require real RBOptimizerContext would need to be tested
// with actual system infrastructure or more sophisticated mocking
}
// Test edge cases with real structures
TEST_F(RBOHybridTest, EdgeCasesWithRealStructures)
{
// Test with empty execution plan
auto emptyCSEP = createCSEP();
EXPECT_FALSE(optimizer::details::someAreForeignTables(*emptyCSEP));
// Test with empty table alias
auto emptyTable = createTableAlias("", "", "");
EXPECT_TRUE(emptyTable.schema.empty());
EXPECT_TRUE(emptyTable.table.empty());
// Test TableAliasName comparison (if TableAliasLessThan is accessible)
auto table1 = createTableAlias("schema1", "table1");
auto table2 = createTableAlias("schema2", "table2");
// These are real structures that can be compared
EXPECT_NE(table1.schema, table2.schema);
EXPECT_NE(table1.table, table2.table);
}
// Test parallelCESFilter logic through helper functions (since direct testing requires complex
// RBOptimizerContext)
TEST_F(RBOHybridTest, ParallelCESFilterLogicTesting)
{
auto csep = createCSEP();
// Test the first condition: someAreForeignTables
// Test 1: All ColumnStore tables - should return false
execplan::CalpontSelectExecutionPlan::TableList csOnlyTables;
auto csTable1 = createTableAlias("test_schema", "cs_table1", "", true);
auto csTable2 = createTableAlias("test_schema", "cs_table2", "", true);
csOnlyTables.push_back(csTable1);
csOnlyTables.push_back(csTable2);
csep->tableList(csOnlyTables);
EXPECT_FALSE(optimizer::details::someAreForeignTables(*csep));
// Test 2: Mixed tables with foreign tables
execplan::CalpontSelectExecutionPlan::TableList mixedTables;
auto foreignTable = createTableAlias("test_schema", "foreign_table", "", false);
mixedTables.push_back(csTable1);
mixedTables.push_back(foreignTable);
csep->tableList(mixedTables);
EXPECT_TRUE(optimizer::details::someAreForeignTables(*csep));
// Test 3: Only foreign tables
execplan::CalpontSelectExecutionPlan::TableList foreignOnlyTables;
auto foreignTable1 = createTableAlias("test_schema", "foreign_table1", "", false);
auto foreignTable2 = createTableAlias("test_schema", "foreign_table2", "", false);
foreignOnlyTables.push_back(foreignTable1);
foreignOnlyTables.push_back(foreignTable2);
csep->tableList(foreignOnlyTables);
EXPECT_TRUE(optimizer::details::someAreForeignTables(*csep));
// Note: Testing the full parallelCESFilter function would require a real RBOptimizerContext
// with proper statistics setup, which is not feasible in unit tests without system infrastructure
}
// Test applyParallelCES prerequisites and data structure setup
TEST_F(RBOHybridTest, ApplyParallelCESPrerequisites)
{
auto csep = createCSEP();
// Set up a realistic test scenario that would be suitable for parallel rewrite
execplan::CalpontSelectExecutionPlan::TableList tables;
auto csTable = createTableAlias("test_schema", "cs_table", "", true);
auto foreignTable = createTableAlias("test_schema", "foreign_table", "", false);
tables.push_back(csTable);
tables.push_back(foreignTable);
csep->tableList(tables);
// Add some mock columns
execplan::CalpontSelectExecutionPlan::ReturnedColumnList cols;
auto column = createMockSimpleColumn("test_schema", "foreign_table", "id");
boost::shared_ptr<execplan::ReturnedColumn> columnBase = column;
cols.push_back(columnBase);
csep->returnedCols(cols);
// Verify the setup meets the basic requirements for parallel rewrite consideration
EXPECT_TRUE(optimizer::details::someAreForeignTables(*csep)); // Has foreign tables
EXPECT_EQ(2u, csep->tableList().size()); // Has multiple tables
EXPECT_EQ(1u, csep->returnedCols().size()); // Has columns
EXPECT_EQ(0u, csep->unionVec().size()); // No existing unions
// Verify table types are correctly identified
const auto& retrievedTables = csep->tableList();
EXPECT_TRUE(retrievedTables[0].fisColumnStore); // cs_table
EXPECT_FALSE(retrievedTables[1].fisColumnStore); // foreign_table
// Verify column can be cast back to SimpleColumn
const auto& retrievedCols = csep->returnedCols();
auto simpleCol = boost::dynamic_pointer_cast<MockSimpleColumn>(retrievedCols[0]);
EXPECT_NE(nullptr, simpleCol);
if (simpleCol)
{
EXPECT_EQ("test_schema", simpleCol->schemaName());
EXPECT_EQ("foreign_table", simpleCol->tableName());
EXPECT_EQ("id", simpleCol->columnName());
}
// Note: Testing the actual applyParallelCES function would require a real RBOptimizerContext
// with proper statistics setup, which is not feasible in unit tests without system infrastructure
}
// Test parallelCESFilter edge cases through helper functions
TEST_F(RBOHybridTest, ParallelCESFilterEdgeCases)
{
// Test 1: Empty execution plan
auto emptyCSEP = createCSEP();
EXPECT_FALSE(optimizer::details::someAreForeignTables(*emptyCSEP)); // Should return false for empty plan
// Test 2: Only foreign tables (no ColumnStore tables)
auto foreignOnlyCSEP = createCSEP();
execplan::CalpontSelectExecutionPlan::TableList foreignTables;
auto foreignTable1 = createTableAlias("test_schema", "foreign_table1", "", false);
auto foreignTable2 = createTableAlias("test_schema", "foreign_table2", "", false);
foreignTables.push_back(foreignTable1);
foreignTables.push_back(foreignTable2);
foreignOnlyCSEP->tableList(foreignTables);
// Verify that someAreForeignTables returns true
EXPECT_TRUE(optimizer::details::someAreForeignTables(*foreignOnlyCSEP));
// Test 3: Tables with union subqueries
auto unionCSEP = createCSEP();
auto mainTable = createTableAlias("test_schema", "main_table", "", false);
execplan::CalpontSelectExecutionPlan::TableList mainTables;
mainTables.push_back(mainTable);
unionCSEP->tableList(mainTables);
// Add union subquery
auto unionSubquery = createCSEP();
auto unionTable = createTableAlias("test_schema", "union_table", "", true);
execplan::CalpontSelectExecutionPlan::TableList unionTables;
unionTables.push_back(unionTable);
unionSubquery->tableList(unionTables);
execplan::CalpontSelectExecutionPlan::SelectList unions;
boost::shared_ptr<execplan::CalpontExecutionPlan> unionBase = unionSubquery;
unions.push_back(unionBase);
unionCSEP->unionVec(unions);
// Test tableIsInUnion functionality
EXPECT_TRUE(optimizer::details::tableIsInUnion(unionTable, *unionCSEP));
EXPECT_FALSE(optimizer::details::tableIsInUnion(mainTable, *unionCSEP));
}
// Test applyParallelCES scenarios through data structure validation
TEST_F(RBOHybridTest, ApplyParallelCESScenarios)
{
// Scenario 1: Query that should not be rewritten (all ColumnStore tables)
auto csOnlyCSEP = createCSEP();
execplan::CalpontSelectExecutionPlan::TableList csTables;
auto csTable1 = createTableAlias("test_schema", "cs_table1", "", true);
auto csTable2 = createTableAlias("test_schema", "cs_table2", "", true);
csTables.push_back(csTable1);
csTables.push_back(csTable2);
csOnlyCSEP->tableList(csTables);
// Should not apply parallel rewrite
EXPECT_FALSE(optimizer::details::someAreForeignTables(*csOnlyCSEP));
// Scenario 2: Query with foreign tables but no statistics
auto noStatsCSEP = createCSEP();
execplan::CalpontSelectExecutionPlan::TableList mixedTables;
auto foreignTable = createTableAlias("test_schema", "foreign_table", "", false);
mixedTables.push_back(csTable1);
mixedTables.push_back(foreignTable);
noStatsCSEP->tableList(mixedTables);
// Has foreign tables but no statistics in mock context
EXPECT_TRUE(optimizer::details::someAreForeignTables(*noStatsCSEP));
// Scenario 3: Complex query with multiple foreign tables and columns
auto complexCSEP = createCSEP();
execplan::CalpontSelectExecutionPlan::TableList complexTables;
auto foreignTable1 = createTableAlias("schema1", "foreign_table1", "ft1", false);
auto foreignTable2 = createTableAlias("schema2", "foreign_table2", "ft2", false);
auto csTable = createTableAlias("schema1", "cs_table", "ct", true);
complexTables.push_back(foreignTable1);
complexTables.push_back(foreignTable2);
complexTables.push_back(csTable);
complexCSEP->tableList(complexTables);
// Add multiple columns
execplan::CalpontSelectExecutionPlan::ReturnedColumnList complexCols;
auto col1 = createMockSimpleColumn("schema1", "foreign_table1", "id");
auto col2 = createMockSimpleColumn("schema1", "foreign_table1", "name");
auto col3 = createMockSimpleColumn("schema2", "foreign_table2", "value");
auto col4 = createMockSimpleColumn("schema1", "cs_table", "cs_id");
boost::shared_ptr<execplan::ReturnedColumn> col1Base = col1;
boost::shared_ptr<execplan::ReturnedColumn> col2Base = col2;
boost::shared_ptr<execplan::ReturnedColumn> col3Base = col3;
boost::shared_ptr<execplan::ReturnedColumn> col4Base = col4;
complexCols.push_back(col1Base);
complexCols.push_back(col2Base);
complexCols.push_back(col3Base);
complexCols.push_back(col4Base);
complexCSEP->returnedCols(complexCols);
// Verify the setup
EXPECT_TRUE(optimizer::details::someAreForeignTables(*complexCSEP));
EXPECT_EQ(3u, complexCSEP->tableList().size());
EXPECT_EQ(4u, complexCSEP->returnedCols().size());
// Test that we can identify foreign vs ColumnStore tables
const auto& retrievedTables = complexCSEP->tableList();
EXPECT_FALSE(retrievedTables[0].fisColumnStore); // foreign_table1
EXPECT_FALSE(retrievedTables[1].fisColumnStore); // foreign_table2
EXPECT_TRUE(retrievedTables[2].fisColumnStore); // cs_table
}