Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Support aggregation function in window #9758

Merged
merged 72 commits into from
Feb 14, 2025
Merged
Changes from 1 commit
Commits
Show all changes
72 commits
Select commit Hold shift + click to select a range
3f80eed
init
xzhangxian1008 Nov 26, 2024
171fd46
add gtest
xzhangxian1008 Nov 27, 2024
943c578
add ft
xzhangxian1008 Nov 27, 2024
e0b05a2
refine test framework
xzhangxian1008 Nov 27, 2024
75d2f12
fix compilation phase
xzhangxian1008 Nov 27, 2024
7022607
init
xzhangxian1008 Dec 4, 2024
b011bfa
codes done, need tests
xzhangxian1008 Dec 5, 2024
8628a2e
save
xzhangxian1008 Dec 12, 2024
db4e399
add tests
xzhangxian1008 Dec 13, 2024
a9360da
add sum tests
xzhangxian1008 Dec 17, 2024
e3c31bd
refine tests
xzhangxian1008 Dec 17, 2024
e3b9756
format
xzhangxian1008 Dec 17, 2024
a159857
fix bugs
xzhangxian1008 Dec 18, 2024
0d4401d
refine test
xzhangxian1008 Dec 18, 2024
9ff2bd3
fix tests
xzhangxian1008 Dec 18, 2024
a9aa879
add test for string type
xzhangxian1008 Dec 19, 2024
bf652bf
add test for SingleValueDataGeneric type
xzhangxian1008 Dec 19, 2024
61eaef0
tweaking
xzhangxian1008 Dec 20, 2024
6017780
Merge branch 'master' into wagg
xzhangxian1008 Dec 20, 2024
42a4736
tweaking
xzhangxian1008 Dec 20, 2024
df199b6
fix bugs
xzhangxian1008 Dec 23, 2024
69b766f
fix
xzhangxian1008 Dec 23, 2024
4e9d5ae
add ut
xzhangxian1008 Dec 24, 2024
5dfa63a
add ut
xzhangxian1008 Dec 24, 2024
3d912d9
cherry pick 2b9e991cdef
xzhangxian1008 Dec 26, 2024
9d37608
format
xzhangxian1008 Dec 27, 2024
95d0d1d
add ut tests
xzhangxian1008 Dec 27, 2024
a5bd59e
add test and fix bug
xzhangxian1008 Dec 27, 2024
f7c5bfb
add ut tests
xzhangxian1008 Dec 27, 2024
5abdc73
refactor tests
xzhangxian1008 Dec 30, 2024
34ea791
add tests
xzhangxian1008 Dec 30, 2024
a7ca693
add test
xzhangxian1008 Dec 30, 2024
164129a
add tests and remove cout
xzhangxian1008 Dec 31, 2024
9914549
tweaking
xzhangxian1008 Dec 31, 2024
8051af1
add ft
xzhangxian1008 Dec 31, 2024
88a7805
add tests
xzhangxian1008 Jan 2, 2025
9d8689c
add tests
xzhangxian1008 Jan 2, 2025
2eb5984
address comments
xzhangxian1008 Jan 7, 2025
f8c5d3b
address comments
xzhangxian1008 Jan 7, 2025
235f348
cp
xzhangxian1008 Jan 9, 2025
b478254
remove useless codes
xzhangxian1008 Jan 9, 2025
70c0b43
add decrease judge
xzhangxian1008 Jan 9, 2025
9d34dd6
add tests
xzhangxian1008 Jan 9, 2025
1faf815
remove useless
xzhangxian1008 Jan 13, 2025
0b6374c
change ft
xzhangxian1008 Jan 13, 2025
32e62cb
Merge branch 'master' into wagg
xzhangxian1008 Jan 13, 2025
8c75dd9
address some comments
xzhangxian1008 Jan 14, 2025
8c040db
cp
xzhangxian1008 Jan 14, 2025
d709ed2
merge
xzhangxian1008 Jan 17, 2025
18a2f3e
remove useless codes
xzhangxian1008 Jan 17, 2025
b1c77b0
refine codes
xzhangxian1008 Jan 17, 2025
c4c8237
remove useless todo
xzhangxian1008 Jan 17, 2025
c586ac6
tweaking
xzhangxian1008 Jan 20, 2025
a77fef5
merge master
xzhangxian1008 Jan 21, 2025
4a58f2e
Merge branch 'master' of ssh://github.com/pingcap/tiflash into wagg
xzhangxian1008 Jan 26, 2025
abc3cdd
fix
xzhangxian1008 Jan 26, 2025
b67a4a1
fix
xzhangxian1008 Jan 26, 2025
1814034
fix ci
xzhangxian1008 Feb 5, 2025
6655e5c
tweaking
xzhangxian1008 Feb 7, 2025
7ede92f
tweaking
xzhangxian1008 Feb 10, 2025
d71c52b
tweaking
xzhangxian1008 Feb 11, 2025
d1069fd
address comments
xzhangxian1008 Feb 11, 2025
555e17c
address comment
xzhangxian1008 Feb 12, 2025
b0e2c3f
Merge branch 'master' into wagg
xzhangxian1008 Feb 12, 2025
a6ad301
address comment
xzhangxian1008 Feb 12, 2025
868f64e
tweaking
xzhangxian1008 Feb 13, 2025
4888bf5
address comments
xzhangxian1008 Feb 13, 2025
0ac9726
tweaking
xzhangxian1008 Feb 13, 2025
94d69a6
fix
xzhangxian1008 Feb 13, 2025
f3b3f81
address comment
xzhangxian1008 Feb 13, 2025
f0d0919
Merge branch 'master' into wagg
xzhangxian1008 Feb 14, 2025
d3876a6
tweaking
xzhangxian1008 Feb 14, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Prev Previous commit
Next Next commit
add ut
xzhangxian1008 committed Dec 24, 2024
commit 5dfa63a8f1e6104a590ecf2dbae3139f784b63b5
6 changes: 6 additions & 0 deletions dbms/src/DataStreams/WindowBlockInputStream.cpp
Original file line number Diff line number Diff line change
@@ -1457,25 +1457,31 @@ void WindowTransformAction::tryCalculate()
}
peer_group_last = current_row;

RowNumber tmp = frame_start;
// Advance the frame start.
advanceFrameStart();
std::cout << "frame start: " << tmp.toString() << " -> " << frame_start.toString() << std::endl;

if (!frame_started)
{
// Wait for more input data to find the start of frame.
assert(!input_is_finished);
assert(!partition_ended);
std::cout << "frame start return" << std::endl;
return;
}

// Advance the frame end.
tmp = frame_end;
advanceFrameEnd();
std::cout << "frame end: " << tmp.toString() << " -> " << frame_end.toString() << std::endl;

if (!frame_ended)
{
// Wait for more input data to find the end of frame.
assert(!input_is_finished);
assert(!partition_ended);
std::cout << "frame end return" << std::endl;
return;
}

180 changes: 96 additions & 84 deletions dbms/src/WindowFunctions/tests/gtest_agg.cpp
Original file line number Diff line number Diff line change
@@ -36,11 +36,17 @@ class WindowAggFuncTest : public DB::tests::WindowTest
static std::vector<Int64> int_value;
};

// TODO uncomment them
std::vector<Int64> WindowAggFuncTest::partition = {0, 1, 1, 1, 1, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 4, 5, 6, 6, 6};
std::vector<Int64> WindowAggFuncTest::order = {0, 0, 1, 2, 3, 0, 1, 2, 3, 4, 0, 1, 2, 3, 4, 5, 6, 0, 0, 0, 1, 2};
std::vector<Int64> WindowAggFuncTest::order = {0, 0, 1, 3, 6, 0, 1, 4, 7, 8, 0, 4, 6, 10, 20, 40, 41, 0, 0, 0, 10, 30};
std::vector<Int64> WindowAggFuncTest::int_value
= {0, -1, 0, 4, 6, 2, 0, -4, -2, 1, 7, -3, 9, -9, -3, 2, 1, 4, -5, 2, 5, 0};

// std::vector<Int64> WindowAggFuncTest::partition = {2, 2};
// std::vector<Int64> WindowAggFuncTest::order = {7, 8};
// std::vector<Int64> WindowAggFuncTest::int_value
// = {-2, 1};

// TODO test frame position list:
// 1. prev_start = frame_start, prev_end = frame_end
// 2. prev_start < frame_start, prev_end = frame_end
@@ -55,118 +61,124 @@ std::vector<Int64> WindowAggFuncTest::int_value
// 5. add = 0

// TODO maybe we need to reset null flag for AggregateFunctionNull
TEST_F(WindowAggFuncTest, windowAggSumTests)
// TODO test duplicate order by values in range frame
TEST_F(WindowAggFuncTest, Sum)
try
{
{
// rows frame
MockWindowFrame frame;
frame.type = tipb::WindowFrameType::Rows;
frame.end = mock::MockWindowFrameBound(tipb::WindowBoundType::Following, false, 0);
std::vector<Int64> frame_start_offset{0, 1, 3, 10};
std::vector<Int64> frame_end_offset{0, 1, 3, 10};

std::vector<std::vector<std::optional<Int64>>> res{
{0, -1, 0, 4, 6, 2, 0, -4, -2, 1, 7, -3, 9, -9, -3, 2, 1, 4, -5, 2, 5, 0},
{0, -1, -1, 4, 10, 2, 2, -4, -6, -1, 7, 4, 6, 0, -12, -1, 3, 4, -5, 2, 7, 5},
{0, -1, -1, 3, 9, 2, 2, -2, -4, -5, 7, 4, 13, 4, -6, -1, -9, 4, -5, 2, 7, 7},
{0, -1, -1, 3, 9, 2, 2, -2, -4, -3, 7, 4, 13, 4, 1, 3, 4, 4, -5, 2, 7, 7}};

for (size_t i = 0; i < frame_start_offset.size(); ++i)
{
std::cout << "--------- i: " << i << std::endl;
frame.start = mock::MockWindowFrameBound(tipb::WindowBoundType::Preceding, false, frame_start_offset[i]);

executeFunctionAndAssert(
toNullableVec<Int64>(res[i]),
Sum(value_col),
{toVec<Int64>(partition), toVec<Int64>(order), toVec<Int64>(int_value)},
frame);
}

res
= {{0, -1, 0, 4, 6, 2, 0, -4, -2, 1, 7, -3, 9, -9, -3, 2, 1, 4, -5, 2, 5, 0},
{0, -1, 4, 10, 6, 2, -4, -6, -1, 1, 4, 6, 0, -12, -1, 3, 1, 4, -5, 7, 5, 0},
{0, 9, 10, 10, 6, -4, -5, -5, -1, 1, 4, -6, -1, -9, 0, 3, 1, 4, -5, 7, 5, 0},
{0, 9, 10, 10, 6, -3, -5, -5, -1, 1, 4, -3, 0, -9, 0, 3, 1, 4, -5, 7, 5, 0}};

frame.start = mock::MockWindowFrameBound(tipb::WindowBoundType::Preceding, false, 0);
for (size_t i = 0; i < frame_end_offset.size(); ++i)
{
std::cout << "--------- i: " << i << std::endl;
frame.end = mock::MockWindowFrameBound(tipb::WindowBoundType::Following, false, frame_end_offset[i]);

executeFunctionAndAssert(
toNullableVec<Int64>(res[i]),
Sum(value_col),
{toVec<Int64>(partition), toVec<Int64>(order), toVec<Int64>(int_value)},
frame);
}
}


// TODO uncomment these test after range frame is merged
// {
// // range frame
// // rows frame
// MockWindowFrame frame;
// frame.type = tipb::WindowFrameType::Rows;
// frame.start = buildRangeFrameBound(tipb::WindowBoundType::Preceding, tipb::RangeCmpDataType::Int, ORDER_COL_NAME, false, 0);
// frame.end = buildRangeFrameBound(tipb::WindowBoundType::Following, tipb::RangeCmpDataType::Int, ORDER_COL_NAME, true, 3);
// frame.end = mock::MockWindowFrameBound(tipb::WindowBoundType::Following, false, 0);
// std::vector<Int64> frame_start_offset{0, 1, 3, 10};
// std::vector<Int64> frame_end_offset{0, 1, 3, 10};

// std::vector<std::vector<Int64>> res_not_null{
// {0, 7, 6, 4, 8, 3, 3, 23, 28, 15, 4, 8, 5, 9, 15, 20, 31},
// {0, 7, 7, 4, 8, 3, 3, 23, 28, 15, 4, 8, 5, 9, 15, 20, 31},
// {0, 7, 7, 7, 8, 3, 3, 23, 38, 28, 4, 9, 8, 9, 15, 20, 31},
// {0, 7, 7, 7, 15, 3, 3, 26, 41, 38, 4, 9, 9, 18, 29, 35, 31}};
// std::vector<std::vector<std::optional<Int64>>> res{
// {0, -1, 0, 4, 6, 2, 0, -4, -2, 1, 7, -3, 9, -9, -3, 2, 1, 4, -5, 2, 5, 0},
// {0, -1, -1, 4, 10, 2, 2, -4, -6, -1, 7, 4, 6, 0, -12, -1, 3, 4, -5, 2, 7, 5},
// {0, -1, -1, 3, 9, 2, 2, -2, -4, -5, 7, 4, 13, 4, -6, -1, -9, 4, -5, 2, 7, 7},
// {0, -1, -1, 3, 9, 2, 2, -2, -4, -3, 7, 4, 13, 4, 1, 3, 4, 4, -5, 2, 7, 7}};

// for (size_t i = 0; i < frame_start_offset.size(); ++i)
// {
// frame.start = buildRangeFrameBound(tipb::WindowBoundType::Preceding, tipb::RangeCmpDataType::Int, ORDER_COL_NAME, false, 0);
// std::cout << "--------- i: " << i << std::endl;
// frame.start = mock::MockWindowFrameBound(tipb::WindowBoundType::Preceding, false, frame_start_offset[i]);

// executeFunctionAndAssert(
// toVec<Int64>(res_not_null[i]),
// toNullableVec<Int64>(res[i]),
// Sum(value_col),
// {toVec<Int64>(/*partition*/ {0, 1, 1, 1, 1, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3}),
// toVec<Int64>(/*order*/ {0, 1, 2, 4, 8, 0, 3, 10, 13, 15, 1, 3, 5, 9, 15, 20, 31}),
// toVec<Int64>(/*value*/ {0, 1, 2, 4, 8, 0, 3, 10, 13, 15, 1, 3, 5, 9, 15, 20, 31})},
// {toVec<Int64>(partition), toVec<Int64>(order), toVec<Int64>(int_value)},
// frame);
// }

// res
// = {{0, -1, 0, 4, 6, 2, 0, -4, -2, 1, 7, -3, 9, -9, -3, 2, 1, 4, -5, 2, 5, 0},
// {0, -1, 4, 10, 6, 2, -4, -6, -1, 1, 4, 6, 0, -12, -1, 3, 1, 4, -5, 7, 5, 0},
// {0, 9, 10, 10, 6, -4, -5, -5, -1, 1, 4, -6, -1, -9, 0, 3, 1, 4, -5, 7, 5, 0},
// {0, 9, 10, 10, 6, -3, -5, -5, -1, 1, 4, -3, 0, -9, 0, 3, 1, 4, -5, 7, 5, 0}};

// frame.start = mock::MockWindowFrameBound(tipb::WindowBoundType::Preceding, false, 0);
// for (size_t i = 0; i < frame_end_offset.size(); ++i)
// {
// std::cout << "--------- i: " << i << std::endl;
// frame.end = mock::MockWindowFrameBound(tipb::WindowBoundType::Following, false, frame_end_offset[i]);

// executeFunctionAndAssert(
// toNullableVec<Int64>(res[i]),
// Sum(value_col),
// {toVec<Int64>(partition), toVec<Int64>(order), toVec<Int64>(int_value)},
// frame);
// }
// }
}
CATCH
}

TEST_F(WindowAggFuncTest, windowAggCountTests)
try
{
{
// rows frame
// range frame
MockWindowFrame frame;
frame.type = tipb::WindowFrameType::Rows;
frame.start = mock::MockWindowFrameBound(tipb::WindowBoundType::Preceding, false, 0);
frame.end = mock::MockWindowFrameBound(tipb::WindowBoundType::Following, false, 3);
std::vector<Int64> frame_start_offset{0, 1, 3, 10};
frame.type = tipb::WindowFrameType::Ranges;
frame.start = buildRangeFrameBound<Int64>(tipb::WindowBoundType::Preceding, tipb::RangeCmpDataType::Int, ORDER_COL_NAME, false, 0);
frame.end = buildRangeFrameBound<Int64>(tipb::WindowBoundType::Following, tipb::RangeCmpDataType::Int, ORDER_COL_NAME, true, 0);
// std::vector<Int64> frame_end_offset{0, 1, 3, 10}; // TODO uncomment it
std::vector<Int64> frame_end_offset{0, 1, 3, 10};

// TODO uncomment it
std::vector<std::vector<std::optional<Int64>>> res{
{1, 4, 3, 2, 1, 4, 4, 3, 2, 1, 4, 4, 4, 4, 3, 2, 1},
{1, 4, 4, 3, 2, 4, 5, 4, 3, 2, 4, 5, 5, 5, 4, 3, 2},
{1, 4, 4, 4, 4, 4, 5, 5, 5, 4, 4, 5, 6, 7, 6, 5, 4},
{1, 4, 4, 4, 4, 4, 5, 5, 5, 5, 4, 5, 6, 7, 7, 7, 7}};

for (size_t i = 0; i < frame_start_offset.size(); ++i)
{0, -1, 0, 4, 6, 2, 0, -4, -2, 1, 7, -3, 9, -9, -3, 2, 1, 4, -5, 2, 5, 0},
{0, -1, 0, 4, 6, 2, 0, -4, -1, 1, 7, -3, 9, -9, -3, 3, 1, 4, -5, 2, 5, 0},
{0, 3, 4, 10, 6, 2, -4, -6, -1, 1, 7, 6, 9, -9, -3, 3, 1, 4, -5, 2, 5, 0},
{0, 9, 10, 10, 6, -3, -5, -5, -1, 1, 4, -3, 0, -12, -3, 3, 1, 4, -5, 7, 5, 0}
};

// std::vector<std::vector<std::optional<Int64>>> res{
// // {0, -1, 0, 4, 6, 2, 0, -4, -2, 1, 7, -3, 9, -9, -3, 2, 1, 4, -5, 2, 5, 0},
// {-1, 1},
// // {0, 3, 4, 10, 6, 2, -4, -6, -1, 1, 7, 6, 9, -9, -3, 3, 1, 4, -5, 2, 5, 0},
// // {0, 9, 10, 10, 6, -3, -5, -5, -1, 1, 4, -3, 0, -12, -3, 3, 1, 4, -5, 7, 5, 0}
// };

for (size_t i = 0; i < frame_end_offset.size(); i++)
{
frame.start = mock::MockWindowFrameBound(tipb::WindowBoundType::Preceding, false, frame_start_offset[i]);
std::cout << "-------- i: " << i << std::endl;
frame.end = buildRangeFrameBound<Int64>(tipb::WindowBoundType::Following, tipb::RangeCmpDataType::Int, ORDER_COL_NAME, true, frame_end_offset[i]);

executeFunctionAndAssert(
toNullableVec<Int64>(res[i]),
Count(value_col),
{toVec<Int64>(/*partition*/ {0, 1, 1, 1, 1, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3}),
toVec<Int64>(/*order*/ {0, 1, 2, 4, 8, 0, 3, 10, 13, 15, 1, 3, 5, 9, 15, 20, 31}),
toVec<Int64>(/*value*/ {0, 1, 2, 4, 8, 0, 3, 10, 13, 15, 1, 3, 5, 9, 15, 20, 31})},
Sum(value_col),
{toVec<Int64>(partition),
toVec<Int64>(order),
toVec<Int64>(int_value)},
frame);
}
}
// TODO add range frame tests after that is merged
}
CATCH

TEST_F(WindowAggFuncTest, Count)
try
{
// TODO add tests
}
CATCH

TEST_F(WindowAggFuncTest, Avg)
try
{
// TODO add tests
}
CATCH

TEST_F(WindowAggFuncTest, Min)
try
{
// TODO add tests
}
CATCH

TEST_F(WindowAggFuncTest, Max)
try
{
// TODO add tests
}
CATCH
} // namespace DB::tests
4 changes: 3 additions & 1 deletion tests/fullstack-test/mpp/window_agg.test
Original file line number Diff line number Diff line change
@@ -21,7 +21,9 @@ func> wait_table test test.agg

mysql> use test; set tidb_enforce_mpp=1;

//TODO ast.AggFuncSum, ast.AggFuncCount, ast.AggFuncAvg, ast.AggFuncMax, ast.AggFuncMin ...
// TODO ast.AggFuncSum, ast.AggFuncCount, ast.AggFuncAvg, ast.AggFuncMax, ast.AggFuncMin
// TODO int decimal64 decimal256 should be tested for add agg
// TODO string and duration should be tested fow min/max

mysql> use test; set tidb_enforce_mpp=1; select *, sum(v) over (partition by p order by o rows between 1 preceding and 1 following) as a from test.agg;
+---+----+----+------+