1 | #include "duckdb/execution/window_segment_tree.hpp" |
2 | |
3 | #include "duckdb/common/vector_operations/vector_operations.hpp" |
4 | |
5 | #include <cmath> |
6 | |
7 | using namespace duckdb; |
8 | using namespace std; |
9 | |
10 | WindowSegmentTree::WindowSegmentTree(AggregateFunction &aggregate, TypeId result_type, ChunkCollection *input) |
11 | : aggregate(aggregate), state(aggregate.state_size()), statep(TypeId::POINTER), result_type(result_type), |
12 | input_ref(input) { |
13 | statep.SetCount(STANDARD_VECTOR_SIZE); |
14 | Value ptr_val = Value::POINTER((idx_t)state.data()); |
15 | statep.Reference(ptr_val); |
16 | statep.Normalify(STANDARD_VECTOR_SIZE); |
17 | |
18 | if (input_ref && input_ref->column_count() > 0) { |
19 | inputs.Initialize(input_ref->types); |
20 | if (aggregate.combine) { |
21 | ConstructTree(); |
22 | } |
23 | } |
24 | } |
25 | |
26 | void WindowSegmentTree::AggregateInit() { |
27 | aggregate.initialize(state.data()); |
28 | } |
29 | |
30 | Value WindowSegmentTree::AggegateFinal() { |
31 | Vector statev(Value::POINTER((idx_t)state.data())); |
32 | Vector result(result_type); |
33 | result.vector_type = VectorType::CONSTANT_VECTOR; |
34 | ConstantVector::SetNull(result, false); |
35 | aggregate.finalize(statev, result, 1); |
36 | |
37 | return result.GetValue(0); |
38 | } |
39 | |
40 | void WindowSegmentTree::WindowSegmentValue(idx_t l_idx, idx_t begin, idx_t end) { |
41 | assert(begin <= end); |
42 | if (begin == end) { |
43 | return; |
44 | } |
45 | inputs.SetCardinality(end - begin); |
46 | |
47 | idx_t start_in_vector = begin % STANDARD_VECTOR_SIZE; |
48 | Vector s; |
49 | s.Slice(statep, start_in_vector); |
50 | if (l_idx == 0) { |
51 | const auto input_count = input_ref->column_count(); |
52 | auto &chunk = input_ref->GetChunk(begin); |
53 | for (idx_t i = 0; i < input_count; ++i) { |
54 | auto &v = inputs.data[i]; |
55 | auto &vec = chunk.data[i]; |
56 | v.Slice(vec, start_in_vector); |
57 | v.Verify(inputs.size()); |
58 | } |
59 | aggregate.update(&inputs.data[0], input_count, s, inputs.size()); |
60 | } else { |
61 | assert(end - begin <= STANDARD_VECTOR_SIZE); |
62 | data_ptr_t ptr = levels_flat_native.get() + state.size() * (begin + levels_flat_start[l_idx - 1]); |
63 | Vector v(result_type, ptr); |
64 | v.Verify(inputs.size()); |
65 | aggregate.combine(v, s, inputs.size()); |
66 | } |
67 | } |
68 | |
69 | void WindowSegmentTree::ConstructTree() { |
70 | assert(input_ref); |
71 | assert(inputs.column_count() > 0); |
72 | |
73 | // compute space required to store internal nodes of segment tree |
74 | idx_t internal_nodes = 0; |
75 | idx_t level_nodes = input_ref->count; |
76 | do { |
77 | level_nodes = (idx_t)ceil((double)level_nodes / TREE_FANOUT); |
78 | internal_nodes += level_nodes; |
79 | } while (level_nodes > 1); |
80 | levels_flat_native = unique_ptr<data_t[]>(new data_t[internal_nodes * state.size()]); |
81 | levels_flat_start.push_back(0); |
82 | |
83 | idx_t levels_flat_offset = 0; |
84 | idx_t level_current = 0; |
85 | // level 0 is data itself |
86 | idx_t level_size; |
87 | while ((level_size = (level_current == 0 ? input_ref->count |
88 | : levels_flat_offset - levels_flat_start[level_current - 1])) > 1) { |
89 | for (idx_t pos = 0; pos < level_size; pos += TREE_FANOUT) { |
90 | AggregateInit(); |
91 | WindowSegmentValue(level_current, pos, min(level_size, pos + TREE_FANOUT)); |
92 | |
93 | memcpy(levels_flat_native.get() + (levels_flat_offset * state.size()), state.data(), state.size()); |
94 | |
95 | levels_flat_offset++; |
96 | } |
97 | |
98 | levels_flat_start.push_back(levels_flat_offset); |
99 | level_current++; |
100 | } |
101 | } |
102 | |
103 | Value WindowSegmentTree::Compute(idx_t begin, idx_t end) { |
104 | assert(input_ref); |
105 | |
106 | // No arguments, so just count |
107 | if (inputs.column_count() == 0) { |
108 | return Value::Numeric(result_type, end - begin); |
109 | } |
110 | |
111 | AggregateInit(); |
112 | |
113 | // Aggregate everything at once if we can't combine states |
114 | if (!aggregate.combine) { |
115 | WindowSegmentValue(0, begin, end); |
116 | return AggegateFinal(); |
117 | } |
118 | |
119 | for (idx_t l_idx = 0; l_idx < levels_flat_start.size() + 1; l_idx++) { |
120 | idx_t parent_begin = begin / TREE_FANOUT; |
121 | idx_t parent_end = end / TREE_FANOUT; |
122 | if (parent_begin == parent_end) { |
123 | WindowSegmentValue(l_idx, begin, end); |
124 | return AggegateFinal(); |
125 | } |
126 | idx_t group_begin = parent_begin * TREE_FANOUT; |
127 | if (begin != group_begin) { |
128 | WindowSegmentValue(l_idx, begin, group_begin + TREE_FANOUT); |
129 | parent_begin++; |
130 | } |
131 | idx_t group_end = parent_end * TREE_FANOUT; |
132 | if (end != group_end) { |
133 | WindowSegmentValue(l_idx, group_end, end); |
134 | } |
135 | begin = parent_begin; |
136 | end = parent_end; |
137 | } |
138 | |
139 | return AggegateFinal(); |
140 | } |
141 | |