1 | /* Copyright (c) 2010, Oracle and/or its affiliates. All rights reserved. |
2 | |
3 | This program is free software; you can redistribute it and/or modify |
4 | it under the terms of the GNU General Public License as published by |
5 | the Free Software Foundation; version 2 of the License. |
6 | |
7 | This program is distributed in the hope that it will be useful, |
8 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
9 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
10 | GNU General Public License for more details. |
11 | |
12 | You should have received a copy of the GNU General Public License |
13 | along with this program; if not, write to the Free Software |
14 | Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111-1301 USA */ |
15 | |
16 | #include "mariadb.h" |
17 | #include "filesort_utils.h" |
18 | #include "sql_const.h" |
19 | #include "sql_sort.h" |
20 | #include "table.h" |
21 | |
22 | |
23 | namespace { |
24 | /** |
25 | A local helper function. See comments for get_merge_buffers_cost(). |
26 | */ |
27 | double get_merge_cost(ha_rows num_elements, ha_rows num_buffers, uint elem_size) |
28 | { |
29 | return |
30 | 2.0 * ((double) num_elements * elem_size) / IO_SIZE |
31 | + (double) num_elements * log((double) num_buffers) / |
32 | (TIME_FOR_COMPARE_ROWID * M_LN2); |
33 | } |
34 | } |
35 | |
36 | /** |
37 | This is a simplified, and faster version of @see get_merge_many_buffs_cost(). |
38 | We calculate the cost of merging buffers, by simulating the actions |
39 | of @see merge_many_buff. For explanations of formulas below, |
40 | see comments for get_merge_buffers_cost(). |
41 | TODO: Use this function for Unique::get_use_cost(). |
42 | */ |
43 | double get_merge_many_buffs_cost_fast(ha_rows num_rows, |
44 | ha_rows num_keys_per_buffer, |
45 | uint elem_size) |
46 | { |
47 | ha_rows num_buffers= num_rows / num_keys_per_buffer; |
48 | ha_rows last_n_elems= num_rows % num_keys_per_buffer; |
49 | double total_cost; |
50 | |
51 | // Calculate CPU cost of sorting buffers. |
52 | total_cost= |
53 | ( num_buffers * num_keys_per_buffer * log(1.0 + num_keys_per_buffer) + |
54 | last_n_elems * log(1.0 + last_n_elems) ) |
55 | / TIME_FOR_COMPARE_ROWID; |
56 | |
57 | // Simulate behavior of merge_many_buff(). |
58 | while (num_buffers >= MERGEBUFF2) |
59 | { |
60 | // Calculate # of calls to merge_buffers(). |
61 | const ha_rows loop_limit= num_buffers - MERGEBUFF*3/2; |
62 | const ha_rows num_merge_calls= 1 + loop_limit/MERGEBUFF; |
63 | const ha_rows num_remaining_buffs= |
64 | num_buffers - num_merge_calls * MERGEBUFF; |
65 | |
66 | // Cost of merge sort 'num_merge_calls'. |
67 | total_cost+= |
68 | num_merge_calls * |
69 | get_merge_cost(num_keys_per_buffer * MERGEBUFF, MERGEBUFF, elem_size); |
70 | |
71 | // # of records in remaining buffers. |
72 | last_n_elems+= num_remaining_buffs * num_keys_per_buffer; |
73 | |
74 | // Cost of merge sort of remaining buffers. |
75 | total_cost+= |
76 | get_merge_cost(last_n_elems, 1 + num_remaining_buffs, elem_size); |
77 | |
78 | num_buffers= num_merge_calls; |
79 | num_keys_per_buffer*= MERGEBUFF; |
80 | } |
81 | |
82 | // Simulate final merge_buff call. |
83 | last_n_elems+= num_keys_per_buffer * num_buffers; |
84 | total_cost+= get_merge_cost(last_n_elems, 1 + num_buffers, elem_size); |
85 | return total_cost; |
86 | } |
87 | |
88 | /* |
89 | alloc_sort_buffer() |
90 | |
91 | Allocate buffer for sorting keys. |
92 | Try to reuse old buffer if possible. |
93 | |
94 | @return |
95 | 0 Error |
96 | # Pointer to allocated buffer |
97 | */ |
98 | |
99 | uchar **Filesort_buffer::alloc_sort_buffer(uint num_records, |
100 | uint record_length) |
101 | { |
102 | size_t buff_size; |
103 | uchar **sort_keys, **start_of_data; |
104 | DBUG_ENTER("alloc_sort_buffer" ); |
105 | DBUG_EXECUTE_IF("alloc_sort_buffer_fail" , |
106 | DBUG_SET("+d,simulate_out_of_memory" );); |
107 | |
108 | buff_size= ((size_t)num_records) * (record_length + sizeof(uchar*)); |
109 | set_if_bigger(buff_size, record_length * MERGEBUFF2); |
110 | |
111 | if (!m_idx_array.is_null()) |
112 | { |
113 | /* |
114 | Reuse old buffer if exists and is large enough |
115 | Note that we don't make the buffer smaller, as we want to be |
116 | prepared for next subquery iteration. |
117 | */ |
118 | |
119 | sort_keys= m_idx_array.array(); |
120 | if (buff_size > allocated_size) |
121 | { |
122 | /* |
123 | Better to free and alloc than realloc as we don't have to remember |
124 | the old values |
125 | */ |
126 | my_free(sort_keys); |
127 | if (!(sort_keys= (uchar**) my_malloc(buff_size, |
128 | MYF(MY_THREAD_SPECIFIC)))) |
129 | { |
130 | reset(); |
131 | DBUG_RETURN(0); |
132 | } |
133 | allocated_size= buff_size; |
134 | } |
135 | } |
136 | else |
137 | { |
138 | if (!(sort_keys= (uchar**) my_malloc(buff_size, MYF(MY_THREAD_SPECIFIC)))) |
139 | DBUG_RETURN(0); |
140 | allocated_size= buff_size; |
141 | } |
142 | |
143 | m_idx_array= Idx_array(sort_keys, num_records); |
144 | m_record_length= record_length; |
145 | start_of_data= m_idx_array.array() + m_idx_array.size(); |
146 | m_start_of_data= reinterpret_cast<uchar*>(start_of_data); |
147 | |
148 | DBUG_RETURN(m_idx_array.array()); |
149 | } |
150 | |
151 | |
152 | void Filesort_buffer::free_sort_buffer() |
153 | { |
154 | my_free(m_idx_array.array()); |
155 | m_idx_array.reset(); |
156 | m_start_of_data= NULL; |
157 | } |
158 | |
159 | |
160 | void Filesort_buffer::sort_buffer(const Sort_param *param, uint count) |
161 | { |
162 | size_t size= param->sort_length; |
163 | if (count <= 1 || size == 0) |
164 | return; |
165 | uchar **keys= get_sort_keys(); |
166 | uchar **buffer= NULL; |
167 | if (radixsort_is_appliccable(count, param->sort_length) && |
168 | (buffer= (uchar**) my_malloc(count*sizeof(char*), |
169 | MYF(MY_THREAD_SPECIFIC)))) |
170 | { |
171 | radixsort_for_str_ptr(keys, count, param->sort_length, buffer); |
172 | my_free(buffer); |
173 | return; |
174 | } |
175 | |
176 | my_qsort2(keys, count, sizeof(uchar*), get_ptr_compare(size), &size); |
177 | } |
178 | |