1 | /* -*- c-basic-offset: 2; indent-tabs-mode: nil -*- */ |
2 | /* |
3 | Copyright(C) 2010 Tetsuro IKEDA |
4 | Copyright(C) 2010-2013 Kentoku SHIBA |
5 | Copyright(C) 2011-2017 Kouhei Sutou <kou@clear-code.com> |
6 | |
7 | This library is free software; you can redistribute it and/or |
8 | modify it under the terms of the GNU Lesser General Public |
9 | License as published by the Free Software Foundation; either |
10 | version 2.1 of the License, or (at your option) any later version. |
11 | |
12 | This library is distributed in the hope that it will be useful, |
13 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
15 | Lesser General Public License for more details. |
16 | |
17 | You should have received a copy of the GNU Lesser General Public |
18 | License along with this library; if not, write to the Free Software |
19 | Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
20 | */ |
21 | |
22 | #include <mrn_mysql.h> |
23 | #include <mrn_mysql_compat.h> |
24 | #include <mrn_err.h> |
25 | #include <mrn_encoding.hpp> |
26 | #include <mrn_windows.hpp> |
27 | #include <mrn_table.hpp> |
28 | #include <mrn_macro.hpp> |
29 | #include <mrn_database_manager.hpp> |
30 | #include <mrn_context_pool.hpp> |
31 | #include <mrn_variables.hpp> |
32 | #include <mrn_current_thread.hpp> |
33 | |
34 | MRN_BEGIN_DECLS |
35 | |
36 | extern mrn::DatabaseManager *mrn_db_manager; |
37 | extern mrn::ContextPool *mrn_context_pool; |
38 | |
39 | struct st_mrn_snip_info |
40 | { |
41 | grn_ctx *ctx; |
42 | grn_obj *db; |
43 | bool use_shared_db; |
44 | grn_obj *snippet; |
45 | String result_str; |
46 | }; |
47 | |
48 | static my_bool mrn_snippet_prepare(st_mrn_snip_info *snip_info, UDF_ARGS *args, |
49 | char *message, grn_obj **snippet) |
50 | { |
51 | unsigned int i; |
52 | CHARSET_INFO *cs; |
53 | grn_ctx *ctx = snip_info->ctx; |
54 | long long snip_max_len; |
55 | long long snip_max_num; |
56 | long long skip_leading_spaces; |
57 | long long html_escape; |
58 | int flags = GRN_SNIP_COPY_TAG; |
59 | grn_snip_mapping *mapping = NULL; |
60 | grn_rc rc; |
61 | String *result_str = &snip_info->result_str; |
62 | |
63 | *snippet = NULL; |
64 | snip_max_len = *((long long *) args->args[1]); |
65 | snip_max_num = *((long long *) args->args[2]); |
66 | |
67 | if (args->arg_type[3] == STRING_RESULT) { |
68 | if (!(cs = get_charset_by_name(args->args[3], MYF(0)))) { |
69 | snprintf(message, MYSQL_ERRMSG_SIZE, |
70 | "Unknown charset: <%s>" , args->args[3]); |
71 | goto error; |
72 | } |
73 | } else { |
74 | uint charset_id = static_cast<uint>(*((long long *) args->args[3])); |
75 | if (!(cs = get_charset(charset_id, MYF(0)))) { |
76 | snprintf(message, MYSQL_ERRMSG_SIZE, |
77 | "Unknown charset ID: <%u>" , charset_id); |
78 | goto error; |
79 | } |
80 | } |
81 | if (!mrn::encoding::set_raw(ctx, cs)) { |
82 | snprintf(message, MYSQL_ERRMSG_SIZE, |
83 | "Unsupported charset: <%s>" , cs->name); |
84 | goto error; |
85 | } |
86 | |
87 | if (!(cs->state & (MY_CS_BINSORT | MY_CS_CSSORT))) { |
88 | flags |= GRN_SNIP_NORMALIZE; |
89 | } |
90 | |
91 | skip_leading_spaces = *((long long *) args->args[4]); |
92 | if (skip_leading_spaces) { |
93 | flags |= GRN_SNIP_SKIP_LEADING_SPACES; |
94 | } |
95 | |
96 | html_escape = *((long long *) args->args[5]); |
97 | if (html_escape) { |
98 | mapping = (grn_snip_mapping *) -1; |
99 | } |
100 | |
101 | *snippet = grn_snip_open(ctx, flags, static_cast<unsigned int>(snip_max_len), |
102 | static_cast<unsigned int>(snip_max_num), |
103 | "" , 0, "" , 0, mapping); |
104 | if (ctx->rc) { |
105 | snprintf(message, MYSQL_ERRMSG_SIZE, |
106 | "Failed to open grn_snip: <%s>" , ctx->errbuf); |
107 | goto error; |
108 | } |
109 | |
110 | for (i = 8; i < args->arg_count; i += 3) { |
111 | rc = grn_snip_add_cond(ctx, *snippet, |
112 | args->args[i], args->lengths[i], |
113 | args->args[i + 1], args->lengths[i + 1], |
114 | args->args[i + 2], args->lengths[i + 2]); |
115 | if (rc) { |
116 | snprintf(message, MYSQL_ERRMSG_SIZE, |
117 | "Failed to add a condition to grn_snip: <%s>" , ctx->errbuf); |
118 | goto error; |
119 | } |
120 | } |
121 | |
122 | result_str->set_charset(cs); |
123 | return FALSE; |
124 | |
125 | error: |
126 | if (*snippet) { |
127 | grn_obj_close(ctx, *snippet); |
128 | } |
129 | return TRUE; |
130 | } |
131 | |
132 | MRN_API my_bool mroonga_snippet_init(UDF_INIT *init, UDF_ARGS *args, char *message) |
133 | { |
134 | uint i; |
135 | st_mrn_snip_info *snip_info = NULL; |
136 | bool can_open_snippet = TRUE; |
137 | init->ptr = NULL; |
138 | if (args->arg_count < 11 || (args->arg_count - 11) % 3) |
139 | { |
140 | sprintf(message, "Incorrect number of arguments for mroonga_snippet(): %u" , |
141 | args->arg_count); |
142 | goto error; |
143 | } |
144 | if (args->arg_type[0] != STRING_RESULT) { |
145 | strcpy(message, "mroonga_snippet() requires string for 1st argument" ); |
146 | goto error; |
147 | } |
148 | if (args->arg_type[1] != INT_RESULT) { |
149 | strcpy(message, "mroonga_snippet() requires int for 2nd argument" ); |
150 | goto error; |
151 | } |
152 | if (args->arg_type[2] != INT_RESULT) { |
153 | strcpy(message, "mroonga_snippet() requires int for 3rd argument" ); |
154 | goto error; |
155 | } |
156 | if ( |
157 | args->arg_type[3] != STRING_RESULT && |
158 | args->arg_type[3] != INT_RESULT |
159 | ) { |
160 | strcpy(message, |
161 | "mroonga_snippet() requires string or int for 4th argument" ); |
162 | goto error; |
163 | } |
164 | if (args->arg_type[4] != INT_RESULT) { |
165 | strcpy(message, "mroonga_snippet() requires int for 5th argument" ); |
166 | goto error; |
167 | } |
168 | if (args->arg_type[5] != INT_RESULT) { |
169 | strcpy(message, "mroonga_snippet() requires int for 6th argument" ); |
170 | goto error; |
171 | } |
172 | for (i = 6; i < args->arg_count; i++) { |
173 | if (args->arg_type[i] != STRING_RESULT) { |
174 | sprintf(message, "mroonga_snippet() requires string for %uth argument" , |
175 | i); |
176 | goto error; |
177 | } |
178 | } |
179 | init->maybe_null = 1; |
180 | |
181 | if (!(snip_info = (st_mrn_snip_info *) mrn_my_malloc(sizeof(st_mrn_snip_info), |
182 | MYF(MY_WME | MY_ZEROFILL)))) |
183 | { |
184 | strcpy(message, "mroonga_snippet() out of memory" ); |
185 | goto error; |
186 | } |
187 | snip_info->ctx = mrn_context_pool->pull(); |
188 | { |
189 | const char *current_db_path = MRN_THD_DB_PATH(current_thd); |
190 | const char *action; |
191 | if (current_db_path) { |
192 | action = "open database" ; |
193 | mrn::Database *db; |
194 | int error = mrn_db_manager->open(current_db_path, &db); |
195 | if (error == 0) { |
196 | snip_info->db = db->get(); |
197 | grn_ctx_use(snip_info->ctx, snip_info->db); |
198 | snip_info->use_shared_db = true; |
199 | } |
200 | } else { |
201 | action = "create anonymous database" ; |
202 | snip_info->db = grn_db_create(snip_info->ctx, NULL, NULL); |
203 | snip_info->use_shared_db = false; |
204 | } |
205 | if (!snip_info->db) { |
206 | sprintf(message, |
207 | "mroonga_snippet(): failed to %s: %s" , |
208 | action, |
209 | snip_info->ctx->errbuf); |
210 | goto error; |
211 | } |
212 | } |
213 | |
214 | for (i = 1; i < args->arg_count; i++) { |
215 | if (!args->args[i]) { |
216 | can_open_snippet = FALSE; |
217 | break; |
218 | } |
219 | } |
220 | if (can_open_snippet) { |
221 | if (mrn_snippet_prepare(snip_info, args, message, &snip_info->snippet)) { |
222 | goto error; |
223 | } |
224 | } |
225 | init->ptr = (char *) snip_info; |
226 | |
227 | return FALSE; |
228 | |
229 | error: |
230 | if (snip_info) { |
231 | if (!snip_info->use_shared_db) { |
232 | grn_obj_close(snip_info->ctx, snip_info->db); |
233 | } |
234 | mrn_context_pool->release(snip_info->ctx); |
235 | my_free(snip_info); |
236 | } |
237 | return TRUE; |
238 | } |
239 | |
240 | MRN_API char *mroonga_snippet(UDF_INIT *init, UDF_ARGS *args, char *result, |
241 | unsigned long *length, char *is_null, char *error) |
242 | { |
243 | st_mrn_snip_info *snip_info = (st_mrn_snip_info *) init->ptr; |
244 | grn_ctx *ctx = snip_info->ctx; |
245 | String *result_str = &snip_info->result_str; |
246 | char *target; |
247 | unsigned int target_length; |
248 | grn_obj *snippet = NULL; |
249 | grn_rc rc; |
250 | unsigned int i, n_results, max_tagged_length, result_length; |
251 | |
252 | if (!args->args[0]) { |
253 | *is_null = 1; |
254 | return NULL; |
255 | } |
256 | *is_null = 0; |
257 | target = args->args[0]; |
258 | target_length = args->lengths[0]; |
259 | |
260 | if (!snip_info->snippet) { |
261 | for (i = 1; i < args->arg_count; i++) { |
262 | if (!args->args[i]) { |
263 | my_printf_error(ER_MRN_INVALID_NULL_VALUE_NUM, |
264 | ER_MRN_INVALID_NULL_VALUE_STR, MYF(0), |
265 | "mroonga_snippet() arguments" ); |
266 | goto error; |
267 | } |
268 | } |
269 | |
270 | if (mrn_snippet_prepare(snip_info, args, NULL, &snippet)) { |
271 | goto error; |
272 | } |
273 | } else { |
274 | snippet = snip_info->snippet; |
275 | } |
276 | |
277 | rc = grn_snip_exec(ctx, snippet, target, target_length, |
278 | &n_results, &max_tagged_length); |
279 | if (rc) { |
280 | my_printf_error(ER_MRN_ERROR_FROM_GROONGA_NUM, |
281 | ER_MRN_ERROR_FROM_GROONGA_STR, MYF(0), ctx->errbuf); |
282 | goto error; |
283 | } |
284 | |
285 | result_str->length(0); |
286 | if (result_str->reserve((args->lengths[6] + args->lengths[7] + |
287 | max_tagged_length) * n_results)) { |
288 | my_error(ER_OUT_OF_RESOURCES, MYF(0), HA_ERR_OUT_OF_MEM); |
289 | goto error; |
290 | } |
291 | for (i = 0; i < n_results; i++) { |
292 | result_str->q_append(args->args[6], args->lengths[6]); |
293 | rc = grn_snip_get_result(ctx, snippet, i, |
294 | (char *) result_str->ptr() + result_str->length(), |
295 | &result_length); |
296 | if (rc) { |
297 | my_printf_error(ER_MRN_ERROR_FROM_GROONGA_NUM, |
298 | ER_MRN_ERROR_FROM_GROONGA_STR, MYF(0), ctx->errbuf); |
299 | goto error; |
300 | } |
301 | result_str->length(result_str->length() + result_length); |
302 | result_str->q_append(args->args[7], args->lengths[7]); |
303 | } |
304 | |
305 | if (!snip_info->snippet) { |
306 | rc = grn_obj_close(ctx, snippet); |
307 | if (rc) { |
308 | my_printf_error(ER_MRN_ERROR_FROM_GROONGA_NUM, |
309 | ER_MRN_ERROR_FROM_GROONGA_STR, MYF(0), ctx->errbuf); |
310 | goto error; |
311 | } |
312 | } |
313 | |
314 | *length = result_str->length(); |
315 | return (char *) result_str->ptr(); |
316 | |
317 | error: |
318 | *error = 1; |
319 | return NULL; |
320 | } |
321 | |
322 | MRN_API void mroonga_snippet_deinit(UDF_INIT *init) |
323 | { |
324 | st_mrn_snip_info *snip_info = (st_mrn_snip_info *) init->ptr; |
325 | if (snip_info) { |
326 | if (snip_info->snippet) { |
327 | grn_obj_close(snip_info->ctx, snip_info->snippet); |
328 | } |
329 | MRN_STRING_FREE(snip_info->result_str); |
330 | if (!snip_info->use_shared_db) { |
331 | grn_obj_close(snip_info->ctx, snip_info->db); |
332 | } |
333 | mrn_context_pool->release(snip_info->ctx); |
334 | my_free(snip_info); |
335 | } |
336 | } |
337 | |
338 | MRN_END_DECLS |
339 | |