1 | /* |
2 | * Copyright (c) 2016, 2019, Oracle and/or its affiliates. All rights reserved. |
3 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
4 | * |
5 | * This code is free software; you can redistribute it and/or modify it |
6 | * under the terms of the GNU General Public License version 2 only, as |
7 | * published by the Free Software Foundation. |
8 | * |
9 | * This code is distributed in the hope that it will be useful, but WITHOUT |
10 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
11 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
12 | * version 2 for more details (a copy is included in the LICENSE file that |
13 | * accompanied this code). |
14 | * |
15 | * You should have received a copy of the GNU General Public License version |
16 | * 2 along with this work; if not, write to the Free Software Foundation, |
17 | * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
18 | * |
19 | * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
20 | * or visit www.oracle.com if you need additional information or have any |
21 | * questions. |
22 | * |
23 | */ |
24 | |
25 | #include "precompiled.hpp" |
26 | #include "classfile/symbolTable.hpp" |
27 | #include "compiler/methodMatcher.hpp" |
28 | #include "memory/oopFactory.hpp" |
29 | #include "memory/resourceArea.hpp" |
30 | #include "oops/oop.inline.hpp" |
31 | |
32 | // The JVM specification defines the allowed characters. |
33 | // Tokens that are disallowed by the JVM specification can have |
34 | // a meaning to the parser so we need to include them here. |
35 | // The parser does not enforce all rules of the JVMS - a successful parse |
36 | // does not mean that it is an allowed name. Illegal names will |
37 | // be ignored since they never can match a class or method. |
38 | // |
39 | // '\0' and 0xf0-0xff are disallowed in constant string values |
40 | // 0x20 ' ', 0x09 '\t' and, 0x2c ',' are used in the matching |
41 | // 0x5b '[' and 0x5d ']' can not be used because of the matcher |
42 | // 0x28 '(' and 0x29 ')' are used for the signature |
43 | // 0x2e '.' is always replaced before the matching |
44 | // 0x2f '/' is only used in the class name as package separator |
45 | |
46 | #define RANGEBASE "\x1\x2\x3\x4\x5\x6\x7\x8\xa\xb\xc\xd\xe\xf" \ |
47 | "\x10\x11\x12\x13\x14\x15\x16\x17\x18\x19\x1a\x1b\x1c\x1d\x1e\x1f" \ |
48 | "\x21\x22\x23\x24\x25\x26\x27\x2a\x2b\x2c\x2d" \ |
49 | "\x30\x31\x32\x33\x34\x35\x36\x37\x38\x39\x3a\x3b\x3c\x3d\x3e\x3f" \ |
50 | "\x40\x41\x42\x43\x44\x45\x46\x47\x48\x49\x4a\x4b\x4c\x4d\x4e\x4f" \ |
51 | "\x50\x51\x52\x53\x54\x55\x56\x57\x58\x59\x5a\x5c\x5e\x5f" \ |
52 | "\x60\x61\x62\x63\x64\x65\x66\x67\x68\x69\x6a\x6b\x6c\x6d\x6e\x6f" \ |
53 | "\x70\x71\x72\x73\x74\x75\x76\x77\x78\x79\x7a\x7b\x7c\x7d\x7e\x7f" \ |
54 | "\x80\x81\x82\x83\x84\x85\x86\x87\x88\x89\x8a\x8b\x8c\x8d\x8e\x8f" \ |
55 | "\x90\x91\x92\x93\x94\x95\x96\x97\x98\x99\x9a\x9b\x9c\x9d\x9e\x9f" \ |
56 | "\xa0\xa1\xa2\xa3\xa4\xa5\xa6\xa7\xa8\xa9\xaa\xab\xac\xad\xae\xaf" \ |
57 | "\xb0\xb1\xb2\xb3\xb4\xb5\xb6\xb7\xb8\xb9\xba\xbb\xbc\xbd\xbe\xbf" \ |
58 | "\xc0\xc1\xc2\xc3\xc4\xc5\xc6\xc7\xc8\xc9\xca\xcb\xcc\xcd\xce\xcf" \ |
59 | "\xd0\xd1\xd2\xd3\xd4\xd5\xd6\xd7\xd8\xd9\xda\xdb\xdc\xdd\xde\xdf" \ |
60 | "\xe0\xe1\xe2\xe3\xe4\xe5\xe6\xe7\xe8\xe9\xea\xeb\xec\xed\xee\xef" |
61 | |
62 | #define RANGE0 "[*" RANGEBASE "]" |
63 | #define RANGESLASH "[*" RANGEBASE "/]" |
64 | |
65 | MethodMatcher::MethodMatcher(): |
66 | _class_name(NULL) |
67 | , _method_name(NULL) |
68 | , _signature(NULL) |
69 | , _class_mode(Exact) |
70 | , _method_mode(Exact) { |
71 | } |
72 | |
73 | MethodMatcher::~MethodMatcher() { |
74 | if (_class_name != NULL) { |
75 | _class_name->decrement_refcount(); |
76 | } |
77 | if (_method_name != NULL) { |
78 | _method_name->decrement_refcount(); |
79 | } |
80 | if (_signature != NULL) { |
81 | _signature->decrement_refcount(); |
82 | } |
83 | } |
84 | |
85 | void MethodMatcher::init(Symbol* class_name, Mode class_mode, |
86 | Symbol* method_name, Mode method_mode, |
87 | Symbol* signature) { |
88 | _class_mode = class_mode; |
89 | _method_mode = method_mode; |
90 | _class_name = class_name; |
91 | _method_name = method_name; |
92 | _signature = signature; |
93 | } |
94 | |
95 | bool MethodMatcher::canonicalize(char * line, const char *& error_msg) { |
96 | char* colon = strstr(line, "::" ); |
97 | bool have_colon = (colon != NULL); |
98 | if (have_colon) { |
99 | // Don't allow multiple '::' |
100 | if (colon[2] != '\0') { |
101 | if (strstr(colon+2, "::" )) { |
102 | error_msg = "Method pattern only allows one '::' allowed" ; |
103 | return false; |
104 | } |
105 | } |
106 | |
107 | bool in_signature = false; |
108 | char* pos = line; |
109 | if (pos != NULL) { |
110 | for (char* lp = pos + 1; *lp != '\0'; lp++) { |
111 | if (*lp == '(') { |
112 | break; |
113 | } |
114 | |
115 | if (*lp == '/') { |
116 | error_msg = "Method pattern uses '/' together with '::'" ; |
117 | return false; |
118 | } |
119 | } |
120 | } |
121 | } else { |
122 | // Don't allow mixed package separators |
123 | char* pos = strchr(line, '.'); |
124 | bool in_signature = false; |
125 | if (pos != NULL) { |
126 | for (char* lp = pos + 1; *lp != '\0'; lp++) { |
127 | if (*lp == '(') { |
128 | in_signature = true; |
129 | } |
130 | |
131 | // After any comma the method pattern has ended |
132 | if (*lp == ',') { |
133 | break; |
134 | } |
135 | |
136 | if (!in_signature && (*lp == '/')) { |
137 | error_msg = "Method pattern uses mixed '/' and '.' package separators" ; |
138 | return false; |
139 | } |
140 | |
141 | if (*lp == '.') { |
142 | error_msg = "Method pattern uses multiple '.' in pattern" ; |
143 | return false; |
144 | } |
145 | } |
146 | } |
147 | } |
148 | |
149 | for (char* lp = line; *lp != '\0'; lp++) { |
150 | // Allow '.' to separate the class name from the method name. |
151 | // This is the preferred spelling of methods: |
152 | // exclude java/lang/String.indexOf(I)I |
153 | // Allow ',' for spaces (eases command line quoting). |
154 | // exclude,java/lang/String.indexOf |
155 | // For backward compatibility, allow space as separator also. |
156 | // exclude java/lang/String indexOf |
157 | // exclude,java/lang/String,indexOf |
158 | // For easy cut-and-paste of method names, allow VM output format |
159 | // as produced by Method::print_short_name: |
160 | // exclude java.lang.String::indexOf |
161 | // For simple implementation convenience here, convert them all to space. |
162 | |
163 | if (have_colon) { |
164 | if (*lp == '.') *lp = '/'; // dots build the package prefix |
165 | if (*lp == ':') *lp = ' '; |
166 | } |
167 | if (*lp == ',' || *lp == '.') *lp = ' '; |
168 | } |
169 | return true; |
170 | } |
171 | |
172 | bool MethodMatcher::match(Symbol* candidate, Symbol* match, Mode match_mode) const { |
173 | if (match_mode == Any) { |
174 | return true; |
175 | } |
176 | |
177 | if (match_mode == Exact) { |
178 | return candidate == match; |
179 | } |
180 | |
181 | ResourceMark rm; |
182 | const char * candidate_string = candidate->as_C_string(); |
183 | const char * match_string = match->as_C_string(); |
184 | |
185 | switch (match_mode) { |
186 | case Prefix: |
187 | return strstr(candidate_string, match_string) == candidate_string; |
188 | |
189 | case Suffix: { |
190 | size_t clen = strlen(candidate_string); |
191 | size_t mlen = strlen(match_string); |
192 | return clen >= mlen && strcmp(candidate_string + clen - mlen, match_string) == 0; |
193 | } |
194 | |
195 | case Substring: |
196 | return strstr(candidate_string, match_string) != NULL; |
197 | |
198 | default: |
199 | return false; |
200 | } |
201 | } |
202 | |
203 | static MethodMatcher::Mode check_mode(char name[], const char*& error_msg) { |
204 | int match = MethodMatcher::Exact; |
205 | if (name[0] == '*') { |
206 | if (strlen(name) == 1) { |
207 | return MethodMatcher::Any; |
208 | } |
209 | match |= MethodMatcher::Suffix; |
210 | memmove(name, name + 1, strlen(name + 1) + 1); |
211 | } |
212 | |
213 | size_t len = strlen(name); |
214 | if (len > 0 && name[len - 1] == '*') { |
215 | match |= MethodMatcher::Prefix; |
216 | name[--len] = '\0'; |
217 | } |
218 | |
219 | if (strlen(name) == 0) { |
220 | error_msg = "** Not a valid pattern" ; |
221 | return MethodMatcher::Any; |
222 | } |
223 | |
224 | if (strstr(name, "*" ) != NULL) { |
225 | error_msg = " Embedded * not allowed" ; |
226 | return MethodMatcher::Unknown; |
227 | } |
228 | return (MethodMatcher::Mode)match; |
229 | } |
230 | |
231 | // Skip any leading spaces |
232 | void skip_leading_spaces(char*& line, int* total_bytes_read ) { |
233 | int bytes_read = 0; |
234 | sscanf(line, "%*[ \t]%n" , &bytes_read); |
235 | if (bytes_read > 0) { |
236 | line += bytes_read; |
237 | *total_bytes_read += bytes_read; |
238 | } |
239 | } |
240 | |
241 | PRAGMA_DIAG_PUSH |
242 | // warning C4189: The file contains a character that cannot be represented |
243 | // in the current code page |
244 | PRAGMA_DISABLE_MSVC_WARNING(4819) |
245 | void MethodMatcher::parse_method_pattern(char*& line, const char*& error_msg, MethodMatcher* matcher) { |
246 | MethodMatcher::Mode c_match; |
247 | MethodMatcher::Mode m_match; |
248 | char class_name[256] = {0}; |
249 | char method_name[256] = {0}; |
250 | char sig[1024] = {0}; |
251 | int bytes_read = 0; |
252 | int total_bytes_read = 0; |
253 | |
254 | assert(error_msg == NULL, "Dont call here with error_msg already set" ); |
255 | |
256 | if (!MethodMatcher::canonicalize(line, error_msg)) { |
257 | assert(error_msg != NULL, "Message must be set if parsing failed" ); |
258 | return; |
259 | } |
260 | |
261 | skip_leading_spaces(line, &total_bytes_read); |
262 | |
263 | if (2 == sscanf(line, "%255" RANGESLASH "%*[ ]" "%255" RANGE0 "%n" , class_name, method_name, &bytes_read)) { |
264 | c_match = check_mode(class_name, error_msg); |
265 | m_match = check_mode(method_name, error_msg); |
266 | |
267 | if ((strchr(class_name, '<') != NULL) || (strchr(class_name, '>') != NULL)) { |
268 | error_msg = "Chars '<' and '>' not allowed in class name" ; |
269 | return; |
270 | } |
271 | if ((strchr(method_name, '<') != NULL) || (strchr(method_name, '>') != NULL)) { |
272 | if ((strncmp("<init>" , method_name, 255) != 0) && (strncmp("<clinit>" , method_name, 255) != 0)) { |
273 | error_msg = "Chars '<' and '>' only allowed in <init> and <clinit>" ; |
274 | return; |
275 | } |
276 | } |
277 | |
278 | if (c_match == MethodMatcher::Unknown || m_match == MethodMatcher::Unknown) { |
279 | assert(error_msg != NULL, "Must have been set by check_mode()" ); |
280 | return; |
281 | } |
282 | |
283 | EXCEPTION_MARK; |
284 | Symbol* signature = NULL; |
285 | line += bytes_read; |
286 | bytes_read = 0; |
287 | |
288 | skip_leading_spaces(line, &total_bytes_read); |
289 | |
290 | // there might be a signature following the method. |
291 | // signatures always begin with ( so match that by hand |
292 | if (line[0] == '(') { |
293 | line++; |
294 | sig[0] = '('; |
295 | // scan the rest |
296 | if (1 == sscanf(line, "%1022[[);/" RANGEBASE "]%n" , sig+1, &bytes_read)) { |
297 | if (strchr(sig, '*') != NULL) { |
298 | error_msg = " Wildcard * not allowed in signature" ; |
299 | return; |
300 | } |
301 | line += bytes_read; |
302 | } |
303 | signature = SymbolTable::new_symbol(sig); |
304 | } |
305 | Symbol* c_name = SymbolTable::new_symbol(class_name); |
306 | Symbol* m_name = SymbolTable::new_symbol(method_name); |
307 | |
308 | matcher->init(c_name, c_match, m_name, m_match, signature); |
309 | return; |
310 | } else { |
311 | error_msg = "Could not parse method pattern" ; |
312 | } |
313 | } |
314 | PRAGMA_DIAG_POP |
315 | |
316 | bool MethodMatcher::matches(const methodHandle& method) const { |
317 | Symbol* class_name = method->method_holder()->name(); |
318 | Symbol* method_name = method->name(); |
319 | Symbol* signature = method->signature(); |
320 | |
321 | if (match(class_name, this->class_name(), _class_mode) && |
322 | match(method_name, this->method_name(), _method_mode) && |
323 | ((this->signature() == NULL) || match(signature, this->signature(), Prefix))) { |
324 | return true; |
325 | } |
326 | return false; |
327 | } |
328 | |
329 | void MethodMatcher::print_symbol(outputStream* st, Symbol* h, Mode mode) { |
330 | if (mode == Suffix || mode == Substring || mode == Any) { |
331 | st->print("*" ); |
332 | } |
333 | if (mode != Any) { |
334 | h->print_utf8_on(st); |
335 | } |
336 | if (mode == Prefix || mode == Substring) { |
337 | st->print("*" ); |
338 | } |
339 | } |
340 | |
341 | void MethodMatcher::print_base(outputStream* st) { |
342 | ResourceMark rm; |
343 | |
344 | print_symbol(st, class_name(), _class_mode); |
345 | st->print("." ); |
346 | print_symbol(st, method_name(), _method_mode); |
347 | if (signature() != NULL) { |
348 | signature()->print_utf8_on(st); |
349 | } |
350 | } |
351 | |
352 | BasicMatcher* BasicMatcher::parse_method_pattern(char* line, const char*& error_msg) { |
353 | assert(error_msg == NULL, "Don't call here with error_msg already set" ); |
354 | BasicMatcher* bm = new BasicMatcher(); |
355 | MethodMatcher::parse_method_pattern(line, error_msg, bm); |
356 | if (error_msg != NULL) { |
357 | delete bm; |
358 | return NULL; |
359 | } |
360 | |
361 | // check for bad trailing characters |
362 | int bytes_read = 0; |
363 | sscanf(line, "%*[ \t]%n" , &bytes_read); |
364 | if (line[bytes_read] != '\0') { |
365 | error_msg = "Unrecognized trailing text after method pattern" ; |
366 | delete bm; |
367 | return NULL; |
368 | } |
369 | return bm; |
370 | } |
371 | |
372 | bool BasicMatcher::match(const methodHandle& method) { |
373 | for (BasicMatcher* current = this; current != NULL; current = current->next()) { |
374 | if (current->matches(method)) { |
375 | return true; |
376 | } |
377 | } |
378 | return false; |
379 | } |
380 | |
381 | void InlineMatcher::print(outputStream* st) { |
382 | if (_inline_action == InlineMatcher::force_inline) { |
383 | st->print("+" ); |
384 | } else { |
385 | st->print("-" ); |
386 | } |
387 | print_base(st); |
388 | } |
389 | |
390 | InlineMatcher* InlineMatcher::parse_method_pattern(char* line, const char*& error_msg) { |
391 | assert(error_msg == NULL, "Dont call here with error_msg already set" ); |
392 | InlineMatcher* im = new InlineMatcher(); |
393 | MethodMatcher::parse_method_pattern(line, error_msg, im); |
394 | if (error_msg != NULL) { |
395 | delete im; |
396 | return NULL; |
397 | } |
398 | return im; |
399 | } |
400 | |
401 | bool InlineMatcher::match(const methodHandle& method, int inline_action) { |
402 | for (InlineMatcher* current = this; current != NULL; current = current->next()) { |
403 | if (current->matches(method)) { |
404 | return (current->_inline_action == inline_action); |
405 | } |
406 | } |
407 | return false; |
408 | } |
409 | |
410 | InlineMatcher* InlineMatcher::parse_inline_pattern(char* str, const char*& error_msg) { |
411 | // check first token is +/- |
412 | InlineType _inline_action; |
413 | switch (str[0]) { |
414 | case '-': |
415 | _inline_action = InlineMatcher::dont_inline; |
416 | break; |
417 | case '+': |
418 | _inline_action = InlineMatcher::force_inline; |
419 | break; |
420 | default: |
421 | error_msg = "Missing leading inline type (+/-)" ; |
422 | return NULL; |
423 | } |
424 | str++; |
425 | |
426 | int bytes_read = 0; |
427 | assert(error_msg== NULL, "error_msg must not be set yet" ); |
428 | InlineMatcher* im = InlineMatcher::parse_method_pattern(str, error_msg); |
429 | if (im == NULL) { |
430 | assert(error_msg != NULL, "Must have error message" ); |
431 | return NULL; |
432 | } |
433 | im->set_action(_inline_action); |
434 | return im; |
435 | } |
436 | |
437 | InlineMatcher* InlineMatcher::clone() { |
438 | InlineMatcher* m = new InlineMatcher(); |
439 | m->_class_mode = _class_mode; |
440 | m->_method_mode = _method_mode; |
441 | m->_inline_action = _inline_action; |
442 | m->_class_name = _class_name; |
443 | if(_class_name != NULL) { |
444 | _class_name->increment_refcount(); |
445 | } |
446 | m->_method_name = _method_name; |
447 | if (_method_name != NULL) { |
448 | _method_name->increment_refcount(); |
449 | } |
450 | m->_signature = _signature; |
451 | if (_signature != NULL) { |
452 | _signature->increment_refcount(); |
453 | } |
454 | return m; |
455 | } |
456 | |