| 1 | #include "duckdb/function/scalar/string_functions.hpp" |
| 2 | |
| 3 | #include "duckdb/common/exception.hpp" |
| 4 | #include "duckdb/common/vector_operations/vector_operations.hpp" |
| 5 | #include "duckdb/common/vector_operations/unary_executor.hpp" |
| 6 | #include "utf8proc.hpp" |
| 7 | |
| 8 | #include <cstring> |
| 9 | |
| 10 | using namespace std; |
| 11 | |
| 12 | namespace duckdb { |
| 13 | |
| 14 | static int64_t instr(string_t haystack, string_t needle) { |
| 15 | int64_t string_position = 0; |
| 16 | |
| 17 | // Getting information about the needle and the haystack |
| 18 | auto haystack_data = haystack.GetData(); |
| 19 | auto needle_data = needle.GetData(); |
| 20 | auto location_data = strstr(haystack_data, needle_data); |
| 21 | if (location_data) { |
| 22 | auto str = reinterpret_cast<const utf8proc_uint8_t *>(haystack_data); |
| 23 | utf8proc_ssize_t len = location_data - haystack_data; |
| 24 | for (++string_position; len > 0; ++string_position) { |
| 25 | utf8proc_int32_t codepoint; |
| 26 | const auto bytes = utf8proc_iterate(str, len, &codepoint); |
| 27 | str += bytes; |
| 28 | len -= bytes; |
| 29 | } |
| 30 | } |
| 31 | |
| 32 | return string_position; |
| 33 | } |
| 34 | |
| 35 | struct InstrOperator { |
| 36 | template <class TA, class TB, class TR> static inline TR Operation(TA left, TB right) { |
| 37 | return instr(left, right); |
| 38 | } |
| 39 | }; |
| 40 | |
| 41 | void InstrFun::RegisterFunction(BuiltinFunctions &set) { |
| 42 | set.AddFunction(ScalarFunction("instr" , // name of the function |
| 43 | {SQLType::VARCHAR, SQLType::VARCHAR}, // argument list |
| 44 | SQLType::BIGINT, // return type |
| 45 | ScalarFunction::BinaryFunction<string_t, string_t, int64_t, InstrOperator, true>)); |
| 46 | } |
| 47 | |
| 48 | } // namespace duckdb |
| 49 | |