1#ifndef SIMDJSON_ARM64_STRINGPARSING_H
2#define SIMDJSON_ARM64_STRINGPARSING_H
3
4#include "simdjson/base.h"
5#include "simdjson/arm64/simd.h"
6#include "simdjson/arm64/bitmanipulation.h"
7
8namespace simdjson {
9namespace SIMDJSON_IMPLEMENTATION {
10namespace {
11
12using namespace simd;
13
14// Holds backslashes and quotes locations.
15struct backslash_and_quote {
16public:
17 static constexpr uint32_t BYTES_PROCESSED = 32;
18 simdjson_inline static backslash_and_quote copy_and_find(const uint8_t *src, uint8_t *dst);
19
20 simdjson_inline bool has_quote_first() { return ((bs_bits - 1) & quote_bits) != 0; }
21 simdjson_inline bool has_backslash() { return bs_bits != 0; }
22 simdjson_inline int quote_index() { return trailing_zeroes(input_num: quote_bits); }
23 simdjson_inline int backslash_index() { return trailing_zeroes(input_num: bs_bits); }
24
25 uint32_t bs_bits;
26 uint32_t quote_bits;
27}; // struct backslash_and_quote
28
29simdjson_inline backslash_and_quote backslash_and_quote::copy_and_find(const uint8_t *src, uint8_t *dst) {
30 // this can read up to 31 bytes beyond the buffer size, but we require
31 // SIMDJSON_PADDING of padding
32 static_assert(SIMDJSON_PADDING >= (BYTES_PROCESSED - 1), "backslash and quote finder must process fewer than SIMDJSON_PADDING bytes");
33 simd8<uint8_t> v0(src);
34 simd8<uint8_t> v1(src + sizeof(v0));
35 v0.store(dst);
36 v1.store(dst: dst + sizeof(v0));
37
38 // Getting a 64-bit bitmask is much cheaper than multiple 16-bit bitmasks on ARM; therefore, we
39 // smash them together into a 64-byte mask and get the bitmask from there.
40 uint64_t bs_and_quote = simd8x64<bool>(v0 == '\\', v1 == '\\', v0 == '"', v1 == '"').to_bitmask();
41 return {
42 .bs_bits: uint32_t(bs_and_quote), // bs_bits
43 .quote_bits: uint32_t(bs_and_quote >> 32) // quote_bits
44 };
45}
46
47} // unnamed namespace
48} // namespace SIMDJSON_IMPLEMENTATION
49} // namespace simdjson
50
51#endif // SIMDJSON_ARM64_STRINGPARSING_H
52