1 | // Copyright 2018 Google LLC. |
2 | // Use of this source code is governed by a BSD-style license that can be found in the LICENSE file. |
3 | #ifndef SkUTF_DEFINED |
4 | #define SkUTF_DEFINED |
5 | |
6 | #include "include/core/SkTypes.h" |
7 | #include <cstddef> |
8 | #include <cstdint> |
9 | |
10 | typedef int32_t SkUnichar; |
11 | |
12 | namespace SkUTF { |
13 | |
14 | /** Given a sequence of UTF-8 bytes, return the number of unicode codepoints. |
15 | If the sequence is invalid UTF-8, return -1. |
16 | */ |
17 | SK_SPI int CountUTF8(const char* utf8, size_t byteLength); |
18 | |
19 | /** Given a sequence of aligned UTF-16 characters in machine-endian form, |
20 | return the number of unicode codepoints. If the sequence is invalid |
21 | UTF-16, return -1. |
22 | */ |
23 | SK_SPI int CountUTF16(const uint16_t* utf16, size_t byteLength); |
24 | |
25 | /** Given a sequence of aligned UTF-32 characters in machine-endian form, |
26 | return the number of unicode codepoints. If the sequence is invalid |
27 | UTF-32, return -1. |
28 | */ |
29 | SK_SPI int CountUTF32(const int32_t* utf32, size_t byteLength); |
30 | |
31 | /** Given a sequence of UTF-8 bytes, return the first unicode codepoint. |
32 | The pointer will be incremented to point at the next codepoint's start. If |
33 | invalid UTF-8 is encountered, set *ptr to end and return -1. |
34 | */ |
35 | SK_SPI SkUnichar NextUTF8(const char** ptr, const char* end); |
36 | |
37 | /** Given a sequence of aligned UTF-16 characters in machine-endian form, |
38 | return the first unicode codepoint. The pointer will be incremented to |
39 | point at the next codepoint's start. If invalid UTF-16 is encountered, |
40 | set *ptr to end and return -1. |
41 | */ |
42 | SK_SPI SkUnichar NextUTF16(const uint16_t** ptr, const uint16_t* end); |
43 | |
44 | /** Given a sequence of aligned UTF-32 characters in machine-endian form, |
45 | return the first unicode codepoint. The pointer will be incremented to |
46 | point at the next codepoint's start. If invalid UTF-32 is encountered, |
47 | set *ptr to end and return -1. |
48 | */ |
49 | SK_SPI SkUnichar NextUTF32(const int32_t** ptr, const int32_t* end); |
50 | |
51 | constexpr unsigned kMaxBytesInUTF8Sequence = 4; |
52 | |
53 | /** Convert the unicode codepoint into UTF-8. If `utf8` is non-null, place the |
54 | result in that array. Return the number of bytes in the result. If `utf8` |
55 | is null, simply return the number of bytes that would be used. For invalid |
56 | unicode codepoints, return 0. |
57 | */ |
58 | SK_SPI size_t ToUTF8(SkUnichar uni, char utf8[kMaxBytesInUTF8Sequence] = nullptr); |
59 | |
60 | /** Convert the unicode codepoint into UTF-16. If `utf16` is non-null, place |
61 | the result in that array. Return the number of UTF-16 code units in the |
62 | result (1 or 2). If `utf16` is null, simply return the number of code |
63 | units that would be used. For invalid unicode codepoints, return 0. |
64 | */ |
65 | SK_SPI size_t ToUTF16(SkUnichar uni, uint16_t utf16[2] = nullptr); |
66 | |
67 | /** Returns the number of resulting UTF16 values needed to convert the src utf8 sequence. |
68 | * If dst is not null, it is filled with the corresponding values up to its capacity. |
69 | * If there is an error, -1 is returned and the dst[] buffer is undefined. |
70 | */ |
71 | SK_SPI int UTF8ToUTF16(uint16_t dst[], int dstCapacity, const char src[], size_t srcByteLength); |
72 | |
73 | } // namespace SkUTF |
74 | |
75 | #endif // SkUTF_DEFINED |
76 | |