google-protobuf 3.22.2 → 4.30.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (69) hide show
  1. checksums.yaml +4 -4
  2. data/ext/google/protobuf_c/Rakefile +3 -0
  3. data/ext/google/protobuf_c/convert.c +60 -86
  4. data/ext/google/protobuf_c/convert.h +3 -28
  5. data/ext/google/protobuf_c/defs.c +692 -72
  6. data/ext/google/protobuf_c/defs.h +3 -28
  7. data/ext/google/protobuf_c/extconf.rb +14 -1
  8. data/ext/google/protobuf_c/glue.c +135 -0
  9. data/ext/google/protobuf_c/map.c +89 -45
  10. data/ext/google/protobuf_c/map.h +12 -30
  11. data/ext/google/protobuf_c/message.c +169 -169
  12. data/ext/google/protobuf_c/message.h +11 -33
  13. data/ext/google/protobuf_c/protobuf.c +65 -188
  14. data/ext/google/protobuf_c/protobuf.h +27 -39
  15. data/ext/google/protobuf_c/repeated_field.c +72 -38
  16. data/ext/google/protobuf_c/repeated_field.h +11 -29
  17. data/ext/google/protobuf_c/ruby-upb.c +15064 -11220
  18. data/ext/google/protobuf_c/ruby-upb.h +10643 -5403
  19. data/ext/google/protobuf_c/shared_convert.c +69 -0
  20. data/ext/google/protobuf_c/shared_convert.h +26 -0
  21. data/ext/google/protobuf_c/shared_message.c +37 -0
  22. data/ext/google/protobuf_c/shared_message.h +21 -0
  23. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range.c +207 -0
  24. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range.h +9 -8
  25. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range_neon.inc +117 -0
  26. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range_sse.inc +272 -0
  27. data/ext/google/protobuf_c/wrap_memcpy.c +3 -26
  28. data/lib/google/protobuf/any_pb.rb +6 -8
  29. data/lib/google/protobuf/api_pb.rb +6 -26
  30. data/lib/google/protobuf/descriptor_pb.rb +21 -252
  31. data/lib/google/protobuf/duration_pb.rb +6 -8
  32. data/lib/google/protobuf/empty_pb.rb +6 -6
  33. data/lib/google/protobuf/ffi/descriptor.rb +175 -0
  34. data/lib/google/protobuf/ffi/descriptor_pool.rb +77 -0
  35. data/lib/google/protobuf/ffi/enum_descriptor.rb +183 -0
  36. data/lib/google/protobuf/ffi/ffi.rb +214 -0
  37. data/lib/google/protobuf/ffi/field_descriptor.rb +340 -0
  38. data/lib/google/protobuf/ffi/file_descriptor.rb +59 -0
  39. data/lib/google/protobuf/ffi/internal/arena.rb +60 -0
  40. data/lib/google/protobuf/ffi/internal/convert.rb +292 -0
  41. data/lib/google/protobuf/ffi/internal/pointer_helper.rb +35 -0
  42. data/lib/google/protobuf/ffi/internal/type_safety.rb +25 -0
  43. data/lib/google/protobuf/ffi/map.rb +433 -0
  44. data/lib/google/protobuf/ffi/message.rb +783 -0
  45. data/lib/google/protobuf/ffi/method_descriptor.rb +124 -0
  46. data/lib/google/protobuf/ffi/object_cache.rb +30 -0
  47. data/lib/google/protobuf/ffi/oneof_descriptor.rb +107 -0
  48. data/lib/google/protobuf/ffi/repeated_field.rb +411 -0
  49. data/lib/google/protobuf/ffi/service_descriptor.rb +117 -0
  50. data/lib/google/protobuf/field_mask_pb.rb +6 -7
  51. data/lib/google/protobuf/internal/object_cache.rb +99 -0
  52. data/lib/google/protobuf/message_exts.rb +3 -26
  53. data/lib/google/protobuf/plugin_pb.rb +6 -31
  54. data/lib/google/protobuf/repeated_field.rb +7 -31
  55. data/lib/google/protobuf/source_context_pb.rb +6 -7
  56. data/lib/google/protobuf/struct_pb.rb +6 -23
  57. data/lib/google/protobuf/timestamp_pb.rb +6 -8
  58. data/lib/google/protobuf/type_pb.rb +6 -71
  59. data/lib/google/protobuf/well_known_types.rb +5 -34
  60. data/lib/google/protobuf/wrappers_pb.rb +6 -31
  61. data/lib/google/protobuf.rb +27 -45
  62. data/lib/google/protobuf_ffi.rb +52 -0
  63. data/lib/google/protobuf_native.rb +19 -0
  64. data/lib/google/tasks/ffi.rake +100 -0
  65. metadata +92 -9
  66. data/ext/google/protobuf_c/third_party/utf8_range/naive.c +0 -92
  67. data/ext/google/protobuf_c/third_party/utf8_range/range2-neon.c +0 -157
  68. data/ext/google/protobuf_c/third_party/utf8_range/range2-sse.c +0 -170
  69. data/lib/google/protobuf/descriptor_dsl.rb +0 -465
@@ -0,0 +1,69 @@
1
+ // Protocol Buffers - Google's data interchange format
2
+ // Copyright 2023 Google Inc. All rights reserved.
3
+ //
4
+ // Use of this source code is governed by a BSD-style
5
+ // license that can be found in the LICENSE file or at
6
+ // https://developers.google.com/open-source/licenses/bsd
7
+
8
+ // -----------------------------------------------------------------------------
9
+ // Ruby <-> upb data conversion functions. Strictly free of dependencies on
10
+ // Ruby interpreter internals.
11
+
12
+ #include "shared_convert.h"
13
+
14
+ bool shared_Msgval_IsEqual(upb_MessageValue val1, upb_MessageValue val2,
15
+ upb_CType type, const upb_MessageDef* msgdef,
16
+ upb_Status* status) {
17
+ switch (type) {
18
+ case kUpb_CType_Bool:
19
+ return memcmp(&val1, &val2, 1) == 0;
20
+ case kUpb_CType_Float:
21
+ case kUpb_CType_Int32:
22
+ case kUpb_CType_UInt32:
23
+ case kUpb_CType_Enum:
24
+ return memcmp(&val1, &val2, 4) == 0;
25
+ case kUpb_CType_Double:
26
+ case kUpb_CType_Int64:
27
+ case kUpb_CType_UInt64:
28
+ return memcmp(&val1, &val2, 8) == 0;
29
+ case kUpb_CType_String:
30
+ case kUpb_CType_Bytes:
31
+ return val1.str_val.size == val2.str_val.size &&
32
+ memcmp(val1.str_val.data, val2.str_val.data, val1.str_val.size) ==
33
+ 0;
34
+ case kUpb_CType_Message: {
35
+ const upb_MiniTable* m = upb_MessageDef_MiniTable(msgdef);
36
+ const int options = 0;
37
+ return upb_Message_IsEqual(val1.msg_val, val2.msg_val, m, options);
38
+ }
39
+ default:
40
+ upb_Status_SetErrorMessage(status, "Internal error, unexpected type");
41
+ return false;
42
+ }
43
+ }
44
+
45
+ uint64_t shared_Msgval_GetHash(upb_MessageValue val, upb_CType type,
46
+ const upb_MessageDef* msgdef, uint64_t seed,
47
+ upb_Status* status) {
48
+ switch (type) {
49
+ case kUpb_CType_Bool:
50
+ return _upb_Hash(&val, 1, seed);
51
+ case kUpb_CType_Float:
52
+ case kUpb_CType_Int32:
53
+ case kUpb_CType_UInt32:
54
+ case kUpb_CType_Enum:
55
+ return _upb_Hash(&val, 4, seed);
56
+ case kUpb_CType_Double:
57
+ case kUpb_CType_Int64:
58
+ case kUpb_CType_UInt64:
59
+ return _upb_Hash(&val, 8, seed);
60
+ case kUpb_CType_String:
61
+ case kUpb_CType_Bytes:
62
+ return _upb_Hash(val.str_val.data, val.str_val.size, seed);
63
+ case kUpb_CType_Message:
64
+ return shared_Message_Hash(val.msg_val, msgdef, seed, status);
65
+ default:
66
+ upb_Status_SetErrorMessage(status, "Internal error, unexpected type");
67
+ return 0;
68
+ }
69
+ }
@@ -0,0 +1,26 @@
1
+ // Protocol Buffers - Google's data interchange format
2
+ // Copyright 2023 Google Inc. All rights reserved.
3
+ //
4
+ // Use of this source code is governed by a BSD-style
5
+ // license that can be found in the LICENSE file or at
6
+ // https://developers.google.com/open-source/licenses/bsd
7
+
8
+ // -----------------------------------------------------------------------------
9
+ // Ruby <-> upb data conversion functions. Strictly free of dependencies on
10
+ // Ruby interpreter internals.
11
+
12
+ #ifndef RUBY_PROTOBUF_SHARED_CONVERT_H_
13
+ #define RUBY_PROTOBUF_SHARED_CONVERT_H_
14
+
15
+ #include "ruby-upb.h"
16
+ #include "shared_message.h"
17
+
18
+ bool shared_Msgval_IsEqual(upb_MessageValue val1, upb_MessageValue val2,
19
+ upb_CType type, const upb_MessageDef* msgdef,
20
+ upb_Status* status);
21
+
22
+ uint64_t shared_Msgval_GetHash(upb_MessageValue val, upb_CType type,
23
+ const upb_MessageDef* msgdef, uint64_t seed,
24
+ upb_Status* status);
25
+
26
+ #endif // RUBY_PROTOBUF_SHARED_CONVERT_H_
@@ -0,0 +1,37 @@
1
+ // Protocol Buffers - Google's data interchange format
2
+ // Copyright 2023 Google Inc. All rights reserved.
3
+ //
4
+ // Use of this source code is governed by a BSD-style
5
+ // license that can be found in the LICENSE file or at
6
+ // https://developers.google.com/open-source/licenses/bsd
7
+
8
+ // -----------------------------------------------------------------------------
9
+ // Ruby Message functions. Strictly free of dependencies on
10
+ // Ruby interpreter internals.
11
+
12
+ #include "shared_message.h"
13
+
14
+ // Support function for Message_Hash. Returns a hash value for the given
15
+ // message.
16
+ uint64_t shared_Message_Hash(const upb_Message* msg, const upb_MessageDef* m,
17
+ uint64_t seed, upb_Status* status) {
18
+ upb_Arena* arena = upb_Arena_New();
19
+ char* data;
20
+ size_t size;
21
+
22
+ // Hash a deterministically serialized payloads with no unknown fields.
23
+ upb_EncodeStatus encode_status = upb_Encode(
24
+ msg, upb_MessageDef_MiniTable(m),
25
+ kUpb_EncodeOption_SkipUnknown | kUpb_EncodeOption_Deterministic, arena,
26
+ &data, &size);
27
+
28
+ if (encode_status == kUpb_EncodeStatus_Ok) {
29
+ uint64_t ret = _upb_Hash(data, size, seed);
30
+ upb_Arena_Free(arena);
31
+ return ret;
32
+ }
33
+
34
+ upb_Arena_Free(arena);
35
+ upb_Status_SetErrorMessage(status, "Error calculating hash");
36
+ return 0;
37
+ }
@@ -0,0 +1,21 @@
1
+ // Protocol Buffers - Google's data interchange format
2
+ // Copyright 2023 Google Inc. All rights reserved.
3
+ //
4
+ // Use of this source code is governed by a BSD-style
5
+ // license that can be found in the LICENSE file or at
6
+ // https://developers.google.com/open-source/licenses/bsd
7
+
8
+ // -----------------------------------------------------------------------------
9
+ // Ruby Message functions. Strictly free of dependencies on
10
+ // Ruby interpreter internals.
11
+
12
+ #ifndef RUBY_PROTOBUF_SHARED_MESSAGE_H_
13
+ #define RUBY_PROTOBUF_SHARED_MESSAGE_H_
14
+
15
+ #include "ruby-upb.h"
16
+
17
+ // Returns a hash value for the given message.
18
+ uint64_t shared_Message_Hash(const upb_Message* msg, const upb_MessageDef* m,
19
+ uint64_t seed, upb_Status* status);
20
+
21
+ #endif // RUBY_PROTOBUF_SHARED_MESSAGE_H_
@@ -0,0 +1,207 @@
1
+ // Copyright 2023 Google LLC
2
+ //
3
+ // Use of this source code is governed by an MIT-style
4
+ // license that can be found in the LICENSE file or at
5
+ // https://opensource.org/licenses/MIT.
6
+
7
+ /* This is a wrapper for the Google range-sse.cc algorithm which checks whether
8
+ * a sequence of bytes is a valid UTF-8 sequence and finds the longest valid
9
+ * prefix of the UTF-8 sequence.
10
+ *
11
+ * The key difference is that it checks for as much ASCII symbols as possible
12
+ * and then falls back to the range-sse.cc algorithm. The changes to the
13
+ * algorithm are cosmetic, mostly to trick the clang compiler to produce optimal
14
+ * code.
15
+ *
16
+ * For API see the utf8_validity.h header.
17
+ */
18
+ #include "utf8_range.h"
19
+
20
+ #include <stddef.h>
21
+ #include <stdint.h>
22
+ #include <string.h>
23
+
24
+ #if defined(__GNUC__)
25
+ #define FORCE_INLINE_ATTR __attribute__((always_inline))
26
+ #elif defined(_MSC_VER)
27
+ #define FORCE_INLINE_ATTR __forceinline
28
+ #else
29
+ #define FORCE_INLINE_ATTR
30
+ #endif
31
+
32
+ static FORCE_INLINE_ATTR inline uint64_t utf8_range_UnalignedLoad64(
33
+ const void* p) {
34
+ uint64_t t;
35
+ memcpy(&t, p, sizeof t);
36
+ return t;
37
+ }
38
+
39
+ static FORCE_INLINE_ATTR inline int utf8_range_AsciiIsAscii(unsigned char c) {
40
+ return c < 128;
41
+ }
42
+
43
+ static FORCE_INLINE_ATTR inline int utf8_range_IsTrailByteOk(const char c) {
44
+ return (int8_t)(c) <= (int8_t)(0xBF);
45
+ }
46
+
47
+ /* If return_position is false then it returns 1 if |data| is a valid utf8
48
+ * sequence, otherwise returns 0.
49
+ * If return_position is set to true, returns the length in bytes of the prefix
50
+ of |data| that is all structurally valid UTF-8.
51
+ */
52
+ static size_t utf8_range_ValidateUTF8Naive(const char* data, const char* end,
53
+ int return_position) {
54
+ /* We return err_pos in the loop which is always 0 if !return_position */
55
+ size_t err_pos = 0;
56
+ size_t codepoint_bytes = 0;
57
+ /* The early check is done because of early continue's on codepoints of all
58
+ * sizes, i.e. we first check for ascii and if it is, we call continue, then
59
+ * for 2 byte codepoints, etc. This is done in order to reduce indentation and
60
+ * improve readability of the codepoint validity check.
61
+ */
62
+ while (data + codepoint_bytes < end) {
63
+ if (return_position) {
64
+ err_pos += codepoint_bytes;
65
+ }
66
+ data += codepoint_bytes;
67
+ const size_t len = end - data;
68
+ const unsigned char byte1 = data[0];
69
+
70
+ /* We do not skip many ascii bytes at the same time as this function is
71
+ used for tail checking (< 16 bytes) and for non x86 platforms. We also
72
+ don't think that cases where non-ASCII codepoints are followed by ascii
73
+ happen often. For small strings it also introduces some penalty. For
74
+ purely ascii UTF8 strings (which is the overwhelming case) we call
75
+ SkipAscii function which is multiplatform and extremely fast.
76
+ */
77
+ /* [00..7F] ASCII -> 1 byte */
78
+ if (utf8_range_AsciiIsAscii(byte1)) {
79
+ codepoint_bytes = 1;
80
+ continue;
81
+ }
82
+ /* [C2..DF], [80..BF] -> 2 bytes */
83
+ if (len >= 2 && byte1 >= 0xC2 && byte1 <= 0xDF &&
84
+ utf8_range_IsTrailByteOk(data[1])) {
85
+ codepoint_bytes = 2;
86
+ continue;
87
+ }
88
+ if (len >= 3) {
89
+ const unsigned char byte2 = data[1];
90
+ const unsigned char byte3 = data[2];
91
+
92
+ /* Is byte2, byte3 between [0x80, 0xBF]
93
+ * Check for 0x80 was done above.
94
+ */
95
+ if (!utf8_range_IsTrailByteOk(byte2) ||
96
+ !utf8_range_IsTrailByteOk(byte3)) {
97
+ return err_pos;
98
+ }
99
+
100
+ if (/* E0, A0..BF, 80..BF */
101
+ ((byte1 == 0xE0 && byte2 >= 0xA0) ||
102
+ /* E1..EC, 80..BF, 80..BF */
103
+ (byte1 >= 0xE1 && byte1 <= 0xEC) ||
104
+ /* ED, 80..9F, 80..BF */
105
+ (byte1 == 0xED && byte2 <= 0x9F) ||
106
+ /* EE..EF, 80..BF, 80..BF */
107
+ (byte1 >= 0xEE && byte1 <= 0xEF))) {
108
+ codepoint_bytes = 3;
109
+ continue;
110
+ }
111
+ if (len >= 4) {
112
+ const unsigned char byte4 = data[3];
113
+ /* Is byte4 between 0x80 ~ 0xBF */
114
+ if (!utf8_range_IsTrailByteOk(byte4)) {
115
+ return err_pos;
116
+ }
117
+
118
+ if (/* F0, 90..BF, 80..BF, 80..BF */
119
+ ((byte1 == 0xF0 && byte2 >= 0x90) ||
120
+ /* F1..F3, 80..BF, 80..BF, 80..BF */
121
+ (byte1 >= 0xF1 && byte1 <= 0xF3) ||
122
+ /* F4, 80..8F, 80..BF, 80..BF */
123
+ (byte1 == 0xF4 && byte2 <= 0x8F))) {
124
+ codepoint_bytes = 4;
125
+ continue;
126
+ }
127
+ }
128
+ }
129
+ return err_pos;
130
+ }
131
+ if (return_position) {
132
+ err_pos += codepoint_bytes;
133
+ }
134
+ /* if return_position is false, this returns 1.
135
+ * if return_position is true, this returns err_pos.
136
+ */
137
+ return err_pos + (1 - return_position);
138
+ }
139
+
140
+ #if defined(__SSE4_1__) || (defined(__ARM_NEON) && defined(__ARM_64BIT_STATE))
141
+ /* Returns the number of bytes needed to skip backwards to get to the first
142
+ byte of codepoint.
143
+ */
144
+ static inline int utf8_range_CodepointSkipBackwards(int32_t codepoint_word) {
145
+ const int8_t* const codepoint = (const int8_t*)(&codepoint_word);
146
+ if (!utf8_range_IsTrailByteOk(codepoint[3])) {
147
+ return 1;
148
+ } else if (!utf8_range_IsTrailByteOk(codepoint[2])) {
149
+ return 2;
150
+ } else if (!utf8_range_IsTrailByteOk(codepoint[1])) {
151
+ return 3;
152
+ }
153
+ return 0;
154
+ }
155
+ #endif // __SSE4_1__
156
+
157
+ /* Skipping over ASCII as much as possible, per 8 bytes. It is intentional
158
+ as most strings to check for validity consist only of 1 byte codepoints.
159
+ */
160
+ static inline const char* utf8_range_SkipAscii(const char* data,
161
+ const char* end) {
162
+ while (8 <= end - data &&
163
+ (utf8_range_UnalignedLoad64(data) & 0x8080808080808080) == 0) {
164
+ data += 8;
165
+ }
166
+ while (data < end && utf8_range_AsciiIsAscii(*data)) {
167
+ ++data;
168
+ }
169
+ return data;
170
+ }
171
+
172
+ #if defined(__SSE4_1__)
173
+ #include "utf8_range_sse.inc"
174
+ #elif defined(__ARM_NEON) && defined(__ARM_64BIT_STATE)
175
+ #include "utf8_range_neon.inc"
176
+ #endif
177
+
178
+ static FORCE_INLINE_ATTR inline size_t utf8_range_Validate(
179
+ const char* data, size_t len, int return_position) {
180
+ if (len == 0) return 1 - return_position;
181
+ // Save buffer start address for later use
182
+ const char* const data_original = data;
183
+ const char* const end = data + len;
184
+ data = utf8_range_SkipAscii(data, end);
185
+ /* SIMD algorithm always outperforms the naive version for any data of
186
+ length >=16.
187
+ */
188
+ if (end - data < 16) {
189
+ return (return_position ? (data - data_original) : 0) +
190
+ utf8_range_ValidateUTF8Naive(data, end, return_position);
191
+ }
192
+ #if defined(__SSE4_1__) || (defined(__ARM_NEON) && defined(__ARM_64BIT_STATE))
193
+ return utf8_range_ValidateUTF8Simd(
194
+ data_original, data, end, return_position);
195
+ #else
196
+ return (return_position ? (data - data_original) : 0) +
197
+ utf8_range_ValidateUTF8Naive(data, end, return_position);
198
+ #endif
199
+ }
200
+
201
+ int utf8_range_IsValid(const char* data, size_t len) {
202
+ return utf8_range_Validate(data, len, /*return_position=*/0) != 0;
203
+ }
204
+
205
+ size_t utf8_range_ValidPrefix(const char* data, size_t len) {
206
+ return utf8_range_Validate(data, len, /*return_position=*/1);
207
+ }
@@ -1,18 +1,19 @@
1
1
  #ifndef THIRD_PARTY_UTF8_RANGE_UTF8_RANGE_H_
2
2
  #define THIRD_PARTY_UTF8_RANGE_UTF8_RANGE_H_
3
3
 
4
+ #include <stddef.h>
5
+
4
6
  #ifdef __cplusplus
5
7
  extern "C" {
6
8
  #endif
7
9
 
8
- #if (defined(__ARM_NEON) && defined(__aarch64__)) || defined(__SSE4_1__)
9
- int utf8_range2(const unsigned char* data, int len);
10
- #else
11
- int utf8_naive(const unsigned char* data, int len);
12
- static inline int utf8_range2(const unsigned char* data, int len) {
13
- return utf8_naive(data, len);
14
- }
15
- #endif
10
+ // Returns 1 if the sequence of characters is a valid UTF-8 sequence, otherwise
11
+ // 0.
12
+ int utf8_range_IsValid(const char* data, size_t len);
13
+
14
+ // Returns the length in bytes of the prefix of str that is all
15
+ // structurally valid UTF-8.
16
+ size_t utf8_range_ValidPrefix(const char* data, size_t len);
16
17
 
17
18
  #ifdef __cplusplus
18
19
  } // extern "C"
@@ -0,0 +1,117 @@
1
+ #include <arm_neon.h>
2
+
3
+ /* This code is almost the same as SSE implementation, please reference
4
+ * utf8-range-sse.inc for detailed explanation.
5
+ * The only difference is the range adjustment step. NEON code is more
6
+ * straightforward.
7
+ */
8
+
9
+ static FORCE_INLINE_ATTR inline size_t utf8_range_ValidateUTF8Simd(
10
+ const char* data_original, const char* data, const char* end,
11
+ int return_position) {
12
+ const uint8x16_t first_len_tbl = {
13
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 2, 3,
14
+ };
15
+ const uint8x16_t first_range_tbl = {
16
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 8, 8, 8,
17
+ };
18
+ const uint8x16_t range_min_tbl = {
19
+ 0x00, 0x80, 0x80, 0x80, 0xA0, 0x80, 0x90, 0x80,
20
+ 0xC2, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF,
21
+ };
22
+ const uint8x16_t range_max_tbl = {
23
+ 0x7F, 0xBF, 0xBF, 0xBF, 0xBF, 0x9F, 0xBF, 0x8F,
24
+ 0xF4, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
25
+ };
26
+ /* Range adjustment in NEON uint8x16x2 table. Note that lanes are interleaved
27
+ * in register. The table below is plotted vertically to ease understanding.
28
+ * The 1st column is for E0~EF, 2nd column for F0~FF.
29
+ */
30
+ // clang-format off
31
+ const uint8_t range_adjust_tbl_data[] = {
32
+ /* index -> 0~15 16~31 <- index */
33
+ /* E0 -> */ 2, 3, /* <- F0 */
34
+ 0, 0,
35
+ 0, 0,
36
+ 0, 0,
37
+ 0, 4, /* <- F4 */
38
+ 0, 0,
39
+ 0, 0,
40
+ 0, 0,
41
+ 0, 0,
42
+ 0, 0,
43
+ 0, 0,
44
+ 0, 0,
45
+ 0, 0,
46
+ /* ED -> */ 3, 0,
47
+ 0, 0,
48
+ 0, 0,
49
+ };
50
+ // clang-format on
51
+ const uint8x16x2_t range_adjust_tbl = vld2q_u8(range_adjust_tbl_data);
52
+
53
+ const uint8x16_t const_1 = vdupq_n_u8(1);
54
+ const uint8x16_t const_2 = vdupq_n_u8(2);
55
+ const uint8x16_t const_e0 = vdupq_n_u8(0xE0);
56
+
57
+ uint8x16_t prev_input = vdupq_n_u8(0);
58
+ uint8x16_t prev_first_len = vdupq_n_u8(0);
59
+ uint8x16_t error = vdupq_n_u8(0);
60
+
61
+ while (end - data >= 16) {
62
+ const uint8x16_t input = vld1q_u8((const uint8_t*)data);
63
+
64
+ const uint8x16_t high_nibbles = vshrq_n_u8(input, 4);
65
+
66
+ const uint8x16_t first_len = vqtbl1q_u8(first_len_tbl, high_nibbles);
67
+
68
+ uint8x16_t range = vqtbl1q_u8(first_range_tbl, high_nibbles);
69
+
70
+ range = vorrq_u8(range, vextq_u8(prev_first_len, first_len, 15));
71
+
72
+ uint8x16_t shift2 = vextq_u8(prev_first_len, first_len, 14);
73
+ shift2 = vqsubq_u8(shift2, const_1);
74
+ range = vorrq_u8(range, shift2);
75
+
76
+ uint8x16_t shift3 = vextq_u8(prev_first_len, first_len, 13);
77
+ shift3 = vqsubq_u8(shift3, const_2);
78
+ range = vorrq_u8(range, shift3);
79
+
80
+ uint8x16_t shift1 = vextq_u8(prev_input, input, 15);
81
+ shift1 = vsubq_u8(shift1, const_e0);
82
+ range = vaddq_u8(range, vqtbl2q_u8(range_adjust_tbl, shift1));
83
+
84
+ const uint8x16_t min_range = vqtbl1q_u8(range_min_tbl, range);
85
+ const uint8x16_t max_range = vqtbl1q_u8(range_max_tbl, range);
86
+
87
+ if (return_position) {
88
+ error = vcltq_u8(input, min_range);
89
+ error = vorrq_u8(error, vcgtq_u8(input, max_range));
90
+ if (vmaxvq_u32(vreinterpretq_u32_u8(error))) {
91
+ break;
92
+ }
93
+ } else {
94
+ error = vorrq_u8(error, vcltq_u8(input, min_range));
95
+ error = vorrq_u8(error, vcgtq_u8(input, max_range));
96
+ }
97
+
98
+ prev_input = input;
99
+ prev_first_len = first_len;
100
+
101
+ data += 16;
102
+ }
103
+
104
+ if (return_position && data == data_original) {
105
+ return utf8_range_ValidateUTF8Naive(data, end, return_position);
106
+ }
107
+ const int32_t prev = vgetq_lane_s32(vreinterpretq_s32_u8(prev_input), 3);
108
+ data -= utf8_range_CodepointSkipBackwards(prev);
109
+ if (return_position) {
110
+ return (data - data_original) +
111
+ utf8_range_ValidateUTF8Naive(data, end, return_position);
112
+ }
113
+ if (vmaxvq_u32(vreinterpretq_u32_u8(error))) {
114
+ return 0;
115
+ }
116
+ return utf8_range_ValidateUTF8Naive(data, end, return_position);
117
+ }