google-protobuf 3.22.2 → 4.30.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (69) hide show
  1. checksums.yaml +4 -4
  2. data/ext/google/protobuf_c/Rakefile +3 -0
  3. data/ext/google/protobuf_c/convert.c +60 -86
  4. data/ext/google/protobuf_c/convert.h +3 -28
  5. data/ext/google/protobuf_c/defs.c +692 -72
  6. data/ext/google/protobuf_c/defs.h +3 -28
  7. data/ext/google/protobuf_c/extconf.rb +14 -1
  8. data/ext/google/protobuf_c/glue.c +135 -0
  9. data/ext/google/protobuf_c/map.c +89 -45
  10. data/ext/google/protobuf_c/map.h +12 -30
  11. data/ext/google/protobuf_c/message.c +169 -169
  12. data/ext/google/protobuf_c/message.h +11 -33
  13. data/ext/google/protobuf_c/protobuf.c +65 -188
  14. data/ext/google/protobuf_c/protobuf.h +27 -39
  15. data/ext/google/protobuf_c/repeated_field.c +72 -38
  16. data/ext/google/protobuf_c/repeated_field.h +11 -29
  17. data/ext/google/protobuf_c/ruby-upb.c +15064 -11220
  18. data/ext/google/protobuf_c/ruby-upb.h +10643 -5403
  19. data/ext/google/protobuf_c/shared_convert.c +69 -0
  20. data/ext/google/protobuf_c/shared_convert.h +26 -0
  21. data/ext/google/protobuf_c/shared_message.c +37 -0
  22. data/ext/google/protobuf_c/shared_message.h +21 -0
  23. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range.c +207 -0
  24. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range.h +9 -8
  25. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range_neon.inc +117 -0
  26. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range_sse.inc +272 -0
  27. data/ext/google/protobuf_c/wrap_memcpy.c +3 -26
  28. data/lib/google/protobuf/any_pb.rb +6 -8
  29. data/lib/google/protobuf/api_pb.rb +6 -26
  30. data/lib/google/protobuf/descriptor_pb.rb +21 -252
  31. data/lib/google/protobuf/duration_pb.rb +6 -8
  32. data/lib/google/protobuf/empty_pb.rb +6 -6
  33. data/lib/google/protobuf/ffi/descriptor.rb +175 -0
  34. data/lib/google/protobuf/ffi/descriptor_pool.rb +77 -0
  35. data/lib/google/protobuf/ffi/enum_descriptor.rb +183 -0
  36. data/lib/google/protobuf/ffi/ffi.rb +214 -0
  37. data/lib/google/protobuf/ffi/field_descriptor.rb +340 -0
  38. data/lib/google/protobuf/ffi/file_descriptor.rb +59 -0
  39. data/lib/google/protobuf/ffi/internal/arena.rb +60 -0
  40. data/lib/google/protobuf/ffi/internal/convert.rb +292 -0
  41. data/lib/google/protobuf/ffi/internal/pointer_helper.rb +35 -0
  42. data/lib/google/protobuf/ffi/internal/type_safety.rb +25 -0
  43. data/lib/google/protobuf/ffi/map.rb +433 -0
  44. data/lib/google/protobuf/ffi/message.rb +783 -0
  45. data/lib/google/protobuf/ffi/method_descriptor.rb +124 -0
  46. data/lib/google/protobuf/ffi/object_cache.rb +30 -0
  47. data/lib/google/protobuf/ffi/oneof_descriptor.rb +107 -0
  48. data/lib/google/protobuf/ffi/repeated_field.rb +411 -0
  49. data/lib/google/protobuf/ffi/service_descriptor.rb +117 -0
  50. data/lib/google/protobuf/field_mask_pb.rb +6 -7
  51. data/lib/google/protobuf/internal/object_cache.rb +99 -0
  52. data/lib/google/protobuf/message_exts.rb +3 -26
  53. data/lib/google/protobuf/plugin_pb.rb +6 -31
  54. data/lib/google/protobuf/repeated_field.rb +7 -31
  55. data/lib/google/protobuf/source_context_pb.rb +6 -7
  56. data/lib/google/protobuf/struct_pb.rb +6 -23
  57. data/lib/google/protobuf/timestamp_pb.rb +6 -8
  58. data/lib/google/protobuf/type_pb.rb +6 -71
  59. data/lib/google/protobuf/well_known_types.rb +5 -34
  60. data/lib/google/protobuf/wrappers_pb.rb +6 -31
  61. data/lib/google/protobuf.rb +27 -45
  62. data/lib/google/protobuf_ffi.rb +52 -0
  63. data/lib/google/protobuf_native.rb +19 -0
  64. data/lib/google/tasks/ffi.rake +100 -0
  65. metadata +92 -9
  66. data/ext/google/protobuf_c/third_party/utf8_range/naive.c +0 -92
  67. data/ext/google/protobuf_c/third_party/utf8_range/range2-neon.c +0 -157
  68. data/ext/google/protobuf_c/third_party/utf8_range/range2-sse.c +0 -170
  69. data/lib/google/protobuf/descriptor_dsl.rb +0 -465
@@ -1,32 +1,9 @@
1
1
  // Protocol Buffers - Google's data interchange format
2
2
  // Copyright 2014 Google Inc. All rights reserved.
3
- // https://developers.google.com/protocol-buffers/
4
3
  //
5
- // Redistribution and use in source and binary forms, with or without
6
- // modification, are permitted provided that the following conditions are
7
- // met:
8
- //
9
- // * Redistributions of source code must retain the above copyright
10
- // notice, this list of conditions and the following disclaimer.
11
- // * Redistributions in binary form must reproduce the above
12
- // copyright notice, this list of conditions and the following disclaimer
13
- // in the documentation and/or other materials provided with the
14
- // distribution.
15
- // * Neither the name of Google Inc. nor the names of its
16
- // contributors may be used to endorse or promote products derived from
17
- // this software without specific prior written permission.
18
- //
19
- // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
20
- // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
21
- // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
22
- // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
23
- // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24
- // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
25
- // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
26
- // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
27
- // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
28
- // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29
- // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
4
+ // Use of this source code is governed by a BSD-style
5
+ // license that can be found in the LICENSE file or at
6
+ // https://developers.google.com/open-source/licenses/bsd
30
7
 
31
8
  #include "message.h"
32
9
 
@@ -35,6 +12,7 @@
35
12
  #include "map.h"
36
13
  #include "protobuf.h"
37
14
  #include "repeated_field.h"
15
+ #include "shared_message.h"
38
16
 
39
17
  static VALUE cParseError = Qnil;
40
18
  static VALUE cAbstractMessage = Qnil;
@@ -53,6 +31,8 @@ VALUE MessageOrEnum_GetDescriptor(VALUE klass) {
53
31
  // -----------------------------------------------------------------------------
54
32
 
55
33
  typedef struct {
34
+ // IMPORTANT: WB_PROTECTED objects must only use the RB_OBJ_WRITE()
35
+ // macro to update VALUE references, as to trigger write barriers.
56
36
  VALUE arena;
57
37
  const upb_Message* msg; // Can get as mutable when non-frozen.
58
38
  const upb_MessageDef*
@@ -64,10 +44,12 @@ static void Message_mark(void* _self) {
64
44
  rb_gc_mark(self->arena);
65
45
  }
66
46
 
47
+ static size_t Message_memsize(const void* _self) { return sizeof(Message); }
48
+
67
49
  static rb_data_type_t Message_type = {
68
- "Message",
69
- {Message_mark, RUBY_DEFAULT_FREE, NULL},
70
- .flags = RUBY_TYPED_FREE_IMMEDIATELY,
50
+ "Google::Protobuf::Message",
51
+ {Message_mark, RUBY_DEFAULT_FREE, Message_memsize},
52
+ .flags = RUBY_TYPED_FREE_IMMEDIATELY | RUBY_TYPED_WB_PROTECTED,
71
53
  };
72
54
 
73
55
  static Message* ruby_to_Message(VALUE msg_rb) {
@@ -98,15 +80,19 @@ const upb_Message* Message_Get(VALUE msg_rb, const upb_MessageDef** m) {
98
80
  }
99
81
 
100
82
  upb_Message* Message_GetMutable(VALUE msg_rb, const upb_MessageDef** m) {
101
- rb_check_frozen(msg_rb);
102
- return (upb_Message*)Message_Get(msg_rb, m);
83
+ const upb_Message* upb_msg = Message_Get(msg_rb, m);
84
+ Protobuf_CheckNotFrozen(msg_rb, upb_Message_IsFrozen(upb_msg));
85
+ return (upb_Message*)upb_msg;
103
86
  }
104
87
 
105
- void Message_InitPtr(VALUE self_, upb_Message* msg, VALUE arena) {
88
+ void Message_InitPtr(VALUE self_, const upb_Message* msg, VALUE arena) {
89
+ PBRUBY_ASSERT(arena != Qnil);
106
90
  Message* self = ruby_to_Message(self_);
107
91
  self->msg = msg;
108
- self->arena = arena;
109
- ObjectCache_Add(msg, self_);
92
+ RB_OBJ_WRITE(self_, &self->arena, arena);
93
+ VALUE stored = ObjectCache_TryAdd(msg, self_);
94
+ (void)stored;
95
+ PBRUBY_ASSERT(stored == self_);
110
96
  }
111
97
 
112
98
  VALUE Message_GetArena(VALUE msg_rb) {
@@ -121,7 +107,7 @@ void Message_CheckClass(VALUE klass) {
121
107
  }
122
108
  }
123
109
 
124
- VALUE Message_GetRubyWrapper(upb_Message* msg, const upb_MessageDef* m,
110
+ VALUE Message_GetRubyWrapper(const upb_Message* msg, const upb_MessageDef* m,
125
111
  VALUE arena) {
126
112
  if (msg == NULL) return Qnil;
127
113
 
@@ -132,7 +118,6 @@ VALUE Message_GetRubyWrapper(upb_Message* msg, const upb_MessageDef* m,
132
118
  val = Message_alloc(klass);
133
119
  Message_InitPtr(val, msg, arena);
134
120
  }
135
-
136
121
  return val;
137
122
  }
138
123
 
@@ -264,7 +249,7 @@ static int extract_method_call(VALUE method_name, Message* self,
264
249
  static VALUE Message_oneof_accessor(VALUE _self, const upb_OneofDef* o,
265
250
  int accessor_type) {
266
251
  Message* self = ruby_to_Message(_self);
267
- const upb_FieldDef* oneof_field = upb_Message_WhichOneof(self->msg, o);
252
+ const upb_FieldDef* oneof_field = upb_Message_WhichOneofByDef(self->msg, o);
268
253
 
269
254
  switch (accessor_type) {
270
255
  case METHOD_PRESENCE:
@@ -304,13 +289,42 @@ static void Message_setfield(upb_Message* msg, const upb_FieldDef* f, VALUE val,
304
289
  upb_Message_SetFieldByDef(msg, f, msgval, arena);
305
290
  }
306
291
 
292
+ VALUE Message_getfield_frozen(const upb_Message* msg, const upb_FieldDef* f,
293
+ VALUE arena) {
294
+ upb_MessageValue msgval = upb_Message_GetFieldByDef(msg, f);
295
+ if (upb_FieldDef_IsMap(f)) {
296
+ if (msgval.map_val == NULL) {
297
+ return Map_EmptyFrozen(f);
298
+ }
299
+ const upb_FieldDef* key_f = map_field_key(f);
300
+ const upb_FieldDef* val_f = map_field_value(f);
301
+ upb_CType key_type = upb_FieldDef_CType(key_f);
302
+ TypeInfo value_type_info = TypeInfo_get(val_f);
303
+ return Map_GetRubyWrapper(msgval.map_val, key_type, value_type_info, arena);
304
+ }
305
+ if (upb_FieldDef_IsRepeated(f)) {
306
+ if (msgval.array_val == NULL) {
307
+ return RepeatedField_EmptyFrozen(f);
308
+ }
309
+ return RepeatedField_GetRubyWrapper(msgval.array_val, TypeInfo_get(f),
310
+ arena);
311
+ }
312
+ VALUE ret;
313
+ if (upb_FieldDef_IsSubMessage(f)) {
314
+ const upb_MessageDef* m = upb_FieldDef_MessageSubDef(f);
315
+ ret = Message_GetRubyWrapper(msgval.msg_val, m, arena);
316
+ } else {
317
+ ret = Convert_UpbToRuby(msgval, TypeInfo_get(f), Qnil);
318
+ }
319
+ return ret;
320
+ }
321
+
307
322
  VALUE Message_getfield(VALUE _self, const upb_FieldDef* f) {
308
323
  Message* self = ruby_to_Message(_self);
309
- // This is a special-case: upb_Message_Mutable() for map & array are logically
310
- // const (they will not change what is serialized) but physically
311
- // non-const, as they do allocate a repeated field or map. The logical
312
- // constness means it's ok to do even if the message is frozen.
313
- upb_Message* msg = (upb_Message*)self->msg;
324
+ if (upb_Message_IsFrozen(self->msg)) {
325
+ return Message_getfield_frozen(self->msg, f, self->arena);
326
+ }
327
+ upb_Message* msg = Message_GetMutable(_self, NULL);
314
328
  upb_Arena* arena = Arena_get(self->arena);
315
329
  if (upb_FieldDef_IsMap(f)) {
316
330
  upb_Map* map = upb_Message_Mutable(msg, f, arena).map;
@@ -323,12 +337,12 @@ VALUE Message_getfield(VALUE _self, const upb_FieldDef* f) {
323
337
  upb_Array* arr = upb_Message_Mutable(msg, f, arena).array;
324
338
  return RepeatedField_GetRubyWrapper(arr, TypeInfo_get(f), self->arena);
325
339
  } else if (upb_FieldDef_IsSubMessage(f)) {
326
- if (!upb_Message_HasFieldByDef(self->msg, f)) return Qnil;
340
+ if (!upb_Message_HasFieldByDef(msg, f)) return Qnil;
327
341
  upb_Message* submsg = upb_Message_Mutable(msg, f, arena).msg;
328
342
  const upb_MessageDef* m = upb_FieldDef_MessageSubDef(f);
329
343
  return Message_GetRubyWrapper(submsg, m, self->arena);
330
344
  } else {
331
- upb_MessageValue msgval = upb_Message_GetFieldByDef(self->msg, f);
345
+ upb_MessageValue msgval = upb_Message_GetFieldByDef(msg, f);
332
346
  return Convert_UpbToRuby(msgval, TypeInfo_get(f), self->arena);
333
347
  }
334
348
  }
@@ -348,7 +362,8 @@ static VALUE Message_field_accessor(VALUE _self, const upb_FieldDef* f,
348
362
  if (!upb_FieldDef_HasPresence(f)) {
349
363
  rb_raise(rb_eRuntimeError, "Field does not have presence.");
350
364
  }
351
- return upb_Message_HasFieldByDef(Message_Get(_self, NULL), f);
365
+ return upb_Message_HasFieldByDef(Message_Get(_self, NULL), f) ? Qtrue
366
+ : Qfalse;
352
367
  case METHOD_WRAPPER_GETTER: {
353
368
  Message* self = ruby_to_Message(_self);
354
369
  if (upb_Message_HasFieldByDef(self->msg, f)) {
@@ -452,7 +467,6 @@ static VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
452
467
  if (argc != 2) {
453
468
  rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
454
469
  }
455
- rb_check_frozen(_self);
456
470
  break;
457
471
  default:
458
472
  if (argc != 1) {
@@ -506,7 +520,8 @@ static int Map_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
506
520
  k = Convert_RubyToUpb(key, "", map_init->key_type, NULL);
507
521
 
508
522
  if (map_init->val_type.type == kUpb_CType_Message && TYPE(val) == T_HASH) {
509
- upb_MiniTable* t = upb_MessageDef_MiniTable(map_init->val_type.def.msgdef);
523
+ const upb_MiniTable* t =
524
+ upb_MessageDef_MiniTable(map_init->val_type.def.msgdef);
510
525
  upb_Message* msg = upb_Message_New(t, map_init->arena);
511
526
  Message_InitFromValue(msg, map_init->val_type.def.msgdef, val,
512
527
  map_init->arena);
@@ -537,7 +552,7 @@ static upb_MessageValue MessageValue_FromValue(VALUE val, TypeInfo info,
537
552
  upb_Arena* arena) {
538
553
  if (info.type == kUpb_CType_Message) {
539
554
  upb_MessageValue msgval;
540
- upb_MiniTable* t = upb_MessageDef_MiniTable(info.def.msgdef);
555
+ const upb_MiniTable* t = upb_MessageDef_MiniTable(info.def.msgdef);
541
556
  upb_Message* msg = upb_Message_New(t, arena);
542
557
  Message_InitFromValue(msg, info.def.msgdef, val, arena);
543
558
  msgval.msg_val = msg;
@@ -653,7 +668,7 @@ static VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
653
668
  Message* self = ruby_to_Message(_self);
654
669
  VALUE arena_rb = Arena_new();
655
670
  upb_Arena* arena = Arena_get(arena_rb);
656
- upb_MiniTable* t = upb_MessageDef_MiniTable(self->msgdef);
671
+ const upb_MiniTable* t = upb_MessageDef_MiniTable(self->msgdef);
657
672
  upb_Message* msg = upb_Message_New(t, arena);
658
673
 
659
674
  Message_InitPtr(_self, msg, arena_rb);
@@ -678,44 +693,12 @@ static VALUE Message_dup(VALUE _self) {
678
693
  Message* self = ruby_to_Message(_self);
679
694
  VALUE new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
680
695
  Message* new_msg_self = ruby_to_Message(new_msg);
681
- size_t size = upb_MessageDef_MiniTable(self->msgdef)->size;
682
-
683
- // TODO(copy unknown fields?)
684
- // TODO(use official upb msg copy function)
685
- memcpy((upb_Message*)new_msg_self->msg, self->msg, size);
696
+ const upb_MiniTable* m = upb_MessageDef_MiniTable(self->msgdef);
697
+ upb_Message_ShallowCopy((upb_Message*)new_msg_self->msg, self->msg, m);
686
698
  Arena_fuse(self->arena, Arena_get(new_msg_self->arena));
687
699
  return new_msg;
688
700
  }
689
701
 
690
- // Support function for Message_eq, and also used by other #eq functions.
691
- bool Message_Equal(const upb_Message* m1, const upb_Message* m2,
692
- const upb_MessageDef* m) {
693
- if (m1 == m2) return true;
694
-
695
- size_t size1, size2;
696
- int encode_opts =
697
- kUpb_EncodeOption_SkipUnknown | kUpb_EncodeOption_Deterministic;
698
- upb_Arena* arena_tmp = upb_Arena_New();
699
- const upb_MiniTable* layout = upb_MessageDef_MiniTable(m);
700
-
701
- // Compare deterministically serialized payloads with no unknown fields.
702
- char* data1;
703
- char* data2;
704
- upb_EncodeStatus status1 =
705
- upb_Encode(m1, layout, encode_opts, arena_tmp, &data1, &size1);
706
- upb_EncodeStatus status2 =
707
- upb_Encode(m2, layout, encode_opts, arena_tmp, &data2, &size2);
708
-
709
- if (status1 == kUpb_EncodeStatus_Ok && status2 == kUpb_EncodeStatus_Ok) {
710
- bool ret = (size1 == size2) && (memcmp(data1, data2, size1) == 0);
711
- upb_Arena_Free(arena_tmp);
712
- return ret;
713
- } else {
714
- upb_Arena_Free(arena_tmp);
715
- rb_raise(cParseError, "Error comparing messages");
716
- }
717
- }
718
-
719
702
  /*
720
703
  * call-seq:
721
704
  * Message.==(other) => boolean
@@ -732,28 +715,22 @@ static VALUE Message_eq(VALUE _self, VALUE _other) {
732
715
  Message* other = ruby_to_Message(_other);
733
716
  assert(self->msgdef == other->msgdef);
734
717
 
735
- return Message_Equal(self->msg, other->msg, self->msgdef) ? Qtrue : Qfalse;
718
+ const upb_MiniTable* m = upb_MessageDef_MiniTable(self->msgdef);
719
+ const int options = 0;
720
+ return upb_Message_IsEqual(self->msg, other->msg, m, options) ? Qtrue
721
+ : Qfalse;
736
722
  }
737
723
 
738
724
  uint64_t Message_Hash(const upb_Message* msg, const upb_MessageDef* m,
739
725
  uint64_t seed) {
740
- upb_Arena* arena = upb_Arena_New();
741
- char* data;
742
- size_t size;
743
-
744
- // Hash a deterministically serialized payloads with no unknown fields.
745
- upb_EncodeStatus status = upb_Encode(
746
- msg, upb_MessageDef_MiniTable(m),
747
- kUpb_EncodeOption_SkipUnknown | kUpb_EncodeOption_Deterministic, arena,
748
- &data, &size);
749
-
750
- if (status == kUpb_EncodeStatus_Ok) {
751
- uint64_t ret = _upb_Hash(data, size, seed);
752
- upb_Arena_Free(arena);
753
- return ret;
726
+ upb_Status status;
727
+ upb_Status_Clear(&status);
728
+ uint64_t return_value = shared_Message_Hash(msg, m, seed, &status);
729
+ if (upb_Status_IsOk(&status)) {
730
+ return return_value;
754
731
  } else {
755
- upb_Arena_Free(arena);
756
- rb_raise(cParseError, "Error calculating hash");
732
+ rb_raise(cParseError, "Message_Hash(): %s",
733
+ upb_Status_ErrorMessage(&status));
757
734
  }
758
735
  }
759
736
 
@@ -810,58 +787,34 @@ static VALUE Message_CreateHash(const upb_Message* msg,
810
787
  if (!msg) return Qnil;
811
788
 
812
789
  VALUE hash = rb_hash_new();
813
- int n = upb_MessageDef_FieldCount(m);
814
- bool is_proto2;
815
-
816
- // We currently have a few behaviors that are specific to proto2.
817
- // This is unfortunate, we should key behaviors off field attributes (like
818
- // whether a field has presence), not proto2 vs. proto3. We should see if we
819
- // can change this without breaking users.
820
- is_proto2 = upb_MessageDef_Syntax(m) == kUpb_Syntax_Proto2;
821
-
822
- for (int i = 0; i < n; i++) {
823
- const upb_FieldDef* field = upb_MessageDef_Field(m, i);
824
- TypeInfo type_info = TypeInfo_get(field);
825
- upb_MessageValue msgval;
826
- VALUE msg_value;
827
- VALUE msg_key;
828
-
829
- if (!is_proto2 && upb_FieldDef_IsSubMessage(field) &&
830
- !upb_FieldDef_IsRepeated(field) &&
831
- !upb_Message_HasFieldByDef(msg, field)) {
832
- // TODO: Legacy behavior, remove when we fix the is_proto2 differences.
833
- msg_key = ID2SYM(rb_intern(upb_FieldDef_Name(field)));
834
- rb_hash_aset(hash, msg_key, Qnil);
835
- continue;
836
- }
790
+ size_t iter = kUpb_Message_Begin;
791
+ const upb_DefPool* pool = upb_FileDef_Pool(upb_MessageDef_File(m));
792
+ const upb_FieldDef* field;
793
+ upb_MessageValue val;
837
794
 
838
- // Do not include fields that are not present (oneof or optional fields).
839
- if (is_proto2 && upb_FieldDef_HasPresence(field) &&
840
- !upb_Message_HasFieldByDef(msg, field)) {
795
+ while (upb_Message_Next(msg, m, pool, &field, &val, &iter)) {
796
+ if (upb_FieldDef_IsExtension(field)) {
797
+ // TODO: allow extensions once we have decided what naming scheme the
798
+ // symbol should use. eg. :"[pkg.ext]"
841
799
  continue;
842
800
  }
843
801
 
844
- msg_key = ID2SYM(rb_intern(upb_FieldDef_Name(field)));
845
- msgval = upb_Message_GetFieldByDef(msg, field);
846
-
847
- // Proto2 omits empty map/repeated filds also.
802
+ TypeInfo type_info = TypeInfo_get(field);
803
+ VALUE msg_value;
848
804
 
849
805
  if (upb_FieldDef_IsMap(field)) {
850
806
  const upb_MessageDef* entry_m = upb_FieldDef_MessageSubDef(field);
851
807
  const upb_FieldDef* key_f = upb_MessageDef_FindFieldByNumber(entry_m, 1);
852
808
  const upb_FieldDef* val_f = upb_MessageDef_FindFieldByNumber(entry_m, 2);
853
809
  upb_CType key_type = upb_FieldDef_CType(key_f);
854
- msg_value = Map_CreateHash(msgval.map_val, key_type, TypeInfo_get(val_f));
810
+ msg_value = Map_CreateHash(val.map_val, key_type, TypeInfo_get(val_f));
855
811
  } else if (upb_FieldDef_IsRepeated(field)) {
856
- if (is_proto2 &&
857
- (!msgval.array_val || upb_Array_Size(msgval.array_val) == 0)) {
858
- continue;
859
- }
860
- msg_value = RepeatedField_CreateArray(msgval.array_val, type_info);
812
+ msg_value = RepeatedField_CreateArray(val.array_val, type_info);
861
813
  } else {
862
- msg_value = Scalar_CreateHash(msgval, type_info);
814
+ msg_value = Scalar_CreateHash(val, type_info);
863
815
  }
864
816
 
817
+ VALUE msg_key = ID2SYM(rb_intern(upb_FieldDef_Name(field)));
865
818
  rb_hash_aset(hash, msg_key, msg_value);
866
819
  }
867
820
 
@@ -887,19 +840,44 @@ static VALUE Message_to_h(VALUE _self) {
887
840
  return Message_CreateHash(self->msg, self->msgdef);
888
841
  }
889
842
 
843
+ /*
844
+ * call-seq:
845
+ * Message.frozen? => bool
846
+ *
847
+ * Returns true if the message is frozen in either Ruby or the underlying
848
+ * representation. Freezes the Ruby message object if it is not already frozen
849
+ * in Ruby but it is frozen in the underlying representation.
850
+ */
851
+ VALUE Message_frozen(VALUE _self) {
852
+ Message* self = ruby_to_Message(_self);
853
+ if (!upb_Message_IsFrozen(self->msg)) {
854
+ PBRUBY_ASSERT(!RB_OBJ_FROZEN(_self));
855
+ return Qfalse;
856
+ }
857
+
858
+ // Lazily freeze the Ruby wrapper.
859
+ if (!RB_OBJ_FROZEN(_self)) RB_OBJ_FREEZE(_self);
860
+ return Qtrue;
861
+ }
862
+
890
863
  /*
891
864
  * call-seq:
892
865
  * Message.freeze => self
893
866
  *
894
- * Freezes the message object. We have to intercept this so we can pin the
895
- * Ruby object into memory so we don't forget it's frozen.
867
+ * Freezes the message object. We have to intercept this so we can freeze the
868
+ * underlying representation, not just the Ruby wrapper.
896
869
  */
897
- static VALUE Message_freeze(VALUE _self) {
870
+ VALUE Message_freeze(VALUE _self) {
898
871
  Message* self = ruby_to_Message(_self);
899
- if (!RB_OBJ_FROZEN(_self)) {
900
- Arena_Pin(self->arena, _self);
901
- RB_OBJ_FREEZE(_self);
872
+ if (RB_OBJ_FROZEN(_self)) {
873
+ PBRUBY_ASSERT(upb_Message_IsFrozen(self->msg));
874
+ return _self;
875
+ }
876
+ if (!upb_Message_IsFrozen(self->msg)) {
877
+ upb_Message_Freeze(Message_GetMutable(_self, NULL),
878
+ upb_MessageDef_MiniTable(self->msgdef));
902
879
  }
880
+ RB_OBJ_FREEZE(_self);
903
881
  return _self;
904
882
  }
905
883
 
@@ -955,7 +933,7 @@ static VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
955
933
  * MessageClass.decode(data, options) => message
956
934
  *
957
935
  * Decodes the given data (as a string containing bytes in protocol buffers wire
958
- * format) under the interpretration given by this message class's definition
936
+ * format) under the interpretation given by this message class's definition
959
937
  * and returns a message object with the corresponding field values.
960
938
  * @param options [Hash] options for the decoder
961
939
  * recursion_limit: set to maximum decoding depth for message (default is 64)
@@ -978,7 +956,7 @@ static VALUE Message_decode(int argc, VALUE* argv, VALUE klass) {
978
956
  rb_hash_lookup(hash_args, ID2SYM(rb_intern("recursion_limit")));
979
957
 
980
958
  if (depth != Qnil && TYPE(depth) == T_FIXNUM) {
981
- options |= UPB_DECODE_MAXDEPTH(FIX2INT(depth));
959
+ options |= upb_DecodeOptions_MaxDepth(FIX2INT(depth));
982
960
  }
983
961
  }
984
962
 
@@ -986,18 +964,27 @@ static VALUE Message_decode(int argc, VALUE* argv, VALUE klass) {
986
964
  rb_raise(rb_eArgError, "Expected string for binary protobuf data.");
987
965
  }
988
966
 
967
+ return Message_decode_bytes(RSTRING_LEN(data), RSTRING_PTR(data), options,
968
+ klass, /*freeze*/ false);
969
+ }
970
+
971
+ VALUE Message_decode_bytes(int size, const char* bytes, int options,
972
+ VALUE klass, bool freeze) {
989
973
  VALUE msg_rb = initialize_rb_class_with_no_args(klass);
990
974
  Message* msg = ruby_to_Message(msg_rb);
991
975
 
992
- upb_DecodeStatus status =
993
- upb_Decode(RSTRING_PTR(data), RSTRING_LEN(data), (upb_Message*)msg->msg,
994
- upb_MessageDef_MiniTable(msg->msgdef), NULL, options,
995
- Arena_get(msg->arena));
996
-
976
+ const upb_FileDef* file = upb_MessageDef_File(msg->msgdef);
977
+ const upb_ExtensionRegistry* extreg =
978
+ upb_DefPool_ExtensionRegistry(upb_FileDef_Pool(file));
979
+ upb_DecodeStatus status = upb_Decode(bytes, size, (upb_Message*)msg->msg,
980
+ upb_MessageDef_MiniTable(msg->msgdef),
981
+ extreg, options, Arena_get(msg->arena));
997
982
  if (status != kUpb_DecodeStatus_Ok) {
998
983
  rb_raise(cParseError, "Error occurred during parsing");
999
984
  }
1000
-
985
+ if (freeze) {
986
+ Message_freeze(msg_rb);
987
+ }
1001
988
  return msg_rb;
1002
989
  }
1003
990
 
@@ -1018,9 +1005,6 @@ static VALUE Message_decode_json(int argc, VALUE* argv, VALUE klass) {
1018
1005
  int options = 0;
1019
1006
  upb_Status status;
1020
1007
 
1021
- // TODO(haberman): use this message's pool instead.
1022
- const upb_DefPool* symtab = DescriptorPool_GetSymtab(generated_pool);
1023
-
1024
1008
  if (argc < 1 || argc > 2) {
1025
1009
  rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1026
1010
  }
@@ -1041,7 +1025,7 @@ static VALUE Message_decode_json(int argc, VALUE* argv, VALUE klass) {
1041
1025
  rb_raise(rb_eArgError, "Expected string for JSON data.");
1042
1026
  }
1043
1027
 
1044
- // TODO(cfallin): Check and respect string encoding. If not UTF-8, we need to
1028
+ // TODO: Check and respect string encoding. If not UTF-8, we need to
1045
1029
  // convert, because string handlers pass data directly to message string
1046
1030
  // fields.
1047
1031
 
@@ -1054,11 +1038,19 @@ static VALUE Message_decode_json(int argc, VALUE* argv, VALUE klass) {
1054
1038
  }
1055
1039
 
1056
1040
  upb_Status_Clear(&status);
1057
- if (!upb_JsonDecode(RSTRING_PTR(data), RSTRING_LEN(data),
1058
- (upb_Message*)msg->msg, msg->msgdef, symtab, options,
1059
- Arena_get(msg->arena), &status)) {
1060
- rb_raise(cParseError, "Error occurred during parsing: %s",
1061
- upb_Status_ErrorMessage(&status));
1041
+ const upb_DefPool* pool = upb_FileDef_Pool(upb_MessageDef_File(msg->msgdef));
1042
+
1043
+ int result = upb_JsonDecodeDetectingNonconformance(
1044
+ RSTRING_PTR(data), RSTRING_LEN(data), (upb_Message*)msg->msg,
1045
+ msg->msgdef, pool, options, Arena_get(msg->arena), &status);
1046
+
1047
+ switch (result) {
1048
+ case kUpb_JsonDecodeResult_Ok:
1049
+ break;
1050
+ case kUpb_JsonDecodeResult_Error:
1051
+ rb_raise(cParseError, "Error occurred during parsing: %s",
1052
+ upb_Status_ErrorMessage(&status));
1053
+ break;
1062
1054
  }
1063
1055
 
1064
1056
  return msg_rb;
@@ -1096,7 +1088,7 @@ static VALUE Message_encode(int argc, VALUE* argv, VALUE klass) {
1096
1088
  rb_hash_lookup(hash_args, ID2SYM(rb_intern("recursion_limit")));
1097
1089
 
1098
1090
  if (depth != Qnil && TYPE(depth) == T_FIXNUM) {
1099
- options |= UPB_DECODE_MAXDEPTH(FIX2INT(depth));
1091
+ options |= upb_DecodeOptions_MaxDepth(FIX2INT(depth));
1100
1092
  }
1101
1093
  }
1102
1094
 
@@ -1134,9 +1126,6 @@ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1134
1126
  size_t size;
1135
1127
  upb_Status status;
1136
1128
 
1137
- // TODO(haberman): use this message's pool instead.
1138
- const upb_DefPool* symtab = DescriptorPool_GetSymtab(generated_pool);
1139
-
1140
1129
  if (argc < 1 || argc > 2) {
1141
1130
  rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1142
1131
  }
@@ -1162,11 +1151,18 @@ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1162
1151
  Qfalse))) {
1163
1152
  options |= upb_JsonEncode_EmitDefaults;
1164
1153
  }
1154
+
1155
+ if (RTEST(rb_hash_lookup2(hash_args,
1156
+ ID2SYM(rb_intern("format_enums_as_integers")),
1157
+ Qfalse))) {
1158
+ options |= upb_JsonEncode_FormatEnumsAsIntegers;
1159
+ }
1165
1160
  }
1166
1161
 
1167
1162
  upb_Status_Clear(&status);
1168
- size = upb_JsonEncode(msg->msg, msg->msgdef, symtab, options, buf,
1169
- sizeof(buf), &status);
1163
+ const upb_DefPool* pool = upb_FileDef_Pool(upb_MessageDef_File(msg->msgdef));
1164
+ size = upb_JsonEncode(msg->msg, msg->msgdef, pool, options, buf, sizeof(buf),
1165
+ &status);
1170
1166
 
1171
1167
  if (!upb_Status_IsOk(&status)) {
1172
1168
  rb_raise(cParseError, "Error occurred during encoding: %s",
@@ -1176,7 +1172,7 @@ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1176
1172
  VALUE ret;
1177
1173
  if (size >= sizeof(buf)) {
1178
1174
  char* buf2 = malloc(size + 1);
1179
- upb_JsonEncode(msg->msg, msg->msgdef, symtab, options, buf2, size + 1,
1175
+ upb_JsonEncode(msg->msg, msg->msgdef, pool, options, buf2, size + 1,
1180
1176
  &status);
1181
1177
  ret = rb_str_new(buf2, size);
1182
1178
  free(buf2);
@@ -1309,9 +1305,12 @@ upb_Message* Message_deep_copy(const upb_Message* msg, const upb_MessageDef* m,
1309
1305
  upb_Message* new_msg = upb_Message_New(layout, arena);
1310
1306
  char* data;
1311
1307
 
1308
+ const upb_FileDef* file = upb_MessageDef_File(m);
1309
+ const upb_ExtensionRegistry* extreg =
1310
+ upb_DefPool_ExtensionRegistry(upb_FileDef_Pool(file));
1312
1311
  if (upb_Encode(msg, layout, 0, tmp_arena, &data, &size) !=
1313
1312
  kUpb_EncodeStatus_Ok ||
1314
- upb_Decode(data, size, new_msg, layout, NULL, 0, arena) !=
1313
+ upb_Decode(data, size, new_msg, layout, extreg, 0, arena) !=
1315
1314
  kUpb_DecodeStatus_Ok) {
1316
1315
  upb_Arena_Free(tmp_arena);
1317
1316
  rb_raise(cParseError, "Error occurred copying proto");
@@ -1399,6 +1398,7 @@ static void Message_define_class(VALUE klass) {
1399
1398
  rb_define_method(klass, "==", Message_eq, 1);
1400
1399
  rb_define_method(klass, "eql?", Message_eq, 1);
1401
1400
  rb_define_method(klass, "freeze", Message_freeze, 0);
1401
+ rb_define_method(klass, "frozen?", Message_frozen, 0);
1402
1402
  rb_define_method(klass, "hash", Message_hash, 0);
1403
1403
  rb_define_method(klass, "to_h", Message_to_h, 0);
1404
1404
  rb_define_method(klass, "inspect", Message_inspect, 0);
@@ -1,38 +1,13 @@
1
1
  // Protocol Buffers - Google's data interchange format
2
2
  // Copyright 2008 Google Inc. All rights reserved.
3
- // https://developers.google.com/protocol-buffers/
4
3
  //
5
- // Redistribution and use in source and binary forms, with or without
6
- // modification, are permitted provided that the following conditions are
7
- // met:
8
- //
9
- // * Redistributions of source code must retain the above copyright
10
- // notice, this list of conditions and the following disclaimer.
11
- // * Redistributions in binary form must reproduce the above
12
- // copyright notice, this list of conditions and the following disclaimer
13
- // in the documentation and/or other materials provided with the
14
- // distribution.
15
- // * Neither the name of Google Inc. nor the names of its
16
- // contributors may be used to endorse or promote products derived from
17
- // this software without specific prior written permission.
18
- //
19
- // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
20
- // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
21
- // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
22
- // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
23
- // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24
- // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
25
- // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
26
- // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
27
- // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
28
- // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29
- // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
4
+ // Use of this source code is governed by a BSD-style
5
+ // license that can be found in the LICENSE file or at
6
+ // https://developers.google.com/open-source/licenses/bsd
30
7
 
31
8
  #ifndef RUBY_PROTOBUF_MESSAGE_H_
32
9
  #define RUBY_PROTOBUF_MESSAGE_H_
33
10
 
34
- #include <ruby/ruby.h>
35
-
36
11
  #include "protobuf.h"
37
12
  #include "ruby-upb.h"
38
13
 
@@ -61,7 +36,7 @@ const upb_Message* Message_GetUpbMessage(VALUE value, const upb_MessageDef* m,
61
36
 
62
37
  // Gets or constructs a Ruby wrapper object for the given message. The wrapper
63
38
  // object will reference |arena| and ensure that it outlives this object.
64
- VALUE Message_GetRubyWrapper(upb_Message* msg, const upb_MessageDef* m,
39
+ VALUE Message_GetRubyWrapper(const upb_Message* msg, const upb_MessageDef* m,
65
40
  VALUE arena);
66
41
 
67
42
  // Gets the given field from this message.
@@ -79,10 +54,6 @@ uint64_t Message_Hash(const upb_Message* msg, const upb_MessageDef* m,
79
54
  upb_Message* Message_deep_copy(const upb_Message* msg, const upb_MessageDef* m,
80
55
  upb_Arena* arena);
81
56
 
82
- // Returns true if these two messages are equal.
83
- bool Message_Equal(const upb_Message* m1, const upb_Message* m2,
84
- const upb_MessageDef* m);
85
-
86
57
  // Checks that this Ruby object is a message, and raises an exception if not.
87
58
  void Message_CheckClass(VALUE klass);
88
59
 
@@ -98,6 +69,13 @@ VALUE build_module_from_enumdesc(VALUE _enumdesc);
98
69
  // module.
99
70
  VALUE MessageOrEnum_GetDescriptor(VALUE klass);
100
71
 
72
+ // Decodes a Message from a byte sequence.
73
+ VALUE Message_decode_bytes(int size, const char* bytes, int options,
74
+ VALUE klass, bool freeze);
75
+
76
+ // Recursively freeze message
77
+ VALUE Message_freeze(VALUE _self);
78
+
101
79
  // Call at startup to register all types in this module.
102
80
  void Message_register(VALUE protobuf);
103
81