google-protobuf 3.25.6 → 4.30.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (61) hide show
  1. checksums.yaml +4 -4
  2. data/ext/google/protobuf_c/convert.c +33 -15
  3. data/ext/google/protobuf_c/defs.c +526 -29
  4. data/ext/google/protobuf_c/extconf.rb +13 -1
  5. data/ext/google/protobuf_c/glue.c +79 -0
  6. data/ext/google/protobuf_c/map.c +72 -27
  7. data/ext/google/protobuf_c/map.h +7 -3
  8. data/ext/google/protobuf_c/message.c +113 -116
  9. data/ext/google/protobuf_c/message.h +2 -6
  10. data/ext/google/protobuf_c/protobuf.c +32 -18
  11. data/ext/google/protobuf_c/protobuf.h +3 -7
  12. data/ext/google/protobuf_c/repeated_field.c +58 -23
  13. data/ext/google/protobuf_c/repeated_field.h +6 -2
  14. data/ext/google/protobuf_c/ruby-upb.c +14926 -11596
  15. data/ext/google/protobuf_c/ruby-upb.h +8701 -5832
  16. data/ext/google/protobuf_c/shared_convert.c +7 -2
  17. data/ext/google/protobuf_c/shared_message.c +3 -32
  18. data/ext/google/protobuf_c/shared_message.h +0 -4
  19. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range.c +207 -0
  20. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range.h +9 -8
  21. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range_neon.inc +117 -0
  22. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range_sse.inc +272 -0
  23. data/lib/google/protobuf/any_pb.rb +1 -22
  24. data/lib/google/protobuf/api_pb.rb +1 -24
  25. data/lib/google/protobuf/descriptor_pb.rb +4 -23
  26. data/lib/google/protobuf/duration_pb.rb +1 -22
  27. data/lib/google/protobuf/empty_pb.rb +1 -22
  28. data/lib/google/protobuf/ffi/descriptor.rb +14 -4
  29. data/lib/google/protobuf/ffi/descriptor_pool.rb +3 -1
  30. data/lib/google/protobuf/ffi/enum_descriptor.rb +13 -1
  31. data/lib/google/protobuf/ffi/ffi.rb +7 -6
  32. data/lib/google/protobuf/ffi/field_descriptor.rb +23 -2
  33. data/lib/google/protobuf/ffi/file_descriptor.rb +13 -13
  34. data/lib/google/protobuf/ffi/internal/arena.rb +0 -6
  35. data/lib/google/protobuf/ffi/internal/convert.rb +17 -30
  36. data/lib/google/protobuf/ffi/map.rb +50 -24
  37. data/lib/google/protobuf/ffi/message.rb +188 -67
  38. data/lib/google/protobuf/ffi/method_descriptor.rb +124 -0
  39. data/lib/google/protobuf/ffi/object_cache.rb +3 -3
  40. data/lib/google/protobuf/ffi/oneof_descriptor.rb +13 -1
  41. data/lib/google/protobuf/ffi/repeated_field.rb +47 -19
  42. data/lib/google/protobuf/ffi/service_descriptor.rb +117 -0
  43. data/lib/google/protobuf/field_mask_pb.rb +1 -22
  44. data/lib/google/protobuf/internal/object_cache.rb +99 -0
  45. data/lib/google/protobuf/plugin_pb.rb +2 -24
  46. data/lib/google/protobuf/repeated_field.rb +4 -5
  47. data/lib/google/protobuf/source_context_pb.rb +1 -22
  48. data/lib/google/protobuf/struct_pb.rb +1 -22
  49. data/lib/google/protobuf/timestamp_pb.rb +1 -22
  50. data/lib/google/protobuf/type_pb.rb +1 -24
  51. data/lib/google/protobuf/wrappers_pb.rb +1 -22
  52. data/lib/google/protobuf.rb +1 -1
  53. data/lib/google/protobuf_ffi.rb +5 -3
  54. data/lib/google/protobuf_native.rb +0 -1
  55. data/lib/google/tasks/ffi.rake +1 -3
  56. metadata +28 -13
  57. data/ext/google/protobuf_c/third_party/utf8_range/naive.c +0 -92
  58. data/ext/google/protobuf_c/third_party/utf8_range/range2-neon.c +0 -157
  59. data/ext/google/protobuf_c/third_party/utf8_range/range2-sse.c +0 -170
  60. data/lib/google/protobuf/descriptor_dsl.rb +0 -465
  61. data/lib/google/protobuf/object_cache.rb +0 -97
@@ -44,9 +44,11 @@ static void Message_mark(void* _self) {
44
44
  rb_gc_mark(self->arena);
45
45
  }
46
46
 
47
+ static size_t Message_memsize(const void* _self) { return sizeof(Message); }
48
+
47
49
  static rb_data_type_t Message_type = {
48
50
  "Google::Protobuf::Message",
49
- {Message_mark, RUBY_DEFAULT_FREE, NULL},
51
+ {Message_mark, RUBY_DEFAULT_FREE, Message_memsize},
50
52
  .flags = RUBY_TYPED_FREE_IMMEDIATELY | RUBY_TYPED_WB_PROTECTED,
51
53
  };
52
54
 
@@ -78,11 +80,13 @@ const upb_Message* Message_Get(VALUE msg_rb, const upb_MessageDef** m) {
78
80
  }
79
81
 
80
82
  upb_Message* Message_GetMutable(VALUE msg_rb, const upb_MessageDef** m) {
81
- rb_check_frozen(msg_rb);
82
- return (upb_Message*)Message_Get(msg_rb, m);
83
+ const upb_Message* upb_msg = Message_Get(msg_rb, m);
84
+ Protobuf_CheckNotFrozen(msg_rb, upb_Message_IsFrozen(upb_msg));
85
+ return (upb_Message*)upb_msg;
83
86
  }
84
87
 
85
- void Message_InitPtr(VALUE self_, upb_Message* msg, VALUE arena) {
88
+ void Message_InitPtr(VALUE self_, const upb_Message* msg, VALUE arena) {
89
+ PBRUBY_ASSERT(arena != Qnil);
86
90
  Message* self = ruby_to_Message(self_);
87
91
  self->msg = msg;
88
92
  RB_OBJ_WRITE(self_, &self->arena, arena);
@@ -103,7 +107,7 @@ void Message_CheckClass(VALUE klass) {
103
107
  }
104
108
  }
105
109
 
106
- VALUE Message_GetRubyWrapper(upb_Message* msg, const upb_MessageDef* m,
110
+ VALUE Message_GetRubyWrapper(const upb_Message* msg, const upb_MessageDef* m,
107
111
  VALUE arena) {
108
112
  if (msg == NULL) return Qnil;
109
113
 
@@ -114,7 +118,6 @@ VALUE Message_GetRubyWrapper(upb_Message* msg, const upb_MessageDef* m,
114
118
  val = Message_alloc(klass);
115
119
  Message_InitPtr(val, msg, arena);
116
120
  }
117
-
118
121
  return val;
119
122
  }
120
123
 
@@ -246,7 +249,7 @@ static int extract_method_call(VALUE method_name, Message* self,
246
249
  static VALUE Message_oneof_accessor(VALUE _self, const upb_OneofDef* o,
247
250
  int accessor_type) {
248
251
  Message* self = ruby_to_Message(_self);
249
- const upb_FieldDef* oneof_field = upb_Message_WhichOneof(self->msg, o);
252
+ const upb_FieldDef* oneof_field = upb_Message_WhichOneofByDef(self->msg, o);
250
253
 
251
254
  switch (accessor_type) {
252
255
  case METHOD_PRESENCE:
@@ -286,13 +289,42 @@ static void Message_setfield(upb_Message* msg, const upb_FieldDef* f, VALUE val,
286
289
  upb_Message_SetFieldByDef(msg, f, msgval, arena);
287
290
  }
288
291
 
292
+ VALUE Message_getfield_frozen(const upb_Message* msg, const upb_FieldDef* f,
293
+ VALUE arena) {
294
+ upb_MessageValue msgval = upb_Message_GetFieldByDef(msg, f);
295
+ if (upb_FieldDef_IsMap(f)) {
296
+ if (msgval.map_val == NULL) {
297
+ return Map_EmptyFrozen(f);
298
+ }
299
+ const upb_FieldDef* key_f = map_field_key(f);
300
+ const upb_FieldDef* val_f = map_field_value(f);
301
+ upb_CType key_type = upb_FieldDef_CType(key_f);
302
+ TypeInfo value_type_info = TypeInfo_get(val_f);
303
+ return Map_GetRubyWrapper(msgval.map_val, key_type, value_type_info, arena);
304
+ }
305
+ if (upb_FieldDef_IsRepeated(f)) {
306
+ if (msgval.array_val == NULL) {
307
+ return RepeatedField_EmptyFrozen(f);
308
+ }
309
+ return RepeatedField_GetRubyWrapper(msgval.array_val, TypeInfo_get(f),
310
+ arena);
311
+ }
312
+ VALUE ret;
313
+ if (upb_FieldDef_IsSubMessage(f)) {
314
+ const upb_MessageDef* m = upb_FieldDef_MessageSubDef(f);
315
+ ret = Message_GetRubyWrapper(msgval.msg_val, m, arena);
316
+ } else {
317
+ ret = Convert_UpbToRuby(msgval, TypeInfo_get(f), Qnil);
318
+ }
319
+ return ret;
320
+ }
321
+
289
322
  VALUE Message_getfield(VALUE _self, const upb_FieldDef* f) {
290
323
  Message* self = ruby_to_Message(_self);
291
- // This is a special-case: upb_Message_Mutable() for map & array are logically
292
- // const (they will not change what is serialized) but physically
293
- // non-const, as they do allocate a repeated field or map. The logical
294
- // constness means it's ok to do even if the message is frozen.
295
- upb_Message* msg = (upb_Message*)self->msg;
324
+ if (upb_Message_IsFrozen(self->msg)) {
325
+ return Message_getfield_frozen(self->msg, f, self->arena);
326
+ }
327
+ upb_Message* msg = Message_GetMutable(_self, NULL);
296
328
  upb_Arena* arena = Arena_get(self->arena);
297
329
  if (upb_FieldDef_IsMap(f)) {
298
330
  upb_Map* map = upb_Message_Mutable(msg, f, arena).map;
@@ -305,12 +337,12 @@ VALUE Message_getfield(VALUE _self, const upb_FieldDef* f) {
305
337
  upb_Array* arr = upb_Message_Mutable(msg, f, arena).array;
306
338
  return RepeatedField_GetRubyWrapper(arr, TypeInfo_get(f), self->arena);
307
339
  } else if (upb_FieldDef_IsSubMessage(f)) {
308
- if (!upb_Message_HasFieldByDef(self->msg, f)) return Qnil;
340
+ if (!upb_Message_HasFieldByDef(msg, f)) return Qnil;
309
341
  upb_Message* submsg = upb_Message_Mutable(msg, f, arena).msg;
310
342
  const upb_MessageDef* m = upb_FieldDef_MessageSubDef(f);
311
343
  return Message_GetRubyWrapper(submsg, m, self->arena);
312
344
  } else {
313
- upb_MessageValue msgval = upb_Message_GetFieldByDef(self->msg, f);
345
+ upb_MessageValue msgval = upb_Message_GetFieldByDef(msg, f);
314
346
  return Convert_UpbToRuby(msgval, TypeInfo_get(f), self->arena);
315
347
  }
316
348
  }
@@ -330,7 +362,8 @@ static VALUE Message_field_accessor(VALUE _self, const upb_FieldDef* f,
330
362
  if (!upb_FieldDef_HasPresence(f)) {
331
363
  rb_raise(rb_eRuntimeError, "Field does not have presence.");
332
364
  }
333
- return upb_Message_HasFieldByDef(Message_Get(_self, NULL), f);
365
+ return upb_Message_HasFieldByDef(Message_Get(_self, NULL), f) ? Qtrue
366
+ : Qfalse;
334
367
  case METHOD_WRAPPER_GETTER: {
335
368
  Message* self = ruby_to_Message(_self);
336
369
  if (upb_Message_HasFieldByDef(self->msg, f)) {
@@ -434,7 +467,6 @@ static VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
434
467
  if (argc != 2) {
435
468
  rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
436
469
  }
437
- rb_check_frozen(_self);
438
470
  break;
439
471
  default:
440
472
  if (argc != 1) {
@@ -661,29 +693,12 @@ static VALUE Message_dup(VALUE _self) {
661
693
  Message* self = ruby_to_Message(_self);
662
694
  VALUE new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
663
695
  Message* new_msg_self = ruby_to_Message(new_msg);
664
- size_t size = upb_MessageDef_MiniTable(self->msgdef)->size;
665
-
666
- // TODO
667
- // TODO
668
- memcpy((upb_Message*)new_msg_self->msg, self->msg, size);
696
+ const upb_MiniTable* m = upb_MessageDef_MiniTable(self->msgdef);
697
+ upb_Message_ShallowCopy((upb_Message*)new_msg_self->msg, self->msg, m);
669
698
  Arena_fuse(self->arena, Arena_get(new_msg_self->arena));
670
699
  return new_msg;
671
700
  }
672
701
 
673
- // Support function for Message_eq, and also used by other #eq functions.
674
- bool Message_Equal(const upb_Message* m1, const upb_Message* m2,
675
- const upb_MessageDef* m) {
676
- upb_Status status;
677
- upb_Status_Clear(&status);
678
- bool return_value = shared_Message_Equal(m1, m2, m, &status);
679
- if (upb_Status_IsOk(&status)) {
680
- return return_value;
681
- } else {
682
- rb_raise(cParseError, "Message_Equal(): %s",
683
- upb_Status_ErrorMessage(&status));
684
- }
685
- }
686
-
687
702
  /*
688
703
  * call-seq:
689
704
  * Message.==(other) => boolean
@@ -700,7 +715,10 @@ static VALUE Message_eq(VALUE _self, VALUE _other) {
700
715
  Message* other = ruby_to_Message(_other);
701
716
  assert(self->msgdef == other->msgdef);
702
717
 
703
- return Message_Equal(self->msg, other->msg, self->msgdef) ? Qtrue : Qfalse;
718
+ const upb_MiniTable* m = upb_MessageDef_MiniTable(self->msgdef);
719
+ const int options = 0;
720
+ return upb_Message_IsEqual(self->msg, other->msg, m, options) ? Qtrue
721
+ : Qfalse;
704
722
  }
705
723
 
706
724
  uint64_t Message_Hash(const upb_Message* msg, const upb_MessageDef* m,
@@ -769,58 +787,34 @@ static VALUE Message_CreateHash(const upb_Message* msg,
769
787
  if (!msg) return Qnil;
770
788
 
771
789
  VALUE hash = rb_hash_new();
772
- int n = upb_MessageDef_FieldCount(m);
773
- bool is_proto2;
774
-
775
- // We currently have a few behaviors that are specific to proto2.
776
- // This is unfortunate, we should key behaviors off field attributes (like
777
- // whether a field has presence), not proto2 vs. proto3. We should see if we
778
- // can change this without breaking users.
779
- is_proto2 = upb_MessageDef_Syntax(m) == kUpb_Syntax_Proto2;
780
-
781
- for (int i = 0; i < n; i++) {
782
- const upb_FieldDef* field = upb_MessageDef_Field(m, i);
783
- TypeInfo type_info = TypeInfo_get(field);
784
- upb_MessageValue msgval;
785
- VALUE msg_value;
786
- VALUE msg_key;
787
-
788
- if (!is_proto2 && upb_FieldDef_IsSubMessage(field) &&
789
- !upb_FieldDef_IsRepeated(field) &&
790
- !upb_Message_HasFieldByDef(msg, field)) {
791
- // TODO: Legacy behavior, remove when we fix the is_proto2 differences.
792
- msg_key = ID2SYM(rb_intern(upb_FieldDef_Name(field)));
793
- rb_hash_aset(hash, msg_key, Qnil);
794
- continue;
795
- }
790
+ size_t iter = kUpb_Message_Begin;
791
+ const upb_DefPool* pool = upb_FileDef_Pool(upb_MessageDef_File(m));
792
+ const upb_FieldDef* field;
793
+ upb_MessageValue val;
796
794
 
797
- // Do not include fields that are not present (oneof or optional fields).
798
- if (is_proto2 && upb_FieldDef_HasPresence(field) &&
799
- !upb_Message_HasFieldByDef(msg, field)) {
795
+ while (upb_Message_Next(msg, m, pool, &field, &val, &iter)) {
796
+ if (upb_FieldDef_IsExtension(field)) {
797
+ // TODO: allow extensions once we have decided what naming scheme the
798
+ // symbol should use. eg. :"[pkg.ext]"
800
799
  continue;
801
800
  }
802
801
 
803
- msg_key = ID2SYM(rb_intern(upb_FieldDef_Name(field)));
804
- msgval = upb_Message_GetFieldByDef(msg, field);
805
-
806
- // Proto2 omits empty map/repeated filds also.
802
+ TypeInfo type_info = TypeInfo_get(field);
803
+ VALUE msg_value;
807
804
 
808
805
  if (upb_FieldDef_IsMap(field)) {
809
806
  const upb_MessageDef* entry_m = upb_FieldDef_MessageSubDef(field);
810
807
  const upb_FieldDef* key_f = upb_MessageDef_FindFieldByNumber(entry_m, 1);
811
808
  const upb_FieldDef* val_f = upb_MessageDef_FindFieldByNumber(entry_m, 2);
812
809
  upb_CType key_type = upb_FieldDef_CType(key_f);
813
- msg_value = Map_CreateHash(msgval.map_val, key_type, TypeInfo_get(val_f));
810
+ msg_value = Map_CreateHash(val.map_val, key_type, TypeInfo_get(val_f));
814
811
  } else if (upb_FieldDef_IsRepeated(field)) {
815
- if (is_proto2 &&
816
- (!msgval.array_val || upb_Array_Size(msgval.array_val) == 0)) {
817
- continue;
818
- }
819
- msg_value = RepeatedField_CreateArray(msgval.array_val, type_info);
812
+ msg_value = RepeatedField_CreateArray(val.array_val, type_info);
820
813
  } else {
821
- msg_value = Scalar_CreateHash(msgval, type_info);
814
+ msg_value = Scalar_CreateHash(val, type_info);
822
815
  }
823
816
 
817
+ VALUE msg_key = ID2SYM(rb_intern(upb_FieldDef_Name(field)));
824
818
  rb_hash_aset(hash, msg_key, msg_value);
825
819
  }
826
820
 
@@ -848,43 +842,42 @@ static VALUE Message_to_h(VALUE _self) {
848
842
 
849
843
  /*
850
844
  * call-seq:
851
- * Message.freeze => self
845
+ * Message.frozen? => bool
852
846
  *
853
- * Freezes the message object. We have to intercept this so we can pin the
854
- * Ruby object into memory so we don't forget it's frozen.
847
+ * Returns true if the message is frozen in either Ruby or the underlying
848
+ * representation. Freezes the Ruby message object if it is not already frozen
849
+ * in Ruby but it is frozen in the underlying representation.
855
850
  */
856
- static VALUE Message_freeze(VALUE _self) {
851
+ VALUE Message_frozen(VALUE _self) {
857
852
  Message* self = ruby_to_Message(_self);
858
- if (!RB_OBJ_FROZEN(_self)) {
859
- Arena_Pin(self->arena, _self);
860
- RB_OBJ_FREEZE(_self);
853
+ if (!upb_Message_IsFrozen(self->msg)) {
854
+ PBRUBY_ASSERT(!RB_OBJ_FROZEN(_self));
855
+ return Qfalse;
861
856
  }
862
- return _self;
857
+
858
+ // Lazily freeze the Ruby wrapper.
859
+ if (!RB_OBJ_FROZEN(_self)) RB_OBJ_FREEZE(_self);
860
+ return Qtrue;
863
861
  }
864
862
 
865
863
  /*
866
- * Deep freezes the message object recursively.
867
- * Internal use only.
864
+ * call-seq:
865
+ * Message.freeze => self
866
+ *
867
+ * Freezes the message object. We have to intercept this so we can freeze the
868
+ * underlying representation, not just the Ruby wrapper.
868
869
  */
869
- VALUE Message_internal_deep_freeze(VALUE _self) {
870
+ VALUE Message_freeze(VALUE _self) {
870
871
  Message* self = ruby_to_Message(_self);
871
- Message_freeze(_self);
872
-
873
- int n = upb_MessageDef_FieldCount(self->msgdef);
874
- for (int i = 0; i < n; i++) {
875
- const upb_FieldDef* f = upb_MessageDef_Field(self->msgdef, i);
876
- VALUE field = Message_getfield(_self, f);
877
-
878
- if (field != Qnil) {
879
- if (upb_FieldDef_IsMap(f)) {
880
- Map_internal_deep_freeze(field);
881
- } else if (upb_FieldDef_IsRepeated(f)) {
882
- RepeatedField_internal_deep_freeze(field);
883
- } else if (upb_FieldDef_IsSubMessage(f)) {
884
- Message_internal_deep_freeze(field);
885
- }
886
- }
872
+ if (RB_OBJ_FROZEN(_self)) {
873
+ PBRUBY_ASSERT(upb_Message_IsFrozen(self->msg));
874
+ return _self;
887
875
  }
876
+ if (!upb_Message_IsFrozen(self->msg)) {
877
+ upb_Message_Freeze(Message_GetMutable(_self, NULL),
878
+ upb_MessageDef_MiniTable(self->msgdef));
879
+ }
880
+ RB_OBJ_FREEZE(_self);
888
881
  return _self;
889
882
  }
890
883
 
@@ -990,7 +983,7 @@ VALUE Message_decode_bytes(int size, const char* bytes, int options,
990
983
  rb_raise(cParseError, "Error occurred during parsing");
991
984
  }
992
985
  if (freeze) {
993
- Message_internal_deep_freeze(msg_rb);
986
+ Message_freeze(msg_rb);
994
987
  }
995
988
  return msg_rb;
996
989
  }
@@ -1012,9 +1005,6 @@ static VALUE Message_decode_json(int argc, VALUE* argv, VALUE klass) {
1012
1005
  int options = 0;
1013
1006
  upb_Status status;
1014
1007
 
1015
- // TODO: use this message's pool instead.
1016
- const upb_DefPool* symtab = DescriptorPool_GetSymtab(generated_pool);
1017
-
1018
1008
  if (argc < 1 || argc > 2) {
1019
1009
  rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1020
1010
  }
@@ -1048,11 +1038,19 @@ static VALUE Message_decode_json(int argc, VALUE* argv, VALUE klass) {
1048
1038
  }
1049
1039
 
1050
1040
  upb_Status_Clear(&status);
1051
- if (!upb_JsonDecode(RSTRING_PTR(data), RSTRING_LEN(data),
1052
- (upb_Message*)msg->msg, msg->msgdef, symtab, options,
1053
- Arena_get(msg->arena), &status)) {
1054
- rb_raise(cParseError, "Error occurred during parsing: %s",
1055
- upb_Status_ErrorMessage(&status));
1041
+ const upb_DefPool* pool = upb_FileDef_Pool(upb_MessageDef_File(msg->msgdef));
1042
+
1043
+ int result = upb_JsonDecodeDetectingNonconformance(
1044
+ RSTRING_PTR(data), RSTRING_LEN(data), (upb_Message*)msg->msg,
1045
+ msg->msgdef, pool, options, Arena_get(msg->arena), &status);
1046
+
1047
+ switch (result) {
1048
+ case kUpb_JsonDecodeResult_Ok:
1049
+ break;
1050
+ case kUpb_JsonDecodeResult_Error:
1051
+ rb_raise(cParseError, "Error occurred during parsing: %s",
1052
+ upb_Status_ErrorMessage(&status));
1053
+ break;
1056
1054
  }
1057
1055
 
1058
1056
  return msg_rb;
@@ -1128,9 +1126,6 @@ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1128
1126
  size_t size;
1129
1127
  upb_Status status;
1130
1128
 
1131
- // TODO: use this message's pool instead.
1132
- const upb_DefPool* symtab = DescriptorPool_GetSymtab(generated_pool);
1133
-
1134
1129
  if (argc < 1 || argc > 2) {
1135
1130
  rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1136
1131
  }
@@ -1165,8 +1160,9 @@ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1165
1160
  }
1166
1161
 
1167
1162
  upb_Status_Clear(&status);
1168
- size = upb_JsonEncode(msg->msg, msg->msgdef, symtab, options, buf,
1169
- sizeof(buf), &status);
1163
+ const upb_DefPool* pool = upb_FileDef_Pool(upb_MessageDef_File(msg->msgdef));
1164
+ size = upb_JsonEncode(msg->msg, msg->msgdef, pool, options, buf, sizeof(buf),
1165
+ &status);
1170
1166
 
1171
1167
  if (!upb_Status_IsOk(&status)) {
1172
1168
  rb_raise(cParseError, "Error occurred during encoding: %s",
@@ -1176,7 +1172,7 @@ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1176
1172
  VALUE ret;
1177
1173
  if (size >= sizeof(buf)) {
1178
1174
  char* buf2 = malloc(size + 1);
1179
- upb_JsonEncode(msg->msg, msg->msgdef, symtab, options, buf2, size + 1,
1175
+ upb_JsonEncode(msg->msg, msg->msgdef, pool, options, buf2, size + 1,
1180
1176
  &status);
1181
1177
  ret = rb_str_new(buf2, size);
1182
1178
  free(buf2);
@@ -1402,6 +1398,7 @@ static void Message_define_class(VALUE klass) {
1402
1398
  rb_define_method(klass, "==", Message_eq, 1);
1403
1399
  rb_define_method(klass, "eql?", Message_eq, 1);
1404
1400
  rb_define_method(klass, "freeze", Message_freeze, 0);
1401
+ rb_define_method(klass, "frozen?", Message_frozen, 0);
1405
1402
  rb_define_method(klass, "hash", Message_hash, 0);
1406
1403
  rb_define_method(klass, "to_h", Message_to_h, 0);
1407
1404
  rb_define_method(klass, "inspect", Message_inspect, 0);
@@ -36,7 +36,7 @@ const upb_Message* Message_GetUpbMessage(VALUE value, const upb_MessageDef* m,
36
36
 
37
37
  // Gets or constructs a Ruby wrapper object for the given message. The wrapper
38
38
  // object will reference |arena| and ensure that it outlives this object.
39
- VALUE Message_GetRubyWrapper(upb_Message* msg, const upb_MessageDef* m,
39
+ VALUE Message_GetRubyWrapper(const upb_Message* msg, const upb_MessageDef* m,
40
40
  VALUE arena);
41
41
 
42
42
  // Gets the given field from this message.
@@ -54,10 +54,6 @@ uint64_t Message_Hash(const upb_Message* msg, const upb_MessageDef* m,
54
54
  upb_Message* Message_deep_copy(const upb_Message* msg, const upb_MessageDef* m,
55
55
  upb_Arena* arena);
56
56
 
57
- // Returns true if these two messages are equal.
58
- bool Message_Equal(const upb_Message* m1, const upb_Message* m2,
59
- const upb_MessageDef* m);
60
-
61
57
  // Checks that this Ruby object is a message, and raises an exception if not.
62
58
  void Message_CheckClass(VALUE klass);
63
59
 
@@ -78,7 +74,7 @@ VALUE Message_decode_bytes(int size, const char* bytes, int options,
78
74
  VALUE klass, bool freeze);
79
75
 
80
76
  // Recursively freeze message
81
- VALUE Message_internal_deep_freeze(VALUE _self);
77
+ VALUE Message_freeze(VALUE _self);
82
78
 
83
79
  // Call at startup to register all types in this module.
84
80
  void Message_register(VALUE protobuf);
@@ -7,8 +7,6 @@
7
7
 
8
8
  #include "protobuf.h"
9
9
 
10
- #include <ruby/version.h>
11
-
12
10
  #include "defs.h"
13
11
  #include "map.h"
14
12
  #include "message.h"
@@ -164,11 +162,23 @@ static void Arena_free(void *data) {
164
162
  xfree(arena);
165
163
  }
166
164
 
165
+ static size_t Arena_memsize(const void *data) {
166
+ const Arena *arena = data;
167
+ size_t fused_count;
168
+ size_t memsize = upb_Arena_SpaceAllocated(arena->arena, &fused_count);
169
+ if (fused_count > 1) {
170
+ // If other arena were fused we attribute an equal
171
+ // share of memory usage to each one.
172
+ memsize /= fused_count;
173
+ }
174
+ return memsize + sizeof(Arena);
175
+ }
176
+
167
177
  static VALUE cArena;
168
178
 
169
179
  const rb_data_type_t Arena_type = {
170
180
  "Google::Protobuf::Internal::Arena",
171
- {Arena_mark, Arena_free, NULL},
181
+ {Arena_mark, Arena_free, Arena_memsize},
172
182
  .flags = RUBY_TYPED_FREE_IMMEDIATELY | RUBY_TYPED_WB_PROTECTED,
173
183
  };
174
184
 
@@ -209,15 +219,6 @@ void Arena_fuse(VALUE _arena, upb_Arena *other) {
209
219
 
210
220
  VALUE Arena_new() { return Arena_alloc(cArena); }
211
221
 
212
- void Arena_Pin(VALUE _arena, VALUE obj) {
213
- Arena *arena;
214
- TypedData_Get_Struct(_arena, Arena, &Arena_type, arena);
215
- if (arena->pinned_objs == Qnil) {
216
- RB_OBJ_WRITE(_arena, &arena->pinned_objs, rb_ary_new());
217
- }
218
- rb_ary_push(arena->pinned_objs, obj);
219
- }
220
-
221
222
  void Arena_register(VALUE module) {
222
223
  VALUE internal = rb_define_module_under(module, "Internal");
223
224
  VALUE klass = rb_define_class_under(internal, "Arena", rb_cObject);
@@ -241,16 +242,17 @@ static void ObjectCache_Init(VALUE protobuf) {
241
242
  item_try_add = rb_intern("try_add");
242
243
 
243
244
  rb_gc_register_address(&weak_obj_cache);
245
+ VALUE internal = rb_const_get(protobuf, rb_intern("Internal"));
244
246
  #if SIZEOF_LONG >= SIZEOF_VALUE
245
- VALUE cache_class = rb_const_get(protobuf, rb_intern("ObjectCache"));
247
+ VALUE cache_class = rb_const_get(internal, rb_intern("ObjectCache"));
246
248
  #else
247
- VALUE cache_class = rb_const_get(protobuf, rb_intern("LegacyObjectCache"));
249
+ VALUE cache_class = rb_const_get(internal, rb_intern("LegacyObjectCache"));
248
250
  #endif
249
251
 
250
252
  weak_obj_cache = rb_class_new_instance(0, NULL, cache_class);
251
- rb_const_set(protobuf, rb_intern("OBJECT_CACHE"), weak_obj_cache);
252
- rb_const_set(protobuf, rb_intern("SIZEOF_LONG"), INT2NUM(SIZEOF_LONG));
253
- rb_const_set(protobuf, rb_intern("SIZEOF_VALUE"), INT2NUM(SIZEOF_VALUE));
253
+ rb_const_set(internal, rb_intern("OBJECT_CACHE"), weak_obj_cache);
254
+ rb_const_set(internal, rb_intern("SIZEOF_LONG"), INT2NUM(SIZEOF_LONG));
255
+ rb_const_set(internal, rb_intern("SIZEOF_VALUE"), INT2NUM(SIZEOF_VALUE));
254
256
  }
255
257
 
256
258
  static VALUE ObjectCache_GetKey(const void *key) {
@@ -284,7 +286,8 @@ VALUE ObjectCache_Get(const void *key) {
284
286
  static VALUE Google_Protobuf_discard_unknown(VALUE self, VALUE msg_rb) {
285
287
  const upb_MessageDef *m;
286
288
  upb_Message *msg = Message_GetMutable(msg_rb, &m);
287
- if (!upb_Message_DiscardUnknown(msg, m, 128)) {
289
+ const upb_DefPool* ext_pool = upb_FileDef_Pool(upb_MessageDef_File(m));
290
+ if (!upb_Message_DiscardUnknown(msg, m, ext_pool, 128)) {
288
291
  rb_raise(rb_eRuntimeError, "Messages nested too deeply.");
289
292
  }
290
293
 
@@ -341,3 +344,14 @@ __attribute__((visibility("default"))) void Init_protobuf_c() {
341
344
  rb_define_singleton_method(protobuf, "deep_copy", Google_Protobuf_deep_copy,
342
345
  1);
343
346
  }
347
+
348
+ // -----------------------------------------------------------------------------
349
+ // Utilities
350
+ // -----------------------------------------------------------------------------
351
+
352
+ // Raises a Ruby error if val is frozen in Ruby or UPB.
353
+ void Protobuf_CheckNotFrozen(VALUE val, bool upb_frozen) {
354
+ if (RB_UNLIKELY(rb_obj_frozen_p(val)||upb_frozen)) {
355
+ rb_error_frozen_object(val);
356
+ }
357
+ }
@@ -50,13 +50,6 @@ upb_Arena* Arena_get(VALUE arena);
50
50
  // possible.
51
51
  void Arena_fuse(VALUE arena, upb_Arena* other);
52
52
 
53
- // Pins this Ruby object to the lifetime of this arena, so that as long as the
54
- // arena is alive this object will not be collected.
55
- //
56
- // We use this to guarantee that the "frozen" bit on the object will be
57
- // remembered, even if the user drops their reference to this precise object.
58
- void Arena_Pin(VALUE arena, VALUE obj);
59
-
60
53
  // -----------------------------------------------------------------------------
61
54
  // ObjectCache
62
55
  // -----------------------------------------------------------------------------
@@ -105,6 +98,9 @@ extern VALUE cTypeError;
105
98
  rb_bug("Assertion failed at %s:%d, expr: %s", __FILE__, __LINE__, #expr)
106
99
  #endif
107
100
 
101
+ // Raises a Ruby error if val is frozen in Ruby or upb_frozen is true.
102
+ void Protobuf_CheckNotFrozen(VALUE val, bool upb_frozen);
103
+
108
104
  #define PBRUBY_MAX(x, y) (((x) > (y)) ? (x) : (y))
109
105
 
110
106
  #define UPB_UNUSED(var) (void)var
@@ -44,8 +44,9 @@ static RepeatedField* ruby_to_RepeatedField(VALUE _self) {
44
44
  }
45
45
 
46
46
  static upb_Array* RepeatedField_GetMutable(VALUE _self) {
47
- rb_check_frozen(_self);
48
- return (upb_Array*)ruby_to_RepeatedField(_self)->array;
47
+ const upb_Array* array = ruby_to_RepeatedField(_self)->array;
48
+ Protobuf_CheckNotFrozen(_self, upb_Array_IsFrozen(array));
49
+ return (upb_Array*)array;
49
50
  }
50
51
 
51
52
  VALUE RepeatedField_alloc(VALUE klass) {
@@ -56,9 +57,32 @@ VALUE RepeatedField_alloc(VALUE klass) {
56
57
  return TypedData_Wrap_Struct(klass, &RepeatedField_type, self);
57
58
  }
58
59
 
59
- VALUE RepeatedField_GetRubyWrapper(upb_Array* array, TypeInfo type_info,
60
+ VALUE RepeatedField_EmptyFrozen(const upb_FieldDef* f) {
61
+ PBRUBY_ASSERT(upb_FieldDef_IsRepeated(f));
62
+ VALUE val = ObjectCache_Get(f);
63
+
64
+ if (val == Qnil) {
65
+ val = RepeatedField_alloc(cRepeatedField);
66
+ RepeatedField* self;
67
+ TypedData_Get_Struct(val, RepeatedField, &RepeatedField_type, self);
68
+ self->arena = Arena_new();
69
+ TypeInfo type_info = TypeInfo_get(f);
70
+ self->array = upb_Array_New(Arena_get(self->arena), type_info.type);
71
+ self->type_info = type_info;
72
+ if (self->type_info.type == kUpb_CType_Message) {
73
+ self->type_class = Descriptor_DefToClass(type_info.def.msgdef);
74
+ }
75
+ val = ObjectCache_TryAdd(f, RepeatedField_freeze(val));
76
+ }
77
+ PBRUBY_ASSERT(RB_OBJ_FROZEN(val));
78
+ PBRUBY_ASSERT(upb_Array_IsFrozen(ruby_to_RepeatedField(val)->array));
79
+ return val;
80
+ }
81
+
82
+ VALUE RepeatedField_GetRubyWrapper(const upb_Array* array, TypeInfo type_info,
60
83
  VALUE arena) {
61
84
  PBRUBY_ASSERT(array);
85
+ PBRUBY_ASSERT(arena != Qnil);
62
86
  VALUE val = ObjectCache_Get(array);
63
87
 
64
88
  if (val == Qnil) {
@@ -78,7 +102,6 @@ VALUE RepeatedField_GetRubyWrapper(upb_Array* array, TypeInfo type_info,
78
102
  PBRUBY_ASSERT(ruby_to_RepeatedField(val)->type_info.def.msgdef ==
79
103
  type_info.def.msgdef);
80
104
  PBRUBY_ASSERT(ruby_to_RepeatedField(val)->array == array);
81
-
82
105
  return val;
83
106
  }
84
107
 
@@ -473,36 +496,47 @@ VALUE RepeatedField_eq(VALUE _self, VALUE _other) {
473
496
 
474
497
  /*
475
498
  * call-seq:
476
- * RepeatedField.freeze => self
499
+ * RepeatedField.frozen? => bool
477
500
  *
478
- * Freezes the repeated field. We have to intercept this so we can pin the Ruby
479
- * object into memory so we don't forget it's frozen.
501
+ * Returns true if the repeated field is frozen in either Ruby or the underlying
502
+ * representation. Freezes the Ruby repeated field object if it is not already
503
+ * frozen in Ruby but it is frozen in the underlying representation.
480
504
  */
481
- static VALUE RepeatedField_freeze(VALUE _self) {
505
+ VALUE RepeatedField_frozen(VALUE _self) {
482
506
  RepeatedField* self = ruby_to_RepeatedField(_self);
483
- if (!RB_OBJ_FROZEN(_self)) {
484
- Arena_Pin(self->arena, _self);
485
- RB_OBJ_FREEZE(_self);
507
+ if (!upb_Array_IsFrozen(self->array)) {
508
+ PBRUBY_ASSERT(!RB_OBJ_FROZEN(_self));
509
+ return Qfalse;
486
510
  }
487
- return _self;
511
+
512
+ // Lazily freeze the Ruby wrapper.
513
+ if (!RB_OBJ_FROZEN(_self)) RB_OBJ_FREEZE(_self);
514
+ return Qtrue;
488
515
  }
489
516
 
490
517
  /*
491
- * Deep freezes the repeated field and values recursively.
492
- * Internal use only.
518
+ * call-seq:
519
+ * RepeatedField.freeze => self
520
+ *
521
+ * Freezes the repeated field object. We have to intercept this so we can freeze
522
+ * the underlying representation, not just the Ruby wrapper.
493
523
  */
494
- VALUE RepeatedField_internal_deep_freeze(VALUE _self) {
524
+ VALUE RepeatedField_freeze(VALUE _self) {
495
525
  RepeatedField* self = ruby_to_RepeatedField(_self);
496
- RepeatedField_freeze(_self);
497
- if (self->type_info.type == kUpb_CType_Message) {
498
- int size = upb_Array_Size(self->array);
499
- int i;
500
- for (i = 0; i < size; i++) {
501
- upb_MessageValue msgval = upb_Array_Get(self->array, i);
502
- VALUE val = Convert_UpbToRuby(msgval, self->type_info, self->arena);
503
- Message_internal_deep_freeze(val);
526
+ if (RB_OBJ_FROZEN(_self)) {
527
+ PBRUBY_ASSERT(upb_Array_IsFrozen(self->array));
528
+ return _self;
529
+ }
530
+
531
+ if (!upb_Array_IsFrozen(self->array)) {
532
+ if (self->type_info.type == kUpb_CType_Message) {
533
+ upb_Array_Freeze(RepeatedField_GetMutable(_self),
534
+ upb_MessageDef_MiniTable(self->type_info.def.msgdef));
535
+ } else {
536
+ upb_Array_Freeze(RepeatedField_GetMutable(_self), NULL);
504
537
  }
505
538
  }
539
+ RB_OBJ_FREEZE(_self);
506
540
  return _self;
507
541
  }
508
542
 
@@ -649,6 +683,7 @@ void RepeatedField_register(VALUE module) {
649
683
  rb_define_method(klass, "==", RepeatedField_eq, 1);
650
684
  rb_define_method(klass, "to_ary", RepeatedField_to_ary, 0);
651
685
  rb_define_method(klass, "freeze", RepeatedField_freeze, 0);
686
+ rb_define_method(klass, "frozen?", RepeatedField_frozen, 0);
652
687
  rb_define_method(klass, "hash", RepeatedField_hash, 0);
653
688
  rb_define_method(klass, "+", RepeatedField_plus, 1);
654
689
  rb_define_method(klass, "concat", RepeatedField_concat, 1);