google-protobuf 3.0.0 → 3.20.0

Sign up to get free protection for your applications and to get access to all the features.

Potentially problematic release.


This version of google-protobuf might be problematic. Click here for more details.

Files changed (46) hide show
  1. checksums.yaml +5 -5
  2. data/ext/google/protobuf_c/convert.c +361 -0
  3. data/ext/google/protobuf_c/convert.h +75 -0
  4. data/ext/google/protobuf_c/defs.c +760 -1243
  5. data/ext/google/protobuf_c/defs.h +107 -0
  6. data/ext/google/protobuf_c/extconf.rb +22 -4
  7. data/ext/google/protobuf_c/map.c +342 -450
  8. data/ext/google/protobuf_c/map.h +66 -0
  9. data/ext/google/protobuf_c/message.c +1108 -284
  10. data/ext/google/protobuf_c/message.h +104 -0
  11. data/ext/google/protobuf_c/protobuf.c +416 -51
  12. data/ext/google/protobuf_c/protobuf.h +53 -472
  13. data/ext/google/protobuf_c/repeated_field.c +318 -317
  14. data/ext/google/protobuf_c/repeated_field.h +63 -0
  15. data/ext/google/protobuf_c/ruby-upb.c +11115 -0
  16. data/ext/google/protobuf_c/ruby-upb.h +5612 -0
  17. data/ext/google/protobuf_c/third_party/utf8_range/LICENSE +21 -0
  18. data/ext/google/protobuf_c/third_party/utf8_range/naive.c +92 -0
  19. data/ext/google/protobuf_c/third_party/utf8_range/range2-neon.c +157 -0
  20. data/ext/google/protobuf_c/third_party/utf8_range/range2-sse.c +170 -0
  21. data/ext/google/protobuf_c/third_party/utf8_range/utf8_range.h +9 -0
  22. data/ext/google/protobuf_c/wrap_memcpy.c +52 -0
  23. data/lib/google/protobuf/any_pb.rb +6 -4
  24. data/lib/google/protobuf/api_pb.rb +27 -24
  25. data/lib/google/protobuf/descriptor_dsl.rb +465 -0
  26. data/lib/google/protobuf/descriptor_pb.rb +269 -0
  27. data/lib/google/protobuf/duration_pb.rb +6 -4
  28. data/lib/google/protobuf/empty_pb.rb +4 -2
  29. data/lib/google/protobuf/field_mask_pb.rb +5 -3
  30. data/lib/google/protobuf/message_exts.rb +4 -4
  31. data/lib/google/protobuf/repeated_field.rb +4 -4
  32. data/lib/google/protobuf/source_context_pb.rb +5 -3
  33. data/lib/google/protobuf/struct_pb.rb +23 -21
  34. data/lib/google/protobuf/timestamp_pb.rb +6 -4
  35. data/lib/google/protobuf/type_pb.rb +77 -74
  36. data/lib/google/protobuf/well_known_types.rb +240 -0
  37. data/lib/google/protobuf/wrappers_pb.rb +37 -35
  38. data/lib/google/protobuf.rb +12 -9
  39. data/tests/basic.rb +489 -1001
  40. data/tests/generated_code_test.rb +6 -2
  41. data/tests/stress.rb +1 -1
  42. metadata +39 -34
  43. data/ext/google/protobuf_c/encode_decode.c +0 -1264
  44. data/ext/google/protobuf_c/storage.c +0 -893
  45. data/ext/google/protobuf_c/upb.c +0 -12812
  46. data/ext/google/protobuf_c/upb.h +0 -8569
@@ -28,90 +28,394 @@
28
28
  // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29
29
  // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
30
 
31
+ #include "message.h"
32
+
33
+ #include "convert.h"
34
+ #include "defs.h"
35
+ #include "map.h"
31
36
  #include "protobuf.h"
37
+ #include "repeated_field.h"
32
38
 
33
- // -----------------------------------------------------------------------------
34
- // Class/module creation from msgdefs and enumdefs, respectively.
35
- // -----------------------------------------------------------------------------
39
+ static VALUE cParseError = Qnil;
40
+ static ID descriptor_instancevar_interned;
36
41
 
37
- void* Message_data(void* msg) {
38
- return ((uint8_t *)msg) + sizeof(MessageHeader);
42
+ static VALUE initialize_rb_class_with_no_args(VALUE klass) {
43
+ return rb_funcall(klass, rb_intern("new"), 0);
39
44
  }
40
45
 
41
- void Message_mark(void* _self) {
42
- MessageHeader* self = (MessageHeader *)_self;
43
- layout_mark(self->descriptor->layout, Message_data(self));
46
+ VALUE MessageOrEnum_GetDescriptor(VALUE klass) {
47
+ return rb_ivar_get(klass, descriptor_instancevar_interned);
44
48
  }
45
49
 
46
- void Message_free(void* self) {
47
- xfree(self);
50
+ // -----------------------------------------------------------------------------
51
+ // Class/module creation from msgdefs and enumdefs, respectively.
52
+ // -----------------------------------------------------------------------------
53
+
54
+ typedef struct {
55
+ VALUE arena;
56
+ const upb_Message* msg; // Can get as mutable when non-frozen.
57
+ const upb_MessageDef*
58
+ msgdef; // kept alive by self.class.descriptor reference.
59
+ } Message;
60
+
61
+ static void Message_mark(void* _self) {
62
+ Message* self = (Message*)_self;
63
+ rb_gc_mark(self->arena);
48
64
  }
49
65
 
50
- rb_data_type_t Message_type = {
51
- "Message",
52
- { Message_mark, Message_free, NULL },
66
+ static rb_data_type_t Message_type = {
67
+ "Message",
68
+ {Message_mark, RUBY_DEFAULT_FREE, NULL},
69
+ .flags = RUBY_TYPED_FREE_IMMEDIATELY,
53
70
  };
54
71
 
55
- VALUE Message_alloc(VALUE klass) {
72
+ static Message* ruby_to_Message(VALUE msg_rb) {
73
+ Message* msg;
74
+ TypedData_Get_Struct(msg_rb, Message, &Message_type, msg);
75
+ return msg;
76
+ }
77
+
78
+ static VALUE Message_alloc(VALUE klass) {
56
79
  VALUE descriptor = rb_ivar_get(klass, descriptor_instancevar_interned);
57
- Descriptor* desc = ruby_to_Descriptor(descriptor);
58
- MessageHeader* msg = (MessageHeader*)ALLOC_N(
59
- uint8_t, sizeof(MessageHeader) + desc->layout->size);
80
+ Message* msg = ALLOC(Message);
60
81
  VALUE ret;
61
82
 
62
- memset(Message_data(msg), 0, desc->layout->size);
83
+ msg->msgdef = Descriptor_GetMsgDef(descriptor);
84
+ msg->arena = Qnil;
85
+ msg->msg = NULL;
63
86
 
64
- // We wrap first so that everything in the message object is GC-rooted in case
65
- // a collection happens during object creation in layout_init().
66
87
  ret = TypedData_Wrap_Struct(klass, &Message_type, msg);
67
- msg->descriptor = desc;
68
88
  rb_ivar_set(ret, descriptor_instancevar_interned, descriptor);
69
89
 
70
- layout_init(desc->layout, Message_data(msg));
71
-
72
90
  return ret;
73
91
  }
74
92
 
75
- static VALUE which_oneof_field(MessageHeader* self, const upb_oneofdef* o) {
76
- upb_oneof_iter it;
77
- size_t case_ofs;
78
- uint32_t oneof_case;
79
- const upb_fielddef* first_field;
80
- const upb_fielddef* f;
93
+ const upb_Message* Message_Get(VALUE msg_rb, const upb_MessageDef** m) {
94
+ Message* msg = ruby_to_Message(msg_rb);
95
+ if (m) *m = msg->msgdef;
96
+ return msg->msg;
97
+ }
81
98
 
82
- // If no fields in the oneof, always nil.
83
- if (upb_oneofdef_numfields(o) == 0) {
84
- return Qnil;
99
+ upb_Message* Message_GetMutable(VALUE msg_rb, const upb_MessageDef** m) {
100
+ rb_check_frozen(msg_rb);
101
+ return (upb_Message*)Message_Get(msg_rb, m);
102
+ }
103
+
104
+ void Message_InitPtr(VALUE self_, upb_Message* msg, VALUE arena) {
105
+ Message* self = ruby_to_Message(self_);
106
+ self->msg = msg;
107
+ self->arena = arena;
108
+ ObjectCache_Add(msg, self_);
109
+ }
110
+
111
+ VALUE Message_GetArena(VALUE msg_rb) {
112
+ Message* msg = ruby_to_Message(msg_rb);
113
+ return msg->arena;
114
+ }
115
+
116
+ void Message_CheckClass(VALUE klass) {
117
+ if (rb_get_alloc_func(klass) != &Message_alloc) {
118
+ rb_raise(rb_eArgError,
119
+ "Message class was not returned by the DescriptorPool.");
85
120
  }
86
- // Grab the first field in the oneof so we can get its layout info to find the
87
- // oneof_case field.
88
- upb_oneof_begin(&it, o);
89
- assert(!upb_oneof_done(&it));
90
- first_field = upb_oneof_iter_field(&it);
91
- assert(upb_fielddef_containingoneof(first_field) != NULL);
121
+ }
92
122
 
93
- case_ofs =
94
- self->descriptor->layout->
95
- fields[upb_fielddef_index(first_field)].case_offset;
96
- oneof_case = *((uint32_t*)((char*)Message_data(self) + case_ofs));
123
+ VALUE Message_GetRubyWrapper(upb_Message* msg, const upb_MessageDef* m,
124
+ VALUE arena) {
125
+ if (msg == NULL) return Qnil;
97
126
 
98
- if (oneof_case == ONEOF_CASE_NONE) {
99
- return Qnil;
127
+ VALUE val = ObjectCache_Get(msg);
128
+
129
+ if (val == Qnil) {
130
+ VALUE klass = Descriptor_DefToClass(m);
131
+ val = Message_alloc(klass);
132
+ Message_InitPtr(val, msg, arena);
133
+ }
134
+
135
+ return val;
136
+ }
137
+
138
+ void Message_PrintMessage(StringBuilder* b, const upb_Message* msg,
139
+ const upb_MessageDef* m) {
140
+ bool first = true;
141
+ int n = upb_MessageDef_FieldCount(m);
142
+ VALUE klass = Descriptor_DefToClass(m);
143
+ StringBuilder_Printf(b, "<%s: ", rb_class2name(klass));
144
+
145
+ for (int i = 0; i < n; i++) {
146
+ const upb_FieldDef* field = upb_MessageDef_Field(m, i);
147
+
148
+ if (upb_FieldDef_HasPresence(field) && !upb_Message_Has(msg, field)) {
149
+ continue;
150
+ }
151
+
152
+ if (!first) {
153
+ StringBuilder_Printf(b, ", ");
154
+ } else {
155
+ first = false;
156
+ }
157
+
158
+ upb_MessageValue msgval = upb_Message_Get(msg, field);
159
+
160
+ StringBuilder_Printf(b, "%s: ", upb_FieldDef_Name(field));
161
+
162
+ if (upb_FieldDef_IsMap(field)) {
163
+ const upb_MessageDef* entry_m = upb_FieldDef_MessageSubDef(field);
164
+ const upb_FieldDef* key_f = upb_MessageDef_FindFieldByNumber(entry_m, 1);
165
+ const upb_FieldDef* val_f = upb_MessageDef_FindFieldByNumber(entry_m, 2);
166
+ TypeInfo val_info = TypeInfo_get(val_f);
167
+ Map_Inspect(b, msgval.map_val, upb_FieldDef_CType(key_f), val_info);
168
+ } else if (upb_FieldDef_IsRepeated(field)) {
169
+ RepeatedField_Inspect(b, msgval.array_val, TypeInfo_get(field));
170
+ } else {
171
+ StringBuilder_PrintMsgval(b, msgval, TypeInfo_get(field));
172
+ }
100
173
  }
101
174
 
102
- // oneof_case is a field index, so find that field.
103
- f = upb_oneofdef_itof(o, oneof_case);
104
- assert(f != NULL);
175
+ StringBuilder_Printf(b, ">");
176
+ }
177
+
178
+ // Helper functions for #method_missing ////////////////////////////////////////
179
+
180
+ enum {
181
+ METHOD_UNKNOWN = 0,
182
+ METHOD_GETTER = 1,
183
+ METHOD_SETTER = 2,
184
+ METHOD_CLEAR = 3,
185
+ METHOD_PRESENCE = 4,
186
+ METHOD_ENUM_GETTER = 5,
187
+ METHOD_WRAPPER_GETTER = 6,
188
+ METHOD_WRAPPER_SETTER = 7
189
+ };
190
+
191
+ // Check if the field is a well known wrapper type
192
+ static bool IsWrapper(const upb_MessageDef* m) {
193
+ if (!m) return false;
194
+ switch (upb_MessageDef_WellKnownType(m)) {
195
+ case kUpb_WellKnown_DoubleValue:
196
+ case kUpb_WellKnown_FloatValue:
197
+ case kUpb_WellKnown_Int64Value:
198
+ case kUpb_WellKnown_UInt64Value:
199
+ case kUpb_WellKnown_Int32Value:
200
+ case kUpb_WellKnown_UInt32Value:
201
+ case kUpb_WellKnown_StringValue:
202
+ case kUpb_WellKnown_BytesValue:
203
+ case kUpb_WellKnown_BoolValue:
204
+ return true;
205
+ default:
206
+ return false;
207
+ }
208
+ }
209
+
210
+ static bool IsFieldWrapper(const upb_FieldDef* f) {
211
+ return IsWrapper(upb_FieldDef_MessageSubDef(f));
212
+ }
213
+
214
+ static bool Match(const upb_MessageDef* m, const char* name,
215
+ const upb_FieldDef** f, const upb_OneofDef** o,
216
+ const char* prefix, const char* suffix) {
217
+ size_t sp = strlen(prefix);
218
+ size_t ss = strlen(suffix);
219
+ size_t sn = strlen(name);
220
+
221
+ if (sn <= sp + ss) return false;
222
+
223
+ if (memcmp(name, prefix, sp) != 0 ||
224
+ memcmp(name + sn - ss, suffix, ss) != 0) {
225
+ return false;
226
+ }
227
+
228
+ return upb_MessageDef_FindByNameWithSize(m, name + sp, sn - sp - ss, f, o);
229
+ }
230
+
231
+ static int extract_method_call(VALUE method_name, Message* self,
232
+ const upb_FieldDef** f, const upb_OneofDef** o) {
233
+ const upb_MessageDef* m = self->msgdef;
234
+ const char* name;
235
+
236
+ Check_Type(method_name, T_SYMBOL);
237
+ name = rb_id2name(SYM2ID(method_name));
238
+
239
+ if (Match(m, name, f, o, "", "")) return METHOD_GETTER;
240
+ if (Match(m, name, f, o, "", "=")) return METHOD_SETTER;
241
+ if (Match(m, name, f, o, "clear_", "")) return METHOD_CLEAR;
242
+ if (Match(m, name, f, o, "has_", "?") &&
243
+ (*o || (*f && upb_FieldDef_HasPresence(*f)))) {
244
+ // Disallow oneof hazzers for proto3.
245
+ // TODO(haberman): remove this test when we are enabling oneof hazzers for
246
+ // proto3.
247
+ if (*f && !upb_FieldDef_IsSubMessage(*f) &&
248
+ upb_FieldDef_RealContainingOneof(*f) &&
249
+ upb_MessageDef_Syntax(upb_FieldDef_ContainingType(*f)) !=
250
+ kUpb_Syntax_Proto2) {
251
+ return METHOD_UNKNOWN;
252
+ }
253
+ return METHOD_PRESENCE;
254
+ }
255
+ if (Match(m, name, f, o, "", "_as_value") && *f &&
256
+ !upb_FieldDef_IsRepeated(*f) && IsFieldWrapper(*f)) {
257
+ return METHOD_WRAPPER_GETTER;
258
+ }
259
+ if (Match(m, name, f, o, "", "_as_value=") && *f &&
260
+ !upb_FieldDef_IsRepeated(*f) && IsFieldWrapper(*f)) {
261
+ return METHOD_WRAPPER_SETTER;
262
+ }
263
+ if (Match(m, name, f, o, "", "_const") && *f &&
264
+ upb_FieldDef_CType(*f) == kUpb_CType_Enum) {
265
+ return METHOD_ENUM_GETTER;
266
+ }
105
267
 
106
- return ID2SYM(rb_intern(upb_fielddef_name(f)));
268
+ return METHOD_UNKNOWN;
269
+ }
270
+
271
+ static VALUE Message_oneof_accessor(VALUE _self, const upb_OneofDef* o,
272
+ int accessor_type) {
273
+ Message* self = ruby_to_Message(_self);
274
+ const upb_FieldDef* oneof_field = upb_Message_WhichOneof(self->msg, o);
275
+
276
+ switch (accessor_type) {
277
+ case METHOD_PRESENCE:
278
+ return oneof_field == NULL ? Qfalse : Qtrue;
279
+ case METHOD_CLEAR:
280
+ if (oneof_field != NULL) {
281
+ upb_Message_ClearField(Message_GetMutable(_self, NULL), oneof_field);
282
+ }
283
+ return Qnil;
284
+ case METHOD_GETTER:
285
+ return oneof_field == NULL
286
+ ? Qnil
287
+ : ID2SYM(rb_intern(upb_FieldDef_Name(oneof_field)));
288
+ case METHOD_SETTER:
289
+ rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
290
+ }
291
+ rb_raise(rb_eRuntimeError, "Invalid access of oneof field.");
292
+ }
293
+
294
+ static void Message_setfield(upb_Message* msg, const upb_FieldDef* f, VALUE val,
295
+ upb_Arena* arena) {
296
+ upb_MessageValue msgval;
297
+ if (upb_FieldDef_IsMap(f)) {
298
+ msgval.map_val = Map_GetUpbMap(val, f, arena);
299
+ } else if (upb_FieldDef_IsRepeated(f)) {
300
+ msgval.array_val = RepeatedField_GetUpbArray(val, f, arena);
301
+ } else {
302
+ if (val == Qnil &&
303
+ (upb_FieldDef_IsSubMessage(f) || upb_FieldDef_RealContainingOneof(f))) {
304
+ upb_Message_ClearField(msg, f);
305
+ return;
306
+ }
307
+ msgval =
308
+ Convert_RubyToUpb(val, upb_FieldDef_Name(f), TypeInfo_get(f), arena);
309
+ }
310
+ upb_Message_Set(msg, f, msgval, arena);
311
+ }
312
+
313
+ VALUE Message_getfield(VALUE _self, const upb_FieldDef* f) {
314
+ Message* self = ruby_to_Message(_self);
315
+ // This is a special-case: upb_Message_Mutable() for map & array are logically
316
+ // const (they will not change what is serialized) but physically
317
+ // non-const, as they do allocate a repeated field or map. The logical
318
+ // constness means it's ok to do even if the message is frozen.
319
+ upb_Message* msg = (upb_Message*)self->msg;
320
+ upb_Arena* arena = Arena_get(self->arena);
321
+ if (upb_FieldDef_IsMap(f)) {
322
+ upb_Map* map = upb_Message_Mutable(msg, f, arena).map;
323
+ const upb_FieldDef* key_f = map_field_key(f);
324
+ const upb_FieldDef* val_f = map_field_value(f);
325
+ upb_CType key_type = upb_FieldDef_CType(key_f);
326
+ TypeInfo value_type_info = TypeInfo_get(val_f);
327
+ return Map_GetRubyWrapper(map, key_type, value_type_info, self->arena);
328
+ } else if (upb_FieldDef_IsRepeated(f)) {
329
+ upb_Array* arr = upb_Message_Mutable(msg, f, arena).array;
330
+ return RepeatedField_GetRubyWrapper(arr, TypeInfo_get(f), self->arena);
331
+ } else if (upb_FieldDef_IsSubMessage(f)) {
332
+ if (!upb_Message_Has(self->msg, f)) return Qnil;
333
+ upb_Message* submsg = upb_Message_Mutable(msg, f, arena).msg;
334
+ const upb_MessageDef* m = upb_FieldDef_MessageSubDef(f);
335
+ return Message_GetRubyWrapper(submsg, m, self->arena);
336
+ } else {
337
+ upb_MessageValue msgval = upb_Message_Get(self->msg, f);
338
+ return Convert_UpbToRuby(msgval, TypeInfo_get(f), self->arena);
339
+ }
340
+ }
341
+
342
+ static VALUE Message_field_accessor(VALUE _self, const upb_FieldDef* f,
343
+ int accessor_type, int argc, VALUE* argv) {
344
+ upb_Arena* arena = Arena_get(Message_GetArena(_self));
345
+
346
+ switch (accessor_type) {
347
+ case METHOD_SETTER:
348
+ Message_setfield(Message_GetMutable(_self, NULL), f, argv[1], arena);
349
+ return Qnil;
350
+ case METHOD_CLEAR:
351
+ upb_Message_ClearField(Message_GetMutable(_self, NULL), f);
352
+ return Qnil;
353
+ case METHOD_PRESENCE:
354
+ if (!upb_FieldDef_HasPresence(f)) {
355
+ rb_raise(rb_eRuntimeError, "Field does not have presence.");
356
+ }
357
+ return upb_Message_Has(Message_Get(_self, NULL), f);
358
+ case METHOD_WRAPPER_GETTER: {
359
+ Message* self = ruby_to_Message(_self);
360
+ if (upb_Message_Has(self->msg, f)) {
361
+ PBRUBY_ASSERT(upb_FieldDef_IsSubMessage(f) &&
362
+ !upb_FieldDef_IsRepeated(f));
363
+ upb_MessageValue wrapper = upb_Message_Get(self->msg, f);
364
+ const upb_MessageDef* wrapper_m = upb_FieldDef_MessageSubDef(f);
365
+ const upb_FieldDef* value_f =
366
+ upb_MessageDef_FindFieldByNumber(wrapper_m, 1);
367
+ upb_MessageValue value = upb_Message_Get(wrapper.msg_val, value_f);
368
+ return Convert_UpbToRuby(value, TypeInfo_get(value_f), self->arena);
369
+ } else {
370
+ return Qnil;
371
+ }
372
+ }
373
+ case METHOD_WRAPPER_SETTER: {
374
+ upb_Message* msg = Message_GetMutable(_self, NULL);
375
+ if (argv[1] == Qnil) {
376
+ upb_Message_ClearField(msg, f);
377
+ } else {
378
+ const upb_FieldDef* val_f =
379
+ upb_MessageDef_FindFieldByNumber(upb_FieldDef_MessageSubDef(f), 1);
380
+ upb_MessageValue msgval = Convert_RubyToUpb(
381
+ argv[1], upb_FieldDef_Name(f), TypeInfo_get(val_f), arena);
382
+ upb_Message* wrapper = upb_Message_Mutable(msg, f, arena).msg;
383
+ upb_Message_Set(wrapper, val_f, msgval, arena);
384
+ }
385
+ return Qnil;
386
+ }
387
+ case METHOD_ENUM_GETTER: {
388
+ upb_MessageValue msgval = upb_Message_Get(Message_Get(_self, NULL), f);
389
+
390
+ if (upb_FieldDef_Label(f) == kUpb_Label_Repeated) {
391
+ // Map repeated fields to a new type with ints
392
+ VALUE arr = rb_ary_new();
393
+ size_t i, n = upb_Array_Size(msgval.array_val);
394
+ for (i = 0; i < n; i++) {
395
+ upb_MessageValue elem = upb_Array_Get(msgval.array_val, i);
396
+ rb_ary_push(arr, INT2NUM(elem.int32_val));
397
+ }
398
+ return arr;
399
+ } else {
400
+ return INT2NUM(msgval.int32_val);
401
+ }
402
+ }
403
+ case METHOD_GETTER:
404
+ return Message_getfield(_self, f);
405
+ default:
406
+ rb_raise(rb_eRuntimeError, "Internal error, no such accessor: %d",
407
+ accessor_type);
408
+ }
107
409
  }
108
410
 
109
411
  /*
110
412
  * call-seq:
111
413
  * Message.method_missing(*args)
112
414
  *
113
- * Provides accessors and setters for message fields according to their field
114
- * names. For any field whose name does not conflict with a built-in method, an
415
+ * Provides accessors and setters and methods to clear and check for presence of
416
+ * message fields according to their field names.
417
+ *
418
+ * For any field whose name does not conflict with a built-in method, an
115
419
  * accessor is provided with the same name as the field, and a setter is
116
420
  * provided with the name of the field plus the '=' suffix. Thus, given a
117
421
  * message instance 'msg' with field 'foo', the following code is valid:
@@ -122,106 +426,218 @@ static VALUE which_oneof_field(MessageHeader* self, const upb_oneofdef* o) {
122
426
  * This method also provides read-only accessors for oneofs. If a oneof exists
123
427
  * with name 'my_oneof', then msg.my_oneof will return a Ruby symbol equal to
124
428
  * the name of the field in that oneof that is currently set, or nil if none.
429
+ *
430
+ * It also provides methods of the form 'clear_fieldname' to clear the value
431
+ * of the field 'fieldname'. For basic data types, this will set the default
432
+ * value of the field.
433
+ *
434
+ * Additionally, it provides methods of the form 'has_fieldname?', which returns
435
+ * true if the field 'fieldname' is set in the message object, else false. For
436
+ * 'proto3' syntax, calling this for a basic type field will result in an error.
125
437
  */
126
- VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
127
- MessageHeader* self;
128
- VALUE method_name, method_str;
129
- char* name;
130
- size_t name_len;
131
- bool setter;
132
- const upb_oneofdef* o;
133
- const upb_fielddef* f;
134
-
135
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
438
+ static VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
439
+ Message* self = ruby_to_Message(_self);
440
+ const upb_OneofDef* o;
441
+ const upb_FieldDef* f;
442
+ int accessor_type;
443
+
136
444
  if (argc < 1) {
137
445
  rb_raise(rb_eArgError, "Expected method name as first argument.");
138
446
  }
139
- method_name = argv[0];
140
- if (!SYMBOL_P(method_name)) {
141
- rb_raise(rb_eArgError, "Expected symbol as method name.");
447
+
448
+ accessor_type = extract_method_call(argv[0], self, &f, &o);
449
+
450
+ if (accessor_type == METHOD_UNKNOWN) return rb_call_super(argc, argv);
451
+
452
+ // Validate argument count.
453
+ switch (accessor_type) {
454
+ case METHOD_SETTER:
455
+ case METHOD_WRAPPER_SETTER:
456
+ if (argc != 2) {
457
+ rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
458
+ }
459
+ rb_check_frozen(_self);
460
+ break;
461
+ default:
462
+ if (argc != 1) {
463
+ rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
464
+ }
465
+ break;
466
+ }
467
+
468
+ // Dispatch accessor.
469
+ if (o != NULL) {
470
+ return Message_oneof_accessor(_self, o, accessor_type);
471
+ } else {
472
+ return Message_field_accessor(_self, f, accessor_type, argc, argv);
142
473
  }
143
- method_str = rb_id2str(SYM2ID(method_name));
144
- name = RSTRING_PTR(method_str);
145
- name_len = RSTRING_LEN(method_str);
146
- setter = false;
474
+ }
147
475
 
148
- // Setters have names that end in '='.
149
- if (name[name_len - 1] == '=') {
150
- setter = true;
151
- name_len--;
476
+ static VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
477
+ Message* self = ruby_to_Message(_self);
478
+ const upb_OneofDef* o;
479
+ const upb_FieldDef* f;
480
+ int accessor_type;
481
+
482
+ if (argc < 1) {
483
+ rb_raise(rb_eArgError, "Expected method name as first argument.");
152
484
  }
153
485
 
154
- // See if this name corresponds to either a oneof or field in this message.
155
- if (!upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len, &f,
156
- &o)) {
486
+ accessor_type = extract_method_call(argv[0], self, &f, &o);
487
+
488
+ if (accessor_type == METHOD_UNKNOWN) {
157
489
  return rb_call_super(argc, argv);
490
+ } else if (o != NULL) {
491
+ return accessor_type == METHOD_SETTER ? Qfalse : Qtrue;
492
+ } else {
493
+ return Qtrue;
158
494
  }
495
+ }
159
496
 
160
- if (o != NULL) {
161
- // This is a oneof -- return which field inside the oneof is set.
162
- if (setter) {
163
- rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
164
- }
165
- return which_oneof_field(self, o);
497
+ void Message_InitFromValue(upb_Message* msg, const upb_MessageDef* m, VALUE val,
498
+ upb_Arena* arena);
499
+
500
+ typedef struct {
501
+ upb_Map* map;
502
+ TypeInfo key_type;
503
+ TypeInfo val_type;
504
+ upb_Arena* arena;
505
+ } MapInit;
506
+
507
+ static int Map_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
508
+ MapInit* map_init = (MapInit*)_self;
509
+ upb_MessageValue k, v;
510
+ k = Convert_RubyToUpb(key, "", map_init->key_type, NULL);
511
+
512
+ if (map_init->val_type.type == kUpb_CType_Message && TYPE(val) == T_HASH) {
513
+ upb_Message* msg =
514
+ upb_Message_New(map_init->val_type.def.msgdef, map_init->arena);
515
+ Message_InitFromValue(msg, map_init->val_type.def.msgdef, val,
516
+ map_init->arena);
517
+ v.msg_val = msg;
166
518
  } else {
167
- // This is a field -- get or set the field's value.
168
- assert(f);
169
- if (setter) {
170
- if (argc < 2) {
171
- rb_raise(rb_eArgError, "No value provided to setter.");
172
- }
173
- layout_set(self->descriptor->layout, Message_data(self), f, argv[1]);
174
- return Qnil;
519
+ v = Convert_RubyToUpb(val, "", map_init->val_type, map_init->arena);
520
+ }
521
+ upb_Map_Set(map_init->map, k, v, map_init->arena);
522
+ return ST_CONTINUE;
523
+ }
524
+
525
+ static void Map_InitFromValue(upb_Map* map, const upb_FieldDef* f, VALUE val,
526
+ upb_Arena* arena) {
527
+ const upb_MessageDef* entry_m = upb_FieldDef_MessageSubDef(f);
528
+ const upb_FieldDef* key_f = upb_MessageDef_FindFieldByNumber(entry_m, 1);
529
+ const upb_FieldDef* val_f = upb_MessageDef_FindFieldByNumber(entry_m, 2);
530
+ if (TYPE(val) != T_HASH) {
531
+ rb_raise(rb_eArgError,
532
+ "Expected Hash object as initializer value for map field '%s' "
533
+ "(given %s).",
534
+ upb_FieldDef_Name(f), rb_class2name(CLASS_OF(val)));
535
+ }
536
+ MapInit map_init = {map, TypeInfo_get(key_f), TypeInfo_get(val_f), arena};
537
+ rb_hash_foreach(val, Map_initialize_kwarg, (VALUE)&map_init);
538
+ }
539
+
540
+ static upb_MessageValue MessageValue_FromValue(VALUE val, TypeInfo info,
541
+ upb_Arena* arena) {
542
+ if (info.type == kUpb_CType_Message) {
543
+ upb_MessageValue msgval;
544
+ upb_Message* msg = upb_Message_New(info.def.msgdef, arena);
545
+ Message_InitFromValue(msg, info.def.msgdef, val, arena);
546
+ msgval.msg_val = msg;
547
+ return msgval;
548
+ } else {
549
+ return Convert_RubyToUpb(val, "", info, arena);
550
+ }
551
+ }
552
+
553
+ static void RepeatedField_InitFromValue(upb_Array* arr, const upb_FieldDef* f,
554
+ VALUE val, upb_Arena* arena) {
555
+ TypeInfo type_info = TypeInfo_get(f);
556
+
557
+ if (TYPE(val) != T_ARRAY) {
558
+ rb_raise(rb_eArgError,
559
+ "Expected array as initializer value for repeated field '%s' "
560
+ "(given %s).",
561
+ upb_FieldDef_Name(f), rb_class2name(CLASS_OF(val)));
562
+ }
563
+
564
+ for (int i = 0; i < RARRAY_LEN(val); i++) {
565
+ VALUE entry = rb_ary_entry(val, i);
566
+ upb_MessageValue msgval;
567
+ if (upb_FieldDef_IsSubMessage(f) && TYPE(entry) == T_HASH) {
568
+ msgval = MessageValue_FromValue(entry, type_info, arena);
569
+ } else {
570
+ msgval = Convert_RubyToUpb(entry, upb_FieldDef_Name(f), type_info, arena);
571
+ }
572
+ upb_Array_Append(arr, msgval, arena);
573
+ }
574
+ }
575
+
576
+ static void Message_InitFieldFromValue(upb_Message* msg, const upb_FieldDef* f,
577
+ VALUE val, upb_Arena* arena) {
578
+ if (TYPE(val) == T_NIL) return;
579
+
580
+ if (upb_FieldDef_IsMap(f)) {
581
+ upb_Map* map = upb_Message_Mutable(msg, f, arena).map;
582
+ Map_InitFromValue(map, f, val, arena);
583
+ } else if (upb_FieldDef_Label(f) == kUpb_Label_Repeated) {
584
+ upb_Array* arr = upb_Message_Mutable(msg, f, arena).array;
585
+ RepeatedField_InitFromValue(arr, f, val, arena);
586
+ } else if (upb_FieldDef_IsSubMessage(f)) {
587
+ if (TYPE(val) == T_HASH) {
588
+ upb_Message* submsg = upb_Message_Mutable(msg, f, arena).msg;
589
+ Message_InitFromValue(submsg, upb_FieldDef_MessageSubDef(f), val, arena);
175
590
  } else {
176
- return layout_get(self->descriptor->layout, Message_data(self), f);
591
+ Message_setfield(msg, f, val, arena);
177
592
  }
593
+ } else {
594
+ upb_MessageValue msgval =
595
+ Convert_RubyToUpb(val, upb_FieldDef_Name(f), TypeInfo_get(f), arena);
596
+ upb_Message_Set(msg, f, msgval, arena);
178
597
  }
179
598
  }
180
599
 
181
- int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
182
- MessageHeader* self;
183
- VALUE method_str;
184
- char* name;
185
- const upb_fielddef* f;
186
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
600
+ typedef struct {
601
+ upb_Message* msg;
602
+ const upb_MessageDef* msgdef;
603
+ upb_Arena* arena;
604
+ } MsgInit;
187
605
 
188
- if (!SYMBOL_P(key)) {
606
+ static int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
607
+ MsgInit* msg_init = (MsgInit*)_self;
608
+ const char* name;
609
+
610
+ if (TYPE(key) == T_STRING) {
611
+ name = RSTRING_PTR(key);
612
+ } else if (TYPE(key) == T_SYMBOL) {
613
+ name = RSTRING_PTR(rb_id2str(SYM2ID(key)));
614
+ } else {
189
615
  rb_raise(rb_eArgError,
190
- "Expected symbols as hash keys in initialization map.");
616
+ "Expected string or symbols as hash keys when initializing proto "
617
+ "from hash.");
191
618
  }
192
619
 
193
- method_str = rb_id2str(SYM2ID(key));
194
- name = RSTRING_PTR(method_str);
195
- f = upb_msgdef_ntofz(self->descriptor->msgdef, name);
620
+ const upb_FieldDef* f =
621
+ upb_MessageDef_FindFieldByName(msg_init->msgdef, name);
622
+
196
623
  if (f == NULL) {
197
624
  rb_raise(rb_eArgError,
198
625
  "Unknown field name '%s' in initialization map entry.", name);
199
626
  }
200
627
 
201
- if (is_map_field(f)) {
202
- VALUE map;
628
+ Message_InitFieldFromValue(msg_init->msg, f, val, msg_init->arena);
629
+ return ST_CONTINUE;
630
+ }
203
631
 
204
- if (TYPE(val) != T_HASH) {
205
- rb_raise(rb_eArgError,
206
- "Expected Hash object as initializer value for map field '%s'.", name);
207
- }
208
- map = layout_get(self->descriptor->layout, Message_data(self), f);
209
- Map_merge_into_self(map, val);
210
- } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
211
- VALUE ary;
212
-
213
- if (TYPE(val) != T_ARRAY) {
214
- rb_raise(rb_eArgError,
215
- "Expected array as initializer value for repeated field '%s'.", name);
216
- }
217
- ary = layout_get(self->descriptor->layout, Message_data(self), f);
218
- for (int i = 0; i < RARRAY_LEN(val); i++) {
219
- RepeatedField_push(ary, rb_ary_entry(val, i));
220
- }
632
+ void Message_InitFromValue(upb_Message* msg, const upb_MessageDef* m, VALUE val,
633
+ upb_Arena* arena) {
634
+ MsgInit msg_init = {msg, m, arena};
635
+ if (TYPE(val) == T_HASH) {
636
+ rb_hash_foreach(val, Message_initialize_kwarg, (VALUE)&msg_init);
221
637
  } else {
222
- layout_set(self->descriptor->layout, Message_data(self), f, val);
638
+ rb_raise(rb_eArgError, "Expected hash arguments or message, not %s",
639
+ rb_class2name(CLASS_OF(val)));
223
640
  }
224
- return 0;
225
641
  }
226
642
 
227
643
  /*
@@ -236,8 +652,13 @@ int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
236
652
  * have been added to a pool. The method definitions described here on the
237
653
  * Message class are provided on each concrete message class.
238
654
  */
239
- VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
240
- VALUE hash_args;
655
+ static VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
656
+ Message* self = ruby_to_Message(_self);
657
+ VALUE arena_rb = Arena_new();
658
+ upb_Arena* arena = Arena_get(arena_rb);
659
+ upb_Message* msg = upb_Message_New(self->msgdef, arena);
660
+
661
+ Message_InitPtr(_self, msg, arena_rb);
241
662
 
242
663
  if (argc == 0) {
243
664
  return Qnil;
@@ -245,12 +666,7 @@ VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
245
666
  if (argc != 1) {
246
667
  rb_raise(rb_eArgError, "Expected 0 or 1 arguments.");
247
668
  }
248
- hash_args = argv[0];
249
- if (TYPE(hash_args) != T_HASH) {
250
- rb_raise(rb_eArgError, "Expected hash arguments.");
251
- }
252
-
253
- rb_hash_foreach(hash_args, Message_initialize_kwarg, _self);
669
+ Message_InitFromValue((upb_Message*)self->msg, self->msgdef, argv[0], arena);
254
670
  return Qnil;
255
671
  }
256
672
 
@@ -260,37 +676,41 @@ VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
260
676
  *
261
677
  * Performs a shallow copy of this message and returns the new copy.
262
678
  */
263
- VALUE Message_dup(VALUE _self) {
264
- MessageHeader* self;
265
- VALUE new_msg;
266
- MessageHeader* new_msg_self;
267
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
268
-
269
- new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
270
- TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);
271
-
272
- layout_dup(self->descriptor->layout,
273
- Message_data(new_msg_self),
274
- Message_data(self));
275
-
679
+ static VALUE Message_dup(VALUE _self) {
680
+ Message* self = ruby_to_Message(_self);
681
+ VALUE new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
682
+ Message* new_msg_self = ruby_to_Message(new_msg);
683
+ size_t size = upb_MessageDef_MiniTable(self->msgdef)->size;
684
+
685
+ // TODO(copy unknown fields?)
686
+ // TODO(use official upb msg copy function)
687
+ memcpy((upb_Message*)new_msg_self->msg, self->msg, size);
688
+ Arena_fuse(self->arena, Arena_get(new_msg_self->arena));
276
689
  return new_msg;
277
690
  }
278
691
 
279
- // Internal only; used by Google::Protobuf.deep_copy.
280
- VALUE Message_deep_copy(VALUE _self) {
281
- MessageHeader* self;
282
- MessageHeader* new_msg_self;
283
- VALUE new_msg;
284
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
692
+ // Support function for Message_eq, and also used by other #eq functions.
693
+ bool Message_Equal(const upb_Message* m1, const upb_Message* m2,
694
+ const upb_MessageDef* m) {
695
+ if (m1 == m2) return true;
285
696
 
286
- new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
287
- TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);
697
+ size_t size1, size2;
698
+ int encode_opts = kUpb_Encode_SkipUnknown | kUpb_Encode_Deterministic;
699
+ upb_Arena* arena_tmp = upb_Arena_New();
700
+ const upb_MiniTable* layout = upb_MessageDef_MiniTable(m);
288
701
 
289
- layout_deep_copy(self->descriptor->layout,
290
- Message_data(new_msg_self),
291
- Message_data(self));
702
+ // Compare deterministically serialized payloads with no unknown fields.
703
+ char* data1 = upb_Encode(m1, layout, encode_opts, arena_tmp, &size1);
704
+ char* data2 = upb_Encode(m2, layout, encode_opts, arena_tmp, &size2);
292
705
 
293
- return new_msg;
706
+ if (data1 && data2) {
707
+ bool ret = (size1 == size2) && (memcmp(data1, data2, size1) == 0);
708
+ upb_Arena_Free(arena_tmp);
709
+ return ret;
710
+ } else {
711
+ upb_Arena_Free(arena_tmp);
712
+ rb_raise(cParseError, "Error comparing messages");
713
+ }
294
714
  }
295
715
 
296
716
  /*
@@ -302,19 +722,35 @@ VALUE Message_deep_copy(VALUE _self) {
302
722
  * method's semantics (a more efficient comparison may actually be done if the
303
723
  * field is of a primitive type).
304
724
  */
305
- VALUE Message_eq(VALUE _self, VALUE _other) {
306
- MessageHeader* self;
307
- MessageHeader* other;
308
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
309
- TypedData_Get_Struct(_other, MessageHeader, &Message_type, other);
725
+ static VALUE Message_eq(VALUE _self, VALUE _other) {
726
+ if (CLASS_OF(_self) != CLASS_OF(_other)) return Qfalse;
310
727
 
311
- if (self->descriptor != other->descriptor) {
312
- return Qfalse;
313
- }
728
+ Message* self = ruby_to_Message(_self);
729
+ Message* other = ruby_to_Message(_other);
730
+ assert(self->msgdef == other->msgdef);
731
+
732
+ return Message_Equal(self->msg, other->msg, self->msgdef) ? Qtrue : Qfalse;
733
+ }
314
734
 
315
- return layout_eq(self->descriptor->layout,
316
- Message_data(self),
317
- Message_data(other));
735
+ uint64_t Message_Hash(const upb_Message* msg, const upb_MessageDef* m,
736
+ uint64_t seed) {
737
+ upb_Arena* arena = upb_Arena_New();
738
+ const char* data;
739
+ size_t size;
740
+
741
+ // Hash a deterministically serialized payloads with no unknown fields.
742
+ data = upb_Encode(msg, upb_MessageDef_MiniTable(m),
743
+ kUpb_Encode_SkipUnknown | kUpb_Encode_Deterministic, arena,
744
+ &size);
745
+
746
+ if (data) {
747
+ uint64_t ret = _upb_Hash(data, size, seed);
748
+ upb_Arena_Free(arena);
749
+ return ret;
750
+ } else {
751
+ upb_Arena_Free(arena);
752
+ rb_raise(cParseError, "Error calculating hash");
753
+ }
318
754
  }
319
755
 
320
756
  /*
@@ -323,11 +759,12 @@ VALUE Message_eq(VALUE _self, VALUE _other) {
323
759
  *
324
760
  * Returns a hash value that represents this message's field values.
325
761
  */
326
- VALUE Message_hash(VALUE _self) {
327
- MessageHeader* self;
328
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
329
-
330
- return layout_hash(self->descriptor->layout, Message_data(self));
762
+ static VALUE Message_hash(VALUE _self) {
763
+ Message* self = ruby_to_Message(_self);
764
+ uint64_t hash_value = Message_Hash(self->msg, self->msgdef, 0);
765
+ // RUBY_FIXNUM_MAX should be one less than a power of 2.
766
+ assert((RUBY_FIXNUM_MAX & (RUBY_FIXNUM_MAX + 1)) == 0);
767
+ return INT2FIX(hash_value & RUBY_FIXNUM_MAX);
331
768
  }
332
769
 
333
770
  /*
@@ -338,45 +775,128 @@ VALUE Message_hash(VALUE _self) {
338
775
  * formatted as "<MessageType: field1: value1, field2: value2, ...>". Each
339
776
  * field's value is represented according to its own #inspect method.
340
777
  */
341
- VALUE Message_inspect(VALUE _self) {
342
- MessageHeader* self;
343
- VALUE str;
344
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
345
-
346
- str = rb_str_new2("<");
347
- str = rb_str_append(str, rb_str_new2(rb_class2name(CLASS_OF(_self))));
348
- str = rb_str_cat2(str, ": ");
349
- str = rb_str_append(str, layout_inspect(
350
- self->descriptor->layout, Message_data(self)));
351
- str = rb_str_cat2(str, ">");
352
- return str;
353
- }
354
-
355
-
356
- VALUE Message_to_h(VALUE _self) {
357
- MessageHeader* self;
358
- VALUE hash;
359
- upb_msg_field_iter it;
360
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
361
-
362
- hash = rb_hash_new();
363
-
364
- for (upb_msg_field_begin(&it, self->descriptor->msgdef);
365
- !upb_msg_field_done(&it);
366
- upb_msg_field_next(&it)) {
367
- const upb_fielddef* field = upb_msg_iter_field(&it);
368
- VALUE msg_value = layout_get(self->descriptor->layout, Message_data(self),
369
- field);
370
- VALUE msg_key = ID2SYM(rb_intern(upb_fielddef_name(field)));
371
- if (upb_fielddef_label(field) == UPB_LABEL_REPEATED) {
372
- msg_value = RepeatedField_to_ary(msg_value);
778
+ static VALUE Message_inspect(VALUE _self) {
779
+ Message* self = ruby_to_Message(_self);
780
+
781
+ StringBuilder* builder = StringBuilder_New();
782
+ Message_PrintMessage(builder, self->msg, self->msgdef);
783
+ VALUE ret = StringBuilder_ToRubyString(builder);
784
+ StringBuilder_Free(builder);
785
+ return ret;
786
+ }
787
+
788
+ // Support functions for Message_to_h //////////////////////////////////////////
789
+
790
+ static VALUE RepeatedField_CreateArray(const upb_Array* arr,
791
+ TypeInfo type_info) {
792
+ int size = arr ? upb_Array_Size(arr) : 0;
793
+ VALUE ary = rb_ary_new2(size);
794
+
795
+ for (int i = 0; i < size; i++) {
796
+ upb_MessageValue msgval = upb_Array_Get(arr, i);
797
+ VALUE val = Scalar_CreateHash(msgval, type_info);
798
+ rb_ary_push(ary, val);
799
+ }
800
+
801
+ return ary;
802
+ }
803
+
804
+ static VALUE Message_CreateHash(const upb_Message* msg,
805
+ const upb_MessageDef* m) {
806
+ if (!msg) return Qnil;
807
+
808
+ VALUE hash = rb_hash_new();
809
+ int n = upb_MessageDef_FieldCount(m);
810
+ bool is_proto2;
811
+
812
+ // We currently have a few behaviors that are specific to proto2.
813
+ // This is unfortunate, we should key behaviors off field attributes (like
814
+ // whether a field has presence), not proto2 vs. proto3. We should see if we
815
+ // can change this without breaking users.
816
+ is_proto2 = upb_MessageDef_Syntax(m) == kUpb_Syntax_Proto2;
817
+
818
+ for (int i = 0; i < n; i++) {
819
+ const upb_FieldDef* field = upb_MessageDef_Field(m, i);
820
+ TypeInfo type_info = TypeInfo_get(field);
821
+ upb_MessageValue msgval;
822
+ VALUE msg_value;
823
+ VALUE msg_key;
824
+
825
+ if (!is_proto2 && upb_FieldDef_IsSubMessage(field) &&
826
+ !upb_FieldDef_IsRepeated(field) && !upb_Message_Has(msg, field)) {
827
+ // TODO: Legacy behavior, remove when we fix the is_proto2 differences.
828
+ msg_key = ID2SYM(rb_intern(upb_FieldDef_Name(field)));
829
+ rb_hash_aset(hash, msg_key, Qnil);
830
+ continue;
831
+ }
832
+
833
+ // Do not include fields that are not present (oneof or optional fields).
834
+ if (is_proto2 && upb_FieldDef_HasPresence(field) &&
835
+ !upb_Message_Has(msg, field)) {
836
+ continue;
373
837
  }
838
+
839
+ msg_key = ID2SYM(rb_intern(upb_FieldDef_Name(field)));
840
+ msgval = upb_Message_Get(msg, field);
841
+
842
+ // Proto2 omits empty map/repeated filds also.
843
+
844
+ if (upb_FieldDef_IsMap(field)) {
845
+ const upb_MessageDef* entry_m = upb_FieldDef_MessageSubDef(field);
846
+ const upb_FieldDef* key_f = upb_MessageDef_FindFieldByNumber(entry_m, 1);
847
+ const upb_FieldDef* val_f = upb_MessageDef_FindFieldByNumber(entry_m, 2);
848
+ upb_CType key_type = upb_FieldDef_CType(key_f);
849
+ msg_value = Map_CreateHash(msgval.map_val, key_type, TypeInfo_get(val_f));
850
+ } else if (upb_FieldDef_IsRepeated(field)) {
851
+ if (is_proto2 &&
852
+ (!msgval.array_val || upb_Array_Size(msgval.array_val) == 0)) {
853
+ continue;
854
+ }
855
+ msg_value = RepeatedField_CreateArray(msgval.array_val, type_info);
856
+ } else {
857
+ msg_value = Scalar_CreateHash(msgval, type_info);
858
+ }
859
+
374
860
  rb_hash_aset(hash, msg_key, msg_value);
375
861
  }
862
+
376
863
  return hash;
377
864
  }
378
865
 
866
+ VALUE Scalar_CreateHash(upb_MessageValue msgval, TypeInfo type_info) {
867
+ if (type_info.type == kUpb_CType_Message) {
868
+ return Message_CreateHash(msgval.msg_val, type_info.def.msgdef);
869
+ } else {
870
+ return Convert_UpbToRuby(msgval, type_info, Qnil);
871
+ }
872
+ }
873
+
874
+ /*
875
+ * call-seq:
876
+ * Message.to_h => {}
877
+ *
878
+ * Returns the message as a Ruby Hash object, with keys as symbols.
879
+ */
880
+ static VALUE Message_to_h(VALUE _self) {
881
+ Message* self = ruby_to_Message(_self);
882
+ return Message_CreateHash(self->msg, self->msgdef);
883
+ }
379
884
 
885
+ /*
886
+ * call-seq:
887
+ * Message.freeze => self
888
+ *
889
+ * Freezes the message object. We have to intercept this so we can pin the
890
+ * Ruby object into memory so we don't forget it's frozen.
891
+ */
892
+ static VALUE Message_freeze(VALUE _self) {
893
+ Message* self = ruby_to_Message(_self);
894
+ if (!RB_OBJ_FROZEN(_self)) {
895
+ Arena_Pin(self->arena, _self);
896
+ RB_OBJ_FREEZE(_self);
897
+ }
898
+ return _self;
899
+ }
380
900
 
381
901
  /*
382
902
  * call-seq:
@@ -385,16 +905,18 @@ VALUE Message_to_h(VALUE _self) {
385
905
  * Accesses a field's value by field name. The provided field name should be a
386
906
  * string.
387
907
  */
388
- VALUE Message_index(VALUE _self, VALUE field_name) {
389
- MessageHeader* self;
390
- const upb_fielddef* field;
391
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
908
+ static VALUE Message_index(VALUE _self, VALUE field_name) {
909
+ Message* self = ruby_to_Message(_self);
910
+ const upb_FieldDef* field;
911
+
392
912
  Check_Type(field_name, T_STRING);
393
- field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
913
+ field = upb_MessageDef_FindFieldByName(self->msgdef, RSTRING_PTR(field_name));
914
+
394
915
  if (field == NULL) {
395
916
  return Qnil;
396
917
  }
397
- return layout_get(self->descriptor->layout, Message_data(self), field);
918
+
919
+ return Message_getfield(_self, field);
398
920
  }
399
921
 
400
922
  /*
@@ -404,19 +926,258 @@ VALUE Message_index(VALUE _self, VALUE field_name) {
404
926
  * Sets a field's value by field name. The provided field name should be a
405
927
  * string.
406
928
  */
407
- VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
408
- MessageHeader* self;
409
- const upb_fielddef* field;
410
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
929
+ static VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
930
+ Message* self = ruby_to_Message(_self);
931
+ const upb_FieldDef* f;
932
+ upb_MessageValue val;
933
+ upb_Arena* arena = Arena_get(self->arena);
934
+
411
935
  Check_Type(field_name, T_STRING);
412
- field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
413
- if (field == NULL) {
936
+ f = upb_MessageDef_FindFieldByName(self->msgdef, RSTRING_PTR(field_name));
937
+
938
+ if (f == NULL) {
414
939
  rb_raise(rb_eArgError, "Unknown field: %s", RSTRING_PTR(field_name));
415
940
  }
416
- layout_set(self->descriptor->layout, Message_data(self), field, value);
941
+
942
+ val = Convert_RubyToUpb(value, upb_FieldDef_Name(f), TypeInfo_get(f), arena);
943
+ upb_Message_Set(Message_GetMutable(_self, NULL), f, val, arena);
944
+
417
945
  return Qnil;
418
946
  }
419
947
 
948
+ /*
949
+ * call-seq:
950
+ * MessageClass.decode(data, options) => message
951
+ *
952
+ * Decodes the given data (as a string containing bytes in protocol buffers wire
953
+ * format) under the interpretration given by this message class's definition
954
+ * and returns a message object with the corresponding field values.
955
+ * @param options [Hash] options for the decoder
956
+ * recursion_limit: set to maximum decoding depth for message (default is 64)
957
+ */
958
+ static VALUE Message_decode(int argc, VALUE* argv, VALUE klass) {
959
+ VALUE data = argv[0];
960
+ int options = 0;
961
+
962
+ if (argc < 1 || argc > 2) {
963
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
964
+ }
965
+
966
+ if (argc == 2) {
967
+ VALUE hash_args = argv[1];
968
+ if (TYPE(hash_args) != T_HASH) {
969
+ rb_raise(rb_eArgError, "Expected hash arguments.");
970
+ }
971
+
972
+ VALUE depth = rb_hash_lookup(hash_args, ID2SYM(rb_intern("recursion_limit")));
973
+
974
+ if (depth != Qnil && TYPE(depth) == T_FIXNUM) {
975
+ options |= UPB_DECODE_MAXDEPTH(FIX2INT(depth));
976
+ }
977
+ }
978
+
979
+ if (TYPE(data) != T_STRING) {
980
+ rb_raise(rb_eArgError, "Expected string for binary protobuf data.");
981
+ }
982
+
983
+ VALUE msg_rb = initialize_rb_class_with_no_args(klass);
984
+ Message* msg = ruby_to_Message(msg_rb);
985
+
986
+ upb_DecodeStatus status = upb_Decode(
987
+ RSTRING_PTR(data), RSTRING_LEN(data), (upb_Message*)msg->msg,
988
+ upb_MessageDef_MiniTable(msg->msgdef), NULL, options, Arena_get(msg->arena));
989
+
990
+ if (status != kUpb_DecodeStatus_Ok) {
991
+ rb_raise(cParseError, "Error occurred during parsing");
992
+ }
993
+
994
+ return msg_rb;
995
+ }
996
+
997
+ /*
998
+ * call-seq:
999
+ * MessageClass.decode_json(data, options = {}) => message
1000
+ *
1001
+ * Decodes the given data (as a string containing bytes in protocol buffers wire
1002
+ * format) under the interpretration given by this message class's definition
1003
+ * and returns a message object with the corresponding field values.
1004
+ *
1005
+ * @param options [Hash] options for the decoder
1006
+ * ignore_unknown_fields: set true to ignore unknown fields (default is to
1007
+ * raise an error)
1008
+ */
1009
+ static VALUE Message_decode_json(int argc, VALUE* argv, VALUE klass) {
1010
+ VALUE data = argv[0];
1011
+ int options = 0;
1012
+ upb_Status status;
1013
+
1014
+ // TODO(haberman): use this message's pool instead.
1015
+ const upb_DefPool* symtab = DescriptorPool_GetSymtab(generated_pool);
1016
+
1017
+ if (argc < 1 || argc > 2) {
1018
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1019
+ }
1020
+
1021
+ if (argc == 2) {
1022
+ VALUE hash_args = argv[1];
1023
+ if (TYPE(hash_args) != T_HASH) {
1024
+ rb_raise(rb_eArgError, "Expected hash arguments.");
1025
+ }
1026
+
1027
+ if (RTEST(rb_hash_lookup2(
1028
+ hash_args, ID2SYM(rb_intern("ignore_unknown_fields")), Qfalse))) {
1029
+ options |= upb_JsonDecode_IgnoreUnknown;
1030
+ }
1031
+ }
1032
+
1033
+ if (TYPE(data) != T_STRING) {
1034
+ rb_raise(rb_eArgError, "Expected string for JSON data.");
1035
+ }
1036
+
1037
+ // TODO(cfallin): Check and respect string encoding. If not UTF-8, we need to
1038
+ // convert, because string handlers pass data directly to message string
1039
+ // fields.
1040
+
1041
+ VALUE msg_rb = initialize_rb_class_with_no_args(klass);
1042
+ Message* msg = ruby_to_Message(msg_rb);
1043
+
1044
+ // We don't allow users to decode a wrapper type directly.
1045
+ if (IsWrapper(msg->msgdef)) {
1046
+ rb_raise(rb_eRuntimeError, "Cannot parse a wrapper directly.");
1047
+ }
1048
+
1049
+ upb_Status_Clear(&status);
1050
+ if (!upb_JsonDecode(RSTRING_PTR(data), RSTRING_LEN(data),
1051
+ (upb_Message*)msg->msg, msg->msgdef, symtab, options,
1052
+ Arena_get(msg->arena), &status)) {
1053
+ rb_raise(cParseError, "Error occurred during parsing: %s",
1054
+ upb_Status_ErrorMessage(&status));
1055
+ }
1056
+
1057
+ return msg_rb;
1058
+ }
1059
+
1060
+ /*
1061
+ * call-seq:
1062
+ * MessageClass.encode(msg, options) => bytes
1063
+ *
1064
+ * Encodes the given message object to its serialized form in protocol buffers
1065
+ * wire format.
1066
+ * @param options [Hash] options for the encoder
1067
+ * recursion_limit: set to maximum encoding depth for message (default is 64)
1068
+ */
1069
+ static VALUE Message_encode(int argc, VALUE* argv, VALUE klass) {
1070
+ Message* msg = ruby_to_Message(argv[0]);
1071
+ int options = 0;
1072
+ const char* data;
1073
+ size_t size;
1074
+
1075
+ if (CLASS_OF(argv[0]) != klass) {
1076
+ rb_raise(rb_eArgError, "Message of wrong type.");
1077
+ }
1078
+
1079
+ if (argc < 1 || argc > 2) {
1080
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1081
+ }
1082
+
1083
+ if (argc == 2) {
1084
+ VALUE hash_args = argv[1];
1085
+ if (TYPE(hash_args) != T_HASH) {
1086
+ rb_raise(rb_eArgError, "Expected hash arguments.");
1087
+ }
1088
+ VALUE depth = rb_hash_lookup(hash_args, ID2SYM(rb_intern("recursion_limit")));
1089
+
1090
+ if (depth != Qnil && TYPE(depth) == T_FIXNUM) {
1091
+ options |= UPB_DECODE_MAXDEPTH(FIX2INT(depth));
1092
+ }
1093
+ }
1094
+
1095
+ upb_Arena *arena = upb_Arena_New();
1096
+
1097
+ data = upb_Encode(msg->msg, upb_MessageDef_MiniTable(msg->msgdef),
1098
+ options, arena, &size);
1099
+
1100
+ if (data) {
1101
+ VALUE ret = rb_str_new(data, size);
1102
+ rb_enc_associate(ret, rb_ascii8bit_encoding());
1103
+ upb_Arena_Free(arena);
1104
+ return ret;
1105
+ } else {
1106
+ upb_Arena_Free(arena);
1107
+ rb_raise(rb_eRuntimeError, "Exceeded maximum depth (possibly cycle)");
1108
+ }
1109
+ }
1110
+
1111
+ /*
1112
+ * call-seq:
1113
+ * MessageClass.encode_json(msg, options = {}) => json_string
1114
+ *
1115
+ * Encodes the given message object into its serialized JSON representation.
1116
+ * @param options [Hash] options for the decoder
1117
+ * preserve_proto_fieldnames: set true to use original fieldnames (default is
1118
+ * to camelCase) emit_defaults: set true to emit 0/false values (default is to
1119
+ * omit them)
1120
+ */
1121
+ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1122
+ Message* msg = ruby_to_Message(argv[0]);
1123
+ int options = 0;
1124
+ char buf[1024];
1125
+ size_t size;
1126
+ upb_Status status;
1127
+
1128
+ // TODO(haberman): use this message's pool instead.
1129
+ const upb_DefPool* symtab = DescriptorPool_GetSymtab(generated_pool);
1130
+
1131
+ if (argc < 1 || argc > 2) {
1132
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1133
+ }
1134
+
1135
+ if (argc == 2) {
1136
+ VALUE hash_args = argv[1];
1137
+ if (TYPE(hash_args) != T_HASH) {
1138
+ if (RTEST(rb_funcall(hash_args, rb_intern("respond_to?"), 1, rb_str_new2("to_h")))) {
1139
+ hash_args = rb_funcall(hash_args, rb_intern("to_h"), 0);
1140
+ } else {
1141
+ rb_raise(rb_eArgError, "Expected hash arguments.");
1142
+ }
1143
+ }
1144
+
1145
+ if (RTEST(rb_hash_lookup2(hash_args,
1146
+ ID2SYM(rb_intern("preserve_proto_fieldnames")),
1147
+ Qfalse))) {
1148
+ options |= upb_JsonEncode_UseProtoNames;
1149
+ }
1150
+
1151
+ if (RTEST(rb_hash_lookup2(hash_args, ID2SYM(rb_intern("emit_defaults")),
1152
+ Qfalse))) {
1153
+ options |= upb_JsonEncode_EmitDefaults;
1154
+ }
1155
+ }
1156
+
1157
+ upb_Status_Clear(&status);
1158
+ size = upb_JsonEncode(msg->msg, msg->msgdef, symtab, options, buf,
1159
+ sizeof(buf), &status);
1160
+
1161
+ if (!upb_Status_IsOk(&status)) {
1162
+ rb_raise(cParseError, "Error occurred during encoding: %s",
1163
+ upb_Status_ErrorMessage(&status));
1164
+ }
1165
+
1166
+ VALUE ret;
1167
+ if (size >= sizeof(buf)) {
1168
+ char* buf2 = malloc(size + 1);
1169
+ upb_JsonEncode(msg->msg, msg->msgdef, symtab, options, buf2, size + 1,
1170
+ &status);
1171
+ ret = rb_str_new(buf2, size);
1172
+ free(buf2);
1173
+ } else {
1174
+ ret = rb_str_new(buf, size);
1175
+ }
1176
+
1177
+ rb_enc_associate(ret, rb_utf8_encoding());
1178
+ return ret;
1179
+ }
1180
+
420
1181
  /*
421
1182
  * call-seq:
422
1183
  * Message.descriptor => descriptor
@@ -424,22 +1185,15 @@ VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
424
1185
  * Class method that returns the Descriptor instance corresponding to this
425
1186
  * message class's type.
426
1187
  */
427
- VALUE Message_descriptor(VALUE klass) {
1188
+ static VALUE Message_descriptor(VALUE klass) {
428
1189
  return rb_ivar_get(klass, descriptor_instancevar_interned);
429
1190
  }
430
1191
 
431
- VALUE build_class_from_descriptor(Descriptor* desc) {
432
- const char *name;
1192
+ VALUE build_class_from_descriptor(VALUE descriptor) {
1193
+ const char* name;
433
1194
  VALUE klass;
434
1195
 
435
- if (desc->layout == NULL) {
436
- desc->layout = create_layout(desc->msgdef);
437
- }
438
- if (desc->fill_method == NULL) {
439
- desc->fill_method = new_fillmsg_decodermethod(desc, &desc->fill_method);
440
- }
441
-
442
- name = upb_msgdef_fullname(desc->msgdef);
1196
+ name = upb_MessageDef_FullName(Descriptor_GetMsgDef(descriptor));
443
1197
  if (name == NULL) {
444
1198
  rb_raise(rb_eRuntimeError, "Descriptor does not have assigned name.");
445
1199
  }
@@ -447,32 +1201,33 @@ VALUE build_class_from_descriptor(Descriptor* desc) {
447
1201
  klass = rb_define_class_id(
448
1202
  // Docs say this parameter is ignored. User will assign return value to
449
1203
  // their own toplevel constant class name.
450
- rb_intern("Message"),
451
- rb_cObject);
452
- rb_ivar_set(klass, descriptor_instancevar_interned,
453
- get_def_obj(desc->msgdef));
1204
+ rb_intern("Message"), rb_cObject);
1205
+ rb_ivar_set(klass, descriptor_instancevar_interned, descriptor);
454
1206
  rb_define_alloc_func(klass, Message_alloc);
455
1207
  rb_require("google/protobuf/message_exts");
456
- rb_include_module(klass, rb_eval_string("Google::Protobuf::MessageExts"));
1208
+ rb_include_module(klass, rb_eval_string("::Google::Protobuf::MessageExts"));
457
1209
  rb_extend_object(
458
- klass, rb_eval_string("Google::Protobuf::MessageExts::ClassMethods"));
1210
+ klass, rb_eval_string("::Google::Protobuf::MessageExts::ClassMethods"));
459
1211
 
460
- rb_define_method(klass, "method_missing",
461
- Message_method_missing, -1);
1212
+ rb_define_method(klass, "method_missing", Message_method_missing, -1);
1213
+ rb_define_method(klass, "respond_to_missing?", Message_respond_to_missing,
1214
+ -1);
462
1215
  rb_define_method(klass, "initialize", Message_initialize, -1);
463
1216
  rb_define_method(klass, "dup", Message_dup, 0);
464
1217
  // Also define #clone so that we don't inherit Object#clone.
465
1218
  rb_define_method(klass, "clone", Message_dup, 0);
466
1219
  rb_define_method(klass, "==", Message_eq, 1);
1220
+ rb_define_method(klass, "eql?", Message_eq, 1);
1221
+ rb_define_method(klass, "freeze", Message_freeze, 0);
467
1222
  rb_define_method(klass, "hash", Message_hash, 0);
468
1223
  rb_define_method(klass, "to_h", Message_to_h, 0);
469
- rb_define_method(klass, "to_hash", Message_to_h, 0);
470
1224
  rb_define_method(klass, "inspect", Message_inspect, 0);
1225
+ rb_define_method(klass, "to_s", Message_inspect, 0);
471
1226
  rb_define_method(klass, "[]", Message_index, 1);
472
1227
  rb_define_method(klass, "[]=", Message_index_set, 2);
473
- rb_define_singleton_method(klass, "decode", Message_decode, 1);
474
- rb_define_singleton_method(klass, "encode", Message_encode, 1);
475
- rb_define_singleton_method(klass, "decode_json", Message_decode_json, 1);
1228
+ rb_define_singleton_method(klass, "decode", Message_decode, -1);
1229
+ rb_define_singleton_method(klass, "encode", Message_encode, -1);
1230
+ rb_define_singleton_method(klass, "decode_json", Message_decode_json, -1);
476
1231
  rb_define_singleton_method(klass, "encode_json", Message_encode_json, -1);
477
1232
  rb_define_singleton_method(klass, "descriptor", Message_descriptor, 0);
478
1233
 
@@ -486,16 +1241,15 @@ VALUE build_class_from_descriptor(Descriptor* desc) {
486
1241
  * This module method, provided on each generated enum module, looks up an enum
487
1242
  * value by number and returns its name as a Ruby symbol, or nil if not found.
488
1243
  */
489
- VALUE enum_lookup(VALUE self, VALUE number) {
1244
+ static VALUE enum_lookup(VALUE self, VALUE number) {
490
1245
  int32_t num = NUM2INT(number);
491
1246
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
492
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);
493
-
494
- const char* name = upb_enumdef_iton(enumdesc->enumdef, num);
495
- if (name == NULL) {
496
- return Qnil;
1247
+ const upb_EnumDef* e = EnumDescriptor_GetEnumDef(desc);
1248
+ const upb_EnumValueDef* ev = upb_EnumDef_FindValueByNumber(e, num);
1249
+ if (ev) {
1250
+ return ID2SYM(rb_intern(upb_EnumValueDef_Name(ev)));
497
1251
  } else {
498
- return ID2SYM(rb_intern(name));
1252
+ return Qnil;
499
1253
  }
500
1254
  }
501
1255
 
@@ -506,17 +1260,15 @@ VALUE enum_lookup(VALUE self, VALUE number) {
506
1260
  * This module method, provided on each generated enum module, looks up an enum
507
1261
  * value by name (as a Ruby symbol) and returns its name, or nil if not found.
508
1262
  */
509
- VALUE enum_resolve(VALUE self, VALUE sym) {
1263
+ static VALUE enum_resolve(VALUE self, VALUE sym) {
510
1264
  const char* name = rb_id2name(SYM2ID(sym));
511
1265
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
512
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);
513
-
514
- int32_t num = 0;
515
- bool found = upb_enumdef_ntoiz(enumdesc->enumdef, name, &num);
516
- if (!found) {
517
- return Qnil;
1266
+ const upb_EnumDef* e = EnumDescriptor_GetEnumDef(desc);
1267
+ const upb_EnumValueDef* ev = upb_EnumDef_FindValueByName(e, name);
1268
+ if (ev) {
1269
+ return INT2NUM(upb_EnumValueDef_Number(ev));
518
1270
  } else {
519
- return INT2NUM(num);
1271
+ return Qnil;
520
1272
  }
521
1273
  }
522
1274
 
@@ -527,25 +1279,24 @@ VALUE enum_resolve(VALUE self, VALUE sym) {
527
1279
  * This module method, provided on each generated enum module, returns the
528
1280
  * EnumDescriptor corresponding to this enum type.
529
1281
  */
530
- VALUE enum_descriptor(VALUE self) {
1282
+ static VALUE enum_descriptor(VALUE self) {
531
1283
  return rb_ivar_get(self, descriptor_instancevar_interned);
532
1284
  }
533
1285
 
534
- VALUE build_module_from_enumdesc(EnumDescriptor* enumdesc) {
535
- VALUE mod = rb_define_module_id(
536
- rb_intern(upb_enumdef_fullname(enumdesc->enumdef)));
1286
+ VALUE build_module_from_enumdesc(VALUE _enumdesc) {
1287
+ const upb_EnumDef* e = EnumDescriptor_GetEnumDef(_enumdesc);
1288
+ VALUE mod = rb_define_module_id(rb_intern(upb_EnumDef_FullName(e)));
537
1289
 
538
- upb_enum_iter it;
539
- for (upb_enum_begin(&it, enumdesc->enumdef);
540
- !upb_enum_done(&it);
541
- upb_enum_next(&it)) {
542
- const char* name = upb_enum_iter_name(&it);
543
- int32_t value = upb_enum_iter_number(&it);
1290
+ int n = upb_EnumDef_ValueCount(e);
1291
+ for (int i = 0; i < n; i++) {
1292
+ const upb_EnumValueDef* ev = upb_EnumDef_Value(e, i);
1293
+ const char* name = upb_EnumValueDef_Name(ev);
1294
+ int32_t value = upb_EnumValueDef_Number(ev);
544
1295
  if (name[0] < 'A' || name[0] > 'Z') {
545
- rb_raise(rb_eTypeError,
546
- "Enum value '%s' does not start with an uppercase letter "
547
- "as is required for Ruby constants.",
548
- name);
1296
+ rb_warn(
1297
+ "Enum value '%s' does not start with an uppercase letter "
1298
+ "as is required for Ruby constants.",
1299
+ name);
549
1300
  }
550
1301
  rb_define_const(mod, name, INT2NUM(value));
551
1302
  }
@@ -553,26 +1304,99 @@ VALUE build_module_from_enumdesc(EnumDescriptor* enumdesc) {
553
1304
  rb_define_singleton_method(mod, "lookup", enum_lookup, 1);
554
1305
  rb_define_singleton_method(mod, "resolve", enum_resolve, 1);
555
1306
  rb_define_singleton_method(mod, "descriptor", enum_descriptor, 0);
556
- rb_ivar_set(mod, descriptor_instancevar_interned,
557
- get_def_obj(enumdesc->enumdef));
1307
+ rb_ivar_set(mod, descriptor_instancevar_interned, _enumdesc);
558
1308
 
559
1309
  return mod;
560
1310
  }
561
1311
 
562
- /*
563
- * call-seq:
564
- * Google::Protobuf.deep_copy(obj) => copy_of_obj
565
- *
566
- * Performs a deep copy of a RepeatedField instance, a Map instance, or a
567
- * message object, recursively copying its members.
568
- */
569
- VALUE Google_Protobuf_deep_copy(VALUE self, VALUE obj) {
570
- VALUE klass = CLASS_OF(obj);
571
- if (klass == cRepeatedField) {
572
- return RepeatedField_deep_copy(obj);
573
- } else if (klass == cMap) {
574
- return Map_deep_copy(obj);
575
- } else {
576
- return Message_deep_copy(obj);
1312
+ // Internal only; used by Google::Protobuf.deep_copy.
1313
+ upb_Message* Message_deep_copy(const upb_Message* msg, const upb_MessageDef* m,
1314
+ upb_Arena* arena) {
1315
+ // Serialize and parse.
1316
+ upb_Arena* tmp_arena = upb_Arena_New();
1317
+ const upb_MiniTable* layout = upb_MessageDef_MiniTable(m);
1318
+ size_t size;
1319
+
1320
+ char* data = upb_Encode(msg, layout, 0, tmp_arena, &size);
1321
+ upb_Message* new_msg = upb_Message_New(m, arena);
1322
+
1323
+ if (!data || upb_Decode(data, size, new_msg, layout, NULL, 0, arena) !=
1324
+ kUpb_DecodeStatus_Ok) {
1325
+ upb_Arena_Free(tmp_arena);
1326
+ rb_raise(cParseError, "Error occurred copying proto");
1327
+ }
1328
+
1329
+ upb_Arena_Free(tmp_arena);
1330
+ return new_msg;
1331
+ }
1332
+
1333
+ const upb_Message* Message_GetUpbMessage(VALUE value, const upb_MessageDef* m,
1334
+ const char* name, upb_Arena* arena) {
1335
+ if (value == Qnil) {
1336
+ rb_raise(cTypeError, "nil message not allowed here.");
577
1337
  }
1338
+
1339
+ VALUE klass = CLASS_OF(value);
1340
+ VALUE desc_rb = rb_ivar_get(klass, descriptor_instancevar_interned);
1341
+ const upb_MessageDef* val_m =
1342
+ desc_rb == Qnil ? NULL : Descriptor_GetMsgDef(desc_rb);
1343
+
1344
+ if (val_m != m) {
1345
+ // Check for possible implicit conversions
1346
+ // TODO: hash conversion?
1347
+
1348
+ switch (upb_MessageDef_WellKnownType(m)) {
1349
+ case kUpb_WellKnown_Timestamp: {
1350
+ // Time -> Google::Protobuf::Timestamp
1351
+ upb_Message* msg = upb_Message_New(m, arena);
1352
+ upb_MessageValue sec, nsec;
1353
+ struct timespec time;
1354
+ const upb_FieldDef* sec_f = upb_MessageDef_FindFieldByNumber(m, 1);
1355
+ const upb_FieldDef* nsec_f = upb_MessageDef_FindFieldByNumber(m, 2);
1356
+
1357
+ if (!rb_obj_is_kind_of(value, rb_cTime)) goto badtype;
1358
+
1359
+ time = rb_time_timespec(value);
1360
+ sec.int64_val = time.tv_sec;
1361
+ nsec.int32_val = time.tv_nsec;
1362
+ upb_Message_Set(msg, sec_f, sec, arena);
1363
+ upb_Message_Set(msg, nsec_f, nsec, arena);
1364
+ return msg;
1365
+ }
1366
+ case kUpb_WellKnown_Duration: {
1367
+ // Numeric -> Google::Protobuf::Duration
1368
+ upb_Message* msg = upb_Message_New(m, arena);
1369
+ upb_MessageValue sec, nsec;
1370
+ const upb_FieldDef* sec_f = upb_MessageDef_FindFieldByNumber(m, 1);
1371
+ const upb_FieldDef* nsec_f = upb_MessageDef_FindFieldByNumber(m, 2);
1372
+
1373
+ if (!rb_obj_is_kind_of(value, rb_cNumeric)) goto badtype;
1374
+
1375
+ sec.int64_val = NUM2LL(value);
1376
+ nsec.int32_val = round((NUM2DBL(value) - NUM2LL(value)) * 1000000000);
1377
+ upb_Message_Set(msg, sec_f, sec, arena);
1378
+ upb_Message_Set(msg, nsec_f, nsec, arena);
1379
+ return msg;
1380
+ }
1381
+ default:
1382
+ badtype:
1383
+ rb_raise(cTypeError,
1384
+ "Invalid type %s to assign to submessage field '%s'.",
1385
+ rb_class2name(CLASS_OF(value)), name);
1386
+ }
1387
+ }
1388
+
1389
+ Message* self = ruby_to_Message(value);
1390
+ Arena_fuse(self->arena, arena);
1391
+
1392
+ return self->msg;
1393
+ }
1394
+
1395
+ void Message_register(VALUE protobuf) {
1396
+ cParseError = rb_const_get(protobuf, rb_intern("ParseError"));
1397
+
1398
+ // Ruby-interned string: "descriptor". We use this identifier to store an
1399
+ // instance variable on message classes we create in order to link them back
1400
+ // to their descriptors.
1401
+ descriptor_instancevar_interned = rb_intern("descriptor");
578
1402
  }