google-protobuf 3.11.3 → 3.19.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of google-protobuf might be problematic. Click here for more details.

@@ -28,49 +28,60 @@
28
28
  // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29
29
  // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
30
 
31
+ #include "message.h"
32
+
33
+ #include "convert.h"
34
+ #include "defs.h"
35
+ #include "map.h"
31
36
  #include "protobuf.h"
37
+ #include "repeated_field.h"
32
38
 
33
- // -----------------------------------------------------------------------------
34
- // Class/module creation from msgdefs and enumdefs, respectively.
35
- // -----------------------------------------------------------------------------
39
+ static VALUE cParseError = Qnil;
40
+ static ID descriptor_instancevar_interned;
36
41
 
37
- void* Message_data(void* msg) {
38
- return ((uint8_t *)msg) + sizeof(MessageHeader);
42
+ static VALUE initialize_rb_class_with_no_args(VALUE klass) {
43
+ return rb_funcall(klass, rb_intern("new"), 0);
39
44
  }
40
45
 
41
- void Message_mark(void* _self) {
42
- MessageHeader* self = (MessageHeader *)_self;
43
- layout_mark(self->descriptor->layout, Message_data(self));
46
+ VALUE MessageOrEnum_GetDescriptor(VALUE klass) {
47
+ return rb_ivar_get(klass, descriptor_instancevar_interned);
44
48
  }
45
49
 
46
- void Message_free(void* self) {
47
- stringsink* unknown = ((MessageHeader *)self)->unknown_fields;
48
- if (unknown != NULL) {
49
- stringsink_uninit(unknown);
50
- free(unknown);
51
- }
52
- xfree(self);
50
+ // -----------------------------------------------------------------------------
51
+ // Class/module creation from msgdefs and enumdefs, respectively.
52
+ // -----------------------------------------------------------------------------
53
+
54
+ typedef struct {
55
+ VALUE arena;
56
+ const upb_msg* msg; // Can get as mutable when non-frozen.
57
+ const upb_msgdef* msgdef; // kept alive by self.class.descriptor reference.
58
+ } Message;
59
+
60
+ static void Message_mark(void* _self) {
61
+ Message* self = (Message *)_self;
62
+ rb_gc_mark(self->arena);
53
63
  }
54
64
 
55
- rb_data_type_t Message_type = {
65
+ static rb_data_type_t Message_type = {
56
66
  "Message",
57
- { Message_mark, Message_free, NULL },
67
+ { Message_mark, RUBY_DEFAULT_FREE, NULL },
68
+ .flags = RUBY_TYPED_FREE_IMMEDIATELY,
58
69
  };
59
70
 
60
- VALUE Message_alloc(VALUE klass) {
71
+ static Message* ruby_to_Message(VALUE msg_rb) {
72
+ Message* msg;
73
+ TypedData_Get_Struct(msg_rb, Message, &Message_type, msg);
74
+ return msg;
75
+ }
76
+
77
+ static VALUE Message_alloc(VALUE klass) {
61
78
  VALUE descriptor = rb_ivar_get(klass, descriptor_instancevar_interned);
62
- Descriptor* desc = ruby_to_Descriptor(descriptor);
63
- MessageHeader* msg;
79
+ Message* msg = ALLOC(Message);
64
80
  VALUE ret;
65
81
 
66
- if (desc->layout == NULL) {
67
- create_layout(desc);
68
- }
69
-
70
- msg = (void*)ALLOC_N(uint8_t, sizeof(MessageHeader) + desc->layout->size);
71
- msg->descriptor = desc;
72
- msg->unknown_fields = NULL;
73
- memcpy(Message_data(msg), desc->layout->empty_template, desc->layout->size);
82
+ msg->msgdef = Descriptor_GetMsgDef(descriptor);
83
+ msg->arena = Qnil;
84
+ msg->msg = NULL;
74
85
 
75
86
  ret = TypedData_Wrap_Struct(klass, &Message_type, msg);
76
87
  rb_ivar_set(ret, descriptor_instancevar_interned, descriptor);
@@ -78,24 +89,92 @@ VALUE Message_alloc(VALUE klass) {
78
89
  return ret;
79
90
  }
80
91
 
81
- static const upb_fielddef* which_oneof_field(MessageHeader* self, const upb_oneofdef* o) {
82
- uint32_t oneof_case;
83
- const upb_fielddef* f;
92
+ const upb_msg *Message_Get(VALUE msg_rb, const upb_msgdef **m) {
93
+ Message* msg = ruby_to_Message(msg_rb);
94
+ if (m) *m = msg->msgdef;
95
+ return msg->msg;
96
+ }
84
97
 
85
- oneof_case =
86
- slot_read_oneof_case(self->descriptor->layout, Message_data(self), o);
98
+ upb_msg *Message_GetMutable(VALUE msg_rb, const upb_msgdef **m) {
99
+ rb_check_frozen(msg_rb);
100
+ return (upb_msg*)Message_Get(msg_rb, m);
101
+ }
87
102
 
88
- if (oneof_case == ONEOF_CASE_NONE) {
89
- return NULL;
103
+ void Message_InitPtr(VALUE self_, upb_msg *msg, VALUE arena) {
104
+ Message* self = ruby_to_Message(self_);
105
+ self->msg = msg;
106
+ self->arena = arena;
107
+ ObjectCache_Add(msg, self_);
108
+ }
109
+
110
+ VALUE Message_GetArena(VALUE msg_rb) {
111
+ Message* msg = ruby_to_Message(msg_rb);
112
+ return msg->arena;
113
+ }
114
+
115
+ void Message_CheckClass(VALUE klass) {
116
+ if (rb_get_alloc_func(klass) != &Message_alloc) {
117
+ rb_raise(rb_eArgError,
118
+ "Message class was not returned by the DescriptorPool.");
119
+ }
120
+ }
121
+
122
+ VALUE Message_GetRubyWrapper(upb_msg* msg, const upb_msgdef* m, VALUE arena) {
123
+ if (msg == NULL) return Qnil;
124
+
125
+ VALUE val = ObjectCache_Get(msg);
126
+
127
+ if (val == Qnil) {
128
+ VALUE klass = Descriptor_DefToClass(m);
129
+ val = Message_alloc(klass);
130
+ Message_InitPtr(val, msg, arena);
90
131
  }
91
132
 
92
- // oneof_case is a field index, so find that field.
93
- f = upb_oneofdef_itof(o, oneof_case);
94
- assert(f != NULL);
133
+ return val;
134
+ }
135
+
136
+ void Message_PrintMessage(StringBuilder* b, const upb_msg* msg,
137
+ const upb_msgdef* m) {
138
+ bool first = true;
139
+ int n = upb_msgdef_fieldcount(m);
140
+ VALUE klass = Descriptor_DefToClass(m);
141
+ StringBuilder_Printf(b, "<%s: ", rb_class2name(klass));
142
+
143
+ for (int i = 0; i < n; i++) {
144
+ const upb_fielddef* field = upb_msgdef_field(m, i);
145
+
146
+ if (upb_fielddef_haspresence(field) && !upb_msg_has(msg, field)) {
147
+ continue;
148
+ }
149
+
150
+ if (!first) {
151
+ StringBuilder_Printf(b, ", ");
152
+ } else {
153
+ first = false;
154
+ }
155
+
156
+ upb_msgval msgval = upb_msg_get(msg, field);
157
+
158
+ StringBuilder_Printf(b, "%s: ", upb_fielddef_name(field));
159
+
160
+ if (upb_fielddef_ismap(field)) {
161
+ const upb_msgdef* entry_m = upb_fielddef_msgsubdef(field);
162
+ const upb_fielddef* key_f = upb_msgdef_itof(entry_m, 1);
163
+ const upb_fielddef* val_f = upb_msgdef_itof(entry_m, 2);
164
+ TypeInfo val_info = TypeInfo_get(val_f);
165
+ Map_Inspect(b, msgval.map_val, upb_fielddef_type(key_f), val_info);
166
+ } else if (upb_fielddef_isseq(field)) {
167
+ RepeatedField_Inspect(b, msgval.array_val, TypeInfo_get(field));
168
+ } else {
169
+ StringBuilder_PrintMsgval(b, msgval, TypeInfo_get(field));
170
+ }
171
+ }
95
172
 
96
- return f;
173
+ StringBuilder_Printf(b, ">");
97
174
  }
98
175
 
176
+ // Helper functions for #method_missing ////////////////////////////////////////
177
+
99
178
  enum {
100
179
  METHOD_UNKNOWN = 0,
101
180
  METHOD_GETTER = 1,
@@ -108,148 +187,203 @@ enum {
108
187
  };
109
188
 
110
189
  // Check if the field is a well known wrapper type
111
- bool is_wrapper_type_field(const upb_fielddef* field) {
112
- const upb_msgdef *m;
113
- if (upb_fielddef_type(field) != UPB_TYPE_MESSAGE) {
190
+ static bool IsWrapper(const upb_fielddef* f) {
191
+ return upb_fielddef_issubmsg(f) &&
192
+ upb_msgdef_iswrapper(upb_fielddef_msgsubdef(f));
193
+ }
194
+
195
+ static bool Match(const upb_msgdef* m, const char* name, const upb_fielddef** f,
196
+ const upb_oneofdef** o, const char* prefix,
197
+ const char* suffix) {
198
+ size_t sp = strlen(prefix);
199
+ size_t ss = strlen(suffix);
200
+ size_t sn = strlen(name);
201
+
202
+ if (sn <= sp + ss) return false;
203
+
204
+ if (memcmp(name, prefix, sp) != 0 ||
205
+ memcmp(name + sn - ss, suffix, ss) != 0) {
114
206
  return false;
115
207
  }
116
- m = upb_fielddef_msgsubdef(field);
117
- switch (upb_msgdef_wellknowntype(m)) {
118
- case UPB_WELLKNOWN_DOUBLEVALUE:
119
- case UPB_WELLKNOWN_FLOATVALUE:
120
- case UPB_WELLKNOWN_INT64VALUE:
121
- case UPB_WELLKNOWN_UINT64VALUE:
122
- case UPB_WELLKNOWN_INT32VALUE:
123
- case UPB_WELLKNOWN_UINT32VALUE:
124
- case UPB_WELLKNOWN_STRINGVALUE:
125
- case UPB_WELLKNOWN_BYTESVALUE:
126
- case UPB_WELLKNOWN_BOOLVALUE:
127
- return true;
128
- default:
129
- return false;
130
- }
208
+
209
+ return upb_msgdef_lookupname(m, name + sp, sn - sp - ss, f, o);
131
210
  }
132
211
 
133
- // Get a new Ruby wrapper type and set the initial value
134
- VALUE ruby_wrapper_type(VALUE type_class, VALUE value) {
135
- if (value != Qnil) {
136
- VALUE hash = rb_hash_new();
137
- rb_hash_aset(hash, rb_str_new2("value"), value);
138
- {
139
- VALUE args[1] = {hash};
140
- return rb_class_new_instance(1, args, type_class);
212
+ static int extract_method_call(VALUE method_name, Message* self,
213
+ const upb_fielddef** f, const upb_oneofdef** o) {
214
+ const upb_msgdef* m = self->msgdef;
215
+ const char* name;
216
+
217
+ Check_Type(method_name, T_SYMBOL);
218
+ name = rb_id2name(SYM2ID(method_name));
219
+
220
+ if (Match(m, name, f, o, "", "")) return METHOD_GETTER;
221
+ if (Match(m, name, f, o, "", "=")) return METHOD_SETTER;
222
+ if (Match(m, name, f, o, "clear_", "")) return METHOD_CLEAR;
223
+ if (Match(m, name, f, o, "has_", "?") &&
224
+ (*o || (*f && upb_fielddef_haspresence(*f)))) {
225
+ // Disallow oneof hazzers for proto3.
226
+ // TODO(haberman): remove this test when we are enabling oneof hazzers for
227
+ // proto3.
228
+ if (*f && !upb_fielddef_issubmsg(*f) &&
229
+ upb_fielddef_realcontainingoneof(*f) &&
230
+ upb_msgdef_syntax(upb_fielddef_containingtype(*f)) !=
231
+ UPB_SYNTAX_PROTO2) {
232
+ return METHOD_UNKNOWN;
141
233
  }
234
+ return METHOD_PRESENCE;
235
+ }
236
+ if (Match(m, name, f, o, "", "_as_value") && *f && !upb_fielddef_isseq(*f) &&
237
+ IsWrapper(*f)) {
238
+ return METHOD_WRAPPER_GETTER;
239
+ }
240
+ if (Match(m, name, f, o, "", "_as_value=") && *f && !upb_fielddef_isseq(*f) &&
241
+ IsWrapper(*f)) {
242
+ return METHOD_WRAPPER_SETTER;
243
+ }
244
+ if (Match(m, name, f, o, "", "_const") && *f &&
245
+ upb_fielddef_type(*f) == UPB_TYPE_ENUM) {
246
+ return METHOD_ENUM_GETTER;
142
247
  }
143
- return Qnil;
144
- }
145
248
 
146
- static int extract_method_call(VALUE method_name, MessageHeader* self,
147
- const upb_fielddef **f, const upb_oneofdef **o) {
148
- VALUE method_str;
149
- char* name;
150
- size_t name_len;
151
- int accessor_type;
152
- const upb_oneofdef* test_o;
153
- const upb_fielddef* test_f;
154
- bool has_field;
249
+ return METHOD_UNKNOWN;
250
+ }
155
251
 
156
- Check_Type(method_name, T_SYMBOL);
252
+ static VALUE Message_oneof_accessor(VALUE _self, const upb_oneofdef* o,
253
+ int accessor_type) {
254
+ Message* self = ruby_to_Message(_self);
255
+ const upb_fielddef* oneof_field = upb_msg_whichoneof(self->msg, o);
157
256
 
158
- method_str = rb_id2str(SYM2ID(method_name));
159
- name = RSTRING_PTR(method_str);
160
- name_len = RSTRING_LEN(method_str);
161
-
162
- if (name[name_len - 1] == '=') {
163
- accessor_type = METHOD_SETTER;
164
- name_len--;
165
- // We want to ensure if the proto has something named clear_foo or has_foo?,
166
- // we don't strip the prefix.
167
- } else if (strncmp("clear_", name, 6) == 0 &&
168
- !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
169
- &test_f, &test_o)) {
170
- accessor_type = METHOD_CLEAR;
171
- name = name + 6;
172
- name_len = name_len - 6;
173
- } else if (strncmp("has_", name, 4) == 0 && name[name_len - 1] == '?' &&
174
- !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
175
- &test_f, &test_o)) {
176
- accessor_type = METHOD_PRESENCE;
177
- name = name + 4;
178
- name_len = name_len - 5;
179
- } else {
180
- accessor_type = METHOD_GETTER;
181
- }
182
-
183
- has_field = upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
184
- &test_f, &test_o);
185
-
186
- // Look for wrapper type accessor of the form <field_name>_as_value
187
- if (!has_field &&
188
- (accessor_type == METHOD_GETTER || accessor_type == METHOD_SETTER) &&
189
- name_len > 9 && strncmp(name + name_len - 9, "_as_value", 9) == 0) {
190
- const upb_oneofdef* test_o_wrapper;
191
- const upb_fielddef* test_f_wrapper;
192
- char wrapper_field_name[name_len - 8];
193
-
194
- // Find the field name
195
- strncpy(wrapper_field_name, name, name_len - 9);
196
- wrapper_field_name[name_len - 9] = '\0';
197
-
198
- // Check if field exists and is a wrapper type
199
- if (upb_msgdef_lookupname(self->descriptor->msgdef, wrapper_field_name,
200
- name_len - 9, &test_f_wrapper, &test_o_wrapper) &&
201
- is_wrapper_type_field(test_f_wrapper)) {
202
- // It does exist!
203
- has_field = true;
204
- if (accessor_type == METHOD_SETTER) {
205
- accessor_type = METHOD_WRAPPER_SETTER;
206
- } else {
207
- accessor_type = METHOD_WRAPPER_GETTER;
257
+ switch (accessor_type) {
258
+ case METHOD_PRESENCE:
259
+ return oneof_field == NULL ? Qfalse : Qtrue;
260
+ case METHOD_CLEAR:
261
+ if (oneof_field != NULL) {
262
+ upb_msg_clearfield(Message_GetMutable(_self, NULL), oneof_field);
208
263
  }
209
- test_o = test_o_wrapper;
210
- test_f = test_f_wrapper;
211
- }
264
+ return Qnil;
265
+ case METHOD_GETTER:
266
+ return oneof_field == NULL
267
+ ? Qnil
268
+ : ID2SYM(rb_intern(upb_fielddef_name(oneof_field)));
269
+ case METHOD_SETTER:
270
+ rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
212
271
  }
272
+ rb_raise(rb_eRuntimeError, "Invalid access of oneof field.");
273
+ }
213
274
 
214
- // Look for enum accessor of the form <enum_name>_const
215
- if (!has_field && accessor_type == METHOD_GETTER &&
216
- name_len > 6 && strncmp(name + name_len - 6, "_const", 6) == 0) {
217
- const upb_oneofdef* test_o_enum;
218
- const upb_fielddef* test_f_enum;
219
- char enum_name[name_len - 5];
220
-
221
- // Find enum field name
222
- strncpy(enum_name, name, name_len - 6);
223
- enum_name[name_len - 6] = '\0';
224
-
225
- // Check if enum field exists
226
- if (upb_msgdef_lookupname(self->descriptor->msgdef, enum_name, name_len - 6,
227
- &test_f_enum, &test_o_enum) &&
228
- upb_fielddef_type(test_f_enum) == UPB_TYPE_ENUM) {
229
- // It does exist!
230
- has_field = true;
231
- accessor_type = METHOD_ENUM_GETTER;
232
- test_o = test_o_enum;
233
- test_f = test_f_enum;
275
+ static void Message_setfield(upb_msg* msg, const upb_fielddef* f, VALUE val,
276
+ upb_arena* arena) {
277
+ upb_msgval msgval;
278
+ if (upb_fielddef_ismap(f)) {
279
+ msgval.map_val = Map_GetUpbMap(val, f, arena);
280
+ } else if (upb_fielddef_isseq(f)) {
281
+ msgval.array_val = RepeatedField_GetUpbArray(val, f, arena);
282
+ } else {
283
+ if (val == Qnil &&
284
+ (upb_fielddef_issubmsg(f) || upb_fielddef_realcontainingoneof(f))) {
285
+ upb_msg_clearfield(msg, f);
286
+ return;
234
287
  }
288
+ msgval =
289
+ Convert_RubyToUpb(val, upb_fielddef_name(f), TypeInfo_get(f), arena);
235
290
  }
291
+ upb_msg_set(msg, f, msgval, arena);
292
+ }
236
293
 
237
- // Verify the name corresponds to a oneof or field in this message.
238
- if (!has_field) {
239
- return METHOD_UNKNOWN;
294
+ VALUE Message_getfield(VALUE _self, const upb_fielddef* f) {
295
+ Message* self = ruby_to_Message(_self);
296
+ // This is a special-case: upb_msg_mutable() for map & array are logically
297
+ // const (they will not change what is serialized) but physically
298
+ // non-const, as they do allocate a repeated field or map. The logical
299
+ // constness means it's ok to do even if the message is frozen.
300
+ upb_msg *msg = (upb_msg*)self->msg;
301
+ upb_arena *arena = Arena_get(self->arena);
302
+ if (upb_fielddef_ismap(f)) {
303
+ upb_map *map = upb_msg_mutable(msg, f, arena).map;
304
+ const upb_fielddef *key_f = map_field_key(f);
305
+ const upb_fielddef *val_f = map_field_value(f);
306
+ upb_fieldtype_t key_type = upb_fielddef_type(key_f);
307
+ TypeInfo value_type_info = TypeInfo_get(val_f);
308
+ return Map_GetRubyWrapper(map, key_type, value_type_info, self->arena);
309
+ } else if (upb_fielddef_isseq(f)) {
310
+ upb_array *arr = upb_msg_mutable(msg, f, arena).array;
311
+ return RepeatedField_GetRubyWrapper(arr, TypeInfo_get(f), self->arena);
312
+ } else if (upb_fielddef_issubmsg(f)) {
313
+ if (!upb_msg_has(self->msg, f)) return Qnil;
314
+ upb_msg *submsg = upb_msg_mutable(msg, f, arena).msg;
315
+ const upb_msgdef *m = upb_fielddef_msgsubdef(f);
316
+ return Message_GetRubyWrapper(submsg, m, self->arena);
317
+ } else {
318
+ upb_msgval msgval = upb_msg_get(self->msg, f);
319
+ return Convert_UpbToRuby(msgval, TypeInfo_get(f), self->arena);
240
320
  }
321
+ }
241
322
 
242
- // Method calls like 'has_foo?' are not allowed if field "foo" does not have
243
- // a hasbit (e.g. repeated fields or non-message type fields for proto3
244
- // syntax).
245
- if (accessor_type == METHOD_PRESENCE && test_f != NULL &&
246
- !upb_fielddef_haspresence(test_f)) {
247
- return METHOD_UNKNOWN;
248
- }
323
+ static VALUE Message_field_accessor(VALUE _self, const upb_fielddef* f,
324
+ int accessor_type, int argc, VALUE* argv) {
325
+ upb_arena *arena = Arena_get(Message_GetArena(_self));
249
326
 
250
- *o = test_o;
251
- *f = test_f;
252
- return accessor_type;
327
+ switch (accessor_type) {
328
+ case METHOD_SETTER:
329
+ Message_setfield(Message_GetMutable(_self, NULL), f, argv[1], arena);
330
+ return Qnil;
331
+ case METHOD_CLEAR:
332
+ upb_msg_clearfield(Message_GetMutable(_self, NULL), f);
333
+ return Qnil;
334
+ case METHOD_PRESENCE:
335
+ if (!upb_fielddef_haspresence(f)) {
336
+ rb_raise(rb_eRuntimeError, "Field does not have presence.");
337
+ }
338
+ return upb_msg_has(Message_Get(_self, NULL), f);
339
+ case METHOD_WRAPPER_GETTER: {
340
+ Message* self = ruby_to_Message(_self);
341
+ if (upb_msg_has(self->msg, f)) {
342
+ PBRUBY_ASSERT(upb_fielddef_issubmsg(f) && !upb_fielddef_isseq(f));
343
+ upb_msgval wrapper = upb_msg_get(self->msg, f);
344
+ const upb_msgdef *wrapper_m = upb_fielddef_msgsubdef(f);
345
+ const upb_fielddef *value_f = upb_msgdef_itof(wrapper_m, 1);
346
+ upb_msgval value = upb_msg_get(wrapper.msg_val, value_f);
347
+ return Convert_UpbToRuby(value, TypeInfo_get(value_f), self->arena);
348
+ } else {
349
+ return Qnil;
350
+ }
351
+ }
352
+ case METHOD_WRAPPER_SETTER: {
353
+ upb_msg *msg = Message_GetMutable(_self, NULL);
354
+ if (argv[1] == Qnil) {
355
+ upb_msg_clearfield(msg, f);
356
+ } else {
357
+ const upb_fielddef *val_f = upb_msgdef_itof(upb_fielddef_msgsubdef(f), 1);
358
+ upb_msgval msgval = Convert_RubyToUpb(argv[1], upb_fielddef_name(f),
359
+ TypeInfo_get(val_f), arena);
360
+ upb_msg *wrapper = upb_msg_mutable(msg, f, arena).msg;
361
+ upb_msg_set(wrapper, val_f, msgval, arena);
362
+ }
363
+ return Qnil;
364
+ }
365
+ case METHOD_ENUM_GETTER: {
366
+ upb_msgval msgval = upb_msg_get(Message_Get(_self, NULL), f);
367
+
368
+ if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
369
+ // Map repeated fields to a new type with ints
370
+ VALUE arr = rb_ary_new();
371
+ size_t i, n = upb_array_size(msgval.array_val);
372
+ for (i = 0; i < n; i++) {
373
+ upb_msgval elem = upb_array_get(msgval.array_val, i);
374
+ rb_ary_push(arr, INT2NUM(elem.int32_val));
375
+ }
376
+ return arr;
377
+ } else {
378
+ return INT2NUM(msgval.int32_val);
379
+ }
380
+ }
381
+ case METHOD_GETTER:
382
+ return Message_getfield(_self, f);
383
+ default:
384
+ rb_raise(rb_eRuntimeError, "Internal error, no such accessor: %d",
385
+ accessor_type);
386
+ }
253
387
  }
254
388
 
255
389
  /*
@@ -279,111 +413,56 @@ static int extract_method_call(VALUE method_name, MessageHeader* self,
279
413
  * true if the field 'fieldname' is set in the message object, else false. For
280
414
  * 'proto3' syntax, calling this for a basic type field will result in an error.
281
415
  */
282
- VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
283
- MessageHeader* self;
416
+ static VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
417
+ Message* self = ruby_to_Message(_self);
284
418
  const upb_oneofdef* o;
285
419
  const upb_fielddef* f;
286
420
  int accessor_type;
287
421
 
288
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
289
422
  if (argc < 1) {
290
423
  rb_raise(rb_eArgError, "Expected method name as first argument.");
291
424
  }
292
425
 
293
426
  accessor_type = extract_method_call(argv[0], self, &f, &o);
294
- if (accessor_type == METHOD_UNKNOWN || (o == NULL && f == NULL) ) {
295
- return rb_call_super(argc, argv);
296
- } else if (accessor_type == METHOD_SETTER || accessor_type == METHOD_WRAPPER_SETTER) {
297
- if (argc != 2) {
298
- rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
299
- }
300
- rb_check_frozen(_self);
301
- } else if (argc != 1) {
302
- rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
303
- }
304
-
305
- // Return which of the oneof fields are set
306
- if (o != NULL) {
307
- const upb_fielddef* oneof_field = which_oneof_field(self, o);
308
427
 
309
- if (accessor_type == METHOD_SETTER) {
310
- rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
311
- }
428
+ if (accessor_type == METHOD_UNKNOWN) return rb_call_super(argc, argv);
312
429
 
313
- if (accessor_type == METHOD_PRESENCE) {
314
- return oneof_field == NULL ? Qfalse : Qtrue;
315
- } else if (accessor_type == METHOD_CLEAR) {
316
- if (oneof_field != NULL) {
317
- layout_clear(self->descriptor->layout, Message_data(self), oneof_field);
430
+ // Validate argument count.
431
+ switch (accessor_type) {
432
+ case METHOD_SETTER:
433
+ case METHOD_WRAPPER_SETTER:
434
+ if (argc != 2) {
435
+ rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
318
436
  }
319
- return Qnil;
320
- } else {
321
- // METHOD_ACCESSOR
322
- return oneof_field == NULL ? Qnil :
323
- ID2SYM(rb_intern(upb_fielddef_name(oneof_field)));
324
- }
325
- // Otherwise we're operating on a single proto field
326
- } else if (accessor_type == METHOD_SETTER) {
327
- layout_set(self->descriptor->layout, Message_data(self), f, argv[1]);
328
- return Qnil;
329
- } else if (accessor_type == METHOD_CLEAR) {
330
- layout_clear(self->descriptor->layout, Message_data(self), f);
331
- return Qnil;
332
- } else if (accessor_type == METHOD_PRESENCE) {
333
- return layout_has(self->descriptor->layout, Message_data(self), f);
334
- } else if (accessor_type == METHOD_WRAPPER_GETTER) {
335
- VALUE value = layout_get(self->descriptor->layout, Message_data(self), f);
336
- switch (TYPE(value)) {
337
- case T_DATA:
338
- return rb_funcall(value, rb_intern("value"), 0);
339
- case T_NIL:
340
- return Qnil;
341
- default:
342
- return value;
343
- }
344
- } else if (accessor_type == METHOD_WRAPPER_SETTER) {
345
- VALUE wrapper = ruby_wrapper_type(
346
- field_type_class(self->descriptor->layout, f), argv[1]);
347
- layout_set(self->descriptor->layout, Message_data(self), f, wrapper);
348
- return Qnil;
349
- } else if (accessor_type == METHOD_ENUM_GETTER) {
350
- VALUE enum_type = field_type_class(self->descriptor->layout, f);
351
- VALUE method = rb_intern("const_get");
352
- VALUE raw_value = layout_get(self->descriptor->layout, Message_data(self), f);
353
-
354
- // Map repeated fields to a new type with ints
355
- if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
356
- int array_size = FIX2INT(rb_funcall(raw_value, rb_intern("length"), 0));
357
- int i;
358
- VALUE array_args[1] = { ID2SYM(rb_intern("int64")) };
359
- VALUE array = rb_class_new_instance(1, array_args, CLASS_OF(raw_value));
360
- for (i = 0; i < array_size; i++) {
361
- VALUE entry = rb_funcall(enum_type, method, 1, rb_funcall(raw_value,
362
- rb_intern("at"), 1, INT2NUM(i)));
363
- rb_funcall(array, rb_intern("push"), 1, entry);
437
+ rb_check_frozen(_self);
438
+ break;
439
+ default:
440
+ if (argc != 1) {
441
+ rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
364
442
  }
365
- return array;
366
- }
367
- // Convert the value for singular fields
368
- return rb_funcall(enum_type, method, 1, raw_value);
443
+ break;
444
+ }
445
+
446
+ // Dispatch accessor.
447
+ if (o != NULL) {
448
+ return Message_oneof_accessor(_self, o, accessor_type);
369
449
  } else {
370
- return layout_get(self->descriptor->layout, Message_data(self), f);
450
+ return Message_field_accessor(_self, f, accessor_type, argc, argv);
371
451
  }
372
452
  }
373
453
 
374
-
375
- VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
376
- MessageHeader* self;
454
+ static VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
455
+ Message* self = ruby_to_Message(_self);
377
456
  const upb_oneofdef* o;
378
457
  const upb_fielddef* f;
379
458
  int accessor_type;
380
459
 
381
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
382
460
  if (argc < 1) {
383
461
  rb_raise(rb_eArgError, "Expected method name as first argument.");
384
462
  }
385
463
 
386
464
  accessor_type = extract_method_call(argv[0], self, &f, &o);
465
+
387
466
  if (accessor_type == METHOD_UNKNOWN) {
388
467
  return rb_call_super(argc, argv);
389
468
  } else if (o != NULL) {
@@ -393,17 +472,116 @@ VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
393
472
  }
394
473
  }
395
474
 
396
- VALUE create_submsg_from_hash(const MessageLayout* layout,
397
- const upb_fielddef* f, VALUE hash) {
398
- VALUE args[1] = { hash };
399
- return rb_class_new_instance(1, args, field_type_class(layout, f));
475
+ void Message_InitFromValue(upb_msg* msg, const upb_msgdef* m, VALUE val,
476
+ upb_arena* arena);
477
+
478
+ typedef struct {
479
+ upb_map *map;
480
+ TypeInfo key_type;
481
+ TypeInfo val_type;
482
+ upb_arena *arena;
483
+ } MapInit;
484
+
485
+ static int Map_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
486
+ MapInit *map_init = (MapInit*)_self;
487
+ upb_msgval k, v;
488
+ k = Convert_RubyToUpb(key, "", map_init->key_type, NULL);
489
+
490
+ if (map_init->val_type.type == UPB_TYPE_MESSAGE && TYPE(val) == T_HASH) {
491
+ upb_msg *msg = upb_msg_new(map_init->val_type.def.msgdef, map_init->arena);
492
+ Message_InitFromValue(msg, map_init->val_type.def.msgdef, val,
493
+ map_init->arena);
494
+ v.msg_val = msg;
495
+ } else {
496
+ v = Convert_RubyToUpb(val, "", map_init->val_type, map_init->arena);
497
+ }
498
+ upb_map_set(map_init->map, k, v, map_init->arena);
499
+ return ST_CONTINUE;
400
500
  }
401
501
 
402
- int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
403
- MessageHeader* self;
404
- char *name;
405
- const upb_fielddef* f;
406
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
502
+ static void Map_InitFromValue(upb_map* map, const upb_fielddef* f, VALUE val,
503
+ upb_arena* arena) {
504
+ const upb_msgdef* entry_m = upb_fielddef_msgsubdef(f);
505
+ const upb_fielddef* key_f = upb_msgdef_itof(entry_m, 1);
506
+ const upb_fielddef* val_f = upb_msgdef_itof(entry_m, 2);
507
+ if (TYPE(val) != T_HASH) {
508
+ rb_raise(rb_eArgError,
509
+ "Expected Hash object as initializer value for map field '%s' "
510
+ "(given %s).",
511
+ upb_fielddef_name(f), rb_class2name(CLASS_OF(val)));
512
+ }
513
+ MapInit map_init = {map, TypeInfo_get(key_f), TypeInfo_get(val_f), arena};
514
+ rb_hash_foreach(val, Map_initialize_kwarg, (VALUE)&map_init);
515
+ }
516
+
517
+ static upb_msgval MessageValue_FromValue(VALUE val, TypeInfo info,
518
+ upb_arena* arena) {
519
+ if (info.type == UPB_TYPE_MESSAGE) {
520
+ upb_msgval msgval;
521
+ upb_msg* msg = upb_msg_new(info.def.msgdef, arena);
522
+ Message_InitFromValue(msg, info.def.msgdef, val, arena);
523
+ msgval.msg_val = msg;
524
+ return msgval;
525
+ } else {
526
+ return Convert_RubyToUpb(val, "", info, arena);
527
+ }
528
+ }
529
+
530
+ static void RepeatedField_InitFromValue(upb_array* arr, const upb_fielddef* f,
531
+ VALUE val, upb_arena* arena) {
532
+ TypeInfo type_info = TypeInfo_get(f);
533
+
534
+ if (TYPE(val) != T_ARRAY) {
535
+ rb_raise(rb_eArgError,
536
+ "Expected array as initializer value for repeated field '%s' (given %s).",
537
+ upb_fielddef_name(f), rb_class2name(CLASS_OF(val)));
538
+ }
539
+
540
+ for (int i = 0; i < RARRAY_LEN(val); i++) {
541
+ VALUE entry = rb_ary_entry(val, i);
542
+ upb_msgval msgval;
543
+ if (upb_fielddef_issubmsg(f) && TYPE(entry) == T_HASH) {
544
+ msgval = MessageValue_FromValue(entry, type_info, arena);
545
+ } else {
546
+ msgval = Convert_RubyToUpb(entry, upb_fielddef_name(f), type_info, arena);
547
+ }
548
+ upb_array_append(arr, msgval, arena);
549
+ }
550
+ }
551
+
552
+ static void Message_InitFieldFromValue(upb_msg* msg, const upb_fielddef* f,
553
+ VALUE val, upb_arena* arena) {
554
+ if (TYPE(val) == T_NIL) return;
555
+
556
+ if (upb_fielddef_ismap(f)) {
557
+ upb_map *map = upb_msg_mutable(msg, f, arena).map;
558
+ Map_InitFromValue(map, f, val, arena);
559
+ } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
560
+ upb_array *arr = upb_msg_mutable(msg, f, arena).array;
561
+ RepeatedField_InitFromValue(arr, f, val, arena);
562
+ } else if (upb_fielddef_issubmsg(f)) {
563
+ if (TYPE(val) == T_HASH) {
564
+ upb_msg *submsg = upb_msg_mutable(msg, f, arena).msg;
565
+ Message_InitFromValue(submsg, upb_fielddef_msgsubdef(f), val, arena);
566
+ } else {
567
+ Message_setfield(msg, f, val, arena);
568
+ }
569
+ } else {
570
+ upb_msgval msgval =
571
+ Convert_RubyToUpb(val, upb_fielddef_name(f), TypeInfo_get(f), arena);
572
+ upb_msg_set(msg, f, msgval, arena);
573
+ }
574
+ }
575
+
576
+ typedef struct {
577
+ upb_msg *msg;
578
+ const upb_msgdef *msgdef;
579
+ upb_arena *arena;
580
+ } MsgInit;
581
+
582
+ static int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
583
+ MsgInit *msg_init = (MsgInit*)_self;
584
+ const char *name;
407
585
 
408
586
  if (TYPE(key) == T_STRING) {
409
587
  name = RSTRING_PTR(key);
@@ -414,52 +592,26 @@ int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
414
592
  "Expected string or symbols as hash keys when initializing proto from hash.");
415
593
  }
416
594
 
417
- f = upb_msgdef_ntofz(self->descriptor->msgdef, name);
595
+ const upb_fielddef* f = upb_msgdef_ntofz(msg_init->msgdef, name);
596
+
418
597
  if (f == NULL) {
419
598
  rb_raise(rb_eArgError,
420
599
  "Unknown field name '%s' in initialization map entry.", name);
421
600
  }
422
601
 
423
- if (TYPE(val) == T_NIL) {
424
- return 0;
425
- }
426
-
427
- if (is_map_field(f)) {
428
- VALUE map;
429
-
430
- if (TYPE(val) != T_HASH) {
431
- rb_raise(rb_eArgError,
432
- "Expected Hash object as initializer value for map field '%s' (given %s).",
433
- name, rb_class2name(CLASS_OF(val)));
434
- }
435
- map = layout_get(self->descriptor->layout, Message_data(self), f);
436
- Map_merge_into_self(map, val);
437
- } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
438
- VALUE ary;
439
- int i;
440
-
441
- if (TYPE(val) != T_ARRAY) {
442
- rb_raise(rb_eArgError,
443
- "Expected array as initializer value for repeated field '%s' (given %s).",
444
- name, rb_class2name(CLASS_OF(val)));
445
- }
446
- ary = layout_get(self->descriptor->layout, Message_data(self), f);
447
- for (i = 0; i < RARRAY_LEN(val); i++) {
448
- VALUE entry = rb_ary_entry(val, i);
449
- if (TYPE(entry) == T_HASH && upb_fielddef_issubmsg(f)) {
450
- entry = create_submsg_from_hash(self->descriptor->layout, f, entry);
451
- }
602
+ Message_InitFieldFromValue(msg_init->msg, f, val, msg_init->arena);
603
+ return ST_CONTINUE;
604
+ }
452
605
 
453
- RepeatedField_push(ary, entry);
454
- }
606
+ void Message_InitFromValue(upb_msg* msg, const upb_msgdef* m, VALUE val,
607
+ upb_arena* arena) {
608
+ MsgInit msg_init = {msg, m, arena};
609
+ if (TYPE(val) == T_HASH) {
610
+ rb_hash_foreach(val, Message_initialize_kwarg, (VALUE)&msg_init);
455
611
  } else {
456
- if (TYPE(val) == T_HASH && upb_fielddef_issubmsg(f)) {
457
- val = create_submsg_from_hash(self->descriptor->layout, f, val);
458
- }
459
-
460
- layout_set(self->descriptor->layout, Message_data(self), f, val);
612
+ rb_raise(rb_eArgError, "Expected hash arguments or message, not %s",
613
+ rb_class2name(CLASS_OF(val)));
461
614
  }
462
- return 0;
463
615
  }
464
616
 
465
617
  /*
@@ -474,12 +626,13 @@ int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
474
626
  * have been added to a pool. The method definitions described here on the
475
627
  * Message class are provided on each concrete message class.
476
628
  */
477
- VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
478
- MessageHeader* self;
479
- VALUE hash_args;
480
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
629
+ static VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
630
+ Message* self = ruby_to_Message(_self);
631
+ VALUE arena_rb = Arena_new();
632
+ upb_arena *arena = Arena_get(arena_rb);
633
+ upb_msg *msg = upb_msg_new(self->msgdef, arena);
481
634
 
482
- layout_init(self->descriptor->layout, Message_data(self));
635
+ Message_InitPtr(_self, msg, arena_rb);
483
636
 
484
637
  if (argc == 0) {
485
638
  return Qnil;
@@ -487,12 +640,7 @@ VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
487
640
  if (argc != 1) {
488
641
  rb_raise(rb_eArgError, "Expected 0 or 1 arguments.");
489
642
  }
490
- hash_args = argv[0];
491
- if (TYPE(hash_args) != T_HASH) {
492
- rb_raise(rb_eArgError, "Expected hash arguments.");
493
- }
494
-
495
- rb_hash_foreach(hash_args, Message_initialize_kwarg, _self);
643
+ Message_InitFromValue((upb_msg*)self->msg, self->msgdef, argv[0], arena);
496
644
  return Qnil;
497
645
  }
498
646
 
@@ -502,37 +650,40 @@ VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
502
650
  *
503
651
  * Performs a shallow copy of this message and returns the new copy.
504
652
  */
505
- VALUE Message_dup(VALUE _self) {
506
- MessageHeader* self;
507
- VALUE new_msg;
508
- MessageHeader* new_msg_self;
509
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
510
-
511
- new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
512
- TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);
513
-
514
- layout_dup(self->descriptor->layout,
515
- Message_data(new_msg_self),
516
- Message_data(self));
517
-
653
+ static VALUE Message_dup(VALUE _self) {
654
+ Message* self = ruby_to_Message(_self);
655
+ VALUE new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
656
+ Message* new_msg_self = ruby_to_Message(new_msg);
657
+ size_t size = upb_msgdef_layout(self->msgdef)->size;
658
+
659
+ // TODO(copy unknown fields?)
660
+ // TODO(use official upb msg copy function)
661
+ memcpy((upb_msg*)new_msg_self->msg, self->msg, size);
662
+ Arena_fuse(self->arena, Arena_get(new_msg_self->arena));
518
663
  return new_msg;
519
664
  }
520
665
 
521
- // Internal only; used by Google::Protobuf.deep_copy.
522
- VALUE Message_deep_copy(VALUE _self) {
523
- MessageHeader* self;
524
- MessageHeader* new_msg_self;
525
- VALUE new_msg;
526
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
666
+ // Support function for Message_eq, and also used by other #eq functions.
667
+ bool Message_Equal(const upb_msg *m1, const upb_msg *m2, const upb_msgdef *m) {
668
+ if (m1 == m2) return true;
527
669
 
528
- new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
529
- TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);
670
+ size_t size1, size2;
671
+ int encode_opts = UPB_ENCODE_SKIPUNKNOWN | UPB_ENCODE_DETERMINISTIC;
672
+ upb_arena *arena_tmp = upb_arena_new();
673
+ const upb_msglayout *layout = upb_msgdef_layout(m);
530
674
 
531
- layout_deep_copy(self->descriptor->layout,
532
- Message_data(new_msg_self),
533
- Message_data(self));
675
+ // Compare deterministically serialized payloads with no unknown fields.
676
+ char *data1 = upb_encode_ex(m1, layout, encode_opts, arena_tmp, &size1);
677
+ char *data2 = upb_encode_ex(m2, layout, encode_opts, arena_tmp, &size2);
534
678
 
535
- return new_msg;
679
+ if (data1 && data2) {
680
+ bool ret = (size1 == size2) && (memcmp(data1, data2, size1) == 0);
681
+ upb_arena_free(arena_tmp);
682
+ return ret;
683
+ } else {
684
+ upb_arena_free(arena_tmp);
685
+ rb_raise(cParseError, "Error comparing messages");
686
+ }
536
687
  }
537
688
 
538
689
  /*
@@ -544,22 +695,34 @@ VALUE Message_deep_copy(VALUE _self) {
544
695
  * method's semantics (a more efficient comparison may actually be done if the
545
696
  * field is of a primitive type).
546
697
  */
547
- VALUE Message_eq(VALUE _self, VALUE _other) {
548
- MessageHeader* self;
549
- MessageHeader* other;
550
- if (TYPE(_self) != TYPE(_other)) {
551
- return Qfalse;
552
- }
553
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
554
- TypedData_Get_Struct(_other, MessageHeader, &Message_type, other);
698
+ static VALUE Message_eq(VALUE _self, VALUE _other) {
699
+ if (CLASS_OF(_self) != CLASS_OF(_other)) return Qfalse;
555
700
 
556
- if (self->descriptor != other->descriptor) {
557
- return Qfalse;
558
- }
701
+ Message* self = ruby_to_Message(_self);
702
+ Message* other = ruby_to_Message(_other);
703
+ assert(self->msgdef == other->msgdef);
559
704
 
560
- return layout_eq(self->descriptor->layout,
561
- Message_data(self),
562
- Message_data(other));
705
+ return Message_Equal(self->msg, other->msg, self->msgdef) ? Qtrue : Qfalse;
706
+ }
707
+
708
+ uint64_t Message_Hash(const upb_msg* msg, const upb_msgdef* m, uint64_t seed) {
709
+ upb_arena *arena = upb_arena_new();
710
+ const char *data;
711
+ size_t size;
712
+
713
+ // Hash a deterministically serialized payloads with no unknown fields.
714
+ data = upb_encode_ex(msg, upb_msgdef_layout(m),
715
+ UPB_ENCODE_SKIPUNKNOWN | UPB_ENCODE_DETERMINISTIC, arena,
716
+ &size);
717
+
718
+ if (data) {
719
+ uint64_t ret = Wyhash(data, size, seed, kWyhashSalt);
720
+ upb_arena_free(arena);
721
+ return ret;
722
+ } else {
723
+ upb_arena_free(arena);
724
+ rb_raise(cParseError, "Error calculating hash");
725
+ }
563
726
  }
564
727
 
565
728
  /*
@@ -568,11 +731,12 @@ VALUE Message_eq(VALUE _self, VALUE _other) {
568
731
  *
569
732
  * Returns a hash value that represents this message's field values.
570
733
  */
571
- VALUE Message_hash(VALUE _self) {
572
- MessageHeader* self;
573
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
574
-
575
- return layout_hash(self->descriptor->layout, Message_data(self));
734
+ static VALUE Message_hash(VALUE _self) {
735
+ Message* self = ruby_to_Message(_self);
736
+ uint64_t hash_value = Message_Hash(self->msg, self->msgdef, 0);
737
+ // RUBY_FIXNUM_MAX should be one less than a power of 2.
738
+ assert((RUBY_FIXNUM_MAX & (RUBY_FIXNUM_MAX + 1)) == 0);
739
+ return INT2FIX(hash_value & RUBY_FIXNUM_MAX);
576
740
  }
577
741
 
578
742
  /*
@@ -583,77 +747,127 @@ VALUE Message_hash(VALUE _self) {
583
747
  * formatted as "<MessageType: field1: value1, field2: value2, ...>". Each
584
748
  * field's value is represented according to its own #inspect method.
585
749
  */
586
- VALUE Message_inspect(VALUE _self) {
587
- MessageHeader* self;
588
- VALUE str;
589
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
750
+ static VALUE Message_inspect(VALUE _self) {
751
+ Message* self = ruby_to_Message(_self);
590
752
 
591
- str = rb_str_new2("<");
592
- str = rb_str_append(str, rb_str_new2(rb_class2name(CLASS_OF(_self))));
593
- str = rb_str_cat2(str, ": ");
594
- str = rb_str_append(str, layout_inspect(
595
- self->descriptor->layout, Message_data(self)));
596
- str = rb_str_cat2(str, ">");
597
- return str;
753
+ StringBuilder* builder = StringBuilder_New();
754
+ Message_PrintMessage(builder, self->msg, self->msgdef);
755
+ VALUE ret = StringBuilder_ToRubyString(builder);
756
+ StringBuilder_Free(builder);
757
+ return ret;
598
758
  }
599
759
 
600
- /*
601
- * call-seq:
602
- * Message.to_h => {}
603
- *
604
- * Returns the message as a Ruby Hash object, with keys as symbols.
605
- */
606
- VALUE Message_to_h(VALUE _self) {
607
- MessageHeader* self;
608
- VALUE hash;
609
- upb_msg_field_iter it;
610
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
611
-
612
- hash = rb_hash_new();
613
-
614
- for (upb_msg_field_begin(&it, self->descriptor->msgdef);
615
- !upb_msg_field_done(&it);
616
- upb_msg_field_next(&it)) {
617
- const upb_fielddef* field = upb_msg_iter_field(&it);
760
+ // Support functions for Message_to_h //////////////////////////////////////////
761
+
762
+ static VALUE RepeatedField_CreateArray(const upb_array* arr,
763
+ TypeInfo type_info) {
764
+ int size = arr ? upb_array_size(arr) : 0;
765
+ VALUE ary = rb_ary_new2(size);
766
+
767
+ for (int i = 0; i < size; i++) {
768
+ upb_msgval msgval = upb_array_get(arr, i);
769
+ VALUE val = Scalar_CreateHash(msgval, type_info);
770
+ rb_ary_push(ary, val);
771
+ }
772
+
773
+ return ary;
774
+ }
775
+
776
+ static VALUE Message_CreateHash(const upb_msg *msg, const upb_msgdef *m) {
777
+ if (!msg) return Qnil;
778
+
779
+ VALUE hash = rb_hash_new();
780
+ int n = upb_msgdef_fieldcount(m);
781
+ bool is_proto2;
782
+
783
+ // We currently have a few behaviors that are specific to proto2.
784
+ // This is unfortunate, we should key behaviors off field attributes (like
785
+ // whether a field has presence), not proto2 vs. proto3. We should see if we
786
+ // can change this without breaking users.
787
+ is_proto2 = upb_msgdef_syntax(m) == UPB_SYNTAX_PROTO2;
788
+
789
+ for (int i = 0; i < n; i++) {
790
+ const upb_fielddef* field = upb_msgdef_field(m, i);
791
+ TypeInfo type_info = TypeInfo_get(field);
792
+ upb_msgval msgval;
618
793
  VALUE msg_value;
619
794
  VALUE msg_key;
620
795
 
621
- // For proto2, do not include fields which are not set.
622
- if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
623
- field_contains_hasbit(self->descriptor->layout, field) &&
624
- !layout_has(self->descriptor->layout, Message_data(self), field)) {
796
+ if (!is_proto2 && upb_fielddef_issubmsg(field) &&
797
+ !upb_fielddef_isseq(field) && !upb_msg_has(msg, field)) {
798
+ // TODO: Legacy behavior, remove when we fix the is_proto2 differences.
799
+ msg_key = ID2SYM(rb_intern(upb_fielddef_name(field)));
800
+ rb_hash_aset(hash, msg_key, Qnil);
801
+ continue;
802
+ }
803
+
804
+ // Do not include fields that are not present (oneof or optional fields).
805
+ if (is_proto2 && upb_fielddef_haspresence(field) &&
806
+ !upb_msg_has(msg, field)) {
625
807
  continue;
626
808
  }
627
809
 
628
- msg_value = layout_get(self->descriptor->layout, Message_data(self), field);
629
810
  msg_key = ID2SYM(rb_intern(upb_fielddef_name(field)));
630
- if (is_map_field(field)) {
631
- msg_value = Map_to_h(msg_value);
632
- } else if (upb_fielddef_label(field) == UPB_LABEL_REPEATED) {
633
- msg_value = RepeatedField_to_ary(msg_value);
634
- if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
635
- RARRAY_LEN(msg_value) == 0) {
811
+ msgval = upb_msg_get(msg, field);
812
+
813
+ // Proto2 omits empty map/repeated filds also.
814
+
815
+ if (upb_fielddef_ismap(field)) {
816
+ const upb_msgdef *entry_m = upb_fielddef_msgsubdef(field);
817
+ const upb_fielddef *key_f = upb_msgdef_itof(entry_m, 1);
818
+ const upb_fielddef *val_f = upb_msgdef_itof(entry_m, 2);
819
+ upb_fieldtype_t key_type = upb_fielddef_type(key_f);
820
+ msg_value = Map_CreateHash(msgval.map_val, key_type, TypeInfo_get(val_f));
821
+ } else if (upb_fielddef_isseq(field)) {
822
+ if (is_proto2 &&
823
+ (!msgval.array_val || upb_array_size(msgval.array_val) == 0)) {
636
824
  continue;
637
825
  }
638
-
639
- if (upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
640
- int i;
641
- for (i = 0; i < RARRAY_LEN(msg_value); i++) {
642
- VALUE elem = rb_ary_entry(msg_value, i);
643
- rb_ary_store(msg_value, i, Message_to_h(elem));
644
- }
645
- }
646
-
647
- } else if (msg_value != Qnil &&
648
- upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
649
- msg_value = Message_to_h(msg_value);
826
+ msg_value = RepeatedField_CreateArray(msgval.array_val, type_info);
827
+ } else {
828
+ msg_value = Scalar_CreateHash(msgval, type_info);
650
829
  }
830
+
651
831
  rb_hash_aset(hash, msg_key, msg_value);
652
832
  }
833
+
653
834
  return hash;
654
835
  }
655
836
 
837
+ VALUE Scalar_CreateHash(upb_msgval msgval, TypeInfo type_info) {
838
+ if (type_info.type == UPB_TYPE_MESSAGE) {
839
+ return Message_CreateHash(msgval.msg_val, type_info.def.msgdef);
840
+ } else {
841
+ return Convert_UpbToRuby(msgval, type_info, Qnil);
842
+ }
843
+ }
844
+
845
+ /*
846
+ * call-seq:
847
+ * Message.to_h => {}
848
+ *
849
+ * Returns the message as a Ruby Hash object, with keys as symbols.
850
+ */
851
+ static VALUE Message_to_h(VALUE _self) {
852
+ Message* self = ruby_to_Message(_self);
853
+ return Message_CreateHash(self->msg, self->msgdef);
854
+ }
656
855
 
856
+ /*
857
+ * call-seq:
858
+ * Message.freeze => self
859
+ *
860
+ * Freezes the message object. We have to intercept this so we can pin the
861
+ * Ruby object into memory so we don't forget it's frozen.
862
+ */
863
+ static VALUE Message_freeze(VALUE _self) {
864
+ Message* self = ruby_to_Message(_self);
865
+ if (!RB_OBJ_FROZEN(_self)) {
866
+ Arena_Pin(self->arena, _self);
867
+ RB_OBJ_FREEZE(_self);
868
+ }
869
+ return _self;
870
+ }
657
871
 
658
872
  /*
659
873
  * call-seq:
@@ -662,16 +876,18 @@ VALUE Message_to_h(VALUE _self) {
662
876
  * Accesses a field's value by field name. The provided field name should be a
663
877
  * string.
664
878
  */
665
- VALUE Message_index(VALUE _self, VALUE field_name) {
666
- MessageHeader* self;
879
+ static VALUE Message_index(VALUE _self, VALUE field_name) {
880
+ Message* self = ruby_to_Message(_self);
667
881
  const upb_fielddef* field;
668
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
882
+
669
883
  Check_Type(field_name, T_STRING);
670
- field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
884
+ field = upb_msgdef_ntofz(self->msgdef, RSTRING_PTR(field_name));
885
+
671
886
  if (field == NULL) {
672
887
  return Qnil;
673
888
  }
674
- return layout_get(self->descriptor->layout, Message_data(self), field);
889
+
890
+ return Message_getfield(_self, field);
675
891
  }
676
892
 
677
893
  /*
@@ -681,19 +897,209 @@ VALUE Message_index(VALUE _self, VALUE field_name) {
681
897
  * Sets a field's value by field name. The provided field name should be a
682
898
  * string.
683
899
  */
684
- VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
685
- MessageHeader* self;
686
- const upb_fielddef* field;
687
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
900
+ static VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
901
+ Message* self = ruby_to_Message(_self);
902
+ const upb_fielddef* f;
903
+ upb_msgval val;
904
+ upb_arena *arena = Arena_get(self->arena);
905
+
688
906
  Check_Type(field_name, T_STRING);
689
- field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
690
- if (field == NULL) {
907
+ f = upb_msgdef_ntofz(self->msgdef, RSTRING_PTR(field_name));
908
+
909
+ if (f == NULL) {
691
910
  rb_raise(rb_eArgError, "Unknown field: %s", RSTRING_PTR(field_name));
692
911
  }
693
- layout_set(self->descriptor->layout, Message_data(self), field, value);
912
+
913
+ val = Convert_RubyToUpb(value, upb_fielddef_name(f), TypeInfo_get(f), arena);
914
+ upb_msg_set(Message_GetMutable(_self, NULL), f, val, arena);
915
+
694
916
  return Qnil;
695
917
  }
696
918
 
919
+ /*
920
+ * call-seq:
921
+ * MessageClass.decode(data) => message
922
+ *
923
+ * Decodes the given data (as a string containing bytes in protocol buffers wire
924
+ * format) under the interpretration given by this message class's definition
925
+ * and returns a message object with the corresponding field values.
926
+ */
927
+ static VALUE Message_decode(VALUE klass, VALUE data) {
928
+ if (TYPE(data) != T_STRING) {
929
+ rb_raise(rb_eArgError, "Expected string for binary protobuf data.");
930
+ }
931
+
932
+ VALUE msg_rb = initialize_rb_class_with_no_args(klass);
933
+ Message* msg = ruby_to_Message(msg_rb);
934
+
935
+ if (!upb_decode(RSTRING_PTR(data), RSTRING_LEN(data), (upb_msg*)msg->msg,
936
+ upb_msgdef_layout(msg->msgdef),
937
+ Arena_get(msg->arena))) {
938
+ rb_raise(cParseError, "Error occurred during parsing");
939
+ }
940
+
941
+ return msg_rb;
942
+ }
943
+
944
+ /*
945
+ * call-seq:
946
+ * MessageClass.decode_json(data, options = {}) => message
947
+ *
948
+ * Decodes the given data (as a string containing bytes in protocol buffers wire
949
+ * format) under the interpretration given by this message class's definition
950
+ * and returns a message object with the corresponding field values.
951
+ *
952
+ * @param options [Hash] options for the decoder
953
+ * ignore_unknown_fields: set true to ignore unknown fields (default is to
954
+ * raise an error)
955
+ */
956
+ static VALUE Message_decode_json(int argc, VALUE* argv, VALUE klass) {
957
+ VALUE data = argv[0];
958
+ int options = 0;
959
+ upb_status status;
960
+
961
+ // TODO(haberman): use this message's pool instead.
962
+ const upb_symtab *symtab = DescriptorPool_GetSymtab(generated_pool);
963
+
964
+ if (argc < 1 || argc > 2) {
965
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
966
+ }
967
+
968
+ if (argc == 2) {
969
+ VALUE hash_args = argv[1];
970
+ if (TYPE(hash_args) != T_HASH) {
971
+ rb_raise(rb_eArgError, "Expected hash arguments.");
972
+ }
973
+
974
+ if (RTEST(rb_hash_lookup2( hash_args, ID2SYM(rb_intern("ignore_unknown_fields")), Qfalse))) {
975
+ options |= UPB_JSONDEC_IGNOREUNKNOWN;
976
+ }
977
+ }
978
+
979
+ if (TYPE(data) != T_STRING) {
980
+ rb_raise(rb_eArgError, "Expected string for JSON data.");
981
+ }
982
+
983
+ // TODO(cfallin): Check and respect string encoding. If not UTF-8, we need to
984
+ // convert, because string handlers pass data directly to message string
985
+ // fields.
986
+
987
+ VALUE msg_rb = initialize_rb_class_with_no_args(klass);
988
+ Message* msg = ruby_to_Message(msg_rb);
989
+
990
+ // We don't allow users to decode a wrapper type directly.
991
+ if (upb_msgdef_iswrapper(msg->msgdef)) {
992
+ rb_raise(rb_eRuntimeError, "Cannot parse a wrapper directly.");
993
+ }
994
+
995
+ upb_status_clear(&status);
996
+ if (!upb_json_decode(RSTRING_PTR(data), RSTRING_LEN(data), (upb_msg*)msg->msg,
997
+ msg->msgdef, symtab, options,
998
+ Arena_get(msg->arena), &status)) {
999
+ rb_raise(cParseError, "Error occurred during parsing: %s",
1000
+ upb_status_errmsg(&status));
1001
+ }
1002
+
1003
+ return msg_rb;
1004
+ }
1005
+
1006
+ /*
1007
+ * call-seq:
1008
+ * MessageClass.encode(msg) => bytes
1009
+ *
1010
+ * Encodes the given message object to its serialized form in protocol buffers
1011
+ * wire format.
1012
+ */
1013
+ static VALUE Message_encode(VALUE klass, VALUE msg_rb) {
1014
+ Message* msg = ruby_to_Message(msg_rb);
1015
+ const char *data;
1016
+ size_t size;
1017
+
1018
+ if (CLASS_OF(msg_rb) != klass) {
1019
+ rb_raise(rb_eArgError, "Message of wrong type.");
1020
+ }
1021
+
1022
+ upb_arena *arena = upb_arena_new();
1023
+
1024
+ data = upb_encode(msg->msg, upb_msgdef_layout(msg->msgdef), arena,
1025
+ &size);
1026
+
1027
+ if (data) {
1028
+ VALUE ret = rb_str_new(data, size);
1029
+ rb_enc_associate(ret, rb_ascii8bit_encoding());
1030
+ upb_arena_free(arena);
1031
+ return ret;
1032
+ } else {
1033
+ upb_arena_free(arena);
1034
+ rb_raise(rb_eRuntimeError, "Exceeded maximum depth (possibly cycle)");
1035
+ }
1036
+ }
1037
+
1038
+ /*
1039
+ * call-seq:
1040
+ * MessageClass.encode_json(msg, options = {}) => json_string
1041
+ *
1042
+ * Encodes the given message object into its serialized JSON representation.
1043
+ * @param options [Hash] options for the decoder
1044
+ * preserve_proto_fieldnames: set true to use original fieldnames (default is to camelCase)
1045
+ * emit_defaults: set true to emit 0/false values (default is to omit them)
1046
+ */
1047
+ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1048
+ Message* msg = ruby_to_Message(argv[0]);
1049
+ int options = 0;
1050
+ char buf[1024];
1051
+ size_t size;
1052
+ upb_status status;
1053
+
1054
+ // TODO(haberman): use this message's pool instead.
1055
+ const upb_symtab *symtab = DescriptorPool_GetSymtab(generated_pool);
1056
+
1057
+ if (argc < 1 || argc > 2) {
1058
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1059
+ }
1060
+
1061
+ if (argc == 2) {
1062
+ VALUE hash_args = argv[1];
1063
+ if (TYPE(hash_args) != T_HASH) {
1064
+ rb_raise(rb_eArgError, "Expected hash arguments.");
1065
+ }
1066
+
1067
+ if (RTEST(rb_hash_lookup2(hash_args,
1068
+ ID2SYM(rb_intern("preserve_proto_fieldnames")),
1069
+ Qfalse))) {
1070
+ options |= UPB_JSONENC_PROTONAMES;
1071
+ }
1072
+
1073
+ if (RTEST(rb_hash_lookup2(hash_args, ID2SYM(rb_intern("emit_defaults")),
1074
+ Qfalse))) {
1075
+ options |= UPB_JSONENC_EMITDEFAULTS;
1076
+ }
1077
+ }
1078
+
1079
+ upb_status_clear(&status);
1080
+ size = upb_json_encode(msg->msg, msg->msgdef, symtab, options, buf,
1081
+ sizeof(buf), &status);
1082
+
1083
+ if (!upb_ok(&status)) {
1084
+ rb_raise(cParseError, "Error occurred during encoding: %s",
1085
+ upb_status_errmsg(&status));
1086
+ }
1087
+
1088
+ VALUE ret;
1089
+ if (size >= sizeof(buf)) {
1090
+ char* buf2 = malloc(size + 1);
1091
+ upb_json_encode(msg->msg, msg->msgdef, symtab, options, buf2, size + 1,
1092
+ &status);
1093
+ ret = rb_str_new(buf2, size);
1094
+ free(buf2);
1095
+ } else {
1096
+ ret = rb_str_new(buf, size);
1097
+ }
1098
+
1099
+ rb_enc_associate(ret, rb_utf8_encoding());
1100
+ return ret;
1101
+ }
1102
+
697
1103
  /*
698
1104
  * call-seq:
699
1105
  * Message.descriptor => descriptor
@@ -701,16 +1107,15 @@ VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
701
1107
  * Class method that returns the Descriptor instance corresponding to this
702
1108
  * message class's type.
703
1109
  */
704
- VALUE Message_descriptor(VALUE klass) {
1110
+ static VALUE Message_descriptor(VALUE klass) {
705
1111
  return rb_ivar_get(klass, descriptor_instancevar_interned);
706
1112
  }
707
1113
 
708
1114
  VALUE build_class_from_descriptor(VALUE descriptor) {
709
- Descriptor* desc = ruby_to_Descriptor(descriptor);
710
1115
  const char *name;
711
1116
  VALUE klass;
712
1117
 
713
- name = upb_msgdef_fullname(desc->msgdef);
1118
+ name = upb_msgdef_fullname(Descriptor_GetMsgDef(descriptor));
714
1119
  if (name == NULL) {
715
1120
  rb_raise(rb_eRuntimeError, "Descriptor does not have assigned name.");
716
1121
  }
@@ -737,6 +1142,7 @@ VALUE build_class_from_descriptor(VALUE descriptor) {
737
1142
  rb_define_method(klass, "clone", Message_dup, 0);
738
1143
  rb_define_method(klass, "==", Message_eq, 1);
739
1144
  rb_define_method(klass, "eql?", Message_eq, 1);
1145
+ rb_define_method(klass, "freeze", Message_freeze, 0);
740
1146
  rb_define_method(klass, "hash", Message_hash, 0);
741
1147
  rb_define_method(klass, "to_h", Message_to_h, 0);
742
1148
  rb_define_method(klass, "inspect", Message_inspect, 0);
@@ -759,12 +1165,12 @@ VALUE build_class_from_descriptor(VALUE descriptor) {
759
1165
  * This module method, provided on each generated enum module, looks up an enum
760
1166
  * value by number and returns its name as a Ruby symbol, or nil if not found.
761
1167
  */
762
- VALUE enum_lookup(VALUE self, VALUE number) {
1168
+ static VALUE enum_lookup(VALUE self, VALUE number) {
763
1169
  int32_t num = NUM2INT(number);
764
1170
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
765
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);
1171
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(desc);
766
1172
 
767
- const char* name = upb_enumdef_iton(enumdesc->enumdef, num);
1173
+ const char* name = upb_enumdef_iton(e, num);
768
1174
  if (name == NULL) {
769
1175
  return Qnil;
770
1176
  } else {
@@ -779,13 +1185,13 @@ VALUE enum_lookup(VALUE self, VALUE number) {
779
1185
  * This module method, provided on each generated enum module, looks up an enum
780
1186
  * value by name (as a Ruby symbol) and returns its name, or nil if not found.
781
1187
  */
782
- VALUE enum_resolve(VALUE self, VALUE sym) {
1188
+ static VALUE enum_resolve(VALUE self, VALUE sym) {
783
1189
  const char* name = rb_id2name(SYM2ID(sym));
784
1190
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
785
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);
1191
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(desc);
786
1192
 
787
1193
  int32_t num = 0;
788
- bool found = upb_enumdef_ntoiz(enumdesc->enumdef, name, &num);
1194
+ bool found = upb_enumdef_ntoiz(e, name, &num);
789
1195
  if (!found) {
790
1196
  return Qnil;
791
1197
  } else {
@@ -800,17 +1206,16 @@ VALUE enum_resolve(VALUE self, VALUE sym) {
800
1206
  * This module method, provided on each generated enum module, returns the
801
1207
  * EnumDescriptor corresponding to this enum type.
802
1208
  */
803
- VALUE enum_descriptor(VALUE self) {
1209
+ static VALUE enum_descriptor(VALUE self) {
804
1210
  return rb_ivar_get(self, descriptor_instancevar_interned);
805
1211
  }
806
1212
 
807
1213
  VALUE build_module_from_enumdesc(VALUE _enumdesc) {
808
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(_enumdesc);
809
- VALUE mod = rb_define_module_id(
810
- rb_intern(upb_enumdef_fullname(enumdesc->enumdef)));
1214
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(_enumdesc);
1215
+ VALUE mod = rb_define_module_id(rb_intern(upb_enumdef_fullname(e)));
811
1216
 
812
1217
  upb_enum_iter it;
813
- for (upb_enum_begin(&it, enumdesc->enumdef);
1218
+ for (upb_enum_begin(&it, e);
814
1219
  !upb_enum_done(&it);
815
1220
  upb_enum_next(&it)) {
816
1221
  const char* name = upb_enum_iter_name(&it);
@@ -831,20 +1236,94 @@ VALUE build_module_from_enumdesc(VALUE _enumdesc) {
831
1236
  return mod;
832
1237
  }
833
1238
 
834
- /*
835
- * call-seq:
836
- * Google::Protobuf.deep_copy(obj) => copy_of_obj
837
- *
838
- * Performs a deep copy of a RepeatedField instance, a Map instance, or a
839
- * message object, recursively copying its members.
840
- */
841
- VALUE Google_Protobuf_deep_copy(VALUE self, VALUE obj) {
842
- VALUE klass = CLASS_OF(obj);
843
- if (klass == cRepeatedField) {
844
- return RepeatedField_deep_copy(obj);
845
- } else if (klass == cMap) {
846
- return Map_deep_copy(obj);
847
- } else {
848
- return Message_deep_copy(obj);
1239
+ // Internal only; used by Google::Protobuf.deep_copy.
1240
+ upb_msg* Message_deep_copy(const upb_msg* msg, const upb_msgdef* m,
1241
+ upb_arena *arena) {
1242
+ // Serialize and parse.
1243
+ upb_arena *tmp_arena = upb_arena_new();
1244
+ const upb_msglayout *layout = upb_msgdef_layout(m);
1245
+ size_t size;
1246
+
1247
+ char* data = upb_encode_ex(msg, layout, 0, tmp_arena, &size);
1248
+ upb_msg* new_msg = upb_msg_new(m, arena);
1249
+
1250
+ if (!data || !upb_decode(data, size, new_msg, layout, arena)) {
1251
+ upb_arena_free(tmp_arena);
1252
+ rb_raise(cParseError, "Error occurred copying proto");
1253
+ }
1254
+
1255
+ upb_arena_free(tmp_arena);
1256
+ return new_msg;
1257
+ }
1258
+
1259
+ const upb_msg* Message_GetUpbMessage(VALUE value, const upb_msgdef* m,
1260
+ const char* name, upb_arena* arena) {
1261
+ if (value == Qnil) {
1262
+ rb_raise(cTypeError, "nil message not allowed here.");
1263
+ }
1264
+
1265
+ VALUE klass = CLASS_OF(value);
1266
+ VALUE desc_rb = rb_ivar_get(klass, descriptor_instancevar_interned);
1267
+ const upb_msgdef* val_m =
1268
+ desc_rb == Qnil ? NULL : Descriptor_GetMsgDef(desc_rb);
1269
+
1270
+ if (val_m != m) {
1271
+ // Check for possible implicit conversions
1272
+ // TODO: hash conversion?
1273
+
1274
+ switch (upb_msgdef_wellknowntype(m)) {
1275
+ case UPB_WELLKNOWN_TIMESTAMP: {
1276
+ // Time -> Google::Protobuf::Timestamp
1277
+ upb_msg *msg = upb_msg_new(m, arena);
1278
+ upb_msgval sec, nsec;
1279
+ struct timespec time;
1280
+ const upb_fielddef *sec_f = upb_msgdef_itof(m, 1);
1281
+ const upb_fielddef *nsec_f = upb_msgdef_itof(m, 2);
1282
+
1283
+ if (!rb_obj_is_kind_of(value, rb_cTime)) goto badtype;
1284
+
1285
+ time = rb_time_timespec(value);
1286
+ sec.int64_val = time.tv_sec;
1287
+ nsec.int32_val = time.tv_nsec;
1288
+ upb_msg_set(msg, sec_f, sec, arena);
1289
+ upb_msg_set(msg, nsec_f, nsec, arena);
1290
+ return msg;
1291
+ }
1292
+ case UPB_WELLKNOWN_DURATION: {
1293
+ // Numeric -> Google::Protobuf::Duration
1294
+ upb_msg *msg = upb_msg_new(m, arena);
1295
+ upb_msgval sec, nsec;
1296
+ const upb_fielddef *sec_f = upb_msgdef_itof(m, 1);
1297
+ const upb_fielddef *nsec_f = upb_msgdef_itof(m, 2);
1298
+
1299
+ if (!rb_obj_is_kind_of(value, rb_cNumeric)) goto badtype;
1300
+
1301
+ sec.int64_val = NUM2LL(value);
1302
+ nsec.int32_val = round((NUM2DBL(value) - NUM2LL(value)) * 1000000000);
1303
+ upb_msg_set(msg, sec_f, sec, arena);
1304
+ upb_msg_set(msg, nsec_f, nsec, arena);
1305
+ return msg;
1306
+ }
1307
+ default:
1308
+ badtype:
1309
+ rb_raise(cTypeError,
1310
+ "Invalid type %s to assign to submessage field '%s'.",
1311
+ rb_class2name(CLASS_OF(value)), name);
1312
+ }
1313
+
849
1314
  }
1315
+
1316
+ Message* self = ruby_to_Message(value);
1317
+ Arena_fuse(self->arena, arena);
1318
+
1319
+ return self->msg;
1320
+ }
1321
+
1322
+ void Message_register(VALUE protobuf) {
1323
+ cParseError = rb_const_get(protobuf, rb_intern("ParseError"));
1324
+
1325
+ // Ruby-interned string: "descriptor". We use this identifier to store an
1326
+ // instance variable on message classes we create in order to link them back
1327
+ // to their descriptors.
1328
+ descriptor_instancevar_interned = rb_intern("descriptor");
850
1329
  }