google-protobuf 3.11.3 → 3.15.5

Sign up to get free protection for your applications and to get access to all the features.

Potentially problematic release.


This version of google-protobuf might be problematic. Click here for more details.

@@ -0,0 +1,66 @@
1
+ // Protocol Buffers - Google's data interchange format
2
+ // Copyright 2008 Google Inc. All rights reserved.
3
+ // https://developers.google.com/protocol-buffers/
4
+ //
5
+ // Redistribution and use in source and binary forms, with or without
6
+ // modification, are permitted provided that the following conditions are
7
+ // met:
8
+ //
9
+ // * Redistributions of source code must retain the above copyright
10
+ // notice, this list of conditions and the following disclaimer.
11
+ // * Redistributions in binary form must reproduce the above
12
+ // copyright notice, this list of conditions and the following disclaimer
13
+ // in the documentation and/or other materials provided with the
14
+ // distribution.
15
+ // * Neither the name of Google Inc. nor the names of its
16
+ // contributors may be used to endorse or promote products derived from
17
+ // this software without specific prior written permission.
18
+ //
19
+ // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
20
+ // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
21
+ // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
22
+ // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
23
+ // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24
+ // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
25
+ // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
26
+ // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
27
+ // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
28
+ // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29
+ // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
+
31
+ #ifndef RUBY_PROTOBUF_MAP_H_
32
+ #define RUBY_PROTOBUF_MAP_H_
33
+
34
+ #include <ruby/ruby.h>
35
+
36
+ #include "protobuf.h"
37
+ #include "ruby-upb.h"
38
+
39
+ // Returns a Ruby wrapper object for the given map, which will be created if
40
+ // one does not exist already.
41
+ VALUE Map_GetRubyWrapper(upb_map *map, upb_fieldtype_t key_type,
42
+ TypeInfo value_type, VALUE arena);
43
+
44
+ // Gets the underlying upb_map for this Ruby map object, which must have
45
+ // key/value type that match |field|. If this is not a map or the type doesn't
46
+ // match, raises an exception.
47
+ const upb_map *Map_GetUpbMap(VALUE val, const upb_fielddef *field);
48
+
49
+ // Implements #inspect for this map by appending its contents to |b|.
50
+ void Map_Inspect(StringBuilder *b, const upb_map *map, upb_fieldtype_t key_type,
51
+ TypeInfo val_type);
52
+
53
+ // Returns a new Hash object containing the contents of this Map.
54
+ VALUE Map_CreateHash(const upb_map* map, upb_fieldtype_t key_type,
55
+ TypeInfo val_info);
56
+
57
+ // Returns a deep copy of this Map object.
58
+ VALUE Map_deep_copy(VALUE obj);
59
+
60
+ // Ruby class of Google::Protobuf::Map.
61
+ extern VALUE cMap;
62
+
63
+ // Call at startup to register all types in this module.
64
+ void Map_register(VALUE module);
65
+
66
+ #endif // RUBY_PROTOBUF_MAP_H_
@@ -28,49 +28,61 @@
28
28
  // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29
29
  // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
30
 
31
+ #include "message.h"
32
+
33
+ #include "convert.h"
34
+ #include "defs.h"
35
+ #include "map.h"
31
36
  #include "protobuf.h"
37
+ #include "repeated_field.h"
38
+ #include "third_party/wyhash/wyhash.h"
32
39
 
33
- // -----------------------------------------------------------------------------
34
- // Class/module creation from msgdefs and enumdefs, respectively.
35
- // -----------------------------------------------------------------------------
40
+ static VALUE cParseError = Qnil;
41
+ static ID descriptor_instancevar_interned;
36
42
 
37
- void* Message_data(void* msg) {
38
- return ((uint8_t *)msg) + sizeof(MessageHeader);
43
+ static VALUE initialize_rb_class_with_no_args(VALUE klass) {
44
+ return rb_funcall(klass, rb_intern("new"), 0);
39
45
  }
40
46
 
41
- void Message_mark(void* _self) {
42
- MessageHeader* self = (MessageHeader *)_self;
43
- layout_mark(self->descriptor->layout, Message_data(self));
47
+ VALUE MessageOrEnum_GetDescriptor(VALUE klass) {
48
+ return rb_ivar_get(klass, descriptor_instancevar_interned);
44
49
  }
45
50
 
46
- void Message_free(void* self) {
47
- stringsink* unknown = ((MessageHeader *)self)->unknown_fields;
48
- if (unknown != NULL) {
49
- stringsink_uninit(unknown);
50
- free(unknown);
51
- }
52
- xfree(self);
51
+ // -----------------------------------------------------------------------------
52
+ // Class/module creation from msgdefs and enumdefs, respectively.
53
+ // -----------------------------------------------------------------------------
54
+
55
+ typedef struct {
56
+ VALUE arena;
57
+ const upb_msg* msg; // Can get as mutable when non-frozen.
58
+ const upb_msgdef* msgdef; // kept alive by self.class.descriptor reference.
59
+ } Message;
60
+
61
+ static void Message_mark(void* _self) {
62
+ Message* self = (Message *)_self;
63
+ rb_gc_mark(self->arena);
53
64
  }
54
65
 
55
- rb_data_type_t Message_type = {
66
+ static rb_data_type_t Message_type = {
56
67
  "Message",
57
- { Message_mark, Message_free, NULL },
68
+ { Message_mark, RUBY_DEFAULT_FREE, NULL },
69
+ .flags = RUBY_TYPED_FREE_IMMEDIATELY,
58
70
  };
59
71
 
60
- VALUE Message_alloc(VALUE klass) {
72
+ static Message* ruby_to_Message(VALUE msg_rb) {
73
+ Message* msg;
74
+ TypedData_Get_Struct(msg_rb, Message, &Message_type, msg);
75
+ return msg;
76
+ }
77
+
78
+ static VALUE Message_alloc(VALUE klass) {
61
79
  VALUE descriptor = rb_ivar_get(klass, descriptor_instancevar_interned);
62
- Descriptor* desc = ruby_to_Descriptor(descriptor);
63
- MessageHeader* msg;
80
+ Message* msg = ALLOC(Message);
64
81
  VALUE ret;
65
82
 
66
- if (desc->layout == NULL) {
67
- create_layout(desc);
68
- }
69
-
70
- msg = (void*)ALLOC_N(uint8_t, sizeof(MessageHeader) + desc->layout->size);
71
- msg->descriptor = desc;
72
- msg->unknown_fields = NULL;
73
- memcpy(Message_data(msg), desc->layout->empty_template, desc->layout->size);
83
+ msg->msgdef = Descriptor_GetMsgDef(descriptor);
84
+ msg->arena = Qnil;
85
+ msg->msg = NULL;
74
86
 
75
87
  ret = TypedData_Wrap_Struct(klass, &Message_type, msg);
76
88
  rb_ivar_set(ret, descriptor_instancevar_interned, descriptor);
@@ -78,24 +90,92 @@ VALUE Message_alloc(VALUE klass) {
78
90
  return ret;
79
91
  }
80
92
 
81
- static const upb_fielddef* which_oneof_field(MessageHeader* self, const upb_oneofdef* o) {
82
- uint32_t oneof_case;
83
- const upb_fielddef* f;
93
+ const upb_msg *Message_Get(VALUE msg_rb, const upb_msgdef **m) {
94
+ Message* msg = ruby_to_Message(msg_rb);
95
+ if (m) *m = msg->msgdef;
96
+ return msg->msg;
97
+ }
98
+
99
+ upb_msg *Message_GetMutable(VALUE msg_rb, const upb_msgdef **m) {
100
+ rb_check_frozen(msg_rb);
101
+ return (upb_msg*)Message_Get(msg_rb, m);
102
+ }
103
+
104
+ void Message_InitPtr(VALUE self_, upb_msg *msg, VALUE arena) {
105
+ Message* self = ruby_to_Message(self_);
106
+ self->msg = msg;
107
+ self->arena = arena;
108
+ ObjectCache_Add(msg, self_);
109
+ }
110
+
111
+ VALUE Message_GetArena(VALUE msg_rb) {
112
+ Message* msg = ruby_to_Message(msg_rb);
113
+ return msg->arena;
114
+ }
115
+
116
+ void Message_CheckClass(VALUE klass) {
117
+ if (rb_get_alloc_func(klass) != &Message_alloc) {
118
+ rb_raise(rb_eArgError,
119
+ "Message class was not returned by the DescriptorPool.");
120
+ }
121
+ }
122
+
123
+ VALUE Message_GetRubyWrapper(upb_msg* msg, const upb_msgdef* m, VALUE arena) {
124
+ if (msg == NULL) return Qnil;
84
125
 
85
- oneof_case =
86
- slot_read_oneof_case(self->descriptor->layout, Message_data(self), o);
126
+ VALUE val = ObjectCache_Get(msg);
87
127
 
88
- if (oneof_case == ONEOF_CASE_NONE) {
89
- return NULL;
128
+ if (val == Qnil) {
129
+ VALUE klass = Descriptor_DefToClass(m);
130
+ val = Message_alloc(klass);
131
+ Message_InitPtr(val, msg, arena);
90
132
  }
91
133
 
92
- // oneof_case is a field index, so find that field.
93
- f = upb_oneofdef_itof(o, oneof_case);
94
- assert(f != NULL);
134
+ return val;
135
+ }
136
+
137
+ void Message_PrintMessage(StringBuilder* b, const upb_msg* msg,
138
+ const upb_msgdef* m) {
139
+ bool first = true;
140
+ int n = upb_msgdef_fieldcount(m);
141
+ VALUE klass = Descriptor_DefToClass(m);
142
+ StringBuilder_Printf(b, "<%s: ", rb_class2name(klass));
143
+
144
+ for (int i = 0; i < n; i++) {
145
+ const upb_fielddef* field = upb_msgdef_field(m, i);
146
+
147
+ if (upb_fielddef_haspresence(field) && !upb_msg_has(msg, field)) {
148
+ continue;
149
+ }
150
+
151
+ if (!first) {
152
+ StringBuilder_Printf(b, ", ");
153
+ } else {
154
+ first = false;
155
+ }
156
+
157
+ upb_msgval msgval = upb_msg_get(msg, field);
158
+
159
+ StringBuilder_Printf(b, "%s: ", upb_fielddef_name(field));
160
+
161
+ if (upb_fielddef_ismap(field)) {
162
+ const upb_msgdef* entry_m = upb_fielddef_msgsubdef(field);
163
+ const upb_fielddef* key_f = upb_msgdef_itof(entry_m, 1);
164
+ const upb_fielddef* val_f = upb_msgdef_itof(entry_m, 2);
165
+ TypeInfo val_info = TypeInfo_get(val_f);
166
+ Map_Inspect(b, msgval.map_val, upb_fielddef_type(key_f), val_info);
167
+ } else if (upb_fielddef_isseq(field)) {
168
+ RepeatedField_Inspect(b, msgval.array_val, TypeInfo_get(field));
169
+ } else {
170
+ StringBuilder_PrintMsgval(b, msgval, TypeInfo_get(field));
171
+ }
172
+ }
95
173
 
96
- return f;
174
+ StringBuilder_Printf(b, ">");
97
175
  }
98
176
 
177
+ // Helper functions for #method_missing ////////////////////////////////////////
178
+
99
179
  enum {
100
180
  METHOD_UNKNOWN = 0,
101
181
  METHOD_GETTER = 1,
@@ -108,148 +188,203 @@ enum {
108
188
  };
109
189
 
110
190
  // Check if the field is a well known wrapper type
111
- bool is_wrapper_type_field(const upb_fielddef* field) {
112
- const upb_msgdef *m;
113
- if (upb_fielddef_type(field) != UPB_TYPE_MESSAGE) {
191
+ static bool IsWrapper(const upb_fielddef* f) {
192
+ return upb_fielddef_issubmsg(f) &&
193
+ upb_msgdef_iswrapper(upb_fielddef_msgsubdef(f));
194
+ }
195
+
196
+ static bool Match(const upb_msgdef* m, const char* name, const upb_fielddef** f,
197
+ const upb_oneofdef** o, const char* prefix,
198
+ const char* suffix) {
199
+ size_t sp = strlen(prefix);
200
+ size_t ss = strlen(suffix);
201
+ size_t sn = strlen(name);
202
+
203
+ if (sn <= sp + ss) return false;
204
+
205
+ if (memcmp(name, prefix, sp) != 0 ||
206
+ memcmp(name + sn - ss, suffix, ss) != 0) {
114
207
  return false;
115
208
  }
116
- m = upb_fielddef_msgsubdef(field);
117
- switch (upb_msgdef_wellknowntype(m)) {
118
- case UPB_WELLKNOWN_DOUBLEVALUE:
119
- case UPB_WELLKNOWN_FLOATVALUE:
120
- case UPB_WELLKNOWN_INT64VALUE:
121
- case UPB_WELLKNOWN_UINT64VALUE:
122
- case UPB_WELLKNOWN_INT32VALUE:
123
- case UPB_WELLKNOWN_UINT32VALUE:
124
- case UPB_WELLKNOWN_STRINGVALUE:
125
- case UPB_WELLKNOWN_BYTESVALUE:
126
- case UPB_WELLKNOWN_BOOLVALUE:
127
- return true;
128
- default:
129
- return false;
130
- }
209
+
210
+ return upb_msgdef_lookupname(m, name + sp, sn - sp - ss, f, o);
131
211
  }
132
212
 
133
- // Get a new Ruby wrapper type and set the initial value
134
- VALUE ruby_wrapper_type(VALUE type_class, VALUE value) {
135
- if (value != Qnil) {
136
- VALUE hash = rb_hash_new();
137
- rb_hash_aset(hash, rb_str_new2("value"), value);
138
- {
139
- VALUE args[1] = {hash};
140
- return rb_class_new_instance(1, args, type_class);
213
+ static int extract_method_call(VALUE method_name, Message* self,
214
+ const upb_fielddef** f, const upb_oneofdef** o) {
215
+ const upb_msgdef* m = self->msgdef;
216
+ const char* name;
217
+
218
+ Check_Type(method_name, T_SYMBOL);
219
+ name = rb_id2name(SYM2ID(method_name));
220
+
221
+ if (Match(m, name, f, o, "", "")) return METHOD_GETTER;
222
+ if (Match(m, name, f, o, "", "=")) return METHOD_SETTER;
223
+ if (Match(m, name, f, o, "clear_", "")) return METHOD_CLEAR;
224
+ if (Match(m, name, f, o, "has_", "?") &&
225
+ (*o || (*f && upb_fielddef_haspresence(*f)))) {
226
+ // Disallow oneof hazzers for proto3.
227
+ // TODO(haberman): remove this test when we are enabling oneof hazzers for
228
+ // proto3.
229
+ if (*f && !upb_fielddef_issubmsg(*f) &&
230
+ upb_fielddef_realcontainingoneof(*f) &&
231
+ upb_msgdef_syntax(upb_fielddef_containingtype(*f)) !=
232
+ UPB_SYNTAX_PROTO2) {
233
+ return METHOD_UNKNOWN;
141
234
  }
235
+ return METHOD_PRESENCE;
236
+ }
237
+ if (Match(m, name, f, o, "", "_as_value") && *f && !upb_fielddef_isseq(*f) &&
238
+ IsWrapper(*f)) {
239
+ return METHOD_WRAPPER_GETTER;
240
+ }
241
+ if (Match(m, name, f, o, "", "_as_value=") && *f && !upb_fielddef_isseq(*f) &&
242
+ IsWrapper(*f)) {
243
+ return METHOD_WRAPPER_SETTER;
244
+ }
245
+ if (Match(m, name, f, o, "", "_const") && *f &&
246
+ upb_fielddef_type(*f) == UPB_TYPE_ENUM) {
247
+ return METHOD_ENUM_GETTER;
142
248
  }
143
- return Qnil;
144
- }
145
249
 
146
- static int extract_method_call(VALUE method_name, MessageHeader* self,
147
- const upb_fielddef **f, const upb_oneofdef **o) {
148
- VALUE method_str;
149
- char* name;
150
- size_t name_len;
151
- int accessor_type;
152
- const upb_oneofdef* test_o;
153
- const upb_fielddef* test_f;
154
- bool has_field;
250
+ return METHOD_UNKNOWN;
251
+ }
155
252
 
156
- Check_Type(method_name, T_SYMBOL);
253
+ static VALUE Message_oneof_accessor(VALUE _self, const upb_oneofdef* o,
254
+ int accessor_type) {
255
+ Message* self = ruby_to_Message(_self);
256
+ const upb_fielddef* oneof_field = upb_msg_whichoneof(self->msg, o);
157
257
 
158
- method_str = rb_id2str(SYM2ID(method_name));
159
- name = RSTRING_PTR(method_str);
160
- name_len = RSTRING_LEN(method_str);
161
-
162
- if (name[name_len - 1] == '=') {
163
- accessor_type = METHOD_SETTER;
164
- name_len--;
165
- // We want to ensure if the proto has something named clear_foo or has_foo?,
166
- // we don't strip the prefix.
167
- } else if (strncmp("clear_", name, 6) == 0 &&
168
- !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
169
- &test_f, &test_o)) {
170
- accessor_type = METHOD_CLEAR;
171
- name = name + 6;
172
- name_len = name_len - 6;
173
- } else if (strncmp("has_", name, 4) == 0 && name[name_len - 1] == '?' &&
174
- !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
175
- &test_f, &test_o)) {
176
- accessor_type = METHOD_PRESENCE;
177
- name = name + 4;
178
- name_len = name_len - 5;
179
- } else {
180
- accessor_type = METHOD_GETTER;
181
- }
182
-
183
- has_field = upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
184
- &test_f, &test_o);
185
-
186
- // Look for wrapper type accessor of the form <field_name>_as_value
187
- if (!has_field &&
188
- (accessor_type == METHOD_GETTER || accessor_type == METHOD_SETTER) &&
189
- name_len > 9 && strncmp(name + name_len - 9, "_as_value", 9) == 0) {
190
- const upb_oneofdef* test_o_wrapper;
191
- const upb_fielddef* test_f_wrapper;
192
- char wrapper_field_name[name_len - 8];
193
-
194
- // Find the field name
195
- strncpy(wrapper_field_name, name, name_len - 9);
196
- wrapper_field_name[name_len - 9] = '\0';
197
-
198
- // Check if field exists and is a wrapper type
199
- if (upb_msgdef_lookupname(self->descriptor->msgdef, wrapper_field_name,
200
- name_len - 9, &test_f_wrapper, &test_o_wrapper) &&
201
- is_wrapper_type_field(test_f_wrapper)) {
202
- // It does exist!
203
- has_field = true;
204
- if (accessor_type == METHOD_SETTER) {
205
- accessor_type = METHOD_WRAPPER_SETTER;
206
- } else {
207
- accessor_type = METHOD_WRAPPER_GETTER;
258
+ switch (accessor_type) {
259
+ case METHOD_PRESENCE:
260
+ return oneof_field == NULL ? Qfalse : Qtrue;
261
+ case METHOD_CLEAR:
262
+ if (oneof_field != NULL) {
263
+ upb_msg_clearfield(Message_GetMutable(_self, NULL), oneof_field);
208
264
  }
209
- test_o = test_o_wrapper;
210
- test_f = test_f_wrapper;
211
- }
265
+ return Qnil;
266
+ case METHOD_GETTER:
267
+ return oneof_field == NULL
268
+ ? Qnil
269
+ : ID2SYM(rb_intern(upb_fielddef_name(oneof_field)));
270
+ case METHOD_SETTER:
271
+ rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
212
272
  }
273
+ rb_raise(rb_eRuntimeError, "Invalid access of oneof field.");
274
+ }
213
275
 
214
- // Look for enum accessor of the form <enum_name>_const
215
- if (!has_field && accessor_type == METHOD_GETTER &&
216
- name_len > 6 && strncmp(name + name_len - 6, "_const", 6) == 0) {
217
- const upb_oneofdef* test_o_enum;
218
- const upb_fielddef* test_f_enum;
219
- char enum_name[name_len - 5];
220
-
221
- // Find enum field name
222
- strncpy(enum_name, name, name_len - 6);
223
- enum_name[name_len - 6] = '\0';
224
-
225
- // Check if enum field exists
226
- if (upb_msgdef_lookupname(self->descriptor->msgdef, enum_name, name_len - 6,
227
- &test_f_enum, &test_o_enum) &&
228
- upb_fielddef_type(test_f_enum) == UPB_TYPE_ENUM) {
229
- // It does exist!
230
- has_field = true;
231
- accessor_type = METHOD_ENUM_GETTER;
232
- test_o = test_o_enum;
233
- test_f = test_f_enum;
276
+ static void Message_setfield(upb_msg* msg, const upb_fielddef* f, VALUE val,
277
+ upb_arena* arena) {
278
+ upb_msgval msgval;
279
+ if (upb_fielddef_ismap(f)) {
280
+ msgval.map_val = Map_GetUpbMap(val, f);
281
+ } else if (upb_fielddef_isseq(f)) {
282
+ msgval.array_val = RepeatedField_GetUpbArray(val, f);
283
+ } else {
284
+ if (val == Qnil &&
285
+ (upb_fielddef_issubmsg(f) || upb_fielddef_realcontainingoneof(f))) {
286
+ upb_msg_clearfield(msg, f);
287
+ return;
234
288
  }
289
+ msgval =
290
+ Convert_RubyToUpb(val, upb_fielddef_name(f), TypeInfo_get(f), arena);
235
291
  }
292
+ upb_msg_set(msg, f, msgval, arena);
293
+ }
236
294
 
237
- // Verify the name corresponds to a oneof or field in this message.
238
- if (!has_field) {
239
- return METHOD_UNKNOWN;
295
+ VALUE Message_getfield(VALUE _self, const upb_fielddef* f) {
296
+ Message* self = ruby_to_Message(_self);
297
+ // This is a special-case: upb_msg_mutable() for map & array are logically
298
+ // const (they will not change what is serialized) but physically
299
+ // non-const, as they do allocate a repeated field or map. The logical
300
+ // constness means it's ok to do even if the message is frozen.
301
+ upb_msg *msg = (upb_msg*)self->msg;
302
+ upb_arena *arena = Arena_get(self->arena);
303
+ if (upb_fielddef_ismap(f)) {
304
+ upb_map *map = upb_msg_mutable(msg, f, arena).map;
305
+ const upb_fielddef *key_f = map_field_key(f);
306
+ const upb_fielddef *val_f = map_field_value(f);
307
+ upb_fieldtype_t key_type = upb_fielddef_type(key_f);
308
+ TypeInfo value_type_info = TypeInfo_get(val_f);
309
+ return Map_GetRubyWrapper(map, key_type, value_type_info, self->arena);
310
+ } else if (upb_fielddef_isseq(f)) {
311
+ upb_array *arr = upb_msg_mutable(msg, f, arena).array;
312
+ return RepeatedField_GetRubyWrapper(arr, TypeInfo_get(f), self->arena);
313
+ } else if (upb_fielddef_issubmsg(f)) {
314
+ if (!upb_msg_has(self->msg, f)) return Qnil;
315
+ upb_msg *submsg = upb_msg_mutable(msg, f, arena).msg;
316
+ const upb_msgdef *m = upb_fielddef_msgsubdef(f);
317
+ return Message_GetRubyWrapper(submsg, m, self->arena);
318
+ } else {
319
+ upb_msgval msgval = upb_msg_get(self->msg, f);
320
+ return Convert_UpbToRuby(msgval, TypeInfo_get(f), self->arena);
240
321
  }
322
+ }
241
323
 
242
- // Method calls like 'has_foo?' are not allowed if field "foo" does not have
243
- // a hasbit (e.g. repeated fields or non-message type fields for proto3
244
- // syntax).
245
- if (accessor_type == METHOD_PRESENCE && test_f != NULL &&
246
- !upb_fielddef_haspresence(test_f)) {
247
- return METHOD_UNKNOWN;
248
- }
324
+ static VALUE Message_field_accessor(VALUE _self, const upb_fielddef* f,
325
+ int accessor_type, int argc, VALUE* argv) {
326
+ upb_arena *arena = Arena_get(Message_GetArena(_self));
249
327
 
250
- *o = test_o;
251
- *f = test_f;
252
- return accessor_type;
328
+ switch (accessor_type) {
329
+ case METHOD_SETTER:
330
+ Message_setfield(Message_GetMutable(_self, NULL), f, argv[1], arena);
331
+ return Qnil;
332
+ case METHOD_CLEAR:
333
+ upb_msg_clearfield(Message_GetMutable(_self, NULL), f);
334
+ return Qnil;
335
+ case METHOD_PRESENCE:
336
+ if (!upb_fielddef_haspresence(f)) {
337
+ rb_raise(rb_eRuntimeError, "Field does not have presence.");
338
+ }
339
+ return upb_msg_has(Message_Get(_self, NULL), f);
340
+ case METHOD_WRAPPER_GETTER: {
341
+ Message* self = ruby_to_Message(_self);
342
+ if (upb_msg_has(self->msg, f)) {
343
+ PBRUBY_ASSERT(upb_fielddef_issubmsg(f) && !upb_fielddef_isseq(f));
344
+ upb_msgval wrapper = upb_msg_get(self->msg, f);
345
+ const upb_msgdef *wrapper_m = upb_fielddef_msgsubdef(f);
346
+ const upb_fielddef *value_f = upb_msgdef_itof(wrapper_m, 1);
347
+ upb_msgval value = upb_msg_get(wrapper.msg_val, value_f);
348
+ return Convert_UpbToRuby(value, TypeInfo_get(value_f), self->arena);
349
+ } else {
350
+ return Qnil;
351
+ }
352
+ }
353
+ case METHOD_WRAPPER_SETTER: {
354
+ upb_msg *msg = Message_GetMutable(_self, NULL);
355
+ if (argv[1] == Qnil) {
356
+ upb_msg_clearfield(msg, f);
357
+ } else {
358
+ const upb_fielddef *val_f = upb_msgdef_itof(upb_fielddef_msgsubdef(f), 1);
359
+ upb_msgval msgval = Convert_RubyToUpb(argv[1], upb_fielddef_name(f),
360
+ TypeInfo_get(val_f), arena);
361
+ upb_msg *wrapper = upb_msg_mutable(msg, f, arena).msg;
362
+ upb_msg_set(wrapper, val_f, msgval, arena);
363
+ }
364
+ return Qnil;
365
+ }
366
+ case METHOD_ENUM_GETTER: {
367
+ upb_msgval msgval = upb_msg_get(Message_Get(_self, NULL), f);
368
+
369
+ if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
370
+ // Map repeated fields to a new type with ints
371
+ VALUE arr = rb_ary_new();
372
+ size_t i, n = upb_array_size(msgval.array_val);
373
+ for (i = 0; i < n; i++) {
374
+ upb_msgval elem = upb_array_get(msgval.array_val, i);
375
+ rb_ary_push(arr, INT2NUM(elem.int32_val));
376
+ }
377
+ return arr;
378
+ } else {
379
+ return INT2NUM(msgval.int32_val);
380
+ }
381
+ }
382
+ case METHOD_GETTER:
383
+ return Message_getfield(_self, f);
384
+ default:
385
+ rb_raise(rb_eRuntimeError, "Internal error, no such accessor: %d",
386
+ accessor_type);
387
+ }
253
388
  }
254
389
 
255
390
  /*
@@ -279,111 +414,56 @@ static int extract_method_call(VALUE method_name, MessageHeader* self,
279
414
  * true if the field 'fieldname' is set in the message object, else false. For
280
415
  * 'proto3' syntax, calling this for a basic type field will result in an error.
281
416
  */
282
- VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
283
- MessageHeader* self;
417
+ static VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
418
+ Message* self = ruby_to_Message(_self);
284
419
  const upb_oneofdef* o;
285
420
  const upb_fielddef* f;
286
421
  int accessor_type;
287
422
 
288
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
289
423
  if (argc < 1) {
290
424
  rb_raise(rb_eArgError, "Expected method name as first argument.");
291
425
  }
292
426
 
293
427
  accessor_type = extract_method_call(argv[0], self, &f, &o);
294
- if (accessor_type == METHOD_UNKNOWN || (o == NULL && f == NULL) ) {
295
- return rb_call_super(argc, argv);
296
- } else if (accessor_type == METHOD_SETTER || accessor_type == METHOD_WRAPPER_SETTER) {
297
- if (argc != 2) {
298
- rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
299
- }
300
- rb_check_frozen(_self);
301
- } else if (argc != 1) {
302
- rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
303
- }
304
-
305
- // Return which of the oneof fields are set
306
- if (o != NULL) {
307
- const upb_fielddef* oneof_field = which_oneof_field(self, o);
308
428
 
309
- if (accessor_type == METHOD_SETTER) {
310
- rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
311
- }
429
+ if (accessor_type == METHOD_UNKNOWN) return rb_call_super(argc, argv);
312
430
 
313
- if (accessor_type == METHOD_PRESENCE) {
314
- return oneof_field == NULL ? Qfalse : Qtrue;
315
- } else if (accessor_type == METHOD_CLEAR) {
316
- if (oneof_field != NULL) {
317
- layout_clear(self->descriptor->layout, Message_data(self), oneof_field);
431
+ // Validate argument count.
432
+ switch (accessor_type) {
433
+ case METHOD_SETTER:
434
+ case METHOD_WRAPPER_SETTER:
435
+ if (argc != 2) {
436
+ rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
318
437
  }
319
- return Qnil;
320
- } else {
321
- // METHOD_ACCESSOR
322
- return oneof_field == NULL ? Qnil :
323
- ID2SYM(rb_intern(upb_fielddef_name(oneof_field)));
324
- }
325
- // Otherwise we're operating on a single proto field
326
- } else if (accessor_type == METHOD_SETTER) {
327
- layout_set(self->descriptor->layout, Message_data(self), f, argv[1]);
328
- return Qnil;
329
- } else if (accessor_type == METHOD_CLEAR) {
330
- layout_clear(self->descriptor->layout, Message_data(self), f);
331
- return Qnil;
332
- } else if (accessor_type == METHOD_PRESENCE) {
333
- return layout_has(self->descriptor->layout, Message_data(self), f);
334
- } else if (accessor_type == METHOD_WRAPPER_GETTER) {
335
- VALUE value = layout_get(self->descriptor->layout, Message_data(self), f);
336
- switch (TYPE(value)) {
337
- case T_DATA:
338
- return rb_funcall(value, rb_intern("value"), 0);
339
- case T_NIL:
340
- return Qnil;
341
- default:
342
- return value;
343
- }
344
- } else if (accessor_type == METHOD_WRAPPER_SETTER) {
345
- VALUE wrapper = ruby_wrapper_type(
346
- field_type_class(self->descriptor->layout, f), argv[1]);
347
- layout_set(self->descriptor->layout, Message_data(self), f, wrapper);
348
- return Qnil;
349
- } else if (accessor_type == METHOD_ENUM_GETTER) {
350
- VALUE enum_type = field_type_class(self->descriptor->layout, f);
351
- VALUE method = rb_intern("const_get");
352
- VALUE raw_value = layout_get(self->descriptor->layout, Message_data(self), f);
353
-
354
- // Map repeated fields to a new type with ints
355
- if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
356
- int array_size = FIX2INT(rb_funcall(raw_value, rb_intern("length"), 0));
357
- int i;
358
- VALUE array_args[1] = { ID2SYM(rb_intern("int64")) };
359
- VALUE array = rb_class_new_instance(1, array_args, CLASS_OF(raw_value));
360
- for (i = 0; i < array_size; i++) {
361
- VALUE entry = rb_funcall(enum_type, method, 1, rb_funcall(raw_value,
362
- rb_intern("at"), 1, INT2NUM(i)));
363
- rb_funcall(array, rb_intern("push"), 1, entry);
438
+ rb_check_frozen(_self);
439
+ break;
440
+ default:
441
+ if (argc != 1) {
442
+ rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
364
443
  }
365
- return array;
366
- }
367
- // Convert the value for singular fields
368
- return rb_funcall(enum_type, method, 1, raw_value);
444
+ break;
445
+ }
446
+
447
+ // Dispatch accessor.
448
+ if (o != NULL) {
449
+ return Message_oneof_accessor(_self, o, accessor_type);
369
450
  } else {
370
- return layout_get(self->descriptor->layout, Message_data(self), f);
451
+ return Message_field_accessor(_self, f, accessor_type, argc, argv);
371
452
  }
372
453
  }
373
454
 
374
-
375
- VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
376
- MessageHeader* self;
455
+ static VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
456
+ Message* self = ruby_to_Message(_self);
377
457
  const upb_oneofdef* o;
378
458
  const upb_fielddef* f;
379
459
  int accessor_type;
380
460
 
381
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
382
461
  if (argc < 1) {
383
462
  rb_raise(rb_eArgError, "Expected method name as first argument.");
384
463
  }
385
464
 
386
465
  accessor_type = extract_method_call(argv[0], self, &f, &o);
466
+
387
467
  if (accessor_type == METHOD_UNKNOWN) {
388
468
  return rb_call_super(argc, argv);
389
469
  } else if (o != NULL) {
@@ -393,17 +473,116 @@ VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
393
473
  }
394
474
  }
395
475
 
396
- VALUE create_submsg_from_hash(const MessageLayout* layout,
397
- const upb_fielddef* f, VALUE hash) {
398
- VALUE args[1] = { hash };
399
- return rb_class_new_instance(1, args, field_type_class(layout, f));
476
+ void Message_InitFromValue(upb_msg* msg, const upb_msgdef* m, VALUE val,
477
+ upb_arena* arena);
478
+
479
+ typedef struct {
480
+ upb_map *map;
481
+ TypeInfo key_type;
482
+ TypeInfo val_type;
483
+ upb_arena *arena;
484
+ } MapInit;
485
+
486
+ static int Map_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
487
+ MapInit *map_init = (MapInit*)_self;
488
+ upb_msgval k, v;
489
+ k = Convert_RubyToUpb(key, "", map_init->key_type, NULL);
490
+
491
+ if (map_init->val_type.type == UPB_TYPE_MESSAGE && TYPE(val) == T_HASH) {
492
+ upb_msg *msg = upb_msg_new(map_init->val_type.def.msgdef, map_init->arena);
493
+ Message_InitFromValue(msg, map_init->val_type.def.msgdef, val,
494
+ map_init->arena);
495
+ v.msg_val = msg;
496
+ } else {
497
+ v = Convert_RubyToUpb(val, "", map_init->val_type, map_init->arena);
498
+ }
499
+ upb_map_set(map_init->map, k, v, map_init->arena);
500
+ return ST_CONTINUE;
400
501
  }
401
502
 
402
- int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
403
- MessageHeader* self;
404
- char *name;
405
- const upb_fielddef* f;
406
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
503
+ static void Map_InitFromValue(upb_map* map, const upb_fielddef* f, VALUE val,
504
+ upb_arena* arena) {
505
+ const upb_msgdef* entry_m = upb_fielddef_msgsubdef(f);
506
+ const upb_fielddef* key_f = upb_msgdef_itof(entry_m, 1);
507
+ const upb_fielddef* val_f = upb_msgdef_itof(entry_m, 2);
508
+ if (TYPE(val) != T_HASH) {
509
+ rb_raise(rb_eArgError,
510
+ "Expected Hash object as initializer value for map field '%s' "
511
+ "(given %s).",
512
+ upb_fielddef_name(f), rb_class2name(CLASS_OF(val)));
513
+ }
514
+ MapInit map_init = {map, TypeInfo_get(key_f), TypeInfo_get(val_f), arena};
515
+ rb_hash_foreach(val, Map_initialize_kwarg, (VALUE)&map_init);
516
+ }
517
+
518
+ static upb_msgval MessageValue_FromValue(VALUE val, TypeInfo info,
519
+ upb_arena* arena) {
520
+ if (info.type == UPB_TYPE_MESSAGE) {
521
+ upb_msgval msgval;
522
+ upb_msg* msg = upb_msg_new(info.def.msgdef, arena);
523
+ Message_InitFromValue(msg, info.def.msgdef, val, arena);
524
+ msgval.msg_val = msg;
525
+ return msgval;
526
+ } else {
527
+ return Convert_RubyToUpb(val, "", info, arena);
528
+ }
529
+ }
530
+
531
+ static void RepeatedField_InitFromValue(upb_array* arr, const upb_fielddef* f,
532
+ VALUE val, upb_arena* arena) {
533
+ TypeInfo type_info = TypeInfo_get(f);
534
+
535
+ if (TYPE(val) != T_ARRAY) {
536
+ rb_raise(rb_eArgError,
537
+ "Expected array as initializer value for repeated field '%s' (given %s).",
538
+ upb_fielddef_name(f), rb_class2name(CLASS_OF(val)));
539
+ }
540
+
541
+ for (int i = 0; i < RARRAY_LEN(val); i++) {
542
+ VALUE entry = rb_ary_entry(val, i);
543
+ upb_msgval msgval;
544
+ if (upb_fielddef_issubmsg(f) && TYPE(entry) == T_HASH) {
545
+ msgval = MessageValue_FromValue(entry, type_info, arena);
546
+ } else {
547
+ msgval = Convert_RubyToUpb(entry, upb_fielddef_name(f), type_info, arena);
548
+ }
549
+ upb_array_append(arr, msgval, arena);
550
+ }
551
+ }
552
+
553
+ static void Message_InitFieldFromValue(upb_msg* msg, const upb_fielddef* f,
554
+ VALUE val, upb_arena* arena) {
555
+ if (TYPE(val) == T_NIL) return;
556
+
557
+ if (upb_fielddef_ismap(f)) {
558
+ upb_map *map = upb_msg_mutable(msg, f, arena).map;
559
+ Map_InitFromValue(map, f, val, arena);
560
+ } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
561
+ upb_array *arr = upb_msg_mutable(msg, f, arena).array;
562
+ RepeatedField_InitFromValue(arr, f, val, arena);
563
+ } else if (upb_fielddef_issubmsg(f)) {
564
+ if (TYPE(val) == T_HASH) {
565
+ upb_msg *submsg = upb_msg_mutable(msg, f, arena).msg;
566
+ Message_InitFromValue(submsg, upb_fielddef_msgsubdef(f), val, arena);
567
+ } else {
568
+ Message_setfield(msg, f, val, arena);
569
+ }
570
+ } else {
571
+ upb_msgval msgval =
572
+ Convert_RubyToUpb(val, upb_fielddef_name(f), TypeInfo_get(f), arena);
573
+ upb_msg_set(msg, f, msgval, arena);
574
+ }
575
+ }
576
+
577
+ typedef struct {
578
+ upb_msg *msg;
579
+ const upb_msgdef *msgdef;
580
+ upb_arena *arena;
581
+ } MsgInit;
582
+
583
+ static int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
584
+ MsgInit *msg_init = (MsgInit*)_self;
585
+ const char *name;
407
586
 
408
587
  if (TYPE(key) == T_STRING) {
409
588
  name = RSTRING_PTR(key);
@@ -414,52 +593,26 @@ int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
414
593
  "Expected string or symbols as hash keys when initializing proto from hash.");
415
594
  }
416
595
 
417
- f = upb_msgdef_ntofz(self->descriptor->msgdef, name);
596
+ const upb_fielddef* f = upb_msgdef_ntofz(msg_init->msgdef, name);
597
+
418
598
  if (f == NULL) {
419
599
  rb_raise(rb_eArgError,
420
600
  "Unknown field name '%s' in initialization map entry.", name);
421
601
  }
422
602
 
423
- if (TYPE(val) == T_NIL) {
424
- return 0;
425
- }
426
-
427
- if (is_map_field(f)) {
428
- VALUE map;
429
-
430
- if (TYPE(val) != T_HASH) {
431
- rb_raise(rb_eArgError,
432
- "Expected Hash object as initializer value for map field '%s' (given %s).",
433
- name, rb_class2name(CLASS_OF(val)));
434
- }
435
- map = layout_get(self->descriptor->layout, Message_data(self), f);
436
- Map_merge_into_self(map, val);
437
- } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
438
- VALUE ary;
439
- int i;
440
-
441
- if (TYPE(val) != T_ARRAY) {
442
- rb_raise(rb_eArgError,
443
- "Expected array as initializer value for repeated field '%s' (given %s).",
444
- name, rb_class2name(CLASS_OF(val)));
445
- }
446
- ary = layout_get(self->descriptor->layout, Message_data(self), f);
447
- for (i = 0; i < RARRAY_LEN(val); i++) {
448
- VALUE entry = rb_ary_entry(val, i);
449
- if (TYPE(entry) == T_HASH && upb_fielddef_issubmsg(f)) {
450
- entry = create_submsg_from_hash(self->descriptor->layout, f, entry);
451
- }
603
+ Message_InitFieldFromValue(msg_init->msg, f, val, msg_init->arena);
604
+ return ST_CONTINUE;
605
+ }
452
606
 
453
- RepeatedField_push(ary, entry);
454
- }
607
+ void Message_InitFromValue(upb_msg* msg, const upb_msgdef* m, VALUE val,
608
+ upb_arena* arena) {
609
+ MsgInit msg_init = {msg, m, arena};
610
+ if (TYPE(val) == T_HASH) {
611
+ rb_hash_foreach(val, Message_initialize_kwarg, (VALUE)&msg_init);
455
612
  } else {
456
- if (TYPE(val) == T_HASH && upb_fielddef_issubmsg(f)) {
457
- val = create_submsg_from_hash(self->descriptor->layout, f, val);
458
- }
459
-
460
- layout_set(self->descriptor->layout, Message_data(self), f, val);
613
+ rb_raise(rb_eArgError, "Expected hash arguments or message, not %s",
614
+ rb_class2name(CLASS_OF(val)));
461
615
  }
462
- return 0;
463
616
  }
464
617
 
465
618
  /*
@@ -474,12 +627,13 @@ int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
474
627
  * have been added to a pool. The method definitions described here on the
475
628
  * Message class are provided on each concrete message class.
476
629
  */
477
- VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
478
- MessageHeader* self;
479
- VALUE hash_args;
480
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
630
+ static VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
631
+ Message* self = ruby_to_Message(_self);
632
+ VALUE arena_rb = Arena_new();
633
+ upb_arena *arena = Arena_get(arena_rb);
634
+ upb_msg *msg = upb_msg_new(self->msgdef, arena);
481
635
 
482
- layout_init(self->descriptor->layout, Message_data(self));
636
+ Message_InitPtr(_self, msg, arena_rb);
483
637
 
484
638
  if (argc == 0) {
485
639
  return Qnil;
@@ -487,12 +641,7 @@ VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
487
641
  if (argc != 1) {
488
642
  rb_raise(rb_eArgError, "Expected 0 or 1 arguments.");
489
643
  }
490
- hash_args = argv[0];
491
- if (TYPE(hash_args) != T_HASH) {
492
- rb_raise(rb_eArgError, "Expected hash arguments.");
493
- }
494
-
495
- rb_hash_foreach(hash_args, Message_initialize_kwarg, _self);
644
+ Message_InitFromValue((upb_msg*)self->msg, self->msgdef, argv[0], arena);
496
645
  return Qnil;
497
646
  }
498
647
 
@@ -502,37 +651,40 @@ VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
502
651
  *
503
652
  * Performs a shallow copy of this message and returns the new copy.
504
653
  */
505
- VALUE Message_dup(VALUE _self) {
506
- MessageHeader* self;
507
- VALUE new_msg;
508
- MessageHeader* new_msg_self;
509
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
510
-
511
- new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
512
- TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);
513
-
514
- layout_dup(self->descriptor->layout,
515
- Message_data(new_msg_self),
516
- Message_data(self));
517
-
654
+ static VALUE Message_dup(VALUE _self) {
655
+ Message* self = ruby_to_Message(_self);
656
+ VALUE new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
657
+ Message* new_msg_self = ruby_to_Message(new_msg);
658
+ size_t size = upb_msgdef_layout(self->msgdef)->size;
659
+
660
+ // TODO(copy unknown fields?)
661
+ // TODO(use official upb msg copy function)
662
+ memcpy((upb_msg*)new_msg_self->msg, self->msg, size);
663
+ upb_arena_fuse(Arena_get(new_msg_self->arena), Arena_get(self->arena));
518
664
  return new_msg;
519
665
  }
520
666
 
521
- // Internal only; used by Google::Protobuf.deep_copy.
522
- VALUE Message_deep_copy(VALUE _self) {
523
- MessageHeader* self;
524
- MessageHeader* new_msg_self;
525
- VALUE new_msg;
526
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
667
+ // Support function for Message_eq, and also used by other #eq functions.
668
+ bool Message_Equal(const upb_msg *m1, const upb_msg *m2, const upb_msgdef *m) {
669
+ if (m1 == m2) return true;
527
670
 
528
- new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
529
- TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);
671
+ size_t size1, size2;
672
+ int encode_opts = UPB_ENCODE_SKIPUNKNOWN | UPB_ENCODE_DETERMINISTIC;
673
+ upb_arena *arena_tmp = upb_arena_new();
674
+ const upb_msglayout *layout = upb_msgdef_layout(m);
530
675
 
531
- layout_deep_copy(self->descriptor->layout,
532
- Message_data(new_msg_self),
533
- Message_data(self));
676
+ // Compare deterministically serialized payloads with no unknown fields.
677
+ char *data1 = upb_encode_ex(m1, layout, encode_opts, arena_tmp, &size1);
678
+ char *data2 = upb_encode_ex(m2, layout, encode_opts, arena_tmp, &size2);
534
679
 
535
- return new_msg;
680
+ if (data1 && data2) {
681
+ bool ret = (size1 == size2) && (memcmp(data1, data2, size1) == 0);
682
+ upb_arena_free(arena_tmp);
683
+ return ret;
684
+ } else {
685
+ upb_arena_free(arena_tmp);
686
+ rb_raise(cParseError, "Error comparing messages");
687
+ }
536
688
  }
537
689
 
538
690
  /*
@@ -544,22 +696,37 @@ VALUE Message_deep_copy(VALUE _self) {
544
696
  * method's semantics (a more efficient comparison may actually be done if the
545
697
  * field is of a primitive type).
546
698
  */
547
- VALUE Message_eq(VALUE _self, VALUE _other) {
548
- MessageHeader* self;
549
- MessageHeader* other;
699
+ static VALUE Message_eq(VALUE _self, VALUE _other) {
550
700
  if (TYPE(_self) != TYPE(_other)) {
551
701
  return Qfalse;
552
702
  }
553
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
554
- TypedData_Get_Struct(_other, MessageHeader, &Message_type, other);
555
703
 
556
- if (self->descriptor != other->descriptor) {
557
- return Qfalse;
558
- }
704
+ Message* self = ruby_to_Message(_self);
705
+ Message* other = ruby_to_Message(_other);
559
706
 
560
- return layout_eq(self->descriptor->layout,
561
- Message_data(self),
562
- Message_data(other));
707
+ return Message_Equal(self->msg, other->msg, self->msgdef)
708
+ ? Qtrue
709
+ : Qfalse;
710
+ }
711
+
712
+ uint64_t Message_Hash(const upb_msg* msg, const upb_msgdef* m, uint64_t seed) {
713
+ upb_arena *arena = upb_arena_new();
714
+ const char *data;
715
+ size_t size;
716
+
717
+ // Hash a deterministically serialized payloads with no unknown fields.
718
+ data = upb_encode_ex(msg, upb_msgdef_layout(m),
719
+ UPB_ENCODE_SKIPUNKNOWN | UPB_ENCODE_DETERMINISTIC, arena,
720
+ &size);
721
+
722
+ if (data) {
723
+ uint64_t ret = wyhash(data, size, seed, _wyp);
724
+ upb_arena_free(arena);
725
+ return ret;
726
+ } else {
727
+ upb_arena_free(arena);
728
+ rb_raise(cParseError, "Error calculating hash");
729
+ }
563
730
  }
564
731
 
565
732
  /*
@@ -568,11 +735,9 @@ VALUE Message_eq(VALUE _self, VALUE _other) {
568
735
  *
569
736
  * Returns a hash value that represents this message's field values.
570
737
  */
571
- VALUE Message_hash(VALUE _self) {
572
- MessageHeader* self;
573
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
574
-
575
- return layout_hash(self->descriptor->layout, Message_data(self));
738
+ static VALUE Message_hash(VALUE _self) {
739
+ Message* self = ruby_to_Message(_self);
740
+ return INT2FIX(Message_Hash(self->msg, self->msgdef, 0));
576
741
  }
577
742
 
578
743
  /*
@@ -583,77 +748,119 @@ VALUE Message_hash(VALUE _self) {
583
748
  * formatted as "<MessageType: field1: value1, field2: value2, ...>". Each
584
749
  * field's value is represented according to its own #inspect method.
585
750
  */
586
- VALUE Message_inspect(VALUE _self) {
587
- MessageHeader* self;
588
- VALUE str;
589
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
751
+ static VALUE Message_inspect(VALUE _self) {
752
+ Message* self = ruby_to_Message(_self);
590
753
 
591
- str = rb_str_new2("<");
592
- str = rb_str_append(str, rb_str_new2(rb_class2name(CLASS_OF(_self))));
593
- str = rb_str_cat2(str, ": ");
594
- str = rb_str_append(str, layout_inspect(
595
- self->descriptor->layout, Message_data(self)));
596
- str = rb_str_cat2(str, ">");
597
- return str;
754
+ StringBuilder* builder = StringBuilder_New();
755
+ Message_PrintMessage(builder, self->msg, self->msgdef);
756
+ VALUE ret = StringBuilder_ToRubyString(builder);
757
+ StringBuilder_Free(builder);
758
+ return ret;
598
759
  }
599
760
 
600
- /*
601
- * call-seq:
602
- * Message.to_h => {}
603
- *
604
- * Returns the message as a Ruby Hash object, with keys as symbols.
605
- */
606
- VALUE Message_to_h(VALUE _self) {
607
- MessageHeader* self;
608
- VALUE hash;
609
- upb_msg_field_iter it;
610
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
611
-
612
- hash = rb_hash_new();
613
-
614
- for (upb_msg_field_begin(&it, self->descriptor->msgdef);
615
- !upb_msg_field_done(&it);
616
- upb_msg_field_next(&it)) {
617
- const upb_fielddef* field = upb_msg_iter_field(&it);
761
+ // Support functions for Message_to_h //////////////////////////////////////////
762
+
763
+ static VALUE RepeatedField_CreateArray(const upb_array* arr,
764
+ TypeInfo type_info) {
765
+ int size = arr ? upb_array_size(arr) : 0;
766
+ VALUE ary = rb_ary_new2(size);
767
+
768
+ for (int i = 0; i < size; i++) {
769
+ upb_msgval msgval = upb_array_get(arr, i);
770
+ VALUE val = Scalar_CreateHash(msgval, type_info);
771
+ rb_ary_push(ary, val);
772
+ }
773
+
774
+ return ary;
775
+ }
776
+
777
+ static VALUE Message_CreateHash(const upb_msg *msg, const upb_msgdef *m) {
778
+ if (!msg) return Qnil;
779
+
780
+ VALUE hash = rb_hash_new();
781
+ int n = upb_msgdef_fieldcount(m);
782
+ bool is_proto2;
783
+
784
+ // We currently have a few behaviors that are specific to proto2.
785
+ // This is unfortunate, we should key behaviors off field attributes (like
786
+ // whether a field has presence), not proto2 vs. proto3. We should see if we
787
+ // can change this without breaking users.
788
+ is_proto2 = upb_msgdef_syntax(m) == UPB_SYNTAX_PROTO2;
789
+
790
+ for (int i = 0; i < n; i++) {
791
+ const upb_fielddef* field = upb_msgdef_field(m, i);
792
+ TypeInfo type_info = TypeInfo_get(field);
793
+ upb_msgval msgval;
618
794
  VALUE msg_value;
619
795
  VALUE msg_key;
620
796
 
621
- // For proto2, do not include fields which are not set.
622
- if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
623
- field_contains_hasbit(self->descriptor->layout, field) &&
624
- !layout_has(self->descriptor->layout, Message_data(self), field)) {
797
+ // Do not include fields that are not present (oneof or optional fields).
798
+ if (is_proto2 && upb_fielddef_haspresence(field) &&
799
+ !upb_msg_has(msg, field)) {
625
800
  continue;
626
801
  }
627
802
 
628
- msg_value = layout_get(self->descriptor->layout, Message_data(self), field);
629
803
  msg_key = ID2SYM(rb_intern(upb_fielddef_name(field)));
630
- if (is_map_field(field)) {
631
- msg_value = Map_to_h(msg_value);
632
- } else if (upb_fielddef_label(field) == UPB_LABEL_REPEATED) {
633
- msg_value = RepeatedField_to_ary(msg_value);
634
- if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
635
- RARRAY_LEN(msg_value) == 0) {
804
+ msgval = upb_msg_get(msg, field);
805
+
806
+ // Proto2 omits empty map/repeated filds also.
807
+
808
+ if (upb_fielddef_ismap(field)) {
809
+ const upb_msgdef *entry_m = upb_fielddef_msgsubdef(field);
810
+ const upb_fielddef *key_f = upb_msgdef_itof(entry_m, 1);
811
+ const upb_fielddef *val_f = upb_msgdef_itof(entry_m, 2);
812
+ upb_fieldtype_t key_type = upb_fielddef_type(key_f);
813
+ msg_value = Map_CreateHash(msgval.map_val, key_type, TypeInfo_get(val_f));
814
+ } else if (upb_fielddef_isseq(field)) {
815
+ if (is_proto2 &&
816
+ (!msgval.array_val || upb_array_size(msgval.array_val) == 0)) {
636
817
  continue;
637
818
  }
638
-
639
- if (upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
640
- int i;
641
- for (i = 0; i < RARRAY_LEN(msg_value); i++) {
642
- VALUE elem = rb_ary_entry(msg_value, i);
643
- rb_ary_store(msg_value, i, Message_to_h(elem));
644
- }
645
- }
646
-
647
- } else if (msg_value != Qnil &&
648
- upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
649
- msg_value = Message_to_h(msg_value);
819
+ msg_value = RepeatedField_CreateArray(msgval.array_val, type_info);
820
+ } else {
821
+ msg_value = Scalar_CreateHash(msgval, type_info);
650
822
  }
823
+
651
824
  rb_hash_aset(hash, msg_key, msg_value);
652
825
  }
826
+
653
827
  return hash;
654
828
  }
655
829
 
830
+ VALUE Scalar_CreateHash(upb_msgval msgval, TypeInfo type_info) {
831
+ if (type_info.type == UPB_TYPE_MESSAGE) {
832
+ return Message_CreateHash(msgval.msg_val, type_info.def.msgdef);
833
+ } else {
834
+ return Convert_UpbToRuby(msgval, type_info, Qnil);
835
+ }
836
+ }
837
+
838
+ /*
839
+ * call-seq:
840
+ * Message.to_h => {}
841
+ *
842
+ * Returns the message as a Ruby Hash object, with keys as symbols.
843
+ */
844
+ static VALUE Message_to_h(VALUE _self) {
845
+ Message* self = ruby_to_Message(_self);
846
+ return Message_CreateHash(self->msg, self->msgdef);
847
+ }
656
848
 
849
+ /*
850
+ * call-seq:
851
+ * Message.freeze => self
852
+ *
853
+ * Freezes the message object. We have to intercept this so we can pin the
854
+ * Ruby object into memory so we don't forget it's frozen.
855
+ */
856
+ static VALUE Message_freeze(VALUE _self) {
857
+ Message* self = ruby_to_Message(_self);
858
+ if (!RB_OBJ_FROZEN(_self)) {
859
+ Arena_Pin(self->arena, _self);
860
+ RB_OBJ_FREEZE(_self);
861
+ }
862
+ return _self;
863
+ }
657
864
 
658
865
  /*
659
866
  * call-seq:
@@ -662,16 +869,18 @@ VALUE Message_to_h(VALUE _self) {
662
869
  * Accesses a field's value by field name. The provided field name should be a
663
870
  * string.
664
871
  */
665
- VALUE Message_index(VALUE _self, VALUE field_name) {
666
- MessageHeader* self;
872
+ static VALUE Message_index(VALUE _self, VALUE field_name) {
873
+ Message* self = ruby_to_Message(_self);
667
874
  const upb_fielddef* field;
668
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
875
+
669
876
  Check_Type(field_name, T_STRING);
670
- field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
877
+ field = upb_msgdef_ntofz(self->msgdef, RSTRING_PTR(field_name));
878
+
671
879
  if (field == NULL) {
672
880
  return Qnil;
673
881
  }
674
- return layout_get(self->descriptor->layout, Message_data(self), field);
882
+
883
+ return Message_getfield(_self, field);
675
884
  }
676
885
 
677
886
  /*
@@ -681,19 +890,208 @@ VALUE Message_index(VALUE _self, VALUE field_name) {
681
890
  * Sets a field's value by field name. The provided field name should be a
682
891
  * string.
683
892
  */
684
- VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
685
- MessageHeader* self;
686
- const upb_fielddef* field;
687
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
893
+ static VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
894
+ Message* self = ruby_to_Message(_self);
895
+ const upb_fielddef* f;
896
+ upb_msgval val;
897
+ upb_arena *arena = Arena_get(self->arena);
898
+
688
899
  Check_Type(field_name, T_STRING);
689
- field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
690
- if (field == NULL) {
900
+ f = upb_msgdef_ntofz(self->msgdef, RSTRING_PTR(field_name));
901
+
902
+ if (f == NULL) {
691
903
  rb_raise(rb_eArgError, "Unknown field: %s", RSTRING_PTR(field_name));
692
904
  }
693
- layout_set(self->descriptor->layout, Message_data(self), field, value);
905
+
906
+ val = Convert_RubyToUpb(value, upb_fielddef_name(f), TypeInfo_get(f), arena);
907
+ upb_msg_set(Message_GetMutable(_self, NULL), f, val, arena);
908
+
694
909
  return Qnil;
695
910
  }
696
911
 
912
+ /*
913
+ * call-seq:
914
+ * MessageClass.decode(data) => message
915
+ *
916
+ * Decodes the given data (as a string containing bytes in protocol buffers wire
917
+ * format) under the interpretration given by this message class's definition
918
+ * and returns a message object with the corresponding field values.
919
+ */
920
+ static VALUE Message_decode(VALUE klass, VALUE data) {
921
+ if (TYPE(data) != T_STRING) {
922
+ rb_raise(rb_eArgError, "Expected string for binary protobuf data.");
923
+ }
924
+
925
+ VALUE msg_rb = initialize_rb_class_with_no_args(klass);
926
+ Message* msg = ruby_to_Message(msg_rb);
927
+
928
+ if (!upb_decode(RSTRING_PTR(data), RSTRING_LEN(data), (upb_msg*)msg->msg,
929
+ upb_msgdef_layout(msg->msgdef),
930
+ Arena_get(msg->arena))) {
931
+ rb_raise(cParseError, "Error occurred during parsing");
932
+ }
933
+
934
+ return msg_rb;
935
+ }
936
+
937
+ /*
938
+ * call-seq:
939
+ * MessageClass.decode_json(data, options = {}) => message
940
+ *
941
+ * Decodes the given data (as a string containing bytes in protocol buffers wire
942
+ * format) under the interpretration given by this message class's definition
943
+ * and returns a message object with the corresponding field values.
944
+ *
945
+ * @param options [Hash] options for the decoder
946
+ * ignore_unknown_fields: set true to ignore unknown fields (default is to
947
+ * raise an error)
948
+ */
949
+ static VALUE Message_decode_json(int argc, VALUE* argv, VALUE klass) {
950
+ VALUE data = argv[0];
951
+ int options = 0;
952
+ upb_status status;
953
+
954
+ // TODO(haberman): use this message's pool instead.
955
+ const upb_symtab *symtab = DescriptorPool_GetSymtab(generated_pool);
956
+
957
+ if (argc < 1 || argc > 2) {
958
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
959
+ }
960
+
961
+ if (argc == 2) {
962
+ VALUE hash_args = argv[1];
963
+ if (TYPE(hash_args) != T_HASH) {
964
+ rb_raise(rb_eArgError, "Expected hash arguments.");
965
+ }
966
+
967
+ if (RTEST(rb_hash_lookup2( hash_args, ID2SYM(rb_intern("ignore_unknown_fields")), Qfalse))) {
968
+ options |= UPB_JSONDEC_IGNOREUNKNOWN;
969
+ }
970
+ }
971
+
972
+ if (TYPE(data) != T_STRING) {
973
+ rb_raise(rb_eArgError, "Expected string for JSON data.");
974
+ }
975
+
976
+ // TODO(cfallin): Check and respect string encoding. If not UTF-8, we need to
977
+ // convert, because string handlers pass data directly to message string
978
+ // fields.
979
+
980
+ VALUE msg_rb = initialize_rb_class_with_no_args(klass);
981
+ Message* msg = ruby_to_Message(msg_rb);
982
+
983
+ // We don't allow users to decode a wrapper type directly.
984
+ if (upb_msgdef_iswrapper(msg->msgdef)) {
985
+ rb_raise(rb_eRuntimeError, "Cannot parse a wrapper directly.");
986
+ }
987
+
988
+ upb_status_clear(&status);
989
+ if (!upb_json_decode(RSTRING_PTR(data), RSTRING_LEN(data), (upb_msg*)msg->msg,
990
+ msg->msgdef, symtab, options,
991
+ Arena_get(msg->arena), &status)) {
992
+ rb_raise(cParseError, "Error occurred during parsing: %s",
993
+ upb_status_errmsg(&status));
994
+ }
995
+
996
+ return msg_rb;
997
+ }
998
+
999
+ /*
1000
+ * call-seq:
1001
+ * MessageClass.encode(msg) => bytes
1002
+ *
1003
+ * Encodes the given message object to its serialized form in protocol buffers
1004
+ * wire format.
1005
+ */
1006
+ static VALUE Message_encode(VALUE klass, VALUE msg_rb) {
1007
+ Message* msg = ruby_to_Message(msg_rb);
1008
+ upb_arena *arena = upb_arena_new();
1009
+ const char *data;
1010
+ size_t size;
1011
+
1012
+ if (CLASS_OF(msg_rb) != klass) {
1013
+ rb_raise(rb_eArgError, "Message of wrong type.");
1014
+ }
1015
+
1016
+ data = upb_encode(msg->msg, upb_msgdef_layout(msg->msgdef), arena,
1017
+ &size);
1018
+
1019
+ if (data) {
1020
+ VALUE ret = rb_str_new(data, size);
1021
+ rb_enc_associate(ret, rb_ascii8bit_encoding());
1022
+ upb_arena_free(arena);
1023
+ return ret;
1024
+ } else {
1025
+ upb_arena_free(arena);
1026
+ rb_raise(rb_eRuntimeError, "Exceeded maximum depth (possibly cycle)");
1027
+ }
1028
+ }
1029
+
1030
+ /*
1031
+ * call-seq:
1032
+ * MessageClass.encode_json(msg, options = {}) => json_string
1033
+ *
1034
+ * Encodes the given message object into its serialized JSON representation.
1035
+ * @param options [Hash] options for the decoder
1036
+ * preserve_proto_fieldnames: set true to use original fieldnames (default is to camelCase)
1037
+ * emit_defaults: set true to emit 0/false values (default is to omit them)
1038
+ */
1039
+ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1040
+ Message* msg = ruby_to_Message(argv[0]);
1041
+ int options = 0;
1042
+ char buf[1024];
1043
+ size_t size;
1044
+ upb_status status;
1045
+
1046
+ // TODO(haberman): use this message's pool instead.
1047
+ const upb_symtab *symtab = DescriptorPool_GetSymtab(generated_pool);
1048
+
1049
+ if (argc < 1 || argc > 2) {
1050
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1051
+ }
1052
+
1053
+ if (argc == 2) {
1054
+ VALUE hash_args = argv[1];
1055
+ if (TYPE(hash_args) != T_HASH) {
1056
+ rb_raise(rb_eArgError, "Expected hash arguments.");
1057
+ }
1058
+
1059
+ if (RTEST(rb_hash_lookup2(hash_args,
1060
+ ID2SYM(rb_intern("preserve_proto_fieldnames")),
1061
+ Qfalse))) {
1062
+ options |= UPB_JSONENC_PROTONAMES;
1063
+ }
1064
+
1065
+ if (RTEST(rb_hash_lookup2(hash_args, ID2SYM(rb_intern("emit_defaults")),
1066
+ Qfalse))) {
1067
+ options |= UPB_JSONENC_EMITDEFAULTS;
1068
+ }
1069
+ }
1070
+
1071
+ upb_status_clear(&status);
1072
+ size = upb_json_encode(msg->msg, msg->msgdef, symtab, options, buf,
1073
+ sizeof(buf), &status);
1074
+
1075
+ if (!upb_ok(&status)) {
1076
+ rb_raise(cParseError, "Error occurred during encoding: %s",
1077
+ upb_status_errmsg(&status));
1078
+ }
1079
+
1080
+ VALUE ret;
1081
+ if (size >= sizeof(buf)) {
1082
+ char* buf2 = malloc(size + 1);
1083
+ upb_json_encode(msg->msg, msg->msgdef, symtab, options, buf2, size + 1,
1084
+ &status);
1085
+ ret = rb_str_new(buf2, size);
1086
+ free(buf2);
1087
+ } else {
1088
+ ret = rb_str_new(buf, size);
1089
+ }
1090
+
1091
+ rb_enc_associate(ret, rb_utf8_encoding());
1092
+ return ret;
1093
+ }
1094
+
697
1095
  /*
698
1096
  * call-seq:
699
1097
  * Message.descriptor => descriptor
@@ -701,16 +1099,15 @@ VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
701
1099
  * Class method that returns the Descriptor instance corresponding to this
702
1100
  * message class's type.
703
1101
  */
704
- VALUE Message_descriptor(VALUE klass) {
1102
+ static VALUE Message_descriptor(VALUE klass) {
705
1103
  return rb_ivar_get(klass, descriptor_instancevar_interned);
706
1104
  }
707
1105
 
708
1106
  VALUE build_class_from_descriptor(VALUE descriptor) {
709
- Descriptor* desc = ruby_to_Descriptor(descriptor);
710
1107
  const char *name;
711
1108
  VALUE klass;
712
1109
 
713
- name = upb_msgdef_fullname(desc->msgdef);
1110
+ name = upb_msgdef_fullname(Descriptor_GetMsgDef(descriptor));
714
1111
  if (name == NULL) {
715
1112
  rb_raise(rb_eRuntimeError, "Descriptor does not have assigned name.");
716
1113
  }
@@ -737,6 +1134,7 @@ VALUE build_class_from_descriptor(VALUE descriptor) {
737
1134
  rb_define_method(klass, "clone", Message_dup, 0);
738
1135
  rb_define_method(klass, "==", Message_eq, 1);
739
1136
  rb_define_method(klass, "eql?", Message_eq, 1);
1137
+ rb_define_method(klass, "freeze", Message_freeze, 0);
740
1138
  rb_define_method(klass, "hash", Message_hash, 0);
741
1139
  rb_define_method(klass, "to_h", Message_to_h, 0);
742
1140
  rb_define_method(klass, "inspect", Message_inspect, 0);
@@ -759,12 +1157,12 @@ VALUE build_class_from_descriptor(VALUE descriptor) {
759
1157
  * This module method, provided on each generated enum module, looks up an enum
760
1158
  * value by number and returns its name as a Ruby symbol, or nil if not found.
761
1159
  */
762
- VALUE enum_lookup(VALUE self, VALUE number) {
1160
+ static VALUE enum_lookup(VALUE self, VALUE number) {
763
1161
  int32_t num = NUM2INT(number);
764
1162
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
765
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);
1163
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(desc);
766
1164
 
767
- const char* name = upb_enumdef_iton(enumdesc->enumdef, num);
1165
+ const char* name = upb_enumdef_iton(e, num);
768
1166
  if (name == NULL) {
769
1167
  return Qnil;
770
1168
  } else {
@@ -779,13 +1177,13 @@ VALUE enum_lookup(VALUE self, VALUE number) {
779
1177
  * This module method, provided on each generated enum module, looks up an enum
780
1178
  * value by name (as a Ruby symbol) and returns its name, or nil if not found.
781
1179
  */
782
- VALUE enum_resolve(VALUE self, VALUE sym) {
1180
+ static VALUE enum_resolve(VALUE self, VALUE sym) {
783
1181
  const char* name = rb_id2name(SYM2ID(sym));
784
1182
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
785
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);
1183
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(desc);
786
1184
 
787
1185
  int32_t num = 0;
788
- bool found = upb_enumdef_ntoiz(enumdesc->enumdef, name, &num);
1186
+ bool found = upb_enumdef_ntoiz(e, name, &num);
789
1187
  if (!found) {
790
1188
  return Qnil;
791
1189
  } else {
@@ -800,17 +1198,16 @@ VALUE enum_resolve(VALUE self, VALUE sym) {
800
1198
  * This module method, provided on each generated enum module, returns the
801
1199
  * EnumDescriptor corresponding to this enum type.
802
1200
  */
803
- VALUE enum_descriptor(VALUE self) {
1201
+ static VALUE enum_descriptor(VALUE self) {
804
1202
  return rb_ivar_get(self, descriptor_instancevar_interned);
805
1203
  }
806
1204
 
807
1205
  VALUE build_module_from_enumdesc(VALUE _enumdesc) {
808
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(_enumdesc);
809
- VALUE mod = rb_define_module_id(
810
- rb_intern(upb_enumdef_fullname(enumdesc->enumdef)));
1206
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(_enumdesc);
1207
+ VALUE mod = rb_define_module_id(rb_intern(upb_enumdef_fullname(e)));
811
1208
 
812
1209
  upb_enum_iter it;
813
- for (upb_enum_begin(&it, enumdesc->enumdef);
1210
+ for (upb_enum_begin(&it, e);
814
1211
  !upb_enum_done(&it);
815
1212
  upb_enum_next(&it)) {
816
1213
  const char* name = upb_enum_iter_name(&it);
@@ -831,20 +1228,94 @@ VALUE build_module_from_enumdesc(VALUE _enumdesc) {
831
1228
  return mod;
832
1229
  }
833
1230
 
834
- /*
835
- * call-seq:
836
- * Google::Protobuf.deep_copy(obj) => copy_of_obj
837
- *
838
- * Performs a deep copy of a RepeatedField instance, a Map instance, or a
839
- * message object, recursively copying its members.
840
- */
841
- VALUE Google_Protobuf_deep_copy(VALUE self, VALUE obj) {
842
- VALUE klass = CLASS_OF(obj);
843
- if (klass == cRepeatedField) {
844
- return RepeatedField_deep_copy(obj);
845
- } else if (klass == cMap) {
846
- return Map_deep_copy(obj);
847
- } else {
848
- return Message_deep_copy(obj);
1231
+ // Internal only; used by Google::Protobuf.deep_copy.
1232
+ upb_msg* Message_deep_copy(const upb_msg* msg, const upb_msgdef* m,
1233
+ upb_arena *arena) {
1234
+ // Serialize and parse.
1235
+ upb_arena *tmp_arena = upb_arena_new();
1236
+ const upb_msglayout *layout = upb_msgdef_layout(m);
1237
+ size_t size;
1238
+
1239
+ char* data = upb_encode_ex(msg, layout, 0, tmp_arena, &size);
1240
+ upb_msg* new_msg = upb_msg_new(m, arena);
1241
+
1242
+ if (!data || !upb_decode(data, size, new_msg, layout, arena)) {
1243
+ upb_arena_free(tmp_arena);
1244
+ rb_raise(cParseError, "Error occurred copying proto");
1245
+ }
1246
+
1247
+ upb_arena_free(tmp_arena);
1248
+ return new_msg;
1249
+ }
1250
+
1251
+ const upb_msg* Message_GetUpbMessage(VALUE value, const upb_msgdef* m,
1252
+ const char* name, upb_arena* arena) {
1253
+ if (value == Qnil) {
1254
+ rb_raise(cTypeError, "nil message not allowed here.");
1255
+ }
1256
+
1257
+ VALUE klass = CLASS_OF(value);
1258
+ VALUE desc_rb = rb_ivar_get(klass, descriptor_instancevar_interned);
1259
+ const upb_msgdef* val_m =
1260
+ desc_rb == Qnil ? NULL : Descriptor_GetMsgDef(desc_rb);
1261
+
1262
+ if (val_m != m) {
1263
+ // Check for possible implicit conversions
1264
+ // TODO: hash conversion?
1265
+
1266
+ switch (upb_msgdef_wellknowntype(m)) {
1267
+ case UPB_WELLKNOWN_TIMESTAMP: {
1268
+ // Time -> Google::Protobuf::Timestamp
1269
+ upb_msg *msg = upb_msg_new(m, arena);
1270
+ upb_msgval sec, nsec;
1271
+ struct timespec time;
1272
+ const upb_fielddef *sec_f = upb_msgdef_itof(m, 1);
1273
+ const upb_fielddef *nsec_f = upb_msgdef_itof(m, 2);
1274
+
1275
+ if (!rb_obj_is_kind_of(value, rb_cTime)) goto badtype;
1276
+
1277
+ time = rb_time_timespec(value);
1278
+ sec.int64_val = time.tv_sec;
1279
+ nsec.int32_val = time.tv_nsec;
1280
+ upb_msg_set(msg, sec_f, sec, arena);
1281
+ upb_msg_set(msg, nsec_f, nsec, arena);
1282
+ return msg;
1283
+ }
1284
+ case UPB_WELLKNOWN_DURATION: {
1285
+ // Numeric -> Google::Protobuf::Duration
1286
+ upb_msg *msg = upb_msg_new(m, arena);
1287
+ upb_msgval sec, nsec;
1288
+ const upb_fielddef *sec_f = upb_msgdef_itof(m, 1);
1289
+ const upb_fielddef *nsec_f = upb_msgdef_itof(m, 2);
1290
+
1291
+ if (!rb_obj_is_kind_of(value, rb_cNumeric)) goto badtype;
1292
+
1293
+ sec.int64_val = NUM2LL(value);
1294
+ nsec.int32_val = round((NUM2DBL(value) - NUM2LL(value)) * 1000000000);
1295
+ upb_msg_set(msg, sec_f, sec, arena);
1296
+ upb_msg_set(msg, nsec_f, nsec, arena);
1297
+ return msg;
1298
+ }
1299
+ default:
1300
+ badtype:
1301
+ rb_raise(cTypeError,
1302
+ "Invalid type %s to assign to submessage field '%s'.",
1303
+ rb_class2name(CLASS_OF(value)), name);
1304
+ }
1305
+
849
1306
  }
1307
+
1308
+ Message* self = ruby_to_Message(value);
1309
+ upb_arena_fuse(arena, Arena_get(self->arena));
1310
+
1311
+ return self->msg;
1312
+ }
1313
+
1314
+ void Message_register(VALUE protobuf) {
1315
+ cParseError = rb_const_get(protobuf, rb_intern("ParseError"));
1316
+
1317
+ // Ruby-interned string: "descriptor". We use this identifier to store an
1318
+ // instance variable on message classes we create in order to link them back
1319
+ // to their descriptors.
1320
+ descriptor_instancevar_interned = rb_intern("descriptor");
850
1321
  }