google-protobuf 3.7.1 → 3.17.3

Sign up to get free protection for your applications and to get access to all the features.

Potentially problematic release.


This version of google-protobuf might be problematic. Click here for more details.

Files changed (37) hide show
  1. checksums.yaml +4 -4
  2. data/ext/google/protobuf_c/convert.c +349 -0
  3. data/ext/google/protobuf_c/convert.h +72 -0
  4. data/ext/google/protobuf_c/defs.c +1555 -1228
  5. data/ext/google/protobuf_c/defs.h +107 -0
  6. data/ext/google/protobuf_c/extconf.rb +5 -7
  7. data/ext/google/protobuf_c/map.c +312 -470
  8. data/ext/google/protobuf_c/map.h +67 -0
  9. data/ext/google/protobuf_c/message.c +942 -348
  10. data/ext/google/protobuf_c/message.h +101 -0
  11. data/ext/google/protobuf_c/protobuf.c +400 -51
  12. data/ext/google/protobuf_c/protobuf.h +47 -545
  13. data/ext/google/protobuf_c/repeated_field.c +313 -308
  14. data/ext/google/protobuf_c/repeated_field.h +63 -0
  15. data/ext/google/protobuf_c/ruby-upb.c +8858 -0
  16. data/ext/google/protobuf_c/ruby-upb.h +4411 -0
  17. data/ext/google/protobuf_c/third_party/wyhash/wyhash.h +145 -0
  18. data/lib/google/protobuf.rb +70 -0
  19. data/lib/google/protobuf/any_pb.rb +1 -1
  20. data/lib/google/protobuf/api_pb.rb +3 -3
  21. data/lib/google/protobuf/duration_pb.rb +1 -1
  22. data/lib/google/protobuf/empty_pb.rb +1 -1
  23. data/lib/google/protobuf/field_mask_pb.rb +1 -1
  24. data/lib/google/protobuf/source_context_pb.rb +1 -1
  25. data/lib/google/protobuf/struct_pb.rb +4 -4
  26. data/lib/google/protobuf/timestamp_pb.rb +1 -1
  27. data/lib/google/protobuf/type_pb.rb +8 -8
  28. data/lib/google/protobuf/well_known_types.rb +8 -2
  29. data/lib/google/protobuf/wrappers_pb.rb +9 -9
  30. data/tests/basic.rb +320 -70
  31. data/tests/generated_code_test.rb +0 -0
  32. data/tests/stress.rb +0 -0
  33. metadata +27 -15
  34. data/ext/google/protobuf_c/encode_decode.c +0 -1614
  35. data/ext/google/protobuf_c/storage.c +0 -1032
  36. data/ext/google/protobuf_c/upb.c +0 -17480
  37. data/ext/google/protobuf_c/upb.h +0 -10642
@@ -0,0 +1,67 @@
1
+ // Protocol Buffers - Google's data interchange format
2
+ // Copyright 2008 Google Inc. All rights reserved.
3
+ // https://developers.google.com/protocol-buffers/
4
+ //
5
+ // Redistribution and use in source and binary forms, with or without
6
+ // modification, are permitted provided that the following conditions are
7
+ // met:
8
+ //
9
+ // * Redistributions of source code must retain the above copyright
10
+ // notice, this list of conditions and the following disclaimer.
11
+ // * Redistributions in binary form must reproduce the above
12
+ // copyright notice, this list of conditions and the following disclaimer
13
+ // in the documentation and/or other materials provided with the
14
+ // distribution.
15
+ // * Neither the name of Google Inc. nor the names of its
16
+ // contributors may be used to endorse or promote products derived from
17
+ // this software without specific prior written permission.
18
+ //
19
+ // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
20
+ // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
21
+ // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
22
+ // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
23
+ // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24
+ // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
25
+ // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
26
+ // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
27
+ // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
28
+ // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29
+ // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
+
31
+ #ifndef RUBY_PROTOBUF_MAP_H_
32
+ #define RUBY_PROTOBUF_MAP_H_
33
+
34
+ #include <ruby/ruby.h>
35
+
36
+ #include "protobuf.h"
37
+ #include "ruby-upb.h"
38
+
39
+ // Returns a Ruby wrapper object for the given map, which will be created if
40
+ // one does not exist already.
41
+ VALUE Map_GetRubyWrapper(upb_map *map, upb_fieldtype_t key_type,
42
+ TypeInfo value_type, VALUE arena);
43
+
44
+ // Gets the underlying upb_map for this Ruby map object, which must have
45
+ // key/value type that match |field|. If this is not a map or the type doesn't
46
+ // match, raises an exception.
47
+ const upb_map *Map_GetUpbMap(VALUE val, const upb_fielddef *field,
48
+ upb_arena *arena);
49
+
50
+ // Implements #inspect for this map by appending its contents to |b|.
51
+ void Map_Inspect(StringBuilder *b, const upb_map *map, upb_fieldtype_t key_type,
52
+ TypeInfo val_type);
53
+
54
+ // Returns a new Hash object containing the contents of this Map.
55
+ VALUE Map_CreateHash(const upb_map* map, upb_fieldtype_t key_type,
56
+ TypeInfo val_info);
57
+
58
+ // Returns a deep copy of this Map object.
59
+ VALUE Map_deep_copy(VALUE obj);
60
+
61
+ // Ruby class of Google::Protobuf::Map.
62
+ extern VALUE cMap;
63
+
64
+ // Call at startup to register all types in this module.
65
+ void Map_register(VALUE module);
66
+
67
+ #endif // RUBY_PROTOBUF_MAP_H_
@@ -28,148 +28,363 @@
28
28
  // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29
29
  // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
30
 
31
+ #include "message.h"
32
+
33
+ #include "convert.h"
34
+ #include "defs.h"
35
+ #include "map.h"
31
36
  #include "protobuf.h"
37
+ #include "repeated_field.h"
38
+ #include "third_party/wyhash/wyhash.h"
32
39
 
33
- // -----------------------------------------------------------------------------
34
- // Class/module creation from msgdefs and enumdefs, respectively.
35
- // -----------------------------------------------------------------------------
40
+ static VALUE cParseError = Qnil;
41
+ static ID descriptor_instancevar_interned;
36
42
 
37
- void* Message_data(void* msg) {
38
- return ((uint8_t *)msg) + sizeof(MessageHeader);
43
+ static VALUE initialize_rb_class_with_no_args(VALUE klass) {
44
+ return rb_funcall(klass, rb_intern("new"), 0);
39
45
  }
40
46
 
41
- void Message_mark(void* _self) {
42
- MessageHeader* self = (MessageHeader *)_self;
43
- layout_mark(self->descriptor->layout, Message_data(self));
47
+ VALUE MessageOrEnum_GetDescriptor(VALUE klass) {
48
+ return rb_ivar_get(klass, descriptor_instancevar_interned);
44
49
  }
45
50
 
46
- void Message_free(void* self) {
47
- stringsink* unknown = ((MessageHeader *)self)->unknown_fields;
48
- if (unknown != NULL) {
49
- stringsink_uninit(unknown);
50
- free(unknown);
51
- }
52
- xfree(self);
51
+ // -----------------------------------------------------------------------------
52
+ // Class/module creation from msgdefs and enumdefs, respectively.
53
+ // -----------------------------------------------------------------------------
54
+
55
+ typedef struct {
56
+ VALUE arena;
57
+ const upb_msg* msg; // Can get as mutable when non-frozen.
58
+ const upb_msgdef* msgdef; // kept alive by self.class.descriptor reference.
59
+ } Message;
60
+
61
+ static void Message_mark(void* _self) {
62
+ Message* self = (Message *)_self;
63
+ rb_gc_mark(self->arena);
53
64
  }
54
65
 
55
- rb_data_type_t Message_type = {
66
+ static rb_data_type_t Message_type = {
56
67
  "Message",
57
- { Message_mark, Message_free, NULL },
68
+ { Message_mark, RUBY_DEFAULT_FREE, NULL },
69
+ .flags = RUBY_TYPED_FREE_IMMEDIATELY,
58
70
  };
59
71
 
60
- VALUE Message_alloc(VALUE klass) {
72
+ static Message* ruby_to_Message(VALUE msg_rb) {
73
+ Message* msg;
74
+ TypedData_Get_Struct(msg_rb, Message, &Message_type, msg);
75
+ return msg;
76
+ }
77
+
78
+ static VALUE Message_alloc(VALUE klass) {
61
79
  VALUE descriptor = rb_ivar_get(klass, descriptor_instancevar_interned);
62
- Descriptor* desc = ruby_to_Descriptor(descriptor);
63
- MessageHeader* msg = (MessageHeader*)ALLOC_N(
64
- uint8_t, sizeof(MessageHeader) + desc->layout->size);
80
+ Message* msg = ALLOC(Message);
65
81
  VALUE ret;
66
82
 
67
- memset(Message_data(msg), 0, desc->layout->size);
83
+ msg->msgdef = Descriptor_GetMsgDef(descriptor);
84
+ msg->arena = Qnil;
85
+ msg->msg = NULL;
68
86
 
69
- // We wrap first so that everything in the message object is GC-rooted in case
70
- // a collection happens during object creation in layout_init().
71
87
  ret = TypedData_Wrap_Struct(klass, &Message_type, msg);
72
- msg->descriptor = desc;
73
88
  rb_ivar_set(ret, descriptor_instancevar_interned, descriptor);
74
89
 
75
- msg->unknown_fields = NULL;
90
+ return ret;
91
+ }
76
92
 
77
- layout_init(desc->layout, Message_data(msg));
93
+ const upb_msg *Message_Get(VALUE msg_rb, const upb_msgdef **m) {
94
+ Message* msg = ruby_to_Message(msg_rb);
95
+ if (m) *m = msg->msgdef;
96
+ return msg->msg;
97
+ }
78
98
 
79
- return ret;
99
+ upb_msg *Message_GetMutable(VALUE msg_rb, const upb_msgdef **m) {
100
+ rb_check_frozen(msg_rb);
101
+ return (upb_msg*)Message_Get(msg_rb, m);
80
102
  }
81
103
 
82
- static const upb_fielddef* which_oneof_field(MessageHeader* self, const upb_oneofdef* o) {
83
- upb_oneof_iter it;
84
- size_t case_ofs;
85
- uint32_t oneof_case;
86
- const upb_fielddef* first_field;
87
- const upb_fielddef* f;
104
+ void Message_InitPtr(VALUE self_, upb_msg *msg, VALUE arena) {
105
+ Message* self = ruby_to_Message(self_);
106
+ self->msg = msg;
107
+ self->arena = arena;
108
+ ObjectCache_Add(msg, self_);
109
+ }
88
110
 
89
- // If no fields in the oneof, always nil.
90
- if (upb_oneofdef_numfields(o) == 0) {
91
- return NULL;
111
+ VALUE Message_GetArena(VALUE msg_rb) {
112
+ Message* msg = ruby_to_Message(msg_rb);
113
+ return msg->arena;
114
+ }
115
+
116
+ void Message_CheckClass(VALUE klass) {
117
+ if (rb_get_alloc_func(klass) != &Message_alloc) {
118
+ rb_raise(rb_eArgError,
119
+ "Message class was not returned by the DescriptorPool.");
92
120
  }
93
- // Grab the first field in the oneof so we can get its layout info to find the
94
- // oneof_case field.
95
- upb_oneof_begin(&it, o);
96
- assert(!upb_oneof_done(&it));
97
- first_field = upb_oneof_iter_field(&it);
98
- assert(upb_fielddef_containingoneof(first_field) != NULL);
121
+ }
99
122
 
100
- case_ofs =
101
- self->descriptor->layout->
102
- fields[upb_fielddef_index(first_field)].case_offset;
103
- oneof_case = *((uint32_t*)((char*)Message_data(self) + case_ofs));
123
+ VALUE Message_GetRubyWrapper(upb_msg* msg, const upb_msgdef* m, VALUE arena) {
124
+ if (msg == NULL) return Qnil;
104
125
 
105
- if (oneof_case == ONEOF_CASE_NONE) {
106
- return NULL;
126
+ VALUE val = ObjectCache_Get(msg);
127
+
128
+ if (val == Qnil) {
129
+ VALUE klass = Descriptor_DefToClass(m);
130
+ val = Message_alloc(klass);
131
+ Message_InitPtr(val, msg, arena);
107
132
  }
108
133
 
109
- // oneof_case is a field index, so find that field.
110
- f = upb_oneofdef_itof(o, oneof_case);
111
- assert(f != NULL);
134
+ return val;
135
+ }
136
+
137
+ void Message_PrintMessage(StringBuilder* b, const upb_msg* msg,
138
+ const upb_msgdef* m) {
139
+ bool first = true;
140
+ int n = upb_msgdef_fieldcount(m);
141
+ VALUE klass = Descriptor_DefToClass(m);
142
+ StringBuilder_Printf(b, "<%s: ", rb_class2name(klass));
143
+
144
+ for (int i = 0; i < n; i++) {
145
+ const upb_fielddef* field = upb_msgdef_field(m, i);
146
+
147
+ if (upb_fielddef_haspresence(field) && !upb_msg_has(msg, field)) {
148
+ continue;
149
+ }
150
+
151
+ if (!first) {
152
+ StringBuilder_Printf(b, ", ");
153
+ } else {
154
+ first = false;
155
+ }
156
+
157
+ upb_msgval msgval = upb_msg_get(msg, field);
158
+
159
+ StringBuilder_Printf(b, "%s: ", upb_fielddef_name(field));
160
+
161
+ if (upb_fielddef_ismap(field)) {
162
+ const upb_msgdef* entry_m = upb_fielddef_msgsubdef(field);
163
+ const upb_fielddef* key_f = upb_msgdef_itof(entry_m, 1);
164
+ const upb_fielddef* val_f = upb_msgdef_itof(entry_m, 2);
165
+ TypeInfo val_info = TypeInfo_get(val_f);
166
+ Map_Inspect(b, msgval.map_val, upb_fielddef_type(key_f), val_info);
167
+ } else if (upb_fielddef_isseq(field)) {
168
+ RepeatedField_Inspect(b, msgval.array_val, TypeInfo_get(field));
169
+ } else {
170
+ StringBuilder_PrintMsgval(b, msgval, TypeInfo_get(field));
171
+ }
172
+ }
112
173
 
113
- return f;
174
+ StringBuilder_Printf(b, ">");
114
175
  }
115
176
 
177
+ // Helper functions for #method_missing ////////////////////////////////////////
178
+
116
179
  enum {
117
180
  METHOD_UNKNOWN = 0,
118
181
  METHOD_GETTER = 1,
119
182
  METHOD_SETTER = 2,
120
183
  METHOD_CLEAR = 3,
121
- METHOD_PRESENCE = 4
184
+ METHOD_PRESENCE = 4,
185
+ METHOD_ENUM_GETTER = 5,
186
+ METHOD_WRAPPER_GETTER = 6,
187
+ METHOD_WRAPPER_SETTER = 7
122
188
  };
123
189
 
124
- static int extract_method_call(VALUE method_name, MessageHeader* self,
125
- const upb_fielddef **f, const upb_oneofdef **o) {
190
+ // Check if the field is a well known wrapper type
191
+ static bool IsWrapper(const upb_fielddef* f) {
192
+ return upb_fielddef_issubmsg(f) &&
193
+ upb_msgdef_iswrapper(upb_fielddef_msgsubdef(f));
194
+ }
195
+
196
+ static bool Match(const upb_msgdef* m, const char* name, const upb_fielddef** f,
197
+ const upb_oneofdef** o, const char* prefix,
198
+ const char* suffix) {
199
+ size_t sp = strlen(prefix);
200
+ size_t ss = strlen(suffix);
201
+ size_t sn = strlen(name);
202
+
203
+ if (sn <= sp + ss) return false;
204
+
205
+ if (memcmp(name, prefix, sp) != 0 ||
206
+ memcmp(name + sn - ss, suffix, ss) != 0) {
207
+ return false;
208
+ }
209
+
210
+ return upb_msgdef_lookupname(m, name + sp, sn - sp - ss, f, o);
211
+ }
212
+
213
+ static int extract_method_call(VALUE method_name, Message* self,
214
+ const upb_fielddef** f, const upb_oneofdef** o) {
215
+ const upb_msgdef* m = self->msgdef;
216
+ const char* name;
217
+
126
218
  Check_Type(method_name, T_SYMBOL);
219
+ name = rb_id2name(SYM2ID(method_name));
220
+
221
+ if (Match(m, name, f, o, "", "")) return METHOD_GETTER;
222
+ if (Match(m, name, f, o, "", "=")) return METHOD_SETTER;
223
+ if (Match(m, name, f, o, "clear_", "")) return METHOD_CLEAR;
224
+ if (Match(m, name, f, o, "has_", "?") &&
225
+ (*o || (*f && upb_fielddef_haspresence(*f)))) {
226
+ // Disallow oneof hazzers for proto3.
227
+ // TODO(haberman): remove this test when we are enabling oneof hazzers for
228
+ // proto3.
229
+ if (*f && !upb_fielddef_issubmsg(*f) &&
230
+ upb_fielddef_realcontainingoneof(*f) &&
231
+ upb_msgdef_syntax(upb_fielddef_containingtype(*f)) !=
232
+ UPB_SYNTAX_PROTO2) {
233
+ return METHOD_UNKNOWN;
234
+ }
235
+ return METHOD_PRESENCE;
236
+ }
237
+ if (Match(m, name, f, o, "", "_as_value") && *f && !upb_fielddef_isseq(*f) &&
238
+ IsWrapper(*f)) {
239
+ return METHOD_WRAPPER_GETTER;
240
+ }
241
+ if (Match(m, name, f, o, "", "_as_value=") && *f && !upb_fielddef_isseq(*f) &&
242
+ IsWrapper(*f)) {
243
+ return METHOD_WRAPPER_SETTER;
244
+ }
245
+ if (Match(m, name, f, o, "", "_const") && *f &&
246
+ upb_fielddef_type(*f) == UPB_TYPE_ENUM) {
247
+ return METHOD_ENUM_GETTER;
248
+ }
127
249
 
128
- VALUE method_str = rb_id2str(SYM2ID(method_name));
129
- char* name = RSTRING_PTR(method_str);
130
- size_t name_len = RSTRING_LEN(method_str);
131
- int accessor_type;
132
- const upb_oneofdef* test_o;
133
- const upb_fielddef* test_f;
134
-
135
- if (name[name_len - 1] == '=') {
136
- accessor_type = METHOD_SETTER;
137
- name_len--;
138
- // We want to ensure if the proto has something named clear_foo or has_foo?,
139
- // we don't strip the prefix.
140
- } else if (strncmp("clear_", name, 6) == 0 &&
141
- !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
142
- &test_f, &test_o)) {
143
- accessor_type = METHOD_CLEAR;
144
- name = name + 6;
145
- name_len = name_len - 6;
146
- } else if (strncmp("has_", name, 4) == 0 && name[name_len - 1] == '?' &&
147
- !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
148
- &test_f, &test_o)) {
149
- accessor_type = METHOD_PRESENCE;
150
- name = name + 4;
151
- name_len = name_len - 5;
152
- } else {
153
- accessor_type = METHOD_GETTER;
250
+ return METHOD_UNKNOWN;
251
+ }
252
+
253
+ static VALUE Message_oneof_accessor(VALUE _self, const upb_oneofdef* o,
254
+ int accessor_type) {
255
+ Message* self = ruby_to_Message(_self);
256
+ const upb_fielddef* oneof_field = upb_msg_whichoneof(self->msg, o);
257
+
258
+ switch (accessor_type) {
259
+ case METHOD_PRESENCE:
260
+ return oneof_field == NULL ? Qfalse : Qtrue;
261
+ case METHOD_CLEAR:
262
+ if (oneof_field != NULL) {
263
+ upb_msg_clearfield(Message_GetMutable(_self, NULL), oneof_field);
264
+ }
265
+ return Qnil;
266
+ case METHOD_GETTER:
267
+ return oneof_field == NULL
268
+ ? Qnil
269
+ : ID2SYM(rb_intern(upb_fielddef_name(oneof_field)));
270
+ case METHOD_SETTER:
271
+ rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
154
272
  }
273
+ rb_raise(rb_eRuntimeError, "Invalid access of oneof field.");
274
+ }
155
275
 
156
- // Verify the name corresponds to a oneof or field in this message.
157
- if (!upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
158
- &test_f, &test_o)) {
159
- return METHOD_UNKNOWN;
276
+ static void Message_setfield(upb_msg* msg, const upb_fielddef* f, VALUE val,
277
+ upb_arena* arena) {
278
+ upb_msgval msgval;
279
+ if (upb_fielddef_ismap(f)) {
280
+ msgval.map_val = Map_GetUpbMap(val, f, arena);
281
+ } else if (upb_fielddef_isseq(f)) {
282
+ msgval.array_val = RepeatedField_GetUpbArray(val, f, arena);
283
+ } else {
284
+ if (val == Qnil &&
285
+ (upb_fielddef_issubmsg(f) || upb_fielddef_realcontainingoneof(f))) {
286
+ upb_msg_clearfield(msg, f);
287
+ return;
288
+ }
289
+ msgval =
290
+ Convert_RubyToUpb(val, upb_fielddef_name(f), TypeInfo_get(f), arena);
160
291
  }
292
+ upb_msg_set(msg, f, msgval, arena);
293
+ }
161
294
 
162
- // Method calls like 'has_foo?' are not allowed if field "foo" does not have
163
- // a hasbit (e.g. repeated fields or non-message type fields for proto3
164
- // syntax).
165
- if (accessor_type == METHOD_PRESENCE && test_f != NULL &&
166
- !upb_fielddef_haspresence(test_f)) {
167
- return METHOD_UNKNOWN;
295
+ VALUE Message_getfield(VALUE _self, const upb_fielddef* f) {
296
+ Message* self = ruby_to_Message(_self);
297
+ // This is a special-case: upb_msg_mutable() for map & array are logically
298
+ // const (they will not change what is serialized) but physically
299
+ // non-const, as they do allocate a repeated field or map. The logical
300
+ // constness means it's ok to do even if the message is frozen.
301
+ upb_msg *msg = (upb_msg*)self->msg;
302
+ upb_arena *arena = Arena_get(self->arena);
303
+ if (upb_fielddef_ismap(f)) {
304
+ upb_map *map = upb_msg_mutable(msg, f, arena).map;
305
+ const upb_fielddef *key_f = map_field_key(f);
306
+ const upb_fielddef *val_f = map_field_value(f);
307
+ upb_fieldtype_t key_type = upb_fielddef_type(key_f);
308
+ TypeInfo value_type_info = TypeInfo_get(val_f);
309
+ return Map_GetRubyWrapper(map, key_type, value_type_info, self->arena);
310
+ } else if (upb_fielddef_isseq(f)) {
311
+ upb_array *arr = upb_msg_mutable(msg, f, arena).array;
312
+ return RepeatedField_GetRubyWrapper(arr, TypeInfo_get(f), self->arena);
313
+ } else if (upb_fielddef_issubmsg(f)) {
314
+ if (!upb_msg_has(self->msg, f)) return Qnil;
315
+ upb_msg *submsg = upb_msg_mutable(msg, f, arena).msg;
316
+ const upb_msgdef *m = upb_fielddef_msgsubdef(f);
317
+ return Message_GetRubyWrapper(submsg, m, self->arena);
318
+ } else {
319
+ upb_msgval msgval = upb_msg_get(self->msg, f);
320
+ return Convert_UpbToRuby(msgval, TypeInfo_get(f), self->arena);
168
321
  }
322
+ }
323
+
324
+ static VALUE Message_field_accessor(VALUE _self, const upb_fielddef* f,
325
+ int accessor_type, int argc, VALUE* argv) {
326
+ upb_arena *arena = Arena_get(Message_GetArena(_self));
169
327
 
170
- *o = test_o;
171
- *f = test_f;
172
- return accessor_type;
328
+ switch (accessor_type) {
329
+ case METHOD_SETTER:
330
+ Message_setfield(Message_GetMutable(_self, NULL), f, argv[1], arena);
331
+ return Qnil;
332
+ case METHOD_CLEAR:
333
+ upb_msg_clearfield(Message_GetMutable(_self, NULL), f);
334
+ return Qnil;
335
+ case METHOD_PRESENCE:
336
+ if (!upb_fielddef_haspresence(f)) {
337
+ rb_raise(rb_eRuntimeError, "Field does not have presence.");
338
+ }
339
+ return upb_msg_has(Message_Get(_self, NULL), f);
340
+ case METHOD_WRAPPER_GETTER: {
341
+ Message* self = ruby_to_Message(_self);
342
+ if (upb_msg_has(self->msg, f)) {
343
+ PBRUBY_ASSERT(upb_fielddef_issubmsg(f) && !upb_fielddef_isseq(f));
344
+ upb_msgval wrapper = upb_msg_get(self->msg, f);
345
+ const upb_msgdef *wrapper_m = upb_fielddef_msgsubdef(f);
346
+ const upb_fielddef *value_f = upb_msgdef_itof(wrapper_m, 1);
347
+ upb_msgval value = upb_msg_get(wrapper.msg_val, value_f);
348
+ return Convert_UpbToRuby(value, TypeInfo_get(value_f), self->arena);
349
+ } else {
350
+ return Qnil;
351
+ }
352
+ }
353
+ case METHOD_WRAPPER_SETTER: {
354
+ upb_msg *msg = Message_GetMutable(_self, NULL);
355
+ if (argv[1] == Qnil) {
356
+ upb_msg_clearfield(msg, f);
357
+ } else {
358
+ const upb_fielddef *val_f = upb_msgdef_itof(upb_fielddef_msgsubdef(f), 1);
359
+ upb_msgval msgval = Convert_RubyToUpb(argv[1], upb_fielddef_name(f),
360
+ TypeInfo_get(val_f), arena);
361
+ upb_msg *wrapper = upb_msg_mutable(msg, f, arena).msg;
362
+ upb_msg_set(wrapper, val_f, msgval, arena);
363
+ }
364
+ return Qnil;
365
+ }
366
+ case METHOD_ENUM_GETTER: {
367
+ upb_msgval msgval = upb_msg_get(Message_Get(_self, NULL), f);
368
+
369
+ if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
370
+ // Map repeated fields to a new type with ints
371
+ VALUE arr = rb_ary_new();
372
+ size_t i, n = upb_array_size(msgval.array_val);
373
+ for (i = 0; i < n; i++) {
374
+ upb_msgval elem = upb_array_get(msgval.array_val, i);
375
+ rb_ary_push(arr, INT2NUM(elem.int32_val));
376
+ }
377
+ return arr;
378
+ } else {
379
+ return INT2NUM(msgval.int32_val);
380
+ }
381
+ }
382
+ case METHOD_GETTER:
383
+ return Message_getfield(_self, f);
384
+ default:
385
+ rb_raise(rb_eRuntimeError, "Internal error, no such accessor: %d",
386
+ accessor_type);
387
+ }
173
388
  }
174
389
 
175
390
  /*
@@ -199,72 +414,56 @@ static int extract_method_call(VALUE method_name, MessageHeader* self,
199
414
  * true if the field 'fieldname' is set in the message object, else false. For
200
415
  * 'proto3' syntax, calling this for a basic type field will result in an error.
201
416
  */
202
- VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
203
- MessageHeader* self;
417
+ static VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
418
+ Message* self = ruby_to_Message(_self);
204
419
  const upb_oneofdef* o;
205
420
  const upb_fielddef* f;
421
+ int accessor_type;
206
422
 
207
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
208
423
  if (argc < 1) {
209
424
  rb_raise(rb_eArgError, "Expected method name as first argument.");
210
425
  }
211
426
 
212
- int accessor_type = extract_method_call(argv[0], self, &f, &o);
213
- if (accessor_type == METHOD_UNKNOWN || (o == NULL && f == NULL) ) {
214
- return rb_call_super(argc, argv);
215
- } else if (accessor_type == METHOD_SETTER) {
216
- if (argc != 2) {
217
- rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
218
- }
219
- } else if (argc != 1) {
220
- rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
221
- }
427
+ accessor_type = extract_method_call(argv[0], self, &f, &o);
222
428
 
223
- // Return which of the oneof fields are set
224
- if (o != NULL) {
225
- if (accessor_type == METHOD_SETTER) {
226
- rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
227
- }
429
+ if (accessor_type == METHOD_UNKNOWN) return rb_call_super(argc, argv);
228
430
 
229
- const upb_fielddef* oneof_field = which_oneof_field(self, o);
230
- if (accessor_type == METHOD_PRESENCE) {
231
- return oneof_field == NULL ? Qfalse : Qtrue;
232
- } else if (accessor_type == METHOD_CLEAR) {
233
- if (oneof_field != NULL) {
234
- layout_clear(self->descriptor->layout, Message_data(self), oneof_field);
431
+ // Validate argument count.
432
+ switch (accessor_type) {
433
+ case METHOD_SETTER:
434
+ case METHOD_WRAPPER_SETTER:
435
+ if (argc != 2) {
436
+ rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
235
437
  }
236
- return Qnil;
237
- } else {
238
- // METHOD_ACCESSOR
239
- return oneof_field == NULL ? Qnil :
240
- ID2SYM(rb_intern(upb_fielddef_name(oneof_field)));
241
- }
242
- // Otherwise we're operating on a single proto field
243
- } else if (accessor_type == METHOD_SETTER) {
244
- layout_set(self->descriptor->layout, Message_data(self), f, argv[1]);
245
- return Qnil;
246
- } else if (accessor_type == METHOD_CLEAR) {
247
- layout_clear(self->descriptor->layout, Message_data(self), f);
248
- return Qnil;
249
- } else if (accessor_type == METHOD_PRESENCE) {
250
- return layout_has(self->descriptor->layout, Message_data(self), f);
438
+ rb_check_frozen(_self);
439
+ break;
440
+ default:
441
+ if (argc != 1) {
442
+ rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
443
+ }
444
+ break;
445
+ }
446
+
447
+ // Dispatch accessor.
448
+ if (o != NULL) {
449
+ return Message_oneof_accessor(_self, o, accessor_type);
251
450
  } else {
252
- return layout_get(self->descriptor->layout, Message_data(self), f);
451
+ return Message_field_accessor(_self, f, accessor_type, argc, argv);
253
452
  }
254
453
  }
255
454
 
256
-
257
- VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
258
- MessageHeader* self;
455
+ static VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
456
+ Message* self = ruby_to_Message(_self);
259
457
  const upb_oneofdef* o;
260
458
  const upb_fielddef* f;
459
+ int accessor_type;
261
460
 
262
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
263
461
  if (argc < 1) {
264
462
  rb_raise(rb_eArgError, "Expected method name as first argument.");
265
463
  }
266
464
 
267
- int accessor_type = extract_method_call(argv[0], self, &f, &o);
465
+ accessor_type = extract_method_call(argv[0], self, &f, &o);
466
+
268
467
  if (accessor_type == METHOD_UNKNOWN) {
269
468
  return rb_call_super(argc, argv);
270
469
  } else if (o != NULL) {
@@ -274,22 +473,116 @@ VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
274
473
  }
275
474
  }
276
475
 
277
- VALUE create_submsg_from_hash(const upb_fielddef *f, VALUE hash) {
278
- const upb_def *d = upb_fielddef_subdef(f);
279
- assert(d != NULL);
476
+ void Message_InitFromValue(upb_msg* msg, const upb_msgdef* m, VALUE val,
477
+ upb_arena* arena);
478
+
479
+ typedef struct {
480
+ upb_map *map;
481
+ TypeInfo key_type;
482
+ TypeInfo val_type;
483
+ upb_arena *arena;
484
+ } MapInit;
485
+
486
+ static int Map_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
487
+ MapInit *map_init = (MapInit*)_self;
488
+ upb_msgval k, v;
489
+ k = Convert_RubyToUpb(key, "", map_init->key_type, NULL);
490
+
491
+ if (map_init->val_type.type == UPB_TYPE_MESSAGE && TYPE(val) == T_HASH) {
492
+ upb_msg *msg = upb_msg_new(map_init->val_type.def.msgdef, map_init->arena);
493
+ Message_InitFromValue(msg, map_init->val_type.def.msgdef, val,
494
+ map_init->arena);
495
+ v.msg_val = msg;
496
+ } else {
497
+ v = Convert_RubyToUpb(val, "", map_init->val_type, map_init->arena);
498
+ }
499
+ upb_map_set(map_init->map, k, v, map_init->arena);
500
+ return ST_CONTINUE;
501
+ }
280
502
 
281
- VALUE descriptor = get_def_obj(d);
282
- VALUE msgclass = rb_funcall(descriptor, rb_intern("msgclass"), 0, NULL);
503
+ static void Map_InitFromValue(upb_map* map, const upb_fielddef* f, VALUE val,
504
+ upb_arena* arena) {
505
+ const upb_msgdef* entry_m = upb_fielddef_msgsubdef(f);
506
+ const upb_fielddef* key_f = upb_msgdef_itof(entry_m, 1);
507
+ const upb_fielddef* val_f = upb_msgdef_itof(entry_m, 2);
508
+ if (TYPE(val) != T_HASH) {
509
+ rb_raise(rb_eArgError,
510
+ "Expected Hash object as initializer value for map field '%s' "
511
+ "(given %s).",
512
+ upb_fielddef_name(f), rb_class2name(CLASS_OF(val)));
513
+ }
514
+ MapInit map_init = {map, TypeInfo_get(key_f), TypeInfo_get(val_f), arena};
515
+ rb_hash_foreach(val, Map_initialize_kwarg, (VALUE)&map_init);
516
+ }
283
517
 
284
- VALUE args[1] = { hash };
285
- return rb_class_new_instance(1, args, msgclass);
518
+ static upb_msgval MessageValue_FromValue(VALUE val, TypeInfo info,
519
+ upb_arena* arena) {
520
+ if (info.type == UPB_TYPE_MESSAGE) {
521
+ upb_msgval msgval;
522
+ upb_msg* msg = upb_msg_new(info.def.msgdef, arena);
523
+ Message_InitFromValue(msg, info.def.msgdef, val, arena);
524
+ msgval.msg_val = msg;
525
+ return msgval;
526
+ } else {
527
+ return Convert_RubyToUpb(val, "", info, arena);
528
+ }
286
529
  }
287
530
 
288
- int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
289
- MessageHeader* self;
290
- char *name;
291
- const upb_fielddef* f;
292
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
531
+ static void RepeatedField_InitFromValue(upb_array* arr, const upb_fielddef* f,
532
+ VALUE val, upb_arena* arena) {
533
+ TypeInfo type_info = TypeInfo_get(f);
534
+
535
+ if (TYPE(val) != T_ARRAY) {
536
+ rb_raise(rb_eArgError,
537
+ "Expected array as initializer value for repeated field '%s' (given %s).",
538
+ upb_fielddef_name(f), rb_class2name(CLASS_OF(val)));
539
+ }
540
+
541
+ for (int i = 0; i < RARRAY_LEN(val); i++) {
542
+ VALUE entry = rb_ary_entry(val, i);
543
+ upb_msgval msgval;
544
+ if (upb_fielddef_issubmsg(f) && TYPE(entry) == T_HASH) {
545
+ msgval = MessageValue_FromValue(entry, type_info, arena);
546
+ } else {
547
+ msgval = Convert_RubyToUpb(entry, upb_fielddef_name(f), type_info, arena);
548
+ }
549
+ upb_array_append(arr, msgval, arena);
550
+ }
551
+ }
552
+
553
+ static void Message_InitFieldFromValue(upb_msg* msg, const upb_fielddef* f,
554
+ VALUE val, upb_arena* arena) {
555
+ if (TYPE(val) == T_NIL) return;
556
+
557
+ if (upb_fielddef_ismap(f)) {
558
+ upb_map *map = upb_msg_mutable(msg, f, arena).map;
559
+ Map_InitFromValue(map, f, val, arena);
560
+ } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
561
+ upb_array *arr = upb_msg_mutable(msg, f, arena).array;
562
+ RepeatedField_InitFromValue(arr, f, val, arena);
563
+ } else if (upb_fielddef_issubmsg(f)) {
564
+ if (TYPE(val) == T_HASH) {
565
+ upb_msg *submsg = upb_msg_mutable(msg, f, arena).msg;
566
+ Message_InitFromValue(submsg, upb_fielddef_msgsubdef(f), val, arena);
567
+ } else {
568
+ Message_setfield(msg, f, val, arena);
569
+ }
570
+ } else {
571
+ upb_msgval msgval =
572
+ Convert_RubyToUpb(val, upb_fielddef_name(f), TypeInfo_get(f), arena);
573
+ upb_msg_set(msg, f, msgval, arena);
574
+ }
575
+ }
576
+
577
+ typedef struct {
578
+ upb_msg *msg;
579
+ const upb_msgdef *msgdef;
580
+ upb_arena *arena;
581
+ } MsgInit;
582
+
583
+ static int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
584
+ MsgInit *msg_init = (MsgInit*)_self;
585
+ const char *name;
293
586
 
294
587
  if (TYPE(key) == T_STRING) {
295
588
  name = RSTRING_PTR(key);
@@ -300,51 +593,26 @@ int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
300
593
  "Expected string or symbols as hash keys when initializing proto from hash.");
301
594
  }
302
595
 
303
- f = upb_msgdef_ntofz(self->descriptor->msgdef, name);
596
+ const upb_fielddef* f = upb_msgdef_ntofz(msg_init->msgdef, name);
597
+
304
598
  if (f == NULL) {
305
599
  rb_raise(rb_eArgError,
306
600
  "Unknown field name '%s' in initialization map entry.", name);
307
601
  }
308
602
 
309
- if (TYPE(val) == T_NIL) {
310
- return 0;
311
- }
312
-
313
- if (is_map_field(f)) {
314
- VALUE map;
315
-
316
- if (TYPE(val) != T_HASH) {
317
- rb_raise(rb_eArgError,
318
- "Expected Hash object as initializer value for map field '%s' (given %s).",
319
- name, rb_class2name(CLASS_OF(val)));
320
- }
321
- map = layout_get(self->descriptor->layout, Message_data(self), f);
322
- Map_merge_into_self(map, val);
323
- } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
324
- VALUE ary;
325
-
326
- if (TYPE(val) != T_ARRAY) {
327
- rb_raise(rb_eArgError,
328
- "Expected array as initializer value for repeated field '%s' (given %s).",
329
- name, rb_class2name(CLASS_OF(val)));
330
- }
331
- ary = layout_get(self->descriptor->layout, Message_data(self), f);
332
- for (int i = 0; i < RARRAY_LEN(val); i++) {
333
- VALUE entry = rb_ary_entry(val, i);
334
- if (TYPE(entry) == T_HASH && upb_fielddef_issubmsg(f)) {
335
- entry = create_submsg_from_hash(f, entry);
336
- }
603
+ Message_InitFieldFromValue(msg_init->msg, f, val, msg_init->arena);
604
+ return ST_CONTINUE;
605
+ }
337
606
 
338
- RepeatedField_push(ary, entry);
339
- }
607
+ void Message_InitFromValue(upb_msg* msg, const upb_msgdef* m, VALUE val,
608
+ upb_arena* arena) {
609
+ MsgInit msg_init = {msg, m, arena};
610
+ if (TYPE(val) == T_HASH) {
611
+ rb_hash_foreach(val, Message_initialize_kwarg, (VALUE)&msg_init);
340
612
  } else {
341
- if (TYPE(val) == T_HASH && upb_fielddef_issubmsg(f)) {
342
- val = create_submsg_from_hash(f, val);
343
- }
344
-
345
- layout_set(self->descriptor->layout, Message_data(self), f, val);
613
+ rb_raise(rb_eArgError, "Expected hash arguments or message, not %s",
614
+ rb_class2name(CLASS_OF(val)));
346
615
  }
347
- return 0;
348
616
  }
349
617
 
350
618
  /*
@@ -359,8 +627,13 @@ int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
359
627
  * have been added to a pool. The method definitions described here on the
360
628
  * Message class are provided on each concrete message class.
361
629
  */
362
- VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
363
- VALUE hash_args;
630
+ static VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
631
+ Message* self = ruby_to_Message(_self);
632
+ VALUE arena_rb = Arena_new();
633
+ upb_arena *arena = Arena_get(arena_rb);
634
+ upb_msg *msg = upb_msg_new(self->msgdef, arena);
635
+
636
+ Message_InitPtr(_self, msg, arena_rb);
364
637
 
365
638
  if (argc == 0) {
366
639
  return Qnil;
@@ -368,12 +641,7 @@ VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
368
641
  if (argc != 1) {
369
642
  rb_raise(rb_eArgError, "Expected 0 or 1 arguments.");
370
643
  }
371
- hash_args = argv[0];
372
- if (TYPE(hash_args) != T_HASH) {
373
- rb_raise(rb_eArgError, "Expected hash arguments.");
374
- }
375
-
376
- rb_hash_foreach(hash_args, Message_initialize_kwarg, _self);
644
+ Message_InitFromValue((upb_msg*)self->msg, self->msgdef, argv[0], arena);
377
645
  return Qnil;
378
646
  }
379
647
 
@@ -383,37 +651,40 @@ VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
383
651
  *
384
652
  * Performs a shallow copy of this message and returns the new copy.
385
653
  */
386
- VALUE Message_dup(VALUE _self) {
387
- MessageHeader* self;
388
- VALUE new_msg;
389
- MessageHeader* new_msg_self;
390
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
391
-
392
- new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
393
- TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);
394
-
395
- layout_dup(self->descriptor->layout,
396
- Message_data(new_msg_self),
397
- Message_data(self));
398
-
654
+ static VALUE Message_dup(VALUE _self) {
655
+ Message* self = ruby_to_Message(_self);
656
+ VALUE new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
657
+ Message* new_msg_self = ruby_to_Message(new_msg);
658
+ size_t size = upb_msgdef_layout(self->msgdef)->size;
659
+
660
+ // TODO(copy unknown fields?)
661
+ // TODO(use official upb msg copy function)
662
+ memcpy((upb_msg*)new_msg_self->msg, self->msg, size);
663
+ Arena_fuse(self->arena, Arena_get(new_msg_self->arena));
399
664
  return new_msg;
400
665
  }
401
666
 
402
- // Internal only; used by Google::Protobuf.deep_copy.
403
- VALUE Message_deep_copy(VALUE _self) {
404
- MessageHeader* self;
405
- MessageHeader* new_msg_self;
406
- VALUE new_msg;
407
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
667
+ // Support function for Message_eq, and also used by other #eq functions.
668
+ bool Message_Equal(const upb_msg *m1, const upb_msg *m2, const upb_msgdef *m) {
669
+ if (m1 == m2) return true;
408
670
 
409
- new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
410
- TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);
671
+ size_t size1, size2;
672
+ int encode_opts = UPB_ENCODE_SKIPUNKNOWN | UPB_ENCODE_DETERMINISTIC;
673
+ upb_arena *arena_tmp = upb_arena_new();
674
+ const upb_msglayout *layout = upb_msgdef_layout(m);
411
675
 
412
- layout_deep_copy(self->descriptor->layout,
413
- Message_data(new_msg_self),
414
- Message_data(self));
676
+ // Compare deterministically serialized payloads with no unknown fields.
677
+ char *data1 = upb_encode_ex(m1, layout, encode_opts, arena_tmp, &size1);
678
+ char *data2 = upb_encode_ex(m2, layout, encode_opts, arena_tmp, &size2);
415
679
 
416
- return new_msg;
680
+ if (data1 && data2) {
681
+ bool ret = (size1 == size2) && (memcmp(data1, data2, size1) == 0);
682
+ upb_arena_free(arena_tmp);
683
+ return ret;
684
+ } else {
685
+ upb_arena_free(arena_tmp);
686
+ rb_raise(cParseError, "Error comparing messages");
687
+ }
417
688
  }
418
689
 
419
690
  /*
@@ -425,22 +696,34 @@ VALUE Message_deep_copy(VALUE _self) {
425
696
  * method's semantics (a more efficient comparison may actually be done if the
426
697
  * field is of a primitive type).
427
698
  */
428
- VALUE Message_eq(VALUE _self, VALUE _other) {
429
- MessageHeader* self;
430
- MessageHeader* other;
431
- if (TYPE(_self) != TYPE(_other)) {
432
- return Qfalse;
433
- }
434
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
435
- TypedData_Get_Struct(_other, MessageHeader, &Message_type, other);
699
+ static VALUE Message_eq(VALUE _self, VALUE _other) {
700
+ if (CLASS_OF(_self) != CLASS_OF(_other)) return Qfalse;
436
701
 
437
- if (self->descriptor != other->descriptor) {
438
- return Qfalse;
439
- }
702
+ Message* self = ruby_to_Message(_self);
703
+ Message* other = ruby_to_Message(_other);
704
+ assert(self->msgdef == other->msgdef);
705
+
706
+ return Message_Equal(self->msg, other->msg, self->msgdef) ? Qtrue : Qfalse;
707
+ }
708
+
709
+ uint64_t Message_Hash(const upb_msg* msg, const upb_msgdef* m, uint64_t seed) {
710
+ upb_arena *arena = upb_arena_new();
711
+ const char *data;
712
+ size_t size;
713
+
714
+ // Hash a deterministically serialized payloads with no unknown fields.
715
+ data = upb_encode_ex(msg, upb_msgdef_layout(m),
716
+ UPB_ENCODE_SKIPUNKNOWN | UPB_ENCODE_DETERMINISTIC, arena,
717
+ &size);
440
718
 
441
- return layout_eq(self->descriptor->layout,
442
- Message_data(self),
443
- Message_data(other));
719
+ if (data) {
720
+ uint64_t ret = wyhash(data, size, seed, _wyp);
721
+ upb_arena_free(arena);
722
+ return ret;
723
+ } else {
724
+ upb_arena_free(arena);
725
+ rb_raise(cParseError, "Error calculating hash");
726
+ }
444
727
  }
445
728
 
446
729
  /*
@@ -449,11 +732,12 @@ VALUE Message_eq(VALUE _self, VALUE _other) {
449
732
  *
450
733
  * Returns a hash value that represents this message's field values.
451
734
  */
452
- VALUE Message_hash(VALUE _self) {
453
- MessageHeader* self;
454
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
455
-
456
- return layout_hash(self->descriptor->layout, Message_data(self));
735
+ static VALUE Message_hash(VALUE _self) {
736
+ Message* self = ruby_to_Message(_self);
737
+ uint64_t hash_value = Message_Hash(self->msg, self->msgdef, 0);
738
+ // RUBY_FIXNUM_MAX should be one less than a power of 2.
739
+ assert((RUBY_FIXNUM_MAX & (RUBY_FIXNUM_MAX + 1)) == 0);
740
+ return INT2FIX(hash_value & RUBY_FIXNUM_MAX);
457
741
  }
458
742
 
459
743
  /*
@@ -464,75 +748,127 @@ VALUE Message_hash(VALUE _self) {
464
748
  * formatted as "<MessageType: field1: value1, field2: value2, ...>". Each
465
749
  * field's value is represented according to its own #inspect method.
466
750
  */
467
- VALUE Message_inspect(VALUE _self) {
468
- MessageHeader* self;
469
- VALUE str;
470
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
751
+ static VALUE Message_inspect(VALUE _self) {
752
+ Message* self = ruby_to_Message(_self);
471
753
 
472
- str = rb_str_new2("<");
473
- str = rb_str_append(str, rb_str_new2(rb_class2name(CLASS_OF(_self))));
474
- str = rb_str_cat2(str, ": ");
475
- str = rb_str_append(str, layout_inspect(
476
- self->descriptor->layout, Message_data(self)));
477
- str = rb_str_cat2(str, ">");
478
- return str;
754
+ StringBuilder* builder = StringBuilder_New();
755
+ Message_PrintMessage(builder, self->msg, self->msgdef);
756
+ VALUE ret = StringBuilder_ToRubyString(builder);
757
+ StringBuilder_Free(builder);
758
+ return ret;
479
759
  }
480
760
 
481
- /*
482
- * call-seq:
483
- * Message.to_h => {}
484
- *
485
- * Returns the message as a Ruby Hash object, with keys as symbols.
486
- */
487
- VALUE Message_to_h(VALUE _self) {
488
- MessageHeader* self;
489
- VALUE hash;
490
- upb_msg_field_iter it;
491
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
492
-
493
- hash = rb_hash_new();
494
-
495
- for (upb_msg_field_begin(&it, self->descriptor->msgdef);
496
- !upb_msg_field_done(&it);
497
- upb_msg_field_next(&it)) {
498
- const upb_fielddef* field = upb_msg_iter_field(&it);
499
-
500
- // For proto2, do not include fields which are not set.
501
- if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
502
- field_contains_hasbit(self->descriptor->layout, field) &&
503
- !layout_has(self->descriptor->layout, Message_data(self), field)) {
761
+ // Support functions for Message_to_h //////////////////////////////////////////
762
+
763
+ static VALUE RepeatedField_CreateArray(const upb_array* arr,
764
+ TypeInfo type_info) {
765
+ int size = arr ? upb_array_size(arr) : 0;
766
+ VALUE ary = rb_ary_new2(size);
767
+
768
+ for (int i = 0; i < size; i++) {
769
+ upb_msgval msgval = upb_array_get(arr, i);
770
+ VALUE val = Scalar_CreateHash(msgval, type_info);
771
+ rb_ary_push(ary, val);
772
+ }
773
+
774
+ return ary;
775
+ }
776
+
777
+ static VALUE Message_CreateHash(const upb_msg *msg, const upb_msgdef *m) {
778
+ if (!msg) return Qnil;
779
+
780
+ VALUE hash = rb_hash_new();
781
+ int n = upb_msgdef_fieldcount(m);
782
+ bool is_proto2;
783
+
784
+ // We currently have a few behaviors that are specific to proto2.
785
+ // This is unfortunate, we should key behaviors off field attributes (like
786
+ // whether a field has presence), not proto2 vs. proto3. We should see if we
787
+ // can change this without breaking users.
788
+ is_proto2 = upb_msgdef_syntax(m) == UPB_SYNTAX_PROTO2;
789
+
790
+ for (int i = 0; i < n; i++) {
791
+ const upb_fielddef* field = upb_msgdef_field(m, i);
792
+ TypeInfo type_info = TypeInfo_get(field);
793
+ upb_msgval msgval;
794
+ VALUE msg_value;
795
+ VALUE msg_key;
796
+
797
+ if (!is_proto2 && upb_fielddef_issubmsg(field) &&
798
+ !upb_fielddef_isseq(field) && !upb_msg_has(msg, field)) {
799
+ // TODO: Legacy behavior, remove when we fix the is_proto2 differences.
800
+ msg_key = ID2SYM(rb_intern(upb_fielddef_name(field)));
801
+ rb_hash_aset(hash, msg_key, Qnil);
504
802
  continue;
505
803
  }
506
804
 
507
- VALUE msg_value = layout_get(self->descriptor->layout, Message_data(self),
508
- field);
509
- VALUE msg_key = ID2SYM(rb_intern(upb_fielddef_name(field)));
510
- if (is_map_field(field)) {
511
- msg_value = Map_to_h(msg_value);
512
- } else if (upb_fielddef_label(field) == UPB_LABEL_REPEATED) {
513
- msg_value = RepeatedField_to_ary(msg_value);
514
- if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
515
- RARRAY_LEN(msg_value) == 0) {
516
- continue;
517
- }
805
+ // Do not include fields that are not present (oneof or optional fields).
806
+ if (is_proto2 && upb_fielddef_haspresence(field) &&
807
+ !upb_msg_has(msg, field)) {
808
+ continue;
809
+ }
518
810
 
519
- if (upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
520
- for (int i = 0; i < RARRAY_LEN(msg_value); i++) {
521
- VALUE elem = rb_ary_entry(msg_value, i);
522
- rb_ary_store(msg_value, i, Message_to_h(elem));
523
- }
524
- }
811
+ msg_key = ID2SYM(rb_intern(upb_fielddef_name(field)));
812
+ msgval = upb_msg_get(msg, field);
813
+
814
+ // Proto2 omits empty map/repeated filds also.
525
815
 
526
- } else if (msg_value != Qnil &&
527
- upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
528
- msg_value = Message_to_h(msg_value);
816
+ if (upb_fielddef_ismap(field)) {
817
+ const upb_msgdef *entry_m = upb_fielddef_msgsubdef(field);
818
+ const upb_fielddef *key_f = upb_msgdef_itof(entry_m, 1);
819
+ const upb_fielddef *val_f = upb_msgdef_itof(entry_m, 2);
820
+ upb_fieldtype_t key_type = upb_fielddef_type(key_f);
821
+ msg_value = Map_CreateHash(msgval.map_val, key_type, TypeInfo_get(val_f));
822
+ } else if (upb_fielddef_isseq(field)) {
823
+ if (is_proto2 &&
824
+ (!msgval.array_val || upb_array_size(msgval.array_val) == 0)) {
825
+ continue;
826
+ }
827
+ msg_value = RepeatedField_CreateArray(msgval.array_val, type_info);
828
+ } else {
829
+ msg_value = Scalar_CreateHash(msgval, type_info);
529
830
  }
831
+
530
832
  rb_hash_aset(hash, msg_key, msg_value);
531
833
  }
834
+
532
835
  return hash;
533
836
  }
534
837
 
838
+ VALUE Scalar_CreateHash(upb_msgval msgval, TypeInfo type_info) {
839
+ if (type_info.type == UPB_TYPE_MESSAGE) {
840
+ return Message_CreateHash(msgval.msg_val, type_info.def.msgdef);
841
+ } else {
842
+ return Convert_UpbToRuby(msgval, type_info, Qnil);
843
+ }
844
+ }
845
+
846
+ /*
847
+ * call-seq:
848
+ * Message.to_h => {}
849
+ *
850
+ * Returns the message as a Ruby Hash object, with keys as symbols.
851
+ */
852
+ static VALUE Message_to_h(VALUE _self) {
853
+ Message* self = ruby_to_Message(_self);
854
+ return Message_CreateHash(self->msg, self->msgdef);
855
+ }
535
856
 
857
+ /*
858
+ * call-seq:
859
+ * Message.freeze => self
860
+ *
861
+ * Freezes the message object. We have to intercept this so we can pin the
862
+ * Ruby object into memory so we don't forget it's frozen.
863
+ */
864
+ static VALUE Message_freeze(VALUE _self) {
865
+ Message* self = ruby_to_Message(_self);
866
+ if (!RB_OBJ_FROZEN(_self)) {
867
+ Arena_Pin(self->arena, _self);
868
+ RB_OBJ_FREEZE(_self);
869
+ }
870
+ return _self;
871
+ }
536
872
 
537
873
  /*
538
874
  * call-seq:
@@ -541,16 +877,18 @@ VALUE Message_to_h(VALUE _self) {
541
877
  * Accesses a field's value by field name. The provided field name should be a
542
878
  * string.
543
879
  */
544
- VALUE Message_index(VALUE _self, VALUE field_name) {
545
- MessageHeader* self;
880
+ static VALUE Message_index(VALUE _self, VALUE field_name) {
881
+ Message* self = ruby_to_Message(_self);
546
882
  const upb_fielddef* field;
547
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
883
+
548
884
  Check_Type(field_name, T_STRING);
549
- field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
885
+ field = upb_msgdef_ntofz(self->msgdef, RSTRING_PTR(field_name));
886
+
550
887
  if (field == NULL) {
551
888
  return Qnil;
552
889
  }
553
- return layout_get(self->descriptor->layout, Message_data(self), field);
890
+
891
+ return Message_getfield(_self, field);
554
892
  }
555
893
 
556
894
  /*
@@ -560,19 +898,208 @@ VALUE Message_index(VALUE _self, VALUE field_name) {
560
898
  * Sets a field's value by field name. The provided field name should be a
561
899
  * string.
562
900
  */
563
- VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
564
- MessageHeader* self;
565
- const upb_fielddef* field;
566
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
901
+ static VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
902
+ Message* self = ruby_to_Message(_self);
903
+ const upb_fielddef* f;
904
+ upb_msgval val;
905
+ upb_arena *arena = Arena_get(self->arena);
906
+
567
907
  Check_Type(field_name, T_STRING);
568
- field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
569
- if (field == NULL) {
908
+ f = upb_msgdef_ntofz(self->msgdef, RSTRING_PTR(field_name));
909
+
910
+ if (f == NULL) {
570
911
  rb_raise(rb_eArgError, "Unknown field: %s", RSTRING_PTR(field_name));
571
912
  }
572
- layout_set(self->descriptor->layout, Message_data(self), field, value);
913
+
914
+ val = Convert_RubyToUpb(value, upb_fielddef_name(f), TypeInfo_get(f), arena);
915
+ upb_msg_set(Message_GetMutable(_self, NULL), f, val, arena);
916
+
573
917
  return Qnil;
574
918
  }
575
919
 
920
+ /*
921
+ * call-seq:
922
+ * MessageClass.decode(data) => message
923
+ *
924
+ * Decodes the given data (as a string containing bytes in protocol buffers wire
925
+ * format) under the interpretration given by this message class's definition
926
+ * and returns a message object with the corresponding field values.
927
+ */
928
+ static VALUE Message_decode(VALUE klass, VALUE data) {
929
+ if (TYPE(data) != T_STRING) {
930
+ rb_raise(rb_eArgError, "Expected string for binary protobuf data.");
931
+ }
932
+
933
+ VALUE msg_rb = initialize_rb_class_with_no_args(klass);
934
+ Message* msg = ruby_to_Message(msg_rb);
935
+
936
+ if (!upb_decode(RSTRING_PTR(data), RSTRING_LEN(data), (upb_msg*)msg->msg,
937
+ upb_msgdef_layout(msg->msgdef),
938
+ Arena_get(msg->arena))) {
939
+ rb_raise(cParseError, "Error occurred during parsing");
940
+ }
941
+
942
+ return msg_rb;
943
+ }
944
+
945
+ /*
946
+ * call-seq:
947
+ * MessageClass.decode_json(data, options = {}) => message
948
+ *
949
+ * Decodes the given data (as a string containing bytes in protocol buffers wire
950
+ * format) under the interpretration given by this message class's definition
951
+ * and returns a message object with the corresponding field values.
952
+ *
953
+ * @param options [Hash] options for the decoder
954
+ * ignore_unknown_fields: set true to ignore unknown fields (default is to
955
+ * raise an error)
956
+ */
957
+ static VALUE Message_decode_json(int argc, VALUE* argv, VALUE klass) {
958
+ VALUE data = argv[0];
959
+ int options = 0;
960
+ upb_status status;
961
+
962
+ // TODO(haberman): use this message's pool instead.
963
+ const upb_symtab *symtab = DescriptorPool_GetSymtab(generated_pool);
964
+
965
+ if (argc < 1 || argc > 2) {
966
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
967
+ }
968
+
969
+ if (argc == 2) {
970
+ VALUE hash_args = argv[1];
971
+ if (TYPE(hash_args) != T_HASH) {
972
+ rb_raise(rb_eArgError, "Expected hash arguments.");
973
+ }
974
+
975
+ if (RTEST(rb_hash_lookup2( hash_args, ID2SYM(rb_intern("ignore_unknown_fields")), Qfalse))) {
976
+ options |= UPB_JSONDEC_IGNOREUNKNOWN;
977
+ }
978
+ }
979
+
980
+ if (TYPE(data) != T_STRING) {
981
+ rb_raise(rb_eArgError, "Expected string for JSON data.");
982
+ }
983
+
984
+ // TODO(cfallin): Check and respect string encoding. If not UTF-8, we need to
985
+ // convert, because string handlers pass data directly to message string
986
+ // fields.
987
+
988
+ VALUE msg_rb = initialize_rb_class_with_no_args(klass);
989
+ Message* msg = ruby_to_Message(msg_rb);
990
+
991
+ // We don't allow users to decode a wrapper type directly.
992
+ if (upb_msgdef_iswrapper(msg->msgdef)) {
993
+ rb_raise(rb_eRuntimeError, "Cannot parse a wrapper directly.");
994
+ }
995
+
996
+ upb_status_clear(&status);
997
+ if (!upb_json_decode(RSTRING_PTR(data), RSTRING_LEN(data), (upb_msg*)msg->msg,
998
+ msg->msgdef, symtab, options,
999
+ Arena_get(msg->arena), &status)) {
1000
+ rb_raise(cParseError, "Error occurred during parsing: %s",
1001
+ upb_status_errmsg(&status));
1002
+ }
1003
+
1004
+ return msg_rb;
1005
+ }
1006
+
1007
+ /*
1008
+ * call-seq:
1009
+ * MessageClass.encode(msg) => bytes
1010
+ *
1011
+ * Encodes the given message object to its serialized form in protocol buffers
1012
+ * wire format.
1013
+ */
1014
+ static VALUE Message_encode(VALUE klass, VALUE msg_rb) {
1015
+ Message* msg = ruby_to_Message(msg_rb);
1016
+ upb_arena *arena = upb_arena_new();
1017
+ const char *data;
1018
+ size_t size;
1019
+
1020
+ if (CLASS_OF(msg_rb) != klass) {
1021
+ rb_raise(rb_eArgError, "Message of wrong type.");
1022
+ }
1023
+
1024
+ data = upb_encode(msg->msg, upb_msgdef_layout(msg->msgdef), arena,
1025
+ &size);
1026
+
1027
+ if (data) {
1028
+ VALUE ret = rb_str_new(data, size);
1029
+ rb_enc_associate(ret, rb_ascii8bit_encoding());
1030
+ upb_arena_free(arena);
1031
+ return ret;
1032
+ } else {
1033
+ upb_arena_free(arena);
1034
+ rb_raise(rb_eRuntimeError, "Exceeded maximum depth (possibly cycle)");
1035
+ }
1036
+ }
1037
+
1038
+ /*
1039
+ * call-seq:
1040
+ * MessageClass.encode_json(msg, options = {}) => json_string
1041
+ *
1042
+ * Encodes the given message object into its serialized JSON representation.
1043
+ * @param options [Hash] options for the decoder
1044
+ * preserve_proto_fieldnames: set true to use original fieldnames (default is to camelCase)
1045
+ * emit_defaults: set true to emit 0/false values (default is to omit them)
1046
+ */
1047
+ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1048
+ Message* msg = ruby_to_Message(argv[0]);
1049
+ int options = 0;
1050
+ char buf[1024];
1051
+ size_t size;
1052
+ upb_status status;
1053
+
1054
+ // TODO(haberman): use this message's pool instead.
1055
+ const upb_symtab *symtab = DescriptorPool_GetSymtab(generated_pool);
1056
+
1057
+ if (argc < 1 || argc > 2) {
1058
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1059
+ }
1060
+
1061
+ if (argc == 2) {
1062
+ VALUE hash_args = argv[1];
1063
+ if (TYPE(hash_args) != T_HASH) {
1064
+ rb_raise(rb_eArgError, "Expected hash arguments.");
1065
+ }
1066
+
1067
+ if (RTEST(rb_hash_lookup2(hash_args,
1068
+ ID2SYM(rb_intern("preserve_proto_fieldnames")),
1069
+ Qfalse))) {
1070
+ options |= UPB_JSONENC_PROTONAMES;
1071
+ }
1072
+
1073
+ if (RTEST(rb_hash_lookup2(hash_args, ID2SYM(rb_intern("emit_defaults")),
1074
+ Qfalse))) {
1075
+ options |= UPB_JSONENC_EMITDEFAULTS;
1076
+ }
1077
+ }
1078
+
1079
+ upb_status_clear(&status);
1080
+ size = upb_json_encode(msg->msg, msg->msgdef, symtab, options, buf,
1081
+ sizeof(buf), &status);
1082
+
1083
+ if (!upb_ok(&status)) {
1084
+ rb_raise(cParseError, "Error occurred during encoding: %s",
1085
+ upb_status_errmsg(&status));
1086
+ }
1087
+
1088
+ VALUE ret;
1089
+ if (size >= sizeof(buf)) {
1090
+ char* buf2 = malloc(size + 1);
1091
+ upb_json_encode(msg->msg, msg->msgdef, symtab, options, buf2, size + 1,
1092
+ &status);
1093
+ ret = rb_str_new(buf2, size);
1094
+ free(buf2);
1095
+ } else {
1096
+ ret = rb_str_new(buf, size);
1097
+ }
1098
+
1099
+ rb_enc_associate(ret, rb_utf8_encoding());
1100
+ return ret;
1101
+ }
1102
+
576
1103
  /*
577
1104
  * call-seq:
578
1105
  * Message.descriptor => descriptor
@@ -580,22 +1107,15 @@ VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
580
1107
  * Class method that returns the Descriptor instance corresponding to this
581
1108
  * message class's type.
582
1109
  */
583
- VALUE Message_descriptor(VALUE klass) {
1110
+ static VALUE Message_descriptor(VALUE klass) {
584
1111
  return rb_ivar_get(klass, descriptor_instancevar_interned);
585
1112
  }
586
1113
 
587
- VALUE build_class_from_descriptor(Descriptor* desc) {
1114
+ VALUE build_class_from_descriptor(VALUE descriptor) {
588
1115
  const char *name;
589
1116
  VALUE klass;
590
1117
 
591
- if (desc->layout == NULL) {
592
- desc->layout = create_layout(desc->msgdef);
593
- }
594
- if (desc->fill_method == NULL) {
595
- desc->fill_method = new_fillmsg_decodermethod(desc, &desc->fill_method);
596
- }
597
-
598
- name = upb_msgdef_fullname(desc->msgdef);
1118
+ name = upb_msgdef_fullname(Descriptor_GetMsgDef(descriptor));
599
1119
  if (name == NULL) {
600
1120
  rb_raise(rb_eRuntimeError, "Descriptor does not have assigned name.");
601
1121
  }
@@ -605,8 +1125,7 @@ VALUE build_class_from_descriptor(Descriptor* desc) {
605
1125
  // their own toplevel constant class name.
606
1126
  rb_intern("Message"),
607
1127
  rb_cObject);
608
- rb_ivar_set(klass, descriptor_instancevar_interned,
609
- get_def_obj(desc->msgdef));
1128
+ rb_ivar_set(klass, descriptor_instancevar_interned, descriptor);
610
1129
  rb_define_alloc_func(klass, Message_alloc);
611
1130
  rb_require("google/protobuf/message_exts");
612
1131
  rb_include_module(klass, rb_eval_string("::Google::Protobuf::MessageExts"));
@@ -622,10 +1141,12 @@ VALUE build_class_from_descriptor(Descriptor* desc) {
622
1141
  // Also define #clone so that we don't inherit Object#clone.
623
1142
  rb_define_method(klass, "clone", Message_dup, 0);
624
1143
  rb_define_method(klass, "==", Message_eq, 1);
1144
+ rb_define_method(klass, "eql?", Message_eq, 1);
1145
+ rb_define_method(klass, "freeze", Message_freeze, 0);
625
1146
  rb_define_method(klass, "hash", Message_hash, 0);
626
1147
  rb_define_method(klass, "to_h", Message_to_h, 0);
627
- rb_define_method(klass, "to_hash", Message_to_h, 0);
628
1148
  rb_define_method(klass, "inspect", Message_inspect, 0);
1149
+ rb_define_method(klass, "to_s", Message_inspect, 0);
629
1150
  rb_define_method(klass, "[]", Message_index, 1);
630
1151
  rb_define_method(klass, "[]=", Message_index_set, 2);
631
1152
  rb_define_singleton_method(klass, "decode", Message_decode, 1);
@@ -644,12 +1165,12 @@ VALUE build_class_from_descriptor(Descriptor* desc) {
644
1165
  * This module method, provided on each generated enum module, looks up an enum
645
1166
  * value by number and returns its name as a Ruby symbol, or nil if not found.
646
1167
  */
647
- VALUE enum_lookup(VALUE self, VALUE number) {
1168
+ static VALUE enum_lookup(VALUE self, VALUE number) {
648
1169
  int32_t num = NUM2INT(number);
649
1170
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
650
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);
1171
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(desc);
651
1172
 
652
- const char* name = upb_enumdef_iton(enumdesc->enumdef, num);
1173
+ const char* name = upb_enumdef_iton(e, num);
653
1174
  if (name == NULL) {
654
1175
  return Qnil;
655
1176
  } else {
@@ -664,13 +1185,13 @@ VALUE enum_lookup(VALUE self, VALUE number) {
664
1185
  * This module method, provided on each generated enum module, looks up an enum
665
1186
  * value by name (as a Ruby symbol) and returns its name, or nil if not found.
666
1187
  */
667
- VALUE enum_resolve(VALUE self, VALUE sym) {
1188
+ static VALUE enum_resolve(VALUE self, VALUE sym) {
668
1189
  const char* name = rb_id2name(SYM2ID(sym));
669
1190
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
670
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);
1191
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(desc);
671
1192
 
672
1193
  int32_t num = 0;
673
- bool found = upb_enumdef_ntoiz(enumdesc->enumdef, name, &num);
1194
+ bool found = upb_enumdef_ntoiz(e, name, &num);
674
1195
  if (!found) {
675
1196
  return Qnil;
676
1197
  } else {
@@ -685,16 +1206,16 @@ VALUE enum_resolve(VALUE self, VALUE sym) {
685
1206
  * This module method, provided on each generated enum module, returns the
686
1207
  * EnumDescriptor corresponding to this enum type.
687
1208
  */
688
- VALUE enum_descriptor(VALUE self) {
1209
+ static VALUE enum_descriptor(VALUE self) {
689
1210
  return rb_ivar_get(self, descriptor_instancevar_interned);
690
1211
  }
691
1212
 
692
- VALUE build_module_from_enumdesc(EnumDescriptor* enumdesc) {
693
- VALUE mod = rb_define_module_id(
694
- rb_intern(upb_enumdef_fullname(enumdesc->enumdef)));
1213
+ VALUE build_module_from_enumdesc(VALUE _enumdesc) {
1214
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(_enumdesc);
1215
+ VALUE mod = rb_define_module_id(rb_intern(upb_enumdef_fullname(e)));
695
1216
 
696
1217
  upb_enum_iter it;
697
- for (upb_enum_begin(&it, enumdesc->enumdef);
1218
+ for (upb_enum_begin(&it, e);
698
1219
  !upb_enum_done(&it);
699
1220
  upb_enum_next(&it)) {
700
1221
  const char* name = upb_enum_iter_name(&it);
@@ -710,26 +1231,99 @@ VALUE build_module_from_enumdesc(EnumDescriptor* enumdesc) {
710
1231
  rb_define_singleton_method(mod, "lookup", enum_lookup, 1);
711
1232
  rb_define_singleton_method(mod, "resolve", enum_resolve, 1);
712
1233
  rb_define_singleton_method(mod, "descriptor", enum_descriptor, 0);
713
- rb_ivar_set(mod, descriptor_instancevar_interned,
714
- get_def_obj(enumdesc->enumdef));
1234
+ rb_ivar_set(mod, descriptor_instancevar_interned, _enumdesc);
715
1235
 
716
1236
  return mod;
717
1237
  }
718
1238
 
719
- /*
720
- * call-seq:
721
- * Google::Protobuf.deep_copy(obj) => copy_of_obj
722
- *
723
- * Performs a deep copy of a RepeatedField instance, a Map instance, or a
724
- * message object, recursively copying its members.
725
- */
726
- VALUE Google_Protobuf_deep_copy(VALUE self, VALUE obj) {
727
- VALUE klass = CLASS_OF(obj);
728
- if (klass == cRepeatedField) {
729
- return RepeatedField_deep_copy(obj);
730
- } else if (klass == cMap) {
731
- return Map_deep_copy(obj);
732
- } else {
733
- return Message_deep_copy(obj);
1239
+ // Internal only; used by Google::Protobuf.deep_copy.
1240
+ upb_msg* Message_deep_copy(const upb_msg* msg, const upb_msgdef* m,
1241
+ upb_arena *arena) {
1242
+ // Serialize and parse.
1243
+ upb_arena *tmp_arena = upb_arena_new();
1244
+ const upb_msglayout *layout = upb_msgdef_layout(m);
1245
+ size_t size;
1246
+
1247
+ char* data = upb_encode_ex(msg, layout, 0, tmp_arena, &size);
1248
+ upb_msg* new_msg = upb_msg_new(m, arena);
1249
+
1250
+ if (!data || !upb_decode(data, size, new_msg, layout, arena)) {
1251
+ upb_arena_free(tmp_arena);
1252
+ rb_raise(cParseError, "Error occurred copying proto");
1253
+ }
1254
+
1255
+ upb_arena_free(tmp_arena);
1256
+ return new_msg;
1257
+ }
1258
+
1259
+ const upb_msg* Message_GetUpbMessage(VALUE value, const upb_msgdef* m,
1260
+ const char* name, upb_arena* arena) {
1261
+ if (value == Qnil) {
1262
+ rb_raise(cTypeError, "nil message not allowed here.");
734
1263
  }
1264
+
1265
+ VALUE klass = CLASS_OF(value);
1266
+ VALUE desc_rb = rb_ivar_get(klass, descriptor_instancevar_interned);
1267
+ const upb_msgdef* val_m =
1268
+ desc_rb == Qnil ? NULL : Descriptor_GetMsgDef(desc_rb);
1269
+
1270
+ if (val_m != m) {
1271
+ // Check for possible implicit conversions
1272
+ // TODO: hash conversion?
1273
+
1274
+ switch (upb_msgdef_wellknowntype(m)) {
1275
+ case UPB_WELLKNOWN_TIMESTAMP: {
1276
+ // Time -> Google::Protobuf::Timestamp
1277
+ upb_msg *msg = upb_msg_new(m, arena);
1278
+ upb_msgval sec, nsec;
1279
+ struct timespec time;
1280
+ const upb_fielddef *sec_f = upb_msgdef_itof(m, 1);
1281
+ const upb_fielddef *nsec_f = upb_msgdef_itof(m, 2);
1282
+
1283
+ if (!rb_obj_is_kind_of(value, rb_cTime)) goto badtype;
1284
+
1285
+ time = rb_time_timespec(value);
1286
+ sec.int64_val = time.tv_sec;
1287
+ nsec.int32_val = time.tv_nsec;
1288
+ upb_msg_set(msg, sec_f, sec, arena);
1289
+ upb_msg_set(msg, nsec_f, nsec, arena);
1290
+ return msg;
1291
+ }
1292
+ case UPB_WELLKNOWN_DURATION: {
1293
+ // Numeric -> Google::Protobuf::Duration
1294
+ upb_msg *msg = upb_msg_new(m, arena);
1295
+ upb_msgval sec, nsec;
1296
+ const upb_fielddef *sec_f = upb_msgdef_itof(m, 1);
1297
+ const upb_fielddef *nsec_f = upb_msgdef_itof(m, 2);
1298
+
1299
+ if (!rb_obj_is_kind_of(value, rb_cNumeric)) goto badtype;
1300
+
1301
+ sec.int64_val = NUM2LL(value);
1302
+ nsec.int32_val = round((NUM2DBL(value) - NUM2LL(value)) * 1000000000);
1303
+ upb_msg_set(msg, sec_f, sec, arena);
1304
+ upb_msg_set(msg, nsec_f, nsec, arena);
1305
+ return msg;
1306
+ }
1307
+ default:
1308
+ badtype:
1309
+ rb_raise(cTypeError,
1310
+ "Invalid type %s to assign to submessage field '%s'.",
1311
+ rb_class2name(CLASS_OF(value)), name);
1312
+ }
1313
+
1314
+ }
1315
+
1316
+ Message* self = ruby_to_Message(value);
1317
+ Arena_fuse(self->arena, arena);
1318
+
1319
+ return self->msg;
1320
+ }
1321
+
1322
+ void Message_register(VALUE protobuf) {
1323
+ cParseError = rb_const_get(protobuf, rb_intern("ParseError"));
1324
+
1325
+ // Ruby-interned string: "descriptor". We use this identifier to store an
1326
+ // instance variable on message classes we create in order to link them back
1327
+ // to their descriptors.
1328
+ descriptor_instancevar_interned = rb_intern("descriptor");
735
1329
  }