google-protobuf 3.8.0 → 3.19.6

Sign up to get free protection for your applications and to get access to all the features.

Potentially problematic release.


This version of google-protobuf might be problematic. Click here for more details.

Files changed (38) hide show
  1. checksums.yaml +4 -4
  2. data/ext/google/protobuf_c/convert.c +348 -0
  3. data/ext/google/protobuf_c/convert.h +72 -0
  4. data/ext/google/protobuf_c/defs.c +610 -1583
  5. data/ext/google/protobuf_c/defs.h +107 -0
  6. data/ext/google/protobuf_c/extconf.rb +4 -7
  7. data/ext/google/protobuf_c/map.c +315 -476
  8. data/ext/google/protobuf_c/map.h +67 -0
  9. data/ext/google/protobuf_c/message.c +928 -448
  10. data/ext/google/protobuf_c/message.h +101 -0
  11. data/ext/google/protobuf_c/protobuf.c +400 -51
  12. data/ext/google/protobuf_c/protobuf.h +47 -545
  13. data/ext/google/protobuf_c/repeated_field.c +311 -312
  14. data/ext/google/protobuf_c/repeated_field.h +63 -0
  15. data/ext/google/protobuf_c/ruby-upb.c +9171 -0
  16. data/ext/google/protobuf_c/ruby-upb.h +4704 -0
  17. data/lib/google/protobuf/any_pb.rb +1 -1
  18. data/lib/google/protobuf/api_pb.rb +4 -3
  19. data/lib/google/protobuf/descriptor_dsl.rb +458 -0
  20. data/lib/google/protobuf/descriptor_pb.rb +268 -0
  21. data/lib/google/protobuf/duration_pb.rb +1 -1
  22. data/lib/google/protobuf/empty_pb.rb +1 -1
  23. data/lib/google/protobuf/field_mask_pb.rb +1 -1
  24. data/lib/google/protobuf/source_context_pb.rb +1 -1
  25. data/lib/google/protobuf/struct_pb.rb +4 -4
  26. data/lib/google/protobuf/timestamp_pb.rb +1 -1
  27. data/lib/google/protobuf/type_pb.rb +9 -8
  28. data/lib/google/protobuf/well_known_types.rb +13 -2
  29. data/lib/google/protobuf/wrappers_pb.rb +9 -9
  30. data/lib/google/protobuf.rb +2 -0
  31. data/tests/basic.rb +337 -70
  32. data/tests/generated_code_test.rb +0 -0
  33. data/tests/stress.rb +1 -1
  34. metadata +21 -28
  35. data/ext/google/protobuf_c/encode_decode.c +0 -1614
  36. data/ext/google/protobuf_c/storage.c +0 -1062
  37. data/ext/google/protobuf_c/upb.c +0 -17480
  38. data/ext/google/protobuf_c/upb.h +0 -10641
@@ -28,91 +28,153 @@
28
28
  // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29
29
  // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
30
 
31
+ #include "message.h"
32
+
33
+ #include "convert.h"
34
+ #include "defs.h"
35
+ #include "map.h"
31
36
  #include "protobuf.h"
37
+ #include "repeated_field.h"
32
38
 
33
- // -----------------------------------------------------------------------------
34
- // Class/module creation from msgdefs and enumdefs, respectively.
35
- // -----------------------------------------------------------------------------
39
+ static VALUE cParseError = Qnil;
40
+ static ID descriptor_instancevar_interned;
36
41
 
37
- void* Message_data(void* msg) {
38
- return ((uint8_t *)msg) + sizeof(MessageHeader);
42
+ static VALUE initialize_rb_class_with_no_args(VALUE klass) {
43
+ return rb_funcall(klass, rb_intern("new"), 0);
39
44
  }
40
45
 
41
- void Message_mark(void* _self) {
42
- MessageHeader* self = (MessageHeader *)_self;
43
- layout_mark(self->descriptor->layout, Message_data(self));
46
+ VALUE MessageOrEnum_GetDescriptor(VALUE klass) {
47
+ return rb_ivar_get(klass, descriptor_instancevar_interned);
44
48
  }
45
49
 
46
- void Message_free(void* self) {
47
- stringsink* unknown = ((MessageHeader *)self)->unknown_fields;
48
- if (unknown != NULL) {
49
- stringsink_uninit(unknown);
50
- free(unknown);
51
- }
52
- xfree(self);
50
+ // -----------------------------------------------------------------------------
51
+ // Class/module creation from msgdefs and enumdefs, respectively.
52
+ // -----------------------------------------------------------------------------
53
+
54
+ typedef struct {
55
+ VALUE arena;
56
+ const upb_msg* msg; // Can get as mutable when non-frozen.
57
+ const upb_msgdef* msgdef; // kept alive by self.class.descriptor reference.
58
+ } Message;
59
+
60
+ static void Message_mark(void* _self) {
61
+ Message* self = (Message *)_self;
62
+ rb_gc_mark(self->arena);
53
63
  }
54
64
 
55
- rb_data_type_t Message_type = {
65
+ static rb_data_type_t Message_type = {
56
66
  "Message",
57
- { Message_mark, Message_free, NULL },
67
+ { Message_mark, RUBY_DEFAULT_FREE, NULL },
68
+ .flags = RUBY_TYPED_FREE_IMMEDIATELY,
58
69
  };
59
70
 
60
- VALUE Message_alloc(VALUE klass) {
71
+ static Message* ruby_to_Message(VALUE msg_rb) {
72
+ Message* msg;
73
+ TypedData_Get_Struct(msg_rb, Message, &Message_type, msg);
74
+ return msg;
75
+ }
76
+
77
+ static VALUE Message_alloc(VALUE klass) {
61
78
  VALUE descriptor = rb_ivar_get(klass, descriptor_instancevar_interned);
62
- Descriptor* desc = ruby_to_Descriptor(descriptor);
63
- MessageHeader* msg = (MessageHeader*)ALLOC_N(
64
- uint8_t, sizeof(MessageHeader) + desc->layout->size);
79
+ Message* msg = ALLOC(Message);
65
80
  VALUE ret;
66
81
 
67
- memset(Message_data(msg), 0, desc->layout->size);
82
+ msg->msgdef = Descriptor_GetMsgDef(descriptor);
83
+ msg->arena = Qnil;
84
+ msg->msg = NULL;
68
85
 
69
- // We wrap first so that everything in the message object is GC-rooted in case
70
- // a collection happens during object creation in layout_init().
71
86
  ret = TypedData_Wrap_Struct(klass, &Message_type, msg);
72
- msg->descriptor = desc;
73
87
  rb_ivar_set(ret, descriptor_instancevar_interned, descriptor);
74
88
 
75
- msg->unknown_fields = NULL;
89
+ return ret;
90
+ }
91
+
92
+ const upb_msg *Message_Get(VALUE msg_rb, const upb_msgdef **m) {
93
+ Message* msg = ruby_to_Message(msg_rb);
94
+ if (m) *m = msg->msgdef;
95
+ return msg->msg;
96
+ }
76
97
 
77
- layout_init(desc->layout, Message_data(msg));
98
+ upb_msg *Message_GetMutable(VALUE msg_rb, const upb_msgdef **m) {
99
+ rb_check_frozen(msg_rb);
100
+ return (upb_msg*)Message_Get(msg_rb, m);
101
+ }
78
102
 
79
- return ret;
103
+ void Message_InitPtr(VALUE self_, upb_msg *msg, VALUE arena) {
104
+ Message* self = ruby_to_Message(self_);
105
+ self->msg = msg;
106
+ self->arena = arena;
107
+ ObjectCache_Add(msg, self_);
80
108
  }
81
109
 
82
- static const upb_fielddef* which_oneof_field(MessageHeader* self, const upb_oneofdef* o) {
83
- upb_oneof_iter it;
84
- size_t case_ofs;
85
- uint32_t oneof_case;
86
- const upb_fielddef* first_field;
87
- const upb_fielddef* f;
110
+ VALUE Message_GetArena(VALUE msg_rb) {
111
+ Message* msg = ruby_to_Message(msg_rb);
112
+ return msg->arena;
113
+ }
88
114
 
89
- // If no fields in the oneof, always nil.
90
- if (upb_oneofdef_numfields(o) == 0) {
91
- return NULL;
115
+ void Message_CheckClass(VALUE klass) {
116
+ if (rb_get_alloc_func(klass) != &Message_alloc) {
117
+ rb_raise(rb_eArgError,
118
+ "Message class was not returned by the DescriptorPool.");
92
119
  }
93
- // Grab the first field in the oneof so we can get its layout info to find the
94
- // oneof_case field.
95
- upb_oneof_begin(&it, o);
96
- assert(!upb_oneof_done(&it));
97
- first_field = upb_oneof_iter_field(&it);
98
- assert(upb_fielddef_containingoneof(first_field) != NULL);
120
+ }
99
121
 
100
- case_ofs =
101
- self->descriptor->layout->
102
- fields[upb_fielddef_index(first_field)].case_offset;
103
- oneof_case = *((uint32_t*)((char*)Message_data(self) + case_ofs));
122
+ VALUE Message_GetRubyWrapper(upb_msg* msg, const upb_msgdef* m, VALUE arena) {
123
+ if (msg == NULL) return Qnil;
104
124
 
105
- if (oneof_case == ONEOF_CASE_NONE) {
106
- return NULL;
125
+ VALUE val = ObjectCache_Get(msg);
126
+
127
+ if (val == Qnil) {
128
+ VALUE klass = Descriptor_DefToClass(m);
129
+ val = Message_alloc(klass);
130
+ Message_InitPtr(val, msg, arena);
107
131
  }
108
132
 
109
- // oneof_case is a field index, so find that field.
110
- f = upb_oneofdef_itof(o, oneof_case);
111
- assert(f != NULL);
133
+ return val;
134
+ }
135
+
136
+ void Message_PrintMessage(StringBuilder* b, const upb_msg* msg,
137
+ const upb_msgdef* m) {
138
+ bool first = true;
139
+ int n = upb_msgdef_fieldcount(m);
140
+ VALUE klass = Descriptor_DefToClass(m);
141
+ StringBuilder_Printf(b, "<%s: ", rb_class2name(klass));
142
+
143
+ for (int i = 0; i < n; i++) {
144
+ const upb_fielddef* field = upb_msgdef_field(m, i);
145
+
146
+ if (upb_fielddef_haspresence(field) && !upb_msg_has(msg, field)) {
147
+ continue;
148
+ }
149
+
150
+ if (!first) {
151
+ StringBuilder_Printf(b, ", ");
152
+ } else {
153
+ first = false;
154
+ }
155
+
156
+ upb_msgval msgval = upb_msg_get(msg, field);
157
+
158
+ StringBuilder_Printf(b, "%s: ", upb_fielddef_name(field));
112
159
 
113
- return f;
160
+ if (upb_fielddef_ismap(field)) {
161
+ const upb_msgdef* entry_m = upb_fielddef_msgsubdef(field);
162
+ const upb_fielddef* key_f = upb_msgdef_itof(entry_m, 1);
163
+ const upb_fielddef* val_f = upb_msgdef_itof(entry_m, 2);
164
+ TypeInfo val_info = TypeInfo_get(val_f);
165
+ Map_Inspect(b, msgval.map_val, upb_fielddef_type(key_f), val_info);
166
+ } else if (upb_fielddef_isseq(field)) {
167
+ RepeatedField_Inspect(b, msgval.array_val, TypeInfo_get(field));
168
+ } else {
169
+ StringBuilder_PrintMsgval(b, msgval, TypeInfo_get(field));
170
+ }
171
+ }
172
+
173
+ StringBuilder_Printf(b, ">");
114
174
  }
115
175
 
176
+ // Helper functions for #method_missing ////////////////////////////////////////
177
+
116
178
  enum {
117
179
  METHOD_UNKNOWN = 0,
118
180
  METHOD_GETTER = 1,
@@ -125,133 +187,203 @@ enum {
125
187
  };
126
188
 
127
189
  // Check if the field is a well known wrapper type
128
- static bool is_wrapper_type_field(const upb_fielddef* field) {
129
- char* field_type_name = rb_class2name(field_type_class(field));
130
-
131
- return strcmp(field_type_name, "Google::Protobuf::DoubleValue") == 0 ||
132
- strcmp(field_type_name, "Google::Protobuf::FloatValue") == 0 ||
133
- strcmp(field_type_name, "Google::Protobuf::Int32Value") == 0 ||
134
- strcmp(field_type_name, "Google::Protobuf::Int64Value") == 0 ||
135
- strcmp(field_type_name, "Google::Protobuf::UInt32Value") == 0 ||
136
- strcmp(field_type_name, "Google::Protobuf::UInt64Value") == 0 ||
137
- strcmp(field_type_name, "Google::Protobuf::BoolValue") == 0 ||
138
- strcmp(field_type_name, "Google::Protobuf::StringValue") == 0 ||
139
- strcmp(field_type_name, "Google::Protobuf::BytesValue") == 0;
140
- }
141
-
142
- // Get a new Ruby wrapper type and set the initial value
143
- static VALUE ruby_wrapper_type(const upb_fielddef* field, const VALUE* value) {
144
- if (is_wrapper_type_field(field) && value != Qnil) {
145
- VALUE hash = rb_hash_new();
146
- rb_hash_aset(hash, rb_str_new2("value"), value);
147
- VALUE args[1] = { hash };
148
- return rb_class_new_instance(1, args, field_type_class(field));
190
+ static bool IsWrapper(const upb_fielddef* f) {
191
+ return upb_fielddef_issubmsg(f) &&
192
+ upb_msgdef_iswrapper(upb_fielddef_msgsubdef(f));
193
+ }
194
+
195
+ static bool Match(const upb_msgdef* m, const char* name, const upb_fielddef** f,
196
+ const upb_oneofdef** o, const char* prefix,
197
+ const char* suffix) {
198
+ size_t sp = strlen(prefix);
199
+ size_t ss = strlen(suffix);
200
+ size_t sn = strlen(name);
201
+
202
+ if (sn <= sp + ss) return false;
203
+
204
+ if (memcmp(name, prefix, sp) != 0 ||
205
+ memcmp(name + sn - ss, suffix, ss) != 0) {
206
+ return false;
149
207
  }
150
- return Qnil;
208
+
209
+ return upb_msgdef_lookupname(m, name + sp, sn - sp - ss, f, o);
151
210
  }
152
211
 
153
- static int extract_method_call(VALUE method_name, MessageHeader* self,
154
- const upb_fielddef **f, const upb_oneofdef **o) {
212
+ static int extract_method_call(VALUE method_name, Message* self,
213
+ const upb_fielddef** f, const upb_oneofdef** o) {
214
+ const upb_msgdef* m = self->msgdef;
215
+ const char* name;
216
+
155
217
  Check_Type(method_name, T_SYMBOL);
218
+ name = rb_id2name(SYM2ID(method_name));
219
+
220
+ if (Match(m, name, f, o, "", "")) return METHOD_GETTER;
221
+ if (Match(m, name, f, o, "", "=")) return METHOD_SETTER;
222
+ if (Match(m, name, f, o, "clear_", "")) return METHOD_CLEAR;
223
+ if (Match(m, name, f, o, "has_", "?") &&
224
+ (*o || (*f && upb_fielddef_haspresence(*f)))) {
225
+ // Disallow oneof hazzers for proto3.
226
+ // TODO(haberman): remove this test when we are enabling oneof hazzers for
227
+ // proto3.
228
+ if (*f && !upb_fielddef_issubmsg(*f) &&
229
+ upb_fielddef_realcontainingoneof(*f) &&
230
+ upb_msgdef_syntax(upb_fielddef_containingtype(*f)) !=
231
+ UPB_SYNTAX_PROTO2) {
232
+ return METHOD_UNKNOWN;
233
+ }
234
+ return METHOD_PRESENCE;
235
+ }
236
+ if (Match(m, name, f, o, "", "_as_value") && *f && !upb_fielddef_isseq(*f) &&
237
+ IsWrapper(*f)) {
238
+ return METHOD_WRAPPER_GETTER;
239
+ }
240
+ if (Match(m, name, f, o, "", "_as_value=") && *f && !upb_fielddef_isseq(*f) &&
241
+ IsWrapper(*f)) {
242
+ return METHOD_WRAPPER_SETTER;
243
+ }
244
+ if (Match(m, name, f, o, "", "_const") && *f &&
245
+ upb_fielddef_type(*f) == UPB_TYPE_ENUM) {
246
+ return METHOD_ENUM_GETTER;
247
+ }
156
248
 
157
- VALUE method_str = rb_id2str(SYM2ID(method_name));
158
- char* name = RSTRING_PTR(method_str);
159
- size_t name_len = RSTRING_LEN(method_str);
160
- int accessor_type;
161
- const upb_oneofdef* test_o;
162
- const upb_fielddef* test_f;
163
-
164
- if (name[name_len - 1] == '=') {
165
- accessor_type = METHOD_SETTER;
166
- name_len--;
167
- // We want to ensure if the proto has something named clear_foo or has_foo?,
168
- // we don't strip the prefix.
169
- } else if (strncmp("clear_", name, 6) == 0 &&
170
- !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
171
- &test_f, &test_o)) {
172
- accessor_type = METHOD_CLEAR;
173
- name = name + 6;
174
- name_len = name_len - 6;
175
- } else if (strncmp("has_", name, 4) == 0 && name[name_len - 1] == '?' &&
176
- !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
177
- &test_f, &test_o)) {
178
- accessor_type = METHOD_PRESENCE;
179
- name = name + 4;
180
- name_len = name_len - 5;
181
- } else {
182
- accessor_type = METHOD_GETTER;
183
- }
184
-
185
- bool has_field = upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
186
- &test_f, &test_o);
187
-
188
- // Look for wrapper type accessor of the form <field_name>_as_value
189
- if (!has_field &&
190
- (accessor_type == METHOD_GETTER || accessor_type == METHOD_SETTER) &&
191
- name_len > 9 && strncmp(name + name_len - 9, "_as_value", 9) == 0) {
192
- // Find the field name
193
- char wrapper_field_name[name_len - 8];
194
- strncpy(wrapper_field_name, name, name_len - 9);
195
- wrapper_field_name[name_len - 7] = '\0';
196
-
197
- // Check if field exists and is a wrapper type
198
- const upb_oneofdef* test_o_wrapper;
199
- const upb_fielddef* test_f_wrapper;
200
- if (upb_msgdef_lookupname(self->descriptor->msgdef, wrapper_field_name, name_len - 9,
201
- &test_f_wrapper, &test_o_wrapper) &&
202
- upb_fielddef_type(test_f_wrapper) == UPB_TYPE_MESSAGE &&
203
- is_wrapper_type_field(test_f_wrapper)) {
204
- // It does exist!
205
- has_field = true;
206
- if (accessor_type == METHOD_SETTER) {
207
- accessor_type = METHOD_WRAPPER_SETTER;
208
- } else {
209
- accessor_type = METHOD_WRAPPER_GETTER;
249
+ return METHOD_UNKNOWN;
250
+ }
251
+
252
+ static VALUE Message_oneof_accessor(VALUE _self, const upb_oneofdef* o,
253
+ int accessor_type) {
254
+ Message* self = ruby_to_Message(_self);
255
+ const upb_fielddef* oneof_field = upb_msg_whichoneof(self->msg, o);
256
+
257
+ switch (accessor_type) {
258
+ case METHOD_PRESENCE:
259
+ return oneof_field == NULL ? Qfalse : Qtrue;
260
+ case METHOD_CLEAR:
261
+ if (oneof_field != NULL) {
262
+ upb_msg_clearfield(Message_GetMutable(_self, NULL), oneof_field);
210
263
  }
211
- test_o = test_o_wrapper;
212
- test_f = test_f_wrapper;
213
- }
264
+ return Qnil;
265
+ case METHOD_GETTER:
266
+ return oneof_field == NULL
267
+ ? Qnil
268
+ : ID2SYM(rb_intern(upb_fielddef_name(oneof_field)));
269
+ case METHOD_SETTER:
270
+ rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
214
271
  }
272
+ rb_raise(rb_eRuntimeError, "Invalid access of oneof field.");
273
+ }
215
274
 
216
- // Look for enum accessor of the form <enum_name>_const
217
- if (!has_field && accessor_type == METHOD_GETTER &&
218
- name_len > 6 && strncmp(name + name_len - 6, "_const", 6) == 0) {
219
-
220
- // Find enum field name
221
- char enum_name[name_len - 5];
222
- strncpy(enum_name, name, name_len - 6);
223
- enum_name[name_len - 4] = '\0';
224
-
225
- // Check if enum field exists
226
- const upb_oneofdef* test_o_enum;
227
- const upb_fielddef* test_f_enum;
228
- if (upb_msgdef_lookupname(self->descriptor->msgdef, enum_name, name_len - 6,
229
- &test_f_enum, &test_o_enum) &&
230
- upb_fielddef_type(test_f_enum) == UPB_TYPE_ENUM) {
231
- // It does exist!
232
- has_field = true;
233
- accessor_type = METHOD_ENUM_GETTER;
234
- test_o = test_o_enum;
235
- test_f = test_f_enum;
275
+ static void Message_setfield(upb_msg* msg, const upb_fielddef* f, VALUE val,
276
+ upb_arena* arena) {
277
+ upb_msgval msgval;
278
+ if (upb_fielddef_ismap(f)) {
279
+ msgval.map_val = Map_GetUpbMap(val, f, arena);
280
+ } else if (upb_fielddef_isseq(f)) {
281
+ msgval.array_val = RepeatedField_GetUpbArray(val, f, arena);
282
+ } else {
283
+ if (val == Qnil &&
284
+ (upb_fielddef_issubmsg(f) || upb_fielddef_realcontainingoneof(f))) {
285
+ upb_msg_clearfield(msg, f);
286
+ return;
236
287
  }
288
+ msgval =
289
+ Convert_RubyToUpb(val, upb_fielddef_name(f), TypeInfo_get(f), arena);
237
290
  }
291
+ upb_msg_set(msg, f, msgval, arena);
292
+ }
238
293
 
239
- // Verify the name corresponds to a oneof or field in this message.
240
- if (!has_field) {
241
- return METHOD_UNKNOWN;
294
+ VALUE Message_getfield(VALUE _self, const upb_fielddef* f) {
295
+ Message* self = ruby_to_Message(_self);
296
+ // This is a special-case: upb_msg_mutable() for map & array are logically
297
+ // const (they will not change what is serialized) but physically
298
+ // non-const, as they do allocate a repeated field or map. The logical
299
+ // constness means it's ok to do even if the message is frozen.
300
+ upb_msg *msg = (upb_msg*)self->msg;
301
+ upb_arena *arena = Arena_get(self->arena);
302
+ if (upb_fielddef_ismap(f)) {
303
+ upb_map *map = upb_msg_mutable(msg, f, arena).map;
304
+ const upb_fielddef *key_f = map_field_key(f);
305
+ const upb_fielddef *val_f = map_field_value(f);
306
+ upb_fieldtype_t key_type = upb_fielddef_type(key_f);
307
+ TypeInfo value_type_info = TypeInfo_get(val_f);
308
+ return Map_GetRubyWrapper(map, key_type, value_type_info, self->arena);
309
+ } else if (upb_fielddef_isseq(f)) {
310
+ upb_array *arr = upb_msg_mutable(msg, f, arena).array;
311
+ return RepeatedField_GetRubyWrapper(arr, TypeInfo_get(f), self->arena);
312
+ } else if (upb_fielddef_issubmsg(f)) {
313
+ if (!upb_msg_has(self->msg, f)) return Qnil;
314
+ upb_msg *submsg = upb_msg_mutable(msg, f, arena).msg;
315
+ const upb_msgdef *m = upb_fielddef_msgsubdef(f);
316
+ return Message_GetRubyWrapper(submsg, m, self->arena);
317
+ } else {
318
+ upb_msgval msgval = upb_msg_get(self->msg, f);
319
+ return Convert_UpbToRuby(msgval, TypeInfo_get(f), self->arena);
242
320
  }
321
+ }
243
322
 
244
- // Method calls like 'has_foo?' are not allowed if field "foo" does not have
245
- // a hasbit (e.g. repeated fields or non-message type fields for proto3
246
- // syntax).
247
- if (accessor_type == METHOD_PRESENCE && test_f != NULL &&
248
- !upb_fielddef_haspresence(test_f)) {
249
- return METHOD_UNKNOWN;
250
- }
323
+ static VALUE Message_field_accessor(VALUE _self, const upb_fielddef* f,
324
+ int accessor_type, int argc, VALUE* argv) {
325
+ upb_arena *arena = Arena_get(Message_GetArena(_self));
251
326
 
252
- *o = test_o;
253
- *f = test_f;
254
- return accessor_type;
327
+ switch (accessor_type) {
328
+ case METHOD_SETTER:
329
+ Message_setfield(Message_GetMutable(_self, NULL), f, argv[1], arena);
330
+ return Qnil;
331
+ case METHOD_CLEAR:
332
+ upb_msg_clearfield(Message_GetMutable(_self, NULL), f);
333
+ return Qnil;
334
+ case METHOD_PRESENCE:
335
+ if (!upb_fielddef_haspresence(f)) {
336
+ rb_raise(rb_eRuntimeError, "Field does not have presence.");
337
+ }
338
+ return upb_msg_has(Message_Get(_self, NULL), f);
339
+ case METHOD_WRAPPER_GETTER: {
340
+ Message* self = ruby_to_Message(_self);
341
+ if (upb_msg_has(self->msg, f)) {
342
+ PBRUBY_ASSERT(upb_fielddef_issubmsg(f) && !upb_fielddef_isseq(f));
343
+ upb_msgval wrapper = upb_msg_get(self->msg, f);
344
+ const upb_msgdef *wrapper_m = upb_fielddef_msgsubdef(f);
345
+ const upb_fielddef *value_f = upb_msgdef_itof(wrapper_m, 1);
346
+ upb_msgval value = upb_msg_get(wrapper.msg_val, value_f);
347
+ return Convert_UpbToRuby(value, TypeInfo_get(value_f), self->arena);
348
+ } else {
349
+ return Qnil;
350
+ }
351
+ }
352
+ case METHOD_WRAPPER_SETTER: {
353
+ upb_msg *msg = Message_GetMutable(_self, NULL);
354
+ if (argv[1] == Qnil) {
355
+ upb_msg_clearfield(msg, f);
356
+ } else {
357
+ const upb_fielddef *val_f = upb_msgdef_itof(upb_fielddef_msgsubdef(f), 1);
358
+ upb_msgval msgval = Convert_RubyToUpb(argv[1], upb_fielddef_name(f),
359
+ TypeInfo_get(val_f), arena);
360
+ upb_msg *wrapper = upb_msg_mutable(msg, f, arena).msg;
361
+ upb_msg_set(wrapper, val_f, msgval, arena);
362
+ }
363
+ return Qnil;
364
+ }
365
+ case METHOD_ENUM_GETTER: {
366
+ upb_msgval msgval = upb_msg_get(Message_Get(_self, NULL), f);
367
+
368
+ if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
369
+ // Map repeated fields to a new type with ints
370
+ VALUE arr = rb_ary_new();
371
+ size_t i, n = upb_array_size(msgval.array_val);
372
+ for (i = 0; i < n; i++) {
373
+ upb_msgval elem = upb_array_get(msgval.array_val, i);
374
+ rb_ary_push(arr, INT2NUM(elem.int32_val));
375
+ }
376
+ return arr;
377
+ } else {
378
+ return INT2NUM(msgval.int32_val);
379
+ }
380
+ }
381
+ case METHOD_GETTER:
382
+ return Message_getfield(_self, f);
383
+ default:
384
+ rb_raise(rb_eRuntimeError, "Internal error, no such accessor: %d",
385
+ accessor_type);
386
+ }
255
387
  }
256
388
 
257
389
  /*
@@ -281,102 +413,56 @@ static int extract_method_call(VALUE method_name, MessageHeader* self,
281
413
  * true if the field 'fieldname' is set in the message object, else false. For
282
414
  * 'proto3' syntax, calling this for a basic type field will result in an error.
283
415
  */
284
- VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
285
- MessageHeader* self;
416
+ static VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
417
+ Message* self = ruby_to_Message(_self);
286
418
  const upb_oneofdef* o;
287
419
  const upb_fielddef* f;
420
+ int accessor_type;
288
421
 
289
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
290
422
  if (argc < 1) {
291
423
  rb_raise(rb_eArgError, "Expected method name as first argument.");
292
424
  }
293
425
 
294
- int accessor_type = extract_method_call(argv[0], self, &f, &o);
295
- if (accessor_type == METHOD_UNKNOWN || (o == NULL && f == NULL) ) {
296
- return rb_call_super(argc, argv);
297
- } else if (accessor_type == METHOD_SETTER || accessor_type == METHOD_WRAPPER_SETTER) {
298
- if (argc != 2) {
299
- rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
300
- }
301
- rb_check_frozen(_self);
302
- } else if (argc != 1) {
303
- rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
304
- }
426
+ accessor_type = extract_method_call(argv[0], self, &f, &o);
305
427
 
306
- // Return which of the oneof fields are set
307
- if (o != NULL) {
308
- if (accessor_type == METHOD_SETTER) {
309
- rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
310
- }
428
+ if (accessor_type == METHOD_UNKNOWN) return rb_call_super(argc, argv);
311
429
 
312
- const upb_fielddef* oneof_field = which_oneof_field(self, o);
313
- if (accessor_type == METHOD_PRESENCE) {
314
- return oneof_field == NULL ? Qfalse : Qtrue;
315
- } else if (accessor_type == METHOD_CLEAR) {
316
- if (oneof_field != NULL) {
317
- layout_clear(self->descriptor->layout, Message_data(self), oneof_field);
430
+ // Validate argument count.
431
+ switch (accessor_type) {
432
+ case METHOD_SETTER:
433
+ case METHOD_WRAPPER_SETTER:
434
+ if (argc != 2) {
435
+ rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
318
436
  }
319
- return Qnil;
320
- } else {
321
- // METHOD_ACCESSOR
322
- return oneof_field == NULL ? Qnil :
323
- ID2SYM(rb_intern(upb_fielddef_name(oneof_field)));
324
- }
325
- // Otherwise we're operating on a single proto field
326
- } else if (accessor_type == METHOD_SETTER) {
327
- layout_set(self->descriptor->layout, Message_data(self), f, argv[1]);
328
- return Qnil;
329
- } else if (accessor_type == METHOD_CLEAR) {
330
- layout_clear(self->descriptor->layout, Message_data(self), f);
331
- return Qnil;
332
- } else if (accessor_type == METHOD_PRESENCE) {
333
- return layout_has(self->descriptor->layout, Message_data(self), f);
334
- } else if (accessor_type == METHOD_WRAPPER_GETTER) {
335
- VALUE value = layout_get(self->descriptor->layout, Message_data(self), f);
336
- if (value != Qnil) {
337
- value = rb_funcall(value, rb_intern("value"), 0);
338
- }
339
- return value;
340
- } else if (accessor_type == METHOD_WRAPPER_SETTER) {
341
- VALUE wrapper = ruby_wrapper_type(f, argv[1]);
342
- layout_set(self->descriptor->layout, Message_data(self), f, wrapper);
343
- return Qnil;
344
- } else if (accessor_type == METHOD_ENUM_GETTER) {
345
- VALUE enum_type = field_type_class(f);
346
- VALUE method = rb_intern("const_get");
347
- VALUE raw_value = layout_get(self->descriptor->layout, Message_data(self), f);
348
-
349
- // Map repeated fields to a new type with ints
350
- if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
351
- int array_size = FIX2INT(rb_funcall(raw_value, rb_intern("length"), 0));
352
- VALUE array_args[1] = { ID2SYM(rb_intern("int64")) };
353
- VALUE array = rb_class_new_instance(1, array_args, CLASS_OF(raw_value));
354
- for (int i = 0; i < array_size; i++) {
355
- VALUE entry = rb_funcall(enum_type, method, 1, rb_funcall(raw_value,
356
- rb_intern("at"), 1, INT2NUM(i)));
357
- rb_funcall(array, rb_intern("push"), 1, entry);
437
+ rb_check_frozen(_self);
438
+ break;
439
+ default:
440
+ if (argc != 1) {
441
+ rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
358
442
  }
359
- return array;
360
- }
361
- // Convert the value for singular fields
362
- return rb_funcall(enum_type, method, 1, raw_value);
443
+ break;
444
+ }
445
+
446
+ // Dispatch accessor.
447
+ if (o != NULL) {
448
+ return Message_oneof_accessor(_self, o, accessor_type);
363
449
  } else {
364
- return layout_get(self->descriptor->layout, Message_data(self), f);
450
+ return Message_field_accessor(_self, f, accessor_type, argc, argv);
365
451
  }
366
452
  }
367
453
 
368
-
369
- VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
370
- MessageHeader* self;
454
+ static VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
455
+ Message* self = ruby_to_Message(_self);
371
456
  const upb_oneofdef* o;
372
457
  const upb_fielddef* f;
458
+ int accessor_type;
373
459
 
374
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
375
460
  if (argc < 1) {
376
461
  rb_raise(rb_eArgError, "Expected method name as first argument.");
377
462
  }
378
463
 
379
- int accessor_type = extract_method_call(argv[0], self, &f, &o);
464
+ accessor_type = extract_method_call(argv[0], self, &f, &o);
465
+
380
466
  if (accessor_type == METHOD_UNKNOWN) {
381
467
  return rb_call_super(argc, argv);
382
468
  } else if (o != NULL) {
@@ -386,22 +472,116 @@ VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
386
472
  }
387
473
  }
388
474
 
389
- VALUE create_submsg_from_hash(const upb_fielddef *f, VALUE hash) {
390
- const upb_def *d = upb_fielddef_subdef(f);
391
- assert(d != NULL);
475
+ void Message_InitFromValue(upb_msg* msg, const upb_msgdef* m, VALUE val,
476
+ upb_arena* arena);
477
+
478
+ typedef struct {
479
+ upb_map *map;
480
+ TypeInfo key_type;
481
+ TypeInfo val_type;
482
+ upb_arena *arena;
483
+ } MapInit;
484
+
485
+ static int Map_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
486
+ MapInit *map_init = (MapInit*)_self;
487
+ upb_msgval k, v;
488
+ k = Convert_RubyToUpb(key, "", map_init->key_type, NULL);
489
+
490
+ if (map_init->val_type.type == UPB_TYPE_MESSAGE && TYPE(val) == T_HASH) {
491
+ upb_msg *msg = upb_msg_new(map_init->val_type.def.msgdef, map_init->arena);
492
+ Message_InitFromValue(msg, map_init->val_type.def.msgdef, val,
493
+ map_init->arena);
494
+ v.msg_val = msg;
495
+ } else {
496
+ v = Convert_RubyToUpb(val, "", map_init->val_type, map_init->arena);
497
+ }
498
+ upb_map_set(map_init->map, k, v, map_init->arena);
499
+ return ST_CONTINUE;
500
+ }
392
501
 
393
- VALUE descriptor = get_def_obj(d);
394
- VALUE msgclass = rb_funcall(descriptor, rb_intern("msgclass"), 0, NULL);
502
+ static void Map_InitFromValue(upb_map* map, const upb_fielddef* f, VALUE val,
503
+ upb_arena* arena) {
504
+ const upb_msgdef* entry_m = upb_fielddef_msgsubdef(f);
505
+ const upb_fielddef* key_f = upb_msgdef_itof(entry_m, 1);
506
+ const upb_fielddef* val_f = upb_msgdef_itof(entry_m, 2);
507
+ if (TYPE(val) != T_HASH) {
508
+ rb_raise(rb_eArgError,
509
+ "Expected Hash object as initializer value for map field '%s' "
510
+ "(given %s).",
511
+ upb_fielddef_name(f), rb_class2name(CLASS_OF(val)));
512
+ }
513
+ MapInit map_init = {map, TypeInfo_get(key_f), TypeInfo_get(val_f), arena};
514
+ rb_hash_foreach(val, Map_initialize_kwarg, (VALUE)&map_init);
515
+ }
395
516
 
396
- VALUE args[1] = { hash };
397
- return rb_class_new_instance(1, args, msgclass);
517
+ static upb_msgval MessageValue_FromValue(VALUE val, TypeInfo info,
518
+ upb_arena* arena) {
519
+ if (info.type == UPB_TYPE_MESSAGE) {
520
+ upb_msgval msgval;
521
+ upb_msg* msg = upb_msg_new(info.def.msgdef, arena);
522
+ Message_InitFromValue(msg, info.def.msgdef, val, arena);
523
+ msgval.msg_val = msg;
524
+ return msgval;
525
+ } else {
526
+ return Convert_RubyToUpb(val, "", info, arena);
527
+ }
398
528
  }
399
529
 
400
- int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
401
- MessageHeader* self;
402
- char *name;
403
- const upb_fielddef* f;
404
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
530
+ static void RepeatedField_InitFromValue(upb_array* arr, const upb_fielddef* f,
531
+ VALUE val, upb_arena* arena) {
532
+ TypeInfo type_info = TypeInfo_get(f);
533
+
534
+ if (TYPE(val) != T_ARRAY) {
535
+ rb_raise(rb_eArgError,
536
+ "Expected array as initializer value for repeated field '%s' (given %s).",
537
+ upb_fielddef_name(f), rb_class2name(CLASS_OF(val)));
538
+ }
539
+
540
+ for (int i = 0; i < RARRAY_LEN(val); i++) {
541
+ VALUE entry = rb_ary_entry(val, i);
542
+ upb_msgval msgval;
543
+ if (upb_fielddef_issubmsg(f) && TYPE(entry) == T_HASH) {
544
+ msgval = MessageValue_FromValue(entry, type_info, arena);
545
+ } else {
546
+ msgval = Convert_RubyToUpb(entry, upb_fielddef_name(f), type_info, arena);
547
+ }
548
+ upb_array_append(arr, msgval, arena);
549
+ }
550
+ }
551
+
552
+ static void Message_InitFieldFromValue(upb_msg* msg, const upb_fielddef* f,
553
+ VALUE val, upb_arena* arena) {
554
+ if (TYPE(val) == T_NIL) return;
555
+
556
+ if (upb_fielddef_ismap(f)) {
557
+ upb_map *map = upb_msg_mutable(msg, f, arena).map;
558
+ Map_InitFromValue(map, f, val, arena);
559
+ } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
560
+ upb_array *arr = upb_msg_mutable(msg, f, arena).array;
561
+ RepeatedField_InitFromValue(arr, f, val, arena);
562
+ } else if (upb_fielddef_issubmsg(f)) {
563
+ if (TYPE(val) == T_HASH) {
564
+ upb_msg *submsg = upb_msg_mutable(msg, f, arena).msg;
565
+ Message_InitFromValue(submsg, upb_fielddef_msgsubdef(f), val, arena);
566
+ } else {
567
+ Message_setfield(msg, f, val, arena);
568
+ }
569
+ } else {
570
+ upb_msgval msgval =
571
+ Convert_RubyToUpb(val, upb_fielddef_name(f), TypeInfo_get(f), arena);
572
+ upb_msg_set(msg, f, msgval, arena);
573
+ }
574
+ }
575
+
576
+ typedef struct {
577
+ upb_msg *msg;
578
+ const upb_msgdef *msgdef;
579
+ upb_arena *arena;
580
+ } MsgInit;
581
+
582
+ static int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
583
+ MsgInit *msg_init = (MsgInit*)_self;
584
+ const char *name;
405
585
 
406
586
  if (TYPE(key) == T_STRING) {
407
587
  name = RSTRING_PTR(key);
@@ -412,51 +592,26 @@ int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
412
592
  "Expected string or symbols as hash keys when initializing proto from hash.");
413
593
  }
414
594
 
415
- f = upb_msgdef_ntofz(self->descriptor->msgdef, name);
595
+ const upb_fielddef* f = upb_msgdef_ntofz(msg_init->msgdef, name);
596
+
416
597
  if (f == NULL) {
417
598
  rb_raise(rb_eArgError,
418
599
  "Unknown field name '%s' in initialization map entry.", name);
419
600
  }
420
601
 
421
- if (TYPE(val) == T_NIL) {
422
- return 0;
423
- }
424
-
425
- if (is_map_field(f)) {
426
- VALUE map;
427
-
428
- if (TYPE(val) != T_HASH) {
429
- rb_raise(rb_eArgError,
430
- "Expected Hash object as initializer value for map field '%s' (given %s).",
431
- name, rb_class2name(CLASS_OF(val)));
432
- }
433
- map = layout_get(self->descriptor->layout, Message_data(self), f);
434
- Map_merge_into_self(map, val);
435
- } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
436
- VALUE ary;
437
-
438
- if (TYPE(val) != T_ARRAY) {
439
- rb_raise(rb_eArgError,
440
- "Expected array as initializer value for repeated field '%s' (given %s).",
441
- name, rb_class2name(CLASS_OF(val)));
442
- }
443
- ary = layout_get(self->descriptor->layout, Message_data(self), f);
444
- for (int i = 0; i < RARRAY_LEN(val); i++) {
445
- VALUE entry = rb_ary_entry(val, i);
446
- if (TYPE(entry) == T_HASH && upb_fielddef_issubmsg(f)) {
447
- entry = create_submsg_from_hash(f, entry);
448
- }
602
+ Message_InitFieldFromValue(msg_init->msg, f, val, msg_init->arena);
603
+ return ST_CONTINUE;
604
+ }
449
605
 
450
- RepeatedField_push(ary, entry);
451
- }
606
+ void Message_InitFromValue(upb_msg* msg, const upb_msgdef* m, VALUE val,
607
+ upb_arena* arena) {
608
+ MsgInit msg_init = {msg, m, arena};
609
+ if (TYPE(val) == T_HASH) {
610
+ rb_hash_foreach(val, Message_initialize_kwarg, (VALUE)&msg_init);
452
611
  } else {
453
- if (TYPE(val) == T_HASH && upb_fielddef_issubmsg(f)) {
454
- val = create_submsg_from_hash(f, val);
455
- }
456
-
457
- layout_set(self->descriptor->layout, Message_data(self), f, val);
612
+ rb_raise(rb_eArgError, "Expected hash arguments or message, not %s",
613
+ rb_class2name(CLASS_OF(val)));
458
614
  }
459
- return 0;
460
615
  }
461
616
 
462
617
  /*
@@ -471,8 +626,13 @@ int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
471
626
  * have been added to a pool. The method definitions described here on the
472
627
  * Message class are provided on each concrete message class.
473
628
  */
474
- VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
475
- VALUE hash_args;
629
+ static VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
630
+ Message* self = ruby_to_Message(_self);
631
+ VALUE arena_rb = Arena_new();
632
+ upb_arena *arena = Arena_get(arena_rb);
633
+ upb_msg *msg = upb_msg_new(self->msgdef, arena);
634
+
635
+ Message_InitPtr(_self, msg, arena_rb);
476
636
 
477
637
  if (argc == 0) {
478
638
  return Qnil;
@@ -480,12 +640,7 @@ VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
480
640
  if (argc != 1) {
481
641
  rb_raise(rb_eArgError, "Expected 0 or 1 arguments.");
482
642
  }
483
- hash_args = argv[0];
484
- if (TYPE(hash_args) != T_HASH) {
485
- rb_raise(rb_eArgError, "Expected hash arguments.");
486
- }
487
-
488
- rb_hash_foreach(hash_args, Message_initialize_kwarg, _self);
643
+ Message_InitFromValue((upb_msg*)self->msg, self->msgdef, argv[0], arena);
489
644
  return Qnil;
490
645
  }
491
646
 
@@ -495,37 +650,40 @@ VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
495
650
  *
496
651
  * Performs a shallow copy of this message and returns the new copy.
497
652
  */
498
- VALUE Message_dup(VALUE _self) {
499
- MessageHeader* self;
500
- VALUE new_msg;
501
- MessageHeader* new_msg_self;
502
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
503
-
504
- new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
505
- TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);
506
-
507
- layout_dup(self->descriptor->layout,
508
- Message_data(new_msg_self),
509
- Message_data(self));
510
-
653
+ static VALUE Message_dup(VALUE _self) {
654
+ Message* self = ruby_to_Message(_self);
655
+ VALUE new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
656
+ Message* new_msg_self = ruby_to_Message(new_msg);
657
+ size_t size = upb_msgdef_layout(self->msgdef)->size;
658
+
659
+ // TODO(copy unknown fields?)
660
+ // TODO(use official upb msg copy function)
661
+ memcpy((upb_msg*)new_msg_self->msg, self->msg, size);
662
+ Arena_fuse(self->arena, Arena_get(new_msg_self->arena));
511
663
  return new_msg;
512
664
  }
513
665
 
514
- // Internal only; used by Google::Protobuf.deep_copy.
515
- VALUE Message_deep_copy(VALUE _self) {
516
- MessageHeader* self;
517
- MessageHeader* new_msg_self;
518
- VALUE new_msg;
519
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
666
+ // Support function for Message_eq, and also used by other #eq functions.
667
+ bool Message_Equal(const upb_msg *m1, const upb_msg *m2, const upb_msgdef *m) {
668
+ if (m1 == m2) return true;
520
669
 
521
- new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
522
- TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);
670
+ size_t size1, size2;
671
+ int encode_opts = UPB_ENCODE_SKIPUNKNOWN | UPB_ENCODE_DETERMINISTIC;
672
+ upb_arena *arena_tmp = upb_arena_new();
673
+ const upb_msglayout *layout = upb_msgdef_layout(m);
523
674
 
524
- layout_deep_copy(self->descriptor->layout,
525
- Message_data(new_msg_self),
526
- Message_data(self));
675
+ // Compare deterministically serialized payloads with no unknown fields.
676
+ char *data1 = upb_encode_ex(m1, layout, encode_opts, arena_tmp, &size1);
677
+ char *data2 = upb_encode_ex(m2, layout, encode_opts, arena_tmp, &size2);
527
678
 
528
- return new_msg;
679
+ if (data1 && data2) {
680
+ bool ret = (size1 == size2) && (memcmp(data1, data2, size1) == 0);
681
+ upb_arena_free(arena_tmp);
682
+ return ret;
683
+ } else {
684
+ upb_arena_free(arena_tmp);
685
+ rb_raise(cParseError, "Error comparing messages");
686
+ }
529
687
  }
530
688
 
531
689
  /*
@@ -537,22 +695,34 @@ VALUE Message_deep_copy(VALUE _self) {
537
695
  * method's semantics (a more efficient comparison may actually be done if the
538
696
  * field is of a primitive type).
539
697
  */
540
- VALUE Message_eq(VALUE _self, VALUE _other) {
541
- MessageHeader* self;
542
- MessageHeader* other;
543
- if (TYPE(_self) != TYPE(_other)) {
544
- return Qfalse;
545
- }
546
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
547
- TypedData_Get_Struct(_other, MessageHeader, &Message_type, other);
698
+ static VALUE Message_eq(VALUE _self, VALUE _other) {
699
+ if (CLASS_OF(_self) != CLASS_OF(_other)) return Qfalse;
548
700
 
549
- if (self->descriptor != other->descriptor) {
550
- return Qfalse;
551
- }
701
+ Message* self = ruby_to_Message(_self);
702
+ Message* other = ruby_to_Message(_other);
703
+ assert(self->msgdef == other->msgdef);
704
+
705
+ return Message_Equal(self->msg, other->msg, self->msgdef) ? Qtrue : Qfalse;
706
+ }
707
+
708
+ uint64_t Message_Hash(const upb_msg* msg, const upb_msgdef* m, uint64_t seed) {
709
+ upb_arena *arena = upb_arena_new();
710
+ const char *data;
711
+ size_t size;
552
712
 
553
- return layout_eq(self->descriptor->layout,
554
- Message_data(self),
555
- Message_data(other));
713
+ // Hash a deterministically serialized payloads with no unknown fields.
714
+ data = upb_encode_ex(msg, upb_msgdef_layout(m),
715
+ UPB_ENCODE_SKIPUNKNOWN | UPB_ENCODE_DETERMINISTIC, arena,
716
+ &size);
717
+
718
+ if (data) {
719
+ uint64_t ret = Wyhash(data, size, seed, kWyhashSalt);
720
+ upb_arena_free(arena);
721
+ return ret;
722
+ } else {
723
+ upb_arena_free(arena);
724
+ rb_raise(cParseError, "Error calculating hash");
725
+ }
556
726
  }
557
727
 
558
728
  /*
@@ -561,11 +731,12 @@ VALUE Message_eq(VALUE _self, VALUE _other) {
561
731
  *
562
732
  * Returns a hash value that represents this message's field values.
563
733
  */
564
- VALUE Message_hash(VALUE _self) {
565
- MessageHeader* self;
566
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
567
-
568
- return layout_hash(self->descriptor->layout, Message_data(self));
734
+ static VALUE Message_hash(VALUE _self) {
735
+ Message* self = ruby_to_Message(_self);
736
+ uint64_t hash_value = Message_Hash(self->msg, self->msgdef, 0);
737
+ // RUBY_FIXNUM_MAX should be one less than a power of 2.
738
+ assert((RUBY_FIXNUM_MAX & (RUBY_FIXNUM_MAX + 1)) == 0);
739
+ return INT2FIX(hash_value & RUBY_FIXNUM_MAX);
569
740
  }
570
741
 
571
742
  /*
@@ -576,75 +747,127 @@ VALUE Message_hash(VALUE _self) {
576
747
  * formatted as "<MessageType: field1: value1, field2: value2, ...>". Each
577
748
  * field's value is represented according to its own #inspect method.
578
749
  */
579
- VALUE Message_inspect(VALUE _self) {
580
- MessageHeader* self;
581
- VALUE str;
582
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
750
+ static VALUE Message_inspect(VALUE _self) {
751
+ Message* self = ruby_to_Message(_self);
583
752
 
584
- str = rb_str_new2("<");
585
- str = rb_str_append(str, rb_str_new2(rb_class2name(CLASS_OF(_self))));
586
- str = rb_str_cat2(str, ": ");
587
- str = rb_str_append(str, layout_inspect(
588
- self->descriptor->layout, Message_data(self)));
589
- str = rb_str_cat2(str, ">");
590
- return str;
753
+ StringBuilder* builder = StringBuilder_New();
754
+ Message_PrintMessage(builder, self->msg, self->msgdef);
755
+ VALUE ret = StringBuilder_ToRubyString(builder);
756
+ StringBuilder_Free(builder);
757
+ return ret;
591
758
  }
592
759
 
593
- /*
594
- * call-seq:
595
- * Message.to_h => {}
596
- *
597
- * Returns the message as a Ruby Hash object, with keys as symbols.
598
- */
599
- VALUE Message_to_h(VALUE _self) {
600
- MessageHeader* self;
601
- VALUE hash;
602
- upb_msg_field_iter it;
603
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
604
-
605
- hash = rb_hash_new();
606
-
607
- for (upb_msg_field_begin(&it, self->descriptor->msgdef);
608
- !upb_msg_field_done(&it);
609
- upb_msg_field_next(&it)) {
610
- const upb_fielddef* field = upb_msg_iter_field(&it);
611
-
612
- // For proto2, do not include fields which are not set.
613
- if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
614
- field_contains_hasbit(self->descriptor->layout, field) &&
615
- !layout_has(self->descriptor->layout, Message_data(self), field)) {
760
+ // Support functions for Message_to_h //////////////////////////////////////////
761
+
762
+ static VALUE RepeatedField_CreateArray(const upb_array* arr,
763
+ TypeInfo type_info) {
764
+ int size = arr ? upb_array_size(arr) : 0;
765
+ VALUE ary = rb_ary_new2(size);
766
+
767
+ for (int i = 0; i < size; i++) {
768
+ upb_msgval msgval = upb_array_get(arr, i);
769
+ VALUE val = Scalar_CreateHash(msgval, type_info);
770
+ rb_ary_push(ary, val);
771
+ }
772
+
773
+ return ary;
774
+ }
775
+
776
+ static VALUE Message_CreateHash(const upb_msg *msg, const upb_msgdef *m) {
777
+ if (!msg) return Qnil;
778
+
779
+ VALUE hash = rb_hash_new();
780
+ int n = upb_msgdef_fieldcount(m);
781
+ bool is_proto2;
782
+
783
+ // We currently have a few behaviors that are specific to proto2.
784
+ // This is unfortunate, we should key behaviors off field attributes (like
785
+ // whether a field has presence), not proto2 vs. proto3. We should see if we
786
+ // can change this without breaking users.
787
+ is_proto2 = upb_msgdef_syntax(m) == UPB_SYNTAX_PROTO2;
788
+
789
+ for (int i = 0; i < n; i++) {
790
+ const upb_fielddef* field = upb_msgdef_field(m, i);
791
+ TypeInfo type_info = TypeInfo_get(field);
792
+ upb_msgval msgval;
793
+ VALUE msg_value;
794
+ VALUE msg_key;
795
+
796
+ if (!is_proto2 && upb_fielddef_issubmsg(field) &&
797
+ !upb_fielddef_isseq(field) && !upb_msg_has(msg, field)) {
798
+ // TODO: Legacy behavior, remove when we fix the is_proto2 differences.
799
+ msg_key = ID2SYM(rb_intern(upb_fielddef_name(field)));
800
+ rb_hash_aset(hash, msg_key, Qnil);
616
801
  continue;
617
802
  }
618
803
 
619
- VALUE msg_value = layout_get(self->descriptor->layout, Message_data(self),
620
- field);
621
- VALUE msg_key = ID2SYM(rb_intern(upb_fielddef_name(field)));
622
- if (is_map_field(field)) {
623
- msg_value = Map_to_h(msg_value);
624
- } else if (upb_fielddef_label(field) == UPB_LABEL_REPEATED) {
625
- msg_value = RepeatedField_to_ary(msg_value);
626
- if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
627
- RARRAY_LEN(msg_value) == 0) {
628
- continue;
629
- }
804
+ // Do not include fields that are not present (oneof or optional fields).
805
+ if (is_proto2 && upb_fielddef_haspresence(field) &&
806
+ !upb_msg_has(msg, field)) {
807
+ continue;
808
+ }
630
809
 
631
- if (upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
632
- for (int i = 0; i < RARRAY_LEN(msg_value); i++) {
633
- VALUE elem = rb_ary_entry(msg_value, i);
634
- rb_ary_store(msg_value, i, Message_to_h(elem));
635
- }
636
- }
810
+ msg_key = ID2SYM(rb_intern(upb_fielddef_name(field)));
811
+ msgval = upb_msg_get(msg, field);
637
812
 
638
- } else if (msg_value != Qnil &&
639
- upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
640
- msg_value = Message_to_h(msg_value);
813
+ // Proto2 omits empty map/repeated filds also.
814
+
815
+ if (upb_fielddef_ismap(field)) {
816
+ const upb_msgdef *entry_m = upb_fielddef_msgsubdef(field);
817
+ const upb_fielddef *key_f = upb_msgdef_itof(entry_m, 1);
818
+ const upb_fielddef *val_f = upb_msgdef_itof(entry_m, 2);
819
+ upb_fieldtype_t key_type = upb_fielddef_type(key_f);
820
+ msg_value = Map_CreateHash(msgval.map_val, key_type, TypeInfo_get(val_f));
821
+ } else if (upb_fielddef_isseq(field)) {
822
+ if (is_proto2 &&
823
+ (!msgval.array_val || upb_array_size(msgval.array_val) == 0)) {
824
+ continue;
825
+ }
826
+ msg_value = RepeatedField_CreateArray(msgval.array_val, type_info);
827
+ } else {
828
+ msg_value = Scalar_CreateHash(msgval, type_info);
641
829
  }
830
+
642
831
  rb_hash_aset(hash, msg_key, msg_value);
643
832
  }
833
+
644
834
  return hash;
645
835
  }
646
836
 
837
+ VALUE Scalar_CreateHash(upb_msgval msgval, TypeInfo type_info) {
838
+ if (type_info.type == UPB_TYPE_MESSAGE) {
839
+ return Message_CreateHash(msgval.msg_val, type_info.def.msgdef);
840
+ } else {
841
+ return Convert_UpbToRuby(msgval, type_info, Qnil);
842
+ }
843
+ }
647
844
 
845
+ /*
846
+ * call-seq:
847
+ * Message.to_h => {}
848
+ *
849
+ * Returns the message as a Ruby Hash object, with keys as symbols.
850
+ */
851
+ static VALUE Message_to_h(VALUE _self) {
852
+ Message* self = ruby_to_Message(_self);
853
+ return Message_CreateHash(self->msg, self->msgdef);
854
+ }
855
+
856
+ /*
857
+ * call-seq:
858
+ * Message.freeze => self
859
+ *
860
+ * Freezes the message object. We have to intercept this so we can pin the
861
+ * Ruby object into memory so we don't forget it's frozen.
862
+ */
863
+ static VALUE Message_freeze(VALUE _self) {
864
+ Message* self = ruby_to_Message(_self);
865
+ if (!RB_OBJ_FROZEN(_self)) {
866
+ Arena_Pin(self->arena, _self);
867
+ RB_OBJ_FREEZE(_self);
868
+ }
869
+ return _self;
870
+ }
648
871
 
649
872
  /*
650
873
  * call-seq:
@@ -653,16 +876,18 @@ VALUE Message_to_h(VALUE _self) {
653
876
  * Accesses a field's value by field name. The provided field name should be a
654
877
  * string.
655
878
  */
656
- VALUE Message_index(VALUE _self, VALUE field_name) {
657
- MessageHeader* self;
879
+ static VALUE Message_index(VALUE _self, VALUE field_name) {
880
+ Message* self = ruby_to_Message(_self);
658
881
  const upb_fielddef* field;
659
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
882
+
660
883
  Check_Type(field_name, T_STRING);
661
- field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
884
+ field = upb_msgdef_ntofz(self->msgdef, RSTRING_PTR(field_name));
885
+
662
886
  if (field == NULL) {
663
887
  return Qnil;
664
888
  }
665
- return layout_get(self->descriptor->layout, Message_data(self), field);
889
+
890
+ return Message_getfield(_self, field);
666
891
  }
667
892
 
668
893
  /*
@@ -672,19 +897,209 @@ VALUE Message_index(VALUE _self, VALUE field_name) {
672
897
  * Sets a field's value by field name. The provided field name should be a
673
898
  * string.
674
899
  */
675
- VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
676
- MessageHeader* self;
677
- const upb_fielddef* field;
678
- TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
900
+ static VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
901
+ Message* self = ruby_to_Message(_self);
902
+ const upb_fielddef* f;
903
+ upb_msgval val;
904
+ upb_arena *arena = Arena_get(self->arena);
905
+
679
906
  Check_Type(field_name, T_STRING);
680
- field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
681
- if (field == NULL) {
907
+ f = upb_msgdef_ntofz(self->msgdef, RSTRING_PTR(field_name));
908
+
909
+ if (f == NULL) {
682
910
  rb_raise(rb_eArgError, "Unknown field: %s", RSTRING_PTR(field_name));
683
911
  }
684
- layout_set(self->descriptor->layout, Message_data(self), field, value);
912
+
913
+ val = Convert_RubyToUpb(value, upb_fielddef_name(f), TypeInfo_get(f), arena);
914
+ upb_msg_set(Message_GetMutable(_self, NULL), f, val, arena);
915
+
685
916
  return Qnil;
686
917
  }
687
918
 
919
+ /*
920
+ * call-seq:
921
+ * MessageClass.decode(data) => message
922
+ *
923
+ * Decodes the given data (as a string containing bytes in protocol buffers wire
924
+ * format) under the interpretration given by this message class's definition
925
+ * and returns a message object with the corresponding field values.
926
+ */
927
+ static VALUE Message_decode(VALUE klass, VALUE data) {
928
+ if (TYPE(data) != T_STRING) {
929
+ rb_raise(rb_eArgError, "Expected string for binary protobuf data.");
930
+ }
931
+
932
+ VALUE msg_rb = initialize_rb_class_with_no_args(klass);
933
+ Message* msg = ruby_to_Message(msg_rb);
934
+
935
+ if (!upb_decode(RSTRING_PTR(data), RSTRING_LEN(data), (upb_msg*)msg->msg,
936
+ upb_msgdef_layout(msg->msgdef),
937
+ Arena_get(msg->arena))) {
938
+ rb_raise(cParseError, "Error occurred during parsing");
939
+ }
940
+
941
+ return msg_rb;
942
+ }
943
+
944
+ /*
945
+ * call-seq:
946
+ * MessageClass.decode_json(data, options = {}) => message
947
+ *
948
+ * Decodes the given data (as a string containing bytes in protocol buffers wire
949
+ * format) under the interpretration given by this message class's definition
950
+ * and returns a message object with the corresponding field values.
951
+ *
952
+ * @param options [Hash] options for the decoder
953
+ * ignore_unknown_fields: set true to ignore unknown fields (default is to
954
+ * raise an error)
955
+ */
956
+ static VALUE Message_decode_json(int argc, VALUE* argv, VALUE klass) {
957
+ VALUE data = argv[0];
958
+ int options = 0;
959
+ upb_status status;
960
+
961
+ // TODO(haberman): use this message's pool instead.
962
+ const upb_symtab *symtab = DescriptorPool_GetSymtab(generated_pool);
963
+
964
+ if (argc < 1 || argc > 2) {
965
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
966
+ }
967
+
968
+ if (argc == 2) {
969
+ VALUE hash_args = argv[1];
970
+ if (TYPE(hash_args) != T_HASH) {
971
+ rb_raise(rb_eArgError, "Expected hash arguments.");
972
+ }
973
+
974
+ if (RTEST(rb_hash_lookup2( hash_args, ID2SYM(rb_intern("ignore_unknown_fields")), Qfalse))) {
975
+ options |= UPB_JSONDEC_IGNOREUNKNOWN;
976
+ }
977
+ }
978
+
979
+ if (TYPE(data) != T_STRING) {
980
+ rb_raise(rb_eArgError, "Expected string for JSON data.");
981
+ }
982
+
983
+ // TODO(cfallin): Check and respect string encoding. If not UTF-8, we need to
984
+ // convert, because string handlers pass data directly to message string
985
+ // fields.
986
+
987
+ VALUE msg_rb = initialize_rb_class_with_no_args(klass);
988
+ Message* msg = ruby_to_Message(msg_rb);
989
+
990
+ // We don't allow users to decode a wrapper type directly.
991
+ if (upb_msgdef_iswrapper(msg->msgdef)) {
992
+ rb_raise(rb_eRuntimeError, "Cannot parse a wrapper directly.");
993
+ }
994
+
995
+ upb_status_clear(&status);
996
+ if (!upb_json_decode(RSTRING_PTR(data), RSTRING_LEN(data), (upb_msg*)msg->msg,
997
+ msg->msgdef, symtab, options,
998
+ Arena_get(msg->arena), &status)) {
999
+ rb_raise(cParseError, "Error occurred during parsing: %s",
1000
+ upb_status_errmsg(&status));
1001
+ }
1002
+
1003
+ return msg_rb;
1004
+ }
1005
+
1006
+ /*
1007
+ * call-seq:
1008
+ * MessageClass.encode(msg) => bytes
1009
+ *
1010
+ * Encodes the given message object to its serialized form in protocol buffers
1011
+ * wire format.
1012
+ */
1013
+ static VALUE Message_encode(VALUE klass, VALUE msg_rb) {
1014
+ Message* msg = ruby_to_Message(msg_rb);
1015
+ const char *data;
1016
+ size_t size;
1017
+
1018
+ if (CLASS_OF(msg_rb) != klass) {
1019
+ rb_raise(rb_eArgError, "Message of wrong type.");
1020
+ }
1021
+
1022
+ upb_arena *arena = upb_arena_new();
1023
+
1024
+ data = upb_encode(msg->msg, upb_msgdef_layout(msg->msgdef), arena,
1025
+ &size);
1026
+
1027
+ if (data) {
1028
+ VALUE ret = rb_str_new(data, size);
1029
+ rb_enc_associate(ret, rb_ascii8bit_encoding());
1030
+ upb_arena_free(arena);
1031
+ return ret;
1032
+ } else {
1033
+ upb_arena_free(arena);
1034
+ rb_raise(rb_eRuntimeError, "Exceeded maximum depth (possibly cycle)");
1035
+ }
1036
+ }
1037
+
1038
+ /*
1039
+ * call-seq:
1040
+ * MessageClass.encode_json(msg, options = {}) => json_string
1041
+ *
1042
+ * Encodes the given message object into its serialized JSON representation.
1043
+ * @param options [Hash] options for the decoder
1044
+ * preserve_proto_fieldnames: set true to use original fieldnames (default is to camelCase)
1045
+ * emit_defaults: set true to emit 0/false values (default is to omit them)
1046
+ */
1047
+ static VALUE Message_encode_json(int argc, VALUE* argv, VALUE klass) {
1048
+ Message* msg = ruby_to_Message(argv[0]);
1049
+ int options = 0;
1050
+ char buf[1024];
1051
+ size_t size;
1052
+ upb_status status;
1053
+
1054
+ // TODO(haberman): use this message's pool instead.
1055
+ const upb_symtab *symtab = DescriptorPool_GetSymtab(generated_pool);
1056
+
1057
+ if (argc < 1 || argc > 2) {
1058
+ rb_raise(rb_eArgError, "Expected 1 or 2 arguments.");
1059
+ }
1060
+
1061
+ if (argc == 2) {
1062
+ VALUE hash_args = argv[1];
1063
+ if (TYPE(hash_args) != T_HASH) {
1064
+ rb_raise(rb_eArgError, "Expected hash arguments.");
1065
+ }
1066
+
1067
+ if (RTEST(rb_hash_lookup2(hash_args,
1068
+ ID2SYM(rb_intern("preserve_proto_fieldnames")),
1069
+ Qfalse))) {
1070
+ options |= UPB_JSONENC_PROTONAMES;
1071
+ }
1072
+
1073
+ if (RTEST(rb_hash_lookup2(hash_args, ID2SYM(rb_intern("emit_defaults")),
1074
+ Qfalse))) {
1075
+ options |= UPB_JSONENC_EMITDEFAULTS;
1076
+ }
1077
+ }
1078
+
1079
+ upb_status_clear(&status);
1080
+ size = upb_json_encode(msg->msg, msg->msgdef, symtab, options, buf,
1081
+ sizeof(buf), &status);
1082
+
1083
+ if (!upb_ok(&status)) {
1084
+ rb_raise(cParseError, "Error occurred during encoding: %s",
1085
+ upb_status_errmsg(&status));
1086
+ }
1087
+
1088
+ VALUE ret;
1089
+ if (size >= sizeof(buf)) {
1090
+ char* buf2 = malloc(size + 1);
1091
+ upb_json_encode(msg->msg, msg->msgdef, symtab, options, buf2, size + 1,
1092
+ &status);
1093
+ ret = rb_str_new(buf2, size);
1094
+ free(buf2);
1095
+ } else {
1096
+ ret = rb_str_new(buf, size);
1097
+ }
1098
+
1099
+ rb_enc_associate(ret, rb_utf8_encoding());
1100
+ return ret;
1101
+ }
1102
+
688
1103
  /*
689
1104
  * call-seq:
690
1105
  * Message.descriptor => descriptor
@@ -692,22 +1107,15 @@ VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
692
1107
  * Class method that returns the Descriptor instance corresponding to this
693
1108
  * message class's type.
694
1109
  */
695
- VALUE Message_descriptor(VALUE klass) {
1110
+ static VALUE Message_descriptor(VALUE klass) {
696
1111
  return rb_ivar_get(klass, descriptor_instancevar_interned);
697
1112
  }
698
1113
 
699
- VALUE build_class_from_descriptor(Descriptor* desc) {
1114
+ VALUE build_class_from_descriptor(VALUE descriptor) {
700
1115
  const char *name;
701
1116
  VALUE klass;
702
1117
 
703
- if (desc->layout == NULL) {
704
- desc->layout = create_layout(desc->msgdef);
705
- }
706
- if (desc->fill_method == NULL) {
707
- desc->fill_method = new_fillmsg_decodermethod(desc, &desc->fill_method);
708
- }
709
-
710
- name = upb_msgdef_fullname(desc->msgdef);
1118
+ name = upb_msgdef_fullname(Descriptor_GetMsgDef(descriptor));
711
1119
  if (name == NULL) {
712
1120
  rb_raise(rb_eRuntimeError, "Descriptor does not have assigned name.");
713
1121
  }
@@ -717,8 +1125,7 @@ VALUE build_class_from_descriptor(Descriptor* desc) {
717
1125
  // their own toplevel constant class name.
718
1126
  rb_intern("Message"),
719
1127
  rb_cObject);
720
- rb_ivar_set(klass, descriptor_instancevar_interned,
721
- get_def_obj(desc->msgdef));
1128
+ rb_ivar_set(klass, descriptor_instancevar_interned, descriptor);
722
1129
  rb_define_alloc_func(klass, Message_alloc);
723
1130
  rb_require("google/protobuf/message_exts");
724
1131
  rb_include_module(klass, rb_eval_string("::Google::Protobuf::MessageExts"));
@@ -735,9 +1142,9 @@ VALUE build_class_from_descriptor(Descriptor* desc) {
735
1142
  rb_define_method(klass, "clone", Message_dup, 0);
736
1143
  rb_define_method(klass, "==", Message_eq, 1);
737
1144
  rb_define_method(klass, "eql?", Message_eq, 1);
1145
+ rb_define_method(klass, "freeze", Message_freeze, 0);
738
1146
  rb_define_method(klass, "hash", Message_hash, 0);
739
1147
  rb_define_method(klass, "to_h", Message_to_h, 0);
740
- rb_define_method(klass, "to_hash", Message_to_h, 0);
741
1148
  rb_define_method(klass, "inspect", Message_inspect, 0);
742
1149
  rb_define_method(klass, "to_s", Message_inspect, 0);
743
1150
  rb_define_method(klass, "[]", Message_index, 1);
@@ -758,12 +1165,12 @@ VALUE build_class_from_descriptor(Descriptor* desc) {
758
1165
  * This module method, provided on each generated enum module, looks up an enum
759
1166
  * value by number and returns its name as a Ruby symbol, or nil if not found.
760
1167
  */
761
- VALUE enum_lookup(VALUE self, VALUE number) {
1168
+ static VALUE enum_lookup(VALUE self, VALUE number) {
762
1169
  int32_t num = NUM2INT(number);
763
1170
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
764
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);
1171
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(desc);
765
1172
 
766
- const char* name = upb_enumdef_iton(enumdesc->enumdef, num);
1173
+ const char* name = upb_enumdef_iton(e, num);
767
1174
  if (name == NULL) {
768
1175
  return Qnil;
769
1176
  } else {
@@ -778,13 +1185,13 @@ VALUE enum_lookup(VALUE self, VALUE number) {
778
1185
  * This module method, provided on each generated enum module, looks up an enum
779
1186
  * value by name (as a Ruby symbol) and returns its name, or nil if not found.
780
1187
  */
781
- VALUE enum_resolve(VALUE self, VALUE sym) {
1188
+ static VALUE enum_resolve(VALUE self, VALUE sym) {
782
1189
  const char* name = rb_id2name(SYM2ID(sym));
783
1190
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
784
- EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);
1191
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(desc);
785
1192
 
786
1193
  int32_t num = 0;
787
- bool found = upb_enumdef_ntoiz(enumdesc->enumdef, name, &num);
1194
+ bool found = upb_enumdef_ntoiz(e, name, &num);
788
1195
  if (!found) {
789
1196
  return Qnil;
790
1197
  } else {
@@ -799,16 +1206,16 @@ VALUE enum_resolve(VALUE self, VALUE sym) {
799
1206
  * This module method, provided on each generated enum module, returns the
800
1207
  * EnumDescriptor corresponding to this enum type.
801
1208
  */
802
- VALUE enum_descriptor(VALUE self) {
1209
+ static VALUE enum_descriptor(VALUE self) {
803
1210
  return rb_ivar_get(self, descriptor_instancevar_interned);
804
1211
  }
805
1212
 
806
- VALUE build_module_from_enumdesc(EnumDescriptor* enumdesc) {
807
- VALUE mod = rb_define_module_id(
808
- rb_intern(upb_enumdef_fullname(enumdesc->enumdef)));
1213
+ VALUE build_module_from_enumdesc(VALUE _enumdesc) {
1214
+ const upb_enumdef *e = EnumDescriptor_GetEnumDef(_enumdesc);
1215
+ VALUE mod = rb_define_module_id(rb_intern(upb_enumdef_fullname(e)));
809
1216
 
810
1217
  upb_enum_iter it;
811
- for (upb_enum_begin(&it, enumdesc->enumdef);
1218
+ for (upb_enum_begin(&it, e);
812
1219
  !upb_enum_done(&it);
813
1220
  upb_enum_next(&it)) {
814
1221
  const char* name = upb_enum_iter_name(&it);
@@ -824,26 +1231,99 @@ VALUE build_module_from_enumdesc(EnumDescriptor* enumdesc) {
824
1231
  rb_define_singleton_method(mod, "lookup", enum_lookup, 1);
825
1232
  rb_define_singleton_method(mod, "resolve", enum_resolve, 1);
826
1233
  rb_define_singleton_method(mod, "descriptor", enum_descriptor, 0);
827
- rb_ivar_set(mod, descriptor_instancevar_interned,
828
- get_def_obj(enumdesc->enumdef));
1234
+ rb_ivar_set(mod, descriptor_instancevar_interned, _enumdesc);
829
1235
 
830
1236
  return mod;
831
1237
  }
832
1238
 
833
- /*
834
- * call-seq:
835
- * Google::Protobuf.deep_copy(obj) => copy_of_obj
836
- *
837
- * Performs a deep copy of a RepeatedField instance, a Map instance, or a
838
- * message object, recursively copying its members.
839
- */
840
- VALUE Google_Protobuf_deep_copy(VALUE self, VALUE obj) {
841
- VALUE klass = CLASS_OF(obj);
842
- if (klass == cRepeatedField) {
843
- return RepeatedField_deep_copy(obj);
844
- } else if (klass == cMap) {
845
- return Map_deep_copy(obj);
846
- } else {
847
- return Message_deep_copy(obj);
1239
+ // Internal only; used by Google::Protobuf.deep_copy.
1240
+ upb_msg* Message_deep_copy(const upb_msg* msg, const upb_msgdef* m,
1241
+ upb_arena *arena) {
1242
+ // Serialize and parse.
1243
+ upb_arena *tmp_arena = upb_arena_new();
1244
+ const upb_msglayout *layout = upb_msgdef_layout(m);
1245
+ size_t size;
1246
+
1247
+ char* data = upb_encode_ex(msg, layout, 0, tmp_arena, &size);
1248
+ upb_msg* new_msg = upb_msg_new(m, arena);
1249
+
1250
+ if (!data || !upb_decode(data, size, new_msg, layout, arena)) {
1251
+ upb_arena_free(tmp_arena);
1252
+ rb_raise(cParseError, "Error occurred copying proto");
1253
+ }
1254
+
1255
+ upb_arena_free(tmp_arena);
1256
+ return new_msg;
1257
+ }
1258
+
1259
+ const upb_msg* Message_GetUpbMessage(VALUE value, const upb_msgdef* m,
1260
+ const char* name, upb_arena* arena) {
1261
+ if (value == Qnil) {
1262
+ rb_raise(cTypeError, "nil message not allowed here.");
848
1263
  }
1264
+
1265
+ VALUE klass = CLASS_OF(value);
1266
+ VALUE desc_rb = rb_ivar_get(klass, descriptor_instancevar_interned);
1267
+ const upb_msgdef* val_m =
1268
+ desc_rb == Qnil ? NULL : Descriptor_GetMsgDef(desc_rb);
1269
+
1270
+ if (val_m != m) {
1271
+ // Check for possible implicit conversions
1272
+ // TODO: hash conversion?
1273
+
1274
+ switch (upb_msgdef_wellknowntype(m)) {
1275
+ case UPB_WELLKNOWN_TIMESTAMP: {
1276
+ // Time -> Google::Protobuf::Timestamp
1277
+ upb_msg *msg = upb_msg_new(m, arena);
1278
+ upb_msgval sec, nsec;
1279
+ struct timespec time;
1280
+ const upb_fielddef *sec_f = upb_msgdef_itof(m, 1);
1281
+ const upb_fielddef *nsec_f = upb_msgdef_itof(m, 2);
1282
+
1283
+ if (!rb_obj_is_kind_of(value, rb_cTime)) goto badtype;
1284
+
1285
+ time = rb_time_timespec(value);
1286
+ sec.int64_val = time.tv_sec;
1287
+ nsec.int32_val = time.tv_nsec;
1288
+ upb_msg_set(msg, sec_f, sec, arena);
1289
+ upb_msg_set(msg, nsec_f, nsec, arena);
1290
+ return msg;
1291
+ }
1292
+ case UPB_WELLKNOWN_DURATION: {
1293
+ // Numeric -> Google::Protobuf::Duration
1294
+ upb_msg *msg = upb_msg_new(m, arena);
1295
+ upb_msgval sec, nsec;
1296
+ const upb_fielddef *sec_f = upb_msgdef_itof(m, 1);
1297
+ const upb_fielddef *nsec_f = upb_msgdef_itof(m, 2);
1298
+
1299
+ if (!rb_obj_is_kind_of(value, rb_cNumeric)) goto badtype;
1300
+
1301
+ sec.int64_val = NUM2LL(value);
1302
+ nsec.int32_val = round((NUM2DBL(value) - NUM2LL(value)) * 1000000000);
1303
+ upb_msg_set(msg, sec_f, sec, arena);
1304
+ upb_msg_set(msg, nsec_f, nsec, arena);
1305
+ return msg;
1306
+ }
1307
+ default:
1308
+ badtype:
1309
+ rb_raise(cTypeError,
1310
+ "Invalid type %s to assign to submessage field '%s'.",
1311
+ rb_class2name(CLASS_OF(value)), name);
1312
+ }
1313
+
1314
+ }
1315
+
1316
+ Message* self = ruby_to_Message(value);
1317
+ Arena_fuse(self->arena, arena);
1318
+
1319
+ return self->msg;
1320
+ }
1321
+
1322
+ void Message_register(VALUE protobuf) {
1323
+ cParseError = rb_const_get(protobuf, rb_intern("ParseError"));
1324
+
1325
+ // Ruby-interned string: "descriptor". We use this identifier to store an
1326
+ // instance variable on message classes we create in order to link them back
1327
+ // to their descriptors.
1328
+ descriptor_instancevar_interned = rb_intern("descriptor");
849
1329
  }