message.c 28.1 KB
Newer Older
Chris Fallin's avatar
Chris Fallin committed
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46
// Protocol Buffers - Google's data interchange format
// Copyright 2014 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#include "protobuf.h"

// -----------------------------------------------------------------------------
// Class/module creation from msgdefs and enumdefs, respectively.
// -----------------------------------------------------------------------------

void* Message_data(void* msg) {
  return ((uint8_t *)msg) + sizeof(MessageHeader);
}

void Message_mark(void* _self) {
  MessageHeader* self = (MessageHeader *)_self;
  layout_mark(self->descriptor->layout, Message_data(self));
}

void Message_free(void* self) {
47 48 49 50 51
  stringsink* unknown = ((MessageHeader *)self)->unknown_fields;
  if (unknown != NULL) {
    stringsink_uninit(unknown);
    free(unknown);
  }
Chris Fallin's avatar
Chris Fallin committed
52 53 54 55 56 57 58 59 60
  xfree(self);
}

rb_data_type_t Message_type = {
  "Message",
  { Message_mark, Message_free, NULL },
};

VALUE Message_alloc(VALUE klass) {
61
  VALUE descriptor = rb_ivar_get(klass, descriptor_instancevar_interned);
Chris Fallin's avatar
Chris Fallin committed
62 63 64
  Descriptor* desc = ruby_to_Descriptor(descriptor);
  MessageHeader* msg = (MessageHeader*)ALLOC_N(
      uint8_t, sizeof(MessageHeader) + desc->layout->size);
65 66
  VALUE ret;

Chris Fallin's avatar
Chris Fallin committed
67 68 69 70
  memset(Message_data(msg), 0, desc->layout->size);

  // We wrap first so that everything in the message object is GC-rooted in case
  // a collection happens during object creation in layout_init().
71
  ret = TypedData_Wrap_Struct(klass, &Message_type, msg);
Chris Fallin's avatar
Chris Fallin committed
72
  msg->descriptor = desc;
73
  rb_ivar_set(ret, descriptor_instancevar_interned, descriptor);
Chris Fallin's avatar
Chris Fallin committed
74

75 76
  msg->unknown_fields = NULL;

Chris Fallin's avatar
Chris Fallin committed
77 78 79 80 81
  layout_init(desc->layout, Message_data(msg));

  return ret;
}

82
static const upb_fielddef* which_oneof_field(MessageHeader* self, const upb_oneofdef* o) {
83 84 85 86 87 88
  upb_oneof_iter it;
  size_t case_ofs;
  uint32_t oneof_case;
  const upb_fielddef* first_field;
  const upb_fielddef* f;

89 90
  // If no fields in the oneof, always nil.
  if (upb_oneofdef_numfields(o) == 0) {
91
    return NULL;
92 93 94 95 96
  }
  // Grab the first field in the oneof so we can get its layout info to find the
  // oneof_case field.
  upb_oneof_begin(&it, o);
  assert(!upb_oneof_done(&it));
97
  first_field = upb_oneof_iter_field(&it);
98 99
  assert(upb_fielddef_containingoneof(first_field) != NULL);

100
  case_ofs =
101 102
      self->descriptor->layout->
      fields[upb_fielddef_index(first_field)].case_offset;
103
  oneof_case = *((uint32_t*)((char*)Message_data(self) + case_ofs));
104

105
  if (oneof_case == ONEOF_CASE_NONE) {
106
    return NULL;
107 108 109
  }

  // oneof_case is a field index, so find that field.
110
  f = upb_oneofdef_itof(o, oneof_case);
111 112
  assert(f != NULL);

113 114 115 116 117 118 119 120
  return f;
}

enum {
  METHOD_UNKNOWN = 0,
  METHOD_GETTER = 1,
  METHOD_SETTER = 2,
  METHOD_CLEAR = 3,
121
  METHOD_PRESENCE = 4,
122 123 124
  METHOD_ENUM_GETTER = 5,
  METHOD_WRAPPER_GETTER = 6,
  METHOD_WRAPPER_SETTER = 7
125 126
};

127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152
// Check if the field is a well known wrapper type
static bool is_wrapper_type_field(const upb_fielddef* field) {
  char* field_type_name = rb_class2name(field_type_class(field));

  return strcmp(field_type_name, "Google::Protobuf::DoubleValue") == 0 ||
         strcmp(field_type_name, "Google::Protobuf::FloatValue") == 0 ||
         strcmp(field_type_name, "Google::Protobuf::Int32Value") == 0 ||
         strcmp(field_type_name, "Google::Protobuf::Int64Value") == 0 ||
         strcmp(field_type_name, "Google::Protobuf::UInt32Value") == 0 ||
         strcmp(field_type_name, "Google::Protobuf::UInt64Value") == 0 ||
         strcmp(field_type_name, "Google::Protobuf::BoolValue") == 0 ||
         strcmp(field_type_name, "Google::Protobuf::StringValue") == 0 ||
         strcmp(field_type_name, "Google::Protobuf::BytesValue") == 0;
}

// Get a new Ruby wrapper type and set the initial value
static VALUE ruby_wrapper_type(const upb_fielddef* field, const VALUE* value) {
  if (is_wrapper_type_field(field) && value != Qnil) {
    VALUE hash = rb_hash_new();
    rb_hash_aset(hash, rb_str_new2("value"), value);
    VALUE args[1] = { hash };
    return rb_class_new_instance(1, args, field_type_class(field));
  }
  return Qnil;
}

153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184
static int extract_method_call(VALUE method_name, MessageHeader* self,
			       const upb_fielddef **f, const upb_oneofdef **o) {
  Check_Type(method_name, T_SYMBOL);

  VALUE method_str = rb_id2str(SYM2ID(method_name));
  char* name = RSTRING_PTR(method_str);
  size_t name_len = RSTRING_LEN(method_str);
  int accessor_type;
  const upb_oneofdef* test_o;
  const upb_fielddef* test_f;

  if (name[name_len - 1] == '=') {
    accessor_type = METHOD_SETTER;
    name_len--;
    // We want to ensure if the proto has something named clear_foo or has_foo?,
    // we don't strip the prefix.
  } else if (strncmp("clear_", name, 6) == 0 &&
             !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
				    &test_f, &test_o)) {
    accessor_type = METHOD_CLEAR;
    name = name + 6;
    name_len = name_len - 6;
  } else if (strncmp("has_", name, 4) == 0 && name[name_len - 1] == '?' &&
             !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
				    &test_f, &test_o)) {
    accessor_type = METHOD_PRESENCE;
    name = name + 4;
    name_len = name_len - 5;
  } else {
    accessor_type = METHOD_GETTER;
  }

185 186 187
  bool has_field = upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
			                                   &test_f, &test_o);

188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215
  // Look for wrapper type accessor of the form <field_name>_as_value
  if (!has_field &&
      (accessor_type == METHOD_GETTER || accessor_type == METHOD_SETTER) &&
      name_len > 9 && strncmp(name + name_len - 9, "_as_value", 9) == 0) {
    // Find the field name
    char wrapper_field_name[name_len - 8];
    strncpy(wrapper_field_name, name, name_len - 9);
    wrapper_field_name[name_len - 7] = '\0';

    // Check if field exists and is a wrapper type
    const upb_oneofdef* test_o_wrapper;
    const upb_fielddef* test_f_wrapper;
    if (upb_msgdef_lookupname(self->descriptor->msgdef, wrapper_field_name, name_len - 9,
			                        &test_f_wrapper, &test_o_wrapper) &&
        upb_fielddef_type(test_f_wrapper) == UPB_TYPE_MESSAGE &&
        is_wrapper_type_field(test_f_wrapper)) {
      // It does exist!
      has_field = true;
      if (accessor_type == METHOD_SETTER) {
        accessor_type = METHOD_WRAPPER_SETTER;
      } else {
        accessor_type = METHOD_WRAPPER_GETTER;
      }
      test_o = test_o_wrapper;
      test_f = test_f_wrapper;
    }
  }

216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238
  // Look for enum accessor of the form <enum_name>_const
  if (!has_field && accessor_type == METHOD_GETTER &&
      name_len > 6 && strncmp(name + name_len - 6, "_const", 6) == 0) {

    // Find enum field name
    char enum_name[name_len - 5];
    strncpy(enum_name, name, name_len - 6);
    enum_name[name_len - 4] = '\0';

    // Check if enum field exists
    const upb_oneofdef* test_o_enum;
    const upb_fielddef* test_f_enum;
    if (upb_msgdef_lookupname(self->descriptor->msgdef, enum_name, name_len - 6,
			                        &test_f_enum, &test_o_enum) &&
        upb_fielddef_type(test_f_enum) == UPB_TYPE_ENUM) {
      // It does exist!
      has_field = true;
      accessor_type = METHOD_ENUM_GETTER;
      test_o = test_o_enum;
      test_f = test_f_enum;
    }
  }

239
  // Verify the name corresponds to a oneof or field in this message.
240
  if (!has_field) {
241 242 243 244 245 246 247 248 249 250 251 252 253 254
    return METHOD_UNKNOWN;
  }

  // Method calls like 'has_foo?' are not allowed if field "foo" does not have
  // a hasbit (e.g. repeated fields or non-message type fields for proto3
  // syntax).
  if (accessor_type == METHOD_PRESENCE && test_f != NULL &&
      !upb_fielddef_haspresence(test_f)) {
    return METHOD_UNKNOWN;
  }

  *o = test_o;
  *f = test_f;
  return accessor_type;
255 256
}

Chris Fallin's avatar
Chris Fallin committed
257 258 259 260
/*
 * call-seq:
 *     Message.method_missing(*args)
 *
261 262 263 264
 * Provides accessors and setters and methods to clear and check for presence of
 * message fields according to their field names.
 *
 * For any field whose name does not conflict with a built-in method, an
Chris Fallin's avatar
Chris Fallin committed
265 266 267 268 269 270
 * accessor is provided with the same name as the field, and a setter is
 * provided with the name of the field plus the '=' suffix. Thus, given a
 * message instance 'msg' with field 'foo', the following code is valid:
 *
 *     msg.foo = 42
 *     puts msg.foo
271 272 273 274
 *
 * This method also provides read-only accessors for oneofs. If a oneof exists
 * with name 'my_oneof', then msg.my_oneof will return a Ruby symbol equal to
 * the name of the field in that oneof that is currently set, or nil if none.
275 276 277 278 279 280 281 282
 *
 * It also provides methods of the form 'clear_fieldname' to clear the value
 * of the field 'fieldname'. For basic data types, this will set the default
 * value of the field.
 *
 * Additionally, it provides methods of the form 'has_fieldname?', which returns
 * true if the field 'fieldname' is set in the message object, else false. For
 * 'proto3' syntax, calling this for a basic type field will result in an error.
Chris Fallin's avatar
Chris Fallin committed
283 284 285
 */
VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
  MessageHeader* self;
286 287 288
  const upb_oneofdef* o;
  const upb_fielddef* f;

Chris Fallin's avatar
Chris Fallin committed
289 290 291 292 293
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
  if (argc < 1) {
    rb_raise(rb_eArgError, "Expected method name as first argument.");
  }

294 295
  int accessor_type = extract_method_call(argv[0], self, &f, &o);
  if (accessor_type == METHOD_UNKNOWN || (o == NULL && f == NULL) ) {
296
    return rb_call_super(argc, argv);
297
  } else if (accessor_type == METHOD_SETTER || accessor_type == METHOD_WRAPPER_SETTER) {
298 299 300
    if (argc != 2) {
      rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
    }
301
    rb_check_frozen(_self);
302 303
  } else if (argc != 1) {
    rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
304 305
  }

306
  // Return which of the oneof fields are set
307
  if (o != NULL) {
308
    if (accessor_type == METHOD_SETTER) {
309 310
      rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
    }
311 312 313 314 315 316

    const upb_fielddef* oneof_field = which_oneof_field(self, o);
    if (accessor_type == METHOD_PRESENCE) {
      return oneof_field == NULL ? Qfalse : Qtrue;
    } else if (accessor_type == METHOD_CLEAR) {
      if (oneof_field != NULL) {
317
        layout_clear(self->descriptor->layout, Message_data(self), oneof_field);
318 319 320
      }
      return Qnil;
    } else {
321 322
      // METHOD_ACCESSOR
      return oneof_field == NULL ? Qnil :
323
        ID2SYM(rb_intern(upb_fielddef_name(oneof_field)));
324
    }
325 326 327 328 329 330 331 332 333
  // Otherwise we're operating on a single proto field
  } else if (accessor_type == METHOD_SETTER) {
    layout_set(self->descriptor->layout, Message_data(self), f, argv[1]);
    return Qnil;
  } else if (accessor_type == METHOD_CLEAR) {
    layout_clear(self->descriptor->layout, Message_data(self), f);
    return Qnil;
  } else if (accessor_type == METHOD_PRESENCE) {
    return layout_has(self->descriptor->layout, Message_data(self), f);
334 335 336 337 338 339 340 341 342 343
  } else if (accessor_type == METHOD_WRAPPER_GETTER) {
    VALUE value = layout_get(self->descriptor->layout, Message_data(self), f);
    if (value != Qnil) {
      value = rb_funcall(value, rb_intern("value"), 0);
    }
    return value;
  } else if (accessor_type == METHOD_WRAPPER_SETTER) {
    VALUE wrapper = ruby_wrapper_type(f, argv[1]);
    layout_set(self->descriptor->layout, Message_data(self), f, wrapper);
    return Qnil;
344
  } else if (accessor_type == METHOD_ENUM_GETTER) {
345
    VALUE enum_type = field_type_class(f);
346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362
    VALUE method = rb_intern("const_get");
    VALUE raw_value = layout_get(self->descriptor->layout, Message_data(self), f);

    // Map repeated fields to a new type with ints
    if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
      int array_size = FIX2INT(rb_funcall(raw_value, rb_intern("length"), 0));
      VALUE array_args[1] = { ID2SYM(rb_intern("int64")) };
      VALUE array = rb_class_new_instance(1, array_args, CLASS_OF(raw_value));
      for (int i = 0; i < array_size; i++) {
        VALUE entry = rb_funcall(enum_type, method, 1, rb_funcall(raw_value,
                                 rb_intern("at"), 1, INT2NUM(i)));
        rb_funcall(array, rb_intern("push"), 1, entry);
      }
      return array;
    }
    // Convert the value for singular fields
    return rb_funcall(enum_type, method, 1, raw_value);
363 364
  } else {
    return layout_get(self->descriptor->layout, Message_data(self), f);
Chris Fallin's avatar
Chris Fallin committed
365 366 367
  }
}

368

369 370 371 372 373 374 375 376 377 378
VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
  MessageHeader* self;
  const upb_oneofdef* o;
  const upb_fielddef* f;

  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
  if (argc < 1) {
    rb_raise(rb_eArgError, "Expected method name as first argument.");
  }

379 380
  int accessor_type = extract_method_call(argv[0], self, &f, &o);
  if (accessor_type == METHOD_UNKNOWN) {
381
    return rb_call_super(argc, argv);
382 383 384 385
  } else if (o != NULL) {
    return accessor_type == METHOD_SETTER ? Qfalse : Qtrue;
  } else {
    return Qtrue;
386 387 388
  }
}

389 390
VALUE create_submsg_from_hash(const upb_fielddef *f, VALUE hash) {
  const upb_def *d = upb_fielddef_subdef(f);
391 392
  assert(d != NULL);

393 394 395
  VALUE descriptor = get_def_obj(d);
  VALUE msgclass = rb_funcall(descriptor, rb_intern("msgclass"), 0, NULL);

396
  VALUE args[1] = { hash };
397
  return rb_class_new_instance(1, args, msgclass);
398 399
}

Chris Fallin's avatar
Chris Fallin committed
400 401
int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
  MessageHeader* self;
402
  char *name;
403
  const upb_fielddef* f;
Chris Fallin's avatar
Chris Fallin committed
404 405
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

406 407 408 409 410
  if (TYPE(key) == T_STRING) {
    name = RSTRING_PTR(key);
  } else if (TYPE(key) == T_SYMBOL) {
    name = RSTRING_PTR(rb_id2str(SYM2ID(key)));
  } else {
Chris Fallin's avatar
Chris Fallin committed
411
    rb_raise(rb_eArgError,
412
             "Expected string or symbols as hash keys when initializing proto from hash.");
Chris Fallin's avatar
Chris Fallin committed
413 414
  }

415
  f = upb_msgdef_ntofz(self->descriptor->msgdef, name);
Chris Fallin's avatar
Chris Fallin committed
416 417
  if (f == NULL) {
    rb_raise(rb_eArgError,
418
             "Unknown field name '%s' in initialization map entry.", name);
Chris Fallin's avatar
Chris Fallin committed
419 420
  }

421 422 423 424
  if (TYPE(val) == T_NIL) {
    return 0;
  }

425
  if (is_map_field(f)) {
426 427
    VALUE map;

428 429
    if (TYPE(val) != T_HASH) {
      rb_raise(rb_eArgError,
430 431
               "Expected Hash object as initializer value for map field '%s' (given %s).",
               name, rb_class2name(CLASS_OF(val)));
432
    }
433
    map = layout_get(self->descriptor->layout, Message_data(self), f);
434 435
    Map_merge_into_self(map, val);
  } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
436 437
    VALUE ary;

Chris Fallin's avatar
Chris Fallin committed
438 439
    if (TYPE(val) != T_ARRAY) {
      rb_raise(rb_eArgError,
440 441
               "Expected array as initializer value for repeated field '%s' (given %s).",
               name, rb_class2name(CLASS_OF(val)));
Chris Fallin's avatar
Chris Fallin committed
442
    }
443
    ary = layout_get(self->descriptor->layout, Message_data(self), f);
Chris Fallin's avatar
Chris Fallin committed
444
    for (int i = 0; i < RARRAY_LEN(val); i++) {
Zachary Anker's avatar
Zachary Anker committed
445
      VALUE entry = rb_ary_entry(val, i);
446
      if (TYPE(entry) == T_HASH && upb_fielddef_issubmsg(f)) {
447
        entry = create_submsg_from_hash(f, entry);
448 449 450
      }

      RepeatedField_push(ary, entry);
Chris Fallin's avatar
Chris Fallin committed
451 452
    }
  } else {
453
    if (TYPE(val) == T_HASH && upb_fielddef_issubmsg(f)) {
454
      val = create_submsg_from_hash(f, val);
455 456
    }

Chris Fallin's avatar
Chris Fallin committed
457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474
    layout_set(self->descriptor->layout, Message_data(self), f, val);
  }
  return 0;
}

/*
 * call-seq:
 *     Message.new(kwargs) => new_message
 *
 * Creates a new instance of the given message class. Keyword arguments may be
 * provided with keywords corresponding to field names.
 *
 * Note that no literal Message class exists. Only concrete classes per message
 * type exist, as provided by the #msgclass method on Descriptors after they
 * have been added to a pool. The method definitions described here on the
 * Message class are provided on each concrete message class.
 */
VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
475 476
  VALUE hash_args;

Chris Fallin's avatar
Chris Fallin committed
477 478 479 480 481 482
  if (argc == 0) {
    return Qnil;
  }
  if (argc != 1) {
    rb_raise(rb_eArgError, "Expected 0 or 1 arguments.");
  }
483
  hash_args = argv[0];
Chris Fallin's avatar
Chris Fallin committed
484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499
  if (TYPE(hash_args) != T_HASH) {
    rb_raise(rb_eArgError, "Expected hash arguments.");
  }

  rb_hash_foreach(hash_args, Message_initialize_kwarg, _self);
  return Qnil;
}

/*
 * call-seq:
 *     Message.dup => new_message
 *
 * Performs a shallow copy of this message and returns the new copy.
 */
VALUE Message_dup(VALUE _self) {
  MessageHeader* self;
500 501
  VALUE new_msg;
  MessageHeader* new_msg_self;
Chris Fallin's avatar
Chris Fallin committed
502 503
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

504
  new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
Chris Fallin's avatar
Chris Fallin committed
505 506 507 508 509 510 511 512 513 514 515 516
  TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);

  layout_dup(self->descriptor->layout,
             Message_data(new_msg_self),
             Message_data(self));

  return new_msg;
}

// Internal only; used by Google::Protobuf.deep_copy.
VALUE Message_deep_copy(VALUE _self) {
  MessageHeader* self;
517 518
  MessageHeader* new_msg_self;
  VALUE new_msg;
Chris Fallin's avatar
Chris Fallin committed
519 520
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

521
  new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
Chris Fallin's avatar
Chris Fallin committed
522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540
  TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);

  layout_deep_copy(self->descriptor->layout,
                   Message_data(new_msg_self),
                   Message_data(self));

  return new_msg;
}

/*
 * call-seq:
 *     Message.==(other) => boolean
 *
 * Performs a deep comparison of this message with another. Messages are equal
 * if they have the same type and if each field is equal according to the :==
 * method's semantics (a more efficient comparison may actually be done if the
 * field is of a primitive type).
 */
VALUE Message_eq(VALUE _self, VALUE _other) {
541 542
  MessageHeader* self;
  MessageHeader* other;
543 544 545
  if (TYPE(_self) != TYPE(_other)) {
    return Qfalse;
  }
546
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
Chris Fallin's avatar
Chris Fallin committed
547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580
  TypedData_Get_Struct(_other, MessageHeader, &Message_type, other);

  if (self->descriptor != other->descriptor) {
    return Qfalse;
  }

  return layout_eq(self->descriptor->layout,
                   Message_data(self),
                   Message_data(other));
}

/*
 * call-seq:
 *     Message.hash => hash_value
 *
 * Returns a hash value that represents this message's field values.
 */
VALUE Message_hash(VALUE _self) {
  MessageHeader* self;
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

  return layout_hash(self->descriptor->layout, Message_data(self));
}

/*
 * call-seq:
 *     Message.inspect => string
 *
 * Returns a human-readable string representing this message. It will be
 * formatted as "<MessageType: field1: value1, field2: value2, ...>". Each
 * field's value is represented according to its own #inspect method.
 */
VALUE Message_inspect(VALUE _self) {
  MessageHeader* self;
581
  VALUE str;
Chris Fallin's avatar
Chris Fallin committed
582 583
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

584
  str = rb_str_new2("<");
Chris Fallin's avatar
Chris Fallin committed
585 586 587 588 589 590 591 592
  str = rb_str_append(str, rb_str_new2(rb_class2name(CLASS_OF(_self))));
  str = rb_str_cat2(str, ": ");
  str = rb_str_append(str, layout_inspect(
      self->descriptor->layout, Message_data(self)));
  str = rb_str_cat2(str, ">");
  return str;
}

593 594 595 596 597 598
/*
 * call-seq:
 *     Message.to_h => {}
 *
 * Returns the message as a Ruby Hash object, with keys as symbols.
 */
599 600
VALUE Message_to_h(VALUE _self) {
  MessageHeader* self;
601 602
  VALUE hash;
  upb_msg_field_iter it;
603 604
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

605
  hash = rb_hash_new();
606 607 608 609 610

  for (upb_msg_field_begin(&it, self->descriptor->msgdef);
       !upb_msg_field_done(&it);
       upb_msg_field_next(&it)) {
    const upb_fielddef* field = upb_msg_iter_field(&it);
611 612 613 614 615 616 617 618

    // For proto2, do not include fields which are not set.
    if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
	field_contains_hasbit(self->descriptor->layout, field) &&
	!layout_has(self->descriptor->layout, Message_data(self), field)) {
      continue;
    }

619 620
    VALUE msg_value = layout_get(self->descriptor->layout, Message_data(self),
                                 field);
621
    VALUE msg_key   = ID2SYM(rb_intern(upb_fielddef_name(field)));
622
    if (is_map_field(field)) {
623 624
      msg_value = Map_to_h(msg_value);
    } else if (upb_fielddef_label(field) == UPB_LABEL_REPEATED) {
625
      msg_value = RepeatedField_to_ary(msg_value);
626 627 628 629
      if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
          RARRAY_LEN(msg_value) == 0) {
        continue;
      }
630

Zachary Anker's avatar
Zachary Anker committed
631
      if (upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
632 633 634 635 636
        for (int i = 0; i < RARRAY_LEN(msg_value); i++) {
          VALUE elem = rb_ary_entry(msg_value, i);
          rb_ary_store(msg_value, i, Message_to_h(elem));
        }
      }
637

638 639 640
    } else if (msg_value != Qnil &&
               upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
      msg_value = Message_to_h(msg_value);
641 642 643 644 645 646 647 648
    }
    rb_hash_aset(hash, msg_key, msg_value);
  }
  return hash;
}



Chris Fallin's avatar
Chris Fallin committed
649 650 651 652 653 654 655 656 657
/*
 * call-seq:
 *     Message.[](index) => value
 *
 * Accesses a field's value by field name. The provided field name should be a
 * string.
 */
VALUE Message_index(VALUE _self, VALUE field_name) {
  MessageHeader* self;
658
  const upb_fielddef* field;
Chris Fallin's avatar
Chris Fallin committed
659 660
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
  Check_Type(field_name, T_STRING);
661
  field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
Chris Fallin's avatar
Chris Fallin committed
662 663 664 665 666 667 668 669 670 671 672 673 674 675 676
  if (field == NULL) {
    return Qnil;
  }
  return layout_get(self->descriptor->layout, Message_data(self), field);
}

/*
 * call-seq:
 *     Message.[]=(index, value)
 *
 * Sets a field's value by field name. The provided field name should be a
 * string.
 */
VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
  MessageHeader* self;
677
  const upb_fielddef* field;
Chris Fallin's avatar
Chris Fallin committed
678 679
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
  Check_Type(field_name, T_STRING);
680
  field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
Chris Fallin's avatar
Chris Fallin committed
681 682 683 684 685 686 687 688 689 690 691 692 693 694 695
  if (field == NULL) {
    rb_raise(rb_eArgError, "Unknown field: %s", RSTRING_PTR(field_name));
  }
  layout_set(self->descriptor->layout, Message_data(self), field, value);
  return Qnil;
}

/*
 * call-seq:
 *     Message.descriptor => descriptor
 *
 * Class method that returns the Descriptor instance corresponding to this
 * message class's type.
 */
VALUE Message_descriptor(VALUE klass) {
696
  return rb_ivar_get(klass, descriptor_instancevar_interned);
Chris Fallin's avatar
Chris Fallin committed
697 698
}

699
VALUE build_class_from_descriptor(Descriptor* desc) {
700 701 702
  const char *name;
  VALUE klass;

703 704 705 706 707 708 709
  if (desc->layout == NULL) {
    desc->layout = create_layout(desc->msgdef);
  }
  if (desc->fill_method == NULL) {
    desc->fill_method = new_fillmsg_decodermethod(desc, &desc->fill_method);
  }

710
  name = upb_msgdef_fullname(desc->msgdef);
Chris Fallin's avatar
Chris Fallin committed
711 712 713 714
  if (name == NULL) {
    rb_raise(rb_eRuntimeError, "Descriptor does not have assigned name.");
  }

715
  klass = rb_define_class_id(
Chris Fallin's avatar
Chris Fallin committed
716 717 718 719
      // Docs say this parameter is ignored. User will assign return value to
      // their own toplevel constant class name.
      rb_intern("Message"),
      rb_cObject);
720 721
  rb_ivar_set(klass, descriptor_instancevar_interned,
              get_def_obj(desc->msgdef));
Chris Fallin's avatar
Chris Fallin committed
722
  rb_define_alloc_func(klass, Message_alloc);
723
  rb_require("google/protobuf/message_exts");
724
  rb_include_module(klass, rb_eval_string("::Google::Protobuf::MessageExts"));
725
  rb_extend_object(
726
      klass, rb_eval_string("::Google::Protobuf::MessageExts::ClassMethods"));
727

Chris Fallin's avatar
Chris Fallin committed
728 729
  rb_define_method(klass, "method_missing",
                   Message_method_missing, -1);
730 731
  rb_define_method(klass, "respond_to_missing?",
                   Message_respond_to_missing, -1);
Chris Fallin's avatar
Chris Fallin committed
732 733 734 735 736
  rb_define_method(klass, "initialize", Message_initialize, -1);
  rb_define_method(klass, "dup", Message_dup, 0);
  // Also define #clone so that we don't inherit Object#clone.
  rb_define_method(klass, "clone", Message_dup, 0);
  rb_define_method(klass, "==", Message_eq, 1);
Joe Bolinger's avatar
Joe Bolinger committed
737
  rb_define_method(klass, "eql?", Message_eq, 1);
Chris Fallin's avatar
Chris Fallin committed
738
  rb_define_method(klass, "hash", Message_hash, 0);
739 740
  rb_define_method(klass, "to_h", Message_to_h, 0);
  rb_define_method(klass, "to_hash", Message_to_h, 0);
Chris Fallin's avatar
Chris Fallin committed
741
  rb_define_method(klass, "inspect", Message_inspect, 0);
742
  rb_define_method(klass, "to_s", Message_inspect, 0);
Chris Fallin's avatar
Chris Fallin committed
743 744 745 746
  rb_define_method(klass, "[]", Message_index, 1);
  rb_define_method(klass, "[]=", Message_index_set, 2);
  rb_define_singleton_method(klass, "decode", Message_decode, 1);
  rb_define_singleton_method(klass, "encode", Message_encode, 1);
747
  rb_define_singleton_method(klass, "decode_json", Message_decode_json, -1);
748
  rb_define_singleton_method(klass, "encode_json", Message_encode_json, -1);
Chris Fallin's avatar
Chris Fallin committed
749
  rb_define_singleton_method(klass, "descriptor", Message_descriptor, 0);
750

Chris Fallin's avatar
Chris Fallin committed
751 752 753 754 755 756 757 758 759 760 761 762
  return klass;
}

/*
 * call-seq:
 *     Enum.lookup(number) => name
 *
 * This module method, provided on each generated enum module, looks up an enum
 * value by number and returns its name as a Ruby symbol, or nil if not found.
 */
VALUE enum_lookup(VALUE self, VALUE number) {
  int32_t num = NUM2INT(number);
763
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
Chris Fallin's avatar
Chris Fallin committed
764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782
  EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);

  const char* name = upb_enumdef_iton(enumdesc->enumdef, num);
  if (name == NULL) {
    return Qnil;
  } else {
    return ID2SYM(rb_intern(name));
  }
}

/*
 * call-seq:
 *     Enum.resolve(name) => number
 *
 * This module method, provided on each generated enum module, looks up an enum
 * value by name (as a Ruby symbol) and returns its name, or nil if not found.
 */
VALUE enum_resolve(VALUE self, VALUE sym) {
  const char* name = rb_id2name(SYM2ID(sym));
783
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
Chris Fallin's avatar
Chris Fallin committed
784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802
  EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);

  int32_t num = 0;
  bool found = upb_enumdef_ntoiz(enumdesc->enumdef, name, &num);
  if (!found) {
    return Qnil;
  } else {
    return INT2NUM(num);
  }
}

/*
 * call-seq:
 *     Enum.descriptor
 *
 * This module method, provided on each generated enum module, returns the
 * EnumDescriptor corresponding to this enum type.
 */
VALUE enum_descriptor(VALUE self) {
803
  return rb_ivar_get(self, descriptor_instancevar_interned);
Chris Fallin's avatar
Chris Fallin committed
804 805
}

806
VALUE build_module_from_enumdesc(EnumDescriptor* enumdesc) {
Chris Fallin's avatar
Chris Fallin committed
807 808 809 810 811 812 813 814 815
  VALUE mod = rb_define_module_id(
      rb_intern(upb_enumdef_fullname(enumdesc->enumdef)));

  upb_enum_iter it;
  for (upb_enum_begin(&it, enumdesc->enumdef);
       !upb_enum_done(&it);
       upb_enum_next(&it)) {
    const char* name = upb_enum_iter_name(&it);
    int32_t value = upb_enum_iter_number(&it);
816 817 818 819 820
    if (name[0] < 'A' || name[0] > 'Z') {
      rb_warn("Enum value '%s' does not start with an uppercase letter "
              "as is required for Ruby constants.",
              name);
    }
Chris Fallin's avatar
Chris Fallin committed
821 822 823 824 825 826
    rb_define_const(mod, name, INT2NUM(value));
  }

  rb_define_singleton_method(mod, "lookup", enum_lookup, 1);
  rb_define_singleton_method(mod, "resolve", enum_resolve, 1);
  rb_define_singleton_method(mod, "descriptor", enum_descriptor, 0);
827 828
  rb_ivar_set(mod, descriptor_instancevar_interned,
              get_def_obj(enumdesc->enumdef));
Chris Fallin's avatar
Chris Fallin committed
829 830 831 832 833 834 835 836

  return mod;
}

/*
 * call-seq:
 *     Google::Protobuf.deep_copy(obj) => copy_of_obj
 *
837 838
 * Performs a deep copy of a RepeatedField instance, a Map instance, or a
 * message object, recursively copying its members.
Chris Fallin's avatar
Chris Fallin committed
839 840 841 842 843
 */
VALUE Google_Protobuf_deep_copy(VALUE self, VALUE obj) {
  VALUE klass = CLASS_OF(obj);
  if (klass == cRepeatedField) {
    return RepeatedField_deep_copy(obj);
844 845
  } else if (klass == cMap) {
    return Map_deep_copy(obj);
Chris Fallin's avatar
Chris Fallin committed
846 847 848 849
  } else {
    return Message_deep_copy(obj);
  }
}