message.c 25.2 KB
Newer Older
Chris Fallin's avatar
Chris Fallin committed
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46
// Protocol Buffers - Google's data interchange format
// Copyright 2014 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#include "protobuf.h"

// -----------------------------------------------------------------------------
// Class/module creation from msgdefs and enumdefs, respectively.
// -----------------------------------------------------------------------------

void* Message_data(void* msg) {
  return ((uint8_t *)msg) + sizeof(MessageHeader);
}

void Message_mark(void* _self) {
  MessageHeader* self = (MessageHeader *)_self;
  layout_mark(self->descriptor->layout, Message_data(self));
}

void Message_free(void* self) {
47 48 49 50 51
  stringsink* unknown = ((MessageHeader *)self)->unknown_fields;
  if (unknown != NULL) {
    stringsink_uninit(unknown);
    free(unknown);
  }
Chris Fallin's avatar
Chris Fallin committed
52 53 54 55 56 57 58 59 60
  xfree(self);
}

rb_data_type_t Message_type = {
  "Message",
  { Message_mark, Message_free, NULL },
};

VALUE Message_alloc(VALUE klass) {
61
  VALUE descriptor = rb_ivar_get(klass, descriptor_instancevar_interned);
Chris Fallin's avatar
Chris Fallin committed
62
  Descriptor* desc = ruby_to_Descriptor(descriptor);
63 64 65 66 67

  if (desc->layout == NULL) {
    desc->layout = create_layout(desc);
  }

Chris Fallin's avatar
Chris Fallin committed
68 69
  MessageHeader* msg = (MessageHeader*)ALLOC_N(
      uint8_t, sizeof(MessageHeader) + desc->layout->size);
70 71
  VALUE ret;

Chris Fallin's avatar
Chris Fallin committed
72 73 74 75
  memset(Message_data(msg), 0, desc->layout->size);

  // We wrap first so that everything in the message object is GC-rooted in case
  // a collection happens during object creation in layout_init().
76
  ret = TypedData_Wrap_Struct(klass, &Message_type, msg);
Chris Fallin's avatar
Chris Fallin committed
77
  msg->descriptor = desc;
78
  rb_ivar_set(ret, descriptor_instancevar_interned, descriptor);
Chris Fallin's avatar
Chris Fallin committed
79

80 81
  msg->unknown_fields = NULL;

Chris Fallin's avatar
Chris Fallin committed
82 83 84 85 86
  layout_init(desc->layout, Message_data(msg));

  return ret;
}

87
static const upb_fielddef* which_oneof_field(MessageHeader* self, const upb_oneofdef* o) {
88 89 90 91 92 93
  upb_oneof_iter it;
  size_t case_ofs;
  uint32_t oneof_case;
  const upb_fielddef* first_field;
  const upb_fielddef* f;

94 95
  // If no fields in the oneof, always nil.
  if (upb_oneofdef_numfields(o) == 0) {
96
    return NULL;
97 98 99 100 101
  }
  // Grab the first field in the oneof so we can get its layout info to find the
  // oneof_case field.
  upb_oneof_begin(&it, o);
  assert(!upb_oneof_done(&it));
102
  first_field = upb_oneof_iter_field(&it);
103 104
  assert(upb_fielddef_containingoneof(first_field) != NULL);

105
  case_ofs =
106 107
      self->descriptor->layout->
      fields[upb_fielddef_index(first_field)].case_offset;
108
  oneof_case = *((uint32_t*)((char*)Message_data(self) + case_ofs));
109

110
  if (oneof_case == ONEOF_CASE_NONE) {
111
    return NULL;
112 113 114
  }

  // oneof_case is a field index, so find that field.
115
  f = upb_oneofdef_itof(o, oneof_case);
116 117
  assert(f != NULL);

118 119 120 121 122 123 124 125
  return f;
}

enum {
  METHOD_UNKNOWN = 0,
  METHOD_GETTER = 1,
  METHOD_SETTER = 2,
  METHOD_CLEAR = 3,
126 127
  METHOD_PRESENCE = 4,
  METHOD_ENUM_GETTER = 5
128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161
};

static int extract_method_call(VALUE method_name, MessageHeader* self,
			       const upb_fielddef **f, const upb_oneofdef **o) {
  Check_Type(method_name, T_SYMBOL);

  VALUE method_str = rb_id2str(SYM2ID(method_name));
  char* name = RSTRING_PTR(method_str);
  size_t name_len = RSTRING_LEN(method_str);
  int accessor_type;
  const upb_oneofdef* test_o;
  const upb_fielddef* test_f;

  if (name[name_len - 1] == '=') {
    accessor_type = METHOD_SETTER;
    name_len--;
    // We want to ensure if the proto has something named clear_foo or has_foo?,
    // we don't strip the prefix.
  } else if (strncmp("clear_", name, 6) == 0 &&
             !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
				    &test_f, &test_o)) {
    accessor_type = METHOD_CLEAR;
    name = name + 6;
    name_len = name_len - 6;
  } else if (strncmp("has_", name, 4) == 0 && name[name_len - 1] == '?' &&
             !upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
				    &test_f, &test_o)) {
    accessor_type = METHOD_PRESENCE;
    name = name + 4;
    name_len = name_len - 5;
  } else {
    accessor_type = METHOD_GETTER;
  }

162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187
  bool has_field = upb_msgdef_lookupname(self->descriptor->msgdef, name, name_len,
			                                   &test_f, &test_o);

  // Look for enum accessor of the form <enum_name>_const
  if (!has_field && accessor_type == METHOD_GETTER &&
      name_len > 6 && strncmp(name + name_len - 6, "_const", 6) == 0) {

    // Find enum field name
    char enum_name[name_len - 5];
    strncpy(enum_name, name, name_len - 6);
    enum_name[name_len - 4] = '\0';

    // Check if enum field exists
    const upb_oneofdef* test_o_enum;
    const upb_fielddef* test_f_enum;
    if (upb_msgdef_lookupname(self->descriptor->msgdef, enum_name, name_len - 6,
			                        &test_f_enum, &test_o_enum) &&
        upb_fielddef_type(test_f_enum) == UPB_TYPE_ENUM) {
      // It does exist!
      has_field = true;
      accessor_type = METHOD_ENUM_GETTER;
      test_o = test_o_enum;
      test_f = test_f_enum;
    }
  }

188
  // Verify the name corresponds to a oneof or field in this message.
189
  if (!has_field) {
190 191 192 193 194 195 196 197 198 199 200 201 202 203
    return METHOD_UNKNOWN;
  }

  // Method calls like 'has_foo?' are not allowed if field "foo" does not have
  // a hasbit (e.g. repeated fields or non-message type fields for proto3
  // syntax).
  if (accessor_type == METHOD_PRESENCE && test_f != NULL &&
      !upb_fielddef_haspresence(test_f)) {
    return METHOD_UNKNOWN;
  }

  *o = test_o;
  *f = test_f;
  return accessor_type;
204 205
}

Chris Fallin's avatar
Chris Fallin committed
206 207 208 209
/*
 * call-seq:
 *     Message.method_missing(*args)
 *
210 211 212 213
 * Provides accessors and setters and methods to clear and check for presence of
 * message fields according to their field names.
 *
 * For any field whose name does not conflict with a built-in method, an
Chris Fallin's avatar
Chris Fallin committed
214 215 216 217 218 219
 * accessor is provided with the same name as the field, and a setter is
 * provided with the name of the field plus the '=' suffix. Thus, given a
 * message instance 'msg' with field 'foo', the following code is valid:
 *
 *     msg.foo = 42
 *     puts msg.foo
220 221 222 223
 *
 * This method also provides read-only accessors for oneofs. If a oneof exists
 * with name 'my_oneof', then msg.my_oneof will return a Ruby symbol equal to
 * the name of the field in that oneof that is currently set, or nil if none.
224 225 226 227 228 229 230 231
 *
 * It also provides methods of the form 'clear_fieldname' to clear the value
 * of the field 'fieldname'. For basic data types, this will set the default
 * value of the field.
 *
 * Additionally, it provides methods of the form 'has_fieldname?', which returns
 * true if the field 'fieldname' is set in the message object, else false. For
 * 'proto3' syntax, calling this for a basic type field will result in an error.
Chris Fallin's avatar
Chris Fallin committed
232 233 234
 */
VALUE Message_method_missing(int argc, VALUE* argv, VALUE _self) {
  MessageHeader* self;
235 236 237
  const upb_oneofdef* o;
  const upb_fielddef* f;

Chris Fallin's avatar
Chris Fallin committed
238 239 240 241 242
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
  if (argc < 1) {
    rb_raise(rb_eArgError, "Expected method name as first argument.");
  }

243 244
  int accessor_type = extract_method_call(argv[0], self, &f, &o);
  if (accessor_type == METHOD_UNKNOWN || (o == NULL && f == NULL) ) {
245
    return rb_call_super(argc, argv);
246 247 248 249
  } else if (accessor_type == METHOD_SETTER) {
    if (argc != 2) {
      rb_raise(rb_eArgError, "Expected 2 arguments, received %d", argc);
    }
250
    rb_check_frozen(_self);
251 252
  } else if (argc != 1) {
    rb_raise(rb_eArgError, "Expected 1 argument, received %d", argc);
253 254
  }

255
  // Return which of the oneof fields are set
256
  if (o != NULL) {
257
    if (accessor_type == METHOD_SETTER) {
258 259
      rb_raise(rb_eRuntimeError, "Oneof accessors are read-only.");
    }
260 261 262 263 264 265

    const upb_fielddef* oneof_field = which_oneof_field(self, o);
    if (accessor_type == METHOD_PRESENCE) {
      return oneof_field == NULL ? Qfalse : Qtrue;
    } else if (accessor_type == METHOD_CLEAR) {
      if (oneof_field != NULL) {
266
        layout_clear(self->descriptor->layout, Message_data(self), oneof_field);
267 268 269
      }
      return Qnil;
    } else {
270 271
      // METHOD_ACCESSOR
      return oneof_field == NULL ? Qnil :
272
        ID2SYM(rb_intern(upb_fielddef_name(oneof_field)));
273
    }
274 275 276 277 278 279 280 281 282
  // Otherwise we're operating on a single proto field
  } else if (accessor_type == METHOD_SETTER) {
    layout_set(self->descriptor->layout, Message_data(self), f, argv[1]);
    return Qnil;
  } else if (accessor_type == METHOD_CLEAR) {
    layout_clear(self->descriptor->layout, Message_data(self), f);
    return Qnil;
  } else if (accessor_type == METHOD_PRESENCE) {
    return layout_has(self->descriptor->layout, Message_data(self), f);
283
  } else if (accessor_type == METHOD_ENUM_GETTER) {
284
    VALUE enum_type = field_type_class(self->descriptor->layout, f);
285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301
    VALUE method = rb_intern("const_get");
    VALUE raw_value = layout_get(self->descriptor->layout, Message_data(self), f);

    // Map repeated fields to a new type with ints
    if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
      int array_size = FIX2INT(rb_funcall(raw_value, rb_intern("length"), 0));
      VALUE array_args[1] = { ID2SYM(rb_intern("int64")) };
      VALUE array = rb_class_new_instance(1, array_args, CLASS_OF(raw_value));
      for (int i = 0; i < array_size; i++) {
        VALUE entry = rb_funcall(enum_type, method, 1, rb_funcall(raw_value,
                                 rb_intern("at"), 1, INT2NUM(i)));
        rb_funcall(array, rb_intern("push"), 1, entry);
      }
      return array;
    }
    // Convert the value for singular fields
    return rb_funcall(enum_type, method, 1, raw_value);
302 303
  } else {
    return layout_get(self->descriptor->layout, Message_data(self), f);
Chris Fallin's avatar
Chris Fallin committed
304 305 306
  }
}

307

308 309 310 311 312 313 314 315 316 317
VALUE Message_respond_to_missing(int argc, VALUE* argv, VALUE _self) {
  MessageHeader* self;
  const upb_oneofdef* o;
  const upb_fielddef* f;

  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
  if (argc < 1) {
    rb_raise(rb_eArgError, "Expected method name as first argument.");
  }

318 319
  int accessor_type = extract_method_call(argv[0], self, &f, &o);
  if (accessor_type == METHOD_UNKNOWN) {
320
    return rb_call_super(argc, argv);
321 322 323 324
  } else if (o != NULL) {
    return accessor_type == METHOD_SETTER ? Qfalse : Qtrue;
  } else {
    return Qtrue;
325 326 327
  }
}

328 329 330
VALUE create_submsg_from_hash(const MessageLayout* layout,
                              const upb_fielddef* f, VALUE hash) {
  const upb_msgdef *d = upb_fielddef_msgsubdef(f);
331 332 333
  assert(d != NULL);

  VALUE args[1] = { hash };
334
  return rb_class_new_instance(1, args, field_type_class(layout, f));
335 336
}

Chris Fallin's avatar
Chris Fallin committed
337 338
int Message_initialize_kwarg(VALUE key, VALUE val, VALUE _self) {
  MessageHeader* self;
339
  char *name;
340
  const upb_fielddef* f;
Chris Fallin's avatar
Chris Fallin committed
341 342
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

343 344 345 346 347
  if (TYPE(key) == T_STRING) {
    name = RSTRING_PTR(key);
  } else if (TYPE(key) == T_SYMBOL) {
    name = RSTRING_PTR(rb_id2str(SYM2ID(key)));
  } else {
Chris Fallin's avatar
Chris Fallin committed
348
    rb_raise(rb_eArgError,
349
             "Expected string or symbols as hash keys when initializing proto from hash.");
Chris Fallin's avatar
Chris Fallin committed
350 351
  }

352
  f = upb_msgdef_ntofz(self->descriptor->msgdef, name);
Chris Fallin's avatar
Chris Fallin committed
353 354
  if (f == NULL) {
    rb_raise(rb_eArgError,
355
             "Unknown field name '%s' in initialization map entry.", name);
Chris Fallin's avatar
Chris Fallin committed
356 357
  }

358 359 360 361
  if (TYPE(val) == T_NIL) {
    return 0;
  }

362
  if (is_map_field(f)) {
363 364
    VALUE map;

365 366
    if (TYPE(val) != T_HASH) {
      rb_raise(rb_eArgError,
367 368
               "Expected Hash object as initializer value for map field '%s' (given %s).",
               name, rb_class2name(CLASS_OF(val)));
369
    }
370
    map = layout_get(self->descriptor->layout, Message_data(self), f);
371 372
    Map_merge_into_self(map, val);
  } else if (upb_fielddef_label(f) == UPB_LABEL_REPEATED) {
373 374
    VALUE ary;

Chris Fallin's avatar
Chris Fallin committed
375 376
    if (TYPE(val) != T_ARRAY) {
      rb_raise(rb_eArgError,
377 378
               "Expected array as initializer value for repeated field '%s' (given %s).",
               name, rb_class2name(CLASS_OF(val)));
Chris Fallin's avatar
Chris Fallin committed
379
    }
380
    ary = layout_get(self->descriptor->layout, Message_data(self), f);
Chris Fallin's avatar
Chris Fallin committed
381
    for (int i = 0; i < RARRAY_LEN(val); i++) {
Zachary Anker's avatar
Zachary Anker committed
382
      VALUE entry = rb_ary_entry(val, i);
383
      if (TYPE(entry) == T_HASH && upb_fielddef_issubmsg(f)) {
384
        entry = create_submsg_from_hash(self->descriptor->layout, f, entry);
385 386 387
      }

      RepeatedField_push(ary, entry);
Chris Fallin's avatar
Chris Fallin committed
388 389
    }
  } else {
390
    if (TYPE(val) == T_HASH && upb_fielddef_issubmsg(f)) {
391
      val = create_submsg_from_hash(self->descriptor->layout, f, val);
392 393
    }

Chris Fallin's avatar
Chris Fallin committed
394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411
    layout_set(self->descriptor->layout, Message_data(self), f, val);
  }
  return 0;
}

/*
 * call-seq:
 *     Message.new(kwargs) => new_message
 *
 * Creates a new instance of the given message class. Keyword arguments may be
 * provided with keywords corresponding to field names.
 *
 * Note that no literal Message class exists. Only concrete classes per message
 * type exist, as provided by the #msgclass method on Descriptors after they
 * have been added to a pool. The method definitions described here on the
 * Message class are provided on each concrete message class.
 */
VALUE Message_initialize(int argc, VALUE* argv, VALUE _self) {
412 413
  VALUE hash_args;

Chris Fallin's avatar
Chris Fallin committed
414 415 416 417 418 419
  if (argc == 0) {
    return Qnil;
  }
  if (argc != 1) {
    rb_raise(rb_eArgError, "Expected 0 or 1 arguments.");
  }
420
  hash_args = argv[0];
Chris Fallin's avatar
Chris Fallin committed
421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436
  if (TYPE(hash_args) != T_HASH) {
    rb_raise(rb_eArgError, "Expected hash arguments.");
  }

  rb_hash_foreach(hash_args, Message_initialize_kwarg, _self);
  return Qnil;
}

/*
 * call-seq:
 *     Message.dup => new_message
 *
 * Performs a shallow copy of this message and returns the new copy.
 */
VALUE Message_dup(VALUE _self) {
  MessageHeader* self;
437 438
  VALUE new_msg;
  MessageHeader* new_msg_self;
Chris Fallin's avatar
Chris Fallin committed
439 440
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

441
  new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
Chris Fallin's avatar
Chris Fallin committed
442 443 444 445 446 447 448 449 450 451 452 453
  TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);

  layout_dup(self->descriptor->layout,
             Message_data(new_msg_self),
             Message_data(self));

  return new_msg;
}

// Internal only; used by Google::Protobuf.deep_copy.
VALUE Message_deep_copy(VALUE _self) {
  MessageHeader* self;
454 455
  MessageHeader* new_msg_self;
  VALUE new_msg;
Chris Fallin's avatar
Chris Fallin committed
456 457
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

458
  new_msg = rb_class_new_instance(0, NULL, CLASS_OF(_self));
Chris Fallin's avatar
Chris Fallin committed
459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477
  TypedData_Get_Struct(new_msg, MessageHeader, &Message_type, new_msg_self);

  layout_deep_copy(self->descriptor->layout,
                   Message_data(new_msg_self),
                   Message_data(self));

  return new_msg;
}

/*
 * call-seq:
 *     Message.==(other) => boolean
 *
 * Performs a deep comparison of this message with another. Messages are equal
 * if they have the same type and if each field is equal according to the :==
 * method's semantics (a more efficient comparison may actually be done if the
 * field is of a primitive type).
 */
VALUE Message_eq(VALUE _self, VALUE _other) {
478 479
  MessageHeader* self;
  MessageHeader* other;
480 481 482
  if (TYPE(_self) != TYPE(_other)) {
    return Qfalse;
  }
483
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
Chris Fallin's avatar
Chris Fallin committed
484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517
  TypedData_Get_Struct(_other, MessageHeader, &Message_type, other);

  if (self->descriptor != other->descriptor) {
    return Qfalse;
  }

  return layout_eq(self->descriptor->layout,
                   Message_data(self),
                   Message_data(other));
}

/*
 * call-seq:
 *     Message.hash => hash_value
 *
 * Returns a hash value that represents this message's field values.
 */
VALUE Message_hash(VALUE _self) {
  MessageHeader* self;
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

  return layout_hash(self->descriptor->layout, Message_data(self));
}

/*
 * call-seq:
 *     Message.inspect => string
 *
 * Returns a human-readable string representing this message. It will be
 * formatted as "<MessageType: field1: value1, field2: value2, ...>". Each
 * field's value is represented according to its own #inspect method.
 */
VALUE Message_inspect(VALUE _self) {
  MessageHeader* self;
518
  VALUE str;
Chris Fallin's avatar
Chris Fallin committed
519 520
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

521
  str = rb_str_new2("<");
Chris Fallin's avatar
Chris Fallin committed
522 523 524 525 526 527 528 529
  str = rb_str_append(str, rb_str_new2(rb_class2name(CLASS_OF(_self))));
  str = rb_str_cat2(str, ": ");
  str = rb_str_append(str, layout_inspect(
      self->descriptor->layout, Message_data(self)));
  str = rb_str_cat2(str, ">");
  return str;
}

530 531 532 533 534 535
/*
 * call-seq:
 *     Message.to_h => {}
 *
 * Returns the message as a Ruby Hash object, with keys as symbols.
 */
536 537
VALUE Message_to_h(VALUE _self) {
  MessageHeader* self;
538 539
  VALUE hash;
  upb_msg_field_iter it;
540 541
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);

542
  hash = rb_hash_new();
543 544 545 546 547

  for (upb_msg_field_begin(&it, self->descriptor->msgdef);
       !upb_msg_field_done(&it);
       upb_msg_field_next(&it)) {
    const upb_fielddef* field = upb_msg_iter_field(&it);
548 549 550 551 552 553 554 555

    // For proto2, do not include fields which are not set.
    if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
	field_contains_hasbit(self->descriptor->layout, field) &&
	!layout_has(self->descriptor->layout, Message_data(self), field)) {
      continue;
    }

556 557
    VALUE msg_value = layout_get(self->descriptor->layout, Message_data(self),
                                 field);
558
    VALUE msg_key   = ID2SYM(rb_intern(upb_fielddef_name(field)));
559
    if (is_map_field(field)) {
560 561
      msg_value = Map_to_h(msg_value);
    } else if (upb_fielddef_label(field) == UPB_LABEL_REPEATED) {
562
      msg_value = RepeatedField_to_ary(msg_value);
563 564 565 566
      if (upb_msgdef_syntax(self->descriptor->msgdef) == UPB_SYNTAX_PROTO2 &&
          RARRAY_LEN(msg_value) == 0) {
        continue;
      }
567

Zachary Anker's avatar
Zachary Anker committed
568
      if (upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
569 570 571 572 573
        for (int i = 0; i < RARRAY_LEN(msg_value); i++) {
          VALUE elem = rb_ary_entry(msg_value, i);
          rb_ary_store(msg_value, i, Message_to_h(elem));
        }
      }
574

575 576 577
    } else if (msg_value != Qnil &&
               upb_fielddef_type(field) == UPB_TYPE_MESSAGE) {
      msg_value = Message_to_h(msg_value);
578 579 580 581 582 583 584 585
    }
    rb_hash_aset(hash, msg_key, msg_value);
  }
  return hash;
}



Chris Fallin's avatar
Chris Fallin committed
586 587 588 589 590 591 592 593 594
/*
 * call-seq:
 *     Message.[](index) => value
 *
 * Accesses a field's value by field name. The provided field name should be a
 * string.
 */
VALUE Message_index(VALUE _self, VALUE field_name) {
  MessageHeader* self;
595
  const upb_fielddef* field;
Chris Fallin's avatar
Chris Fallin committed
596 597
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
  Check_Type(field_name, T_STRING);
598
  field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
Chris Fallin's avatar
Chris Fallin committed
599 600 601 602 603 604 605 606 607 608 609 610 611 612 613
  if (field == NULL) {
    return Qnil;
  }
  return layout_get(self->descriptor->layout, Message_data(self), field);
}

/*
 * call-seq:
 *     Message.[]=(index, value)
 *
 * Sets a field's value by field name. The provided field name should be a
 * string.
 */
VALUE Message_index_set(VALUE _self, VALUE field_name, VALUE value) {
  MessageHeader* self;
614
  const upb_fielddef* field;
Chris Fallin's avatar
Chris Fallin committed
615 616
  TypedData_Get_Struct(_self, MessageHeader, &Message_type, self);
  Check_Type(field_name, T_STRING);
617
  field = upb_msgdef_ntofz(self->descriptor->msgdef, RSTRING_PTR(field_name));
Chris Fallin's avatar
Chris Fallin committed
618 619 620 621 622 623 624 625 626 627 628 629 630 631 632
  if (field == NULL) {
    rb_raise(rb_eArgError, "Unknown field: %s", RSTRING_PTR(field_name));
  }
  layout_set(self->descriptor->layout, Message_data(self), field, value);
  return Qnil;
}

/*
 * call-seq:
 *     Message.descriptor => descriptor
 *
 * Class method that returns the Descriptor instance corresponding to this
 * message class's type.
 */
VALUE Message_descriptor(VALUE klass) {
633
  return rb_ivar_get(klass, descriptor_instancevar_interned);
Chris Fallin's avatar
Chris Fallin committed
634 635
}

636 637
VALUE build_class_from_descriptor(VALUE descriptor) {
  Descriptor* desc = ruby_to_Descriptor(descriptor);
638 639 640 641
  const char *name;
  VALUE klass;

  name = upb_msgdef_fullname(desc->msgdef);
Chris Fallin's avatar
Chris Fallin committed
642 643 644 645
  if (name == NULL) {
    rb_raise(rb_eRuntimeError, "Descriptor does not have assigned name.");
  }

646
  klass = rb_define_class_id(
Chris Fallin's avatar
Chris Fallin committed
647 648 649 650
      // Docs say this parameter is ignored. User will assign return value to
      // their own toplevel constant class name.
      rb_intern("Message"),
      rb_cObject);
651
  rb_ivar_set(klass, descriptor_instancevar_interned, descriptor);
Chris Fallin's avatar
Chris Fallin committed
652
  rb_define_alloc_func(klass, Message_alloc);
653
  rb_require("google/protobuf/message_exts");
654
  rb_include_module(klass, rb_eval_string("::Google::Protobuf::MessageExts"));
655
  rb_extend_object(
656
      klass, rb_eval_string("::Google::Protobuf::MessageExts::ClassMethods"));
657

Chris Fallin's avatar
Chris Fallin committed
658 659
  rb_define_method(klass, "method_missing",
                   Message_method_missing, -1);
660 661
  rb_define_method(klass, "respond_to_missing?",
                   Message_respond_to_missing, -1);
Chris Fallin's avatar
Chris Fallin committed
662 663 664 665 666
  rb_define_method(klass, "initialize", Message_initialize, -1);
  rb_define_method(klass, "dup", Message_dup, 0);
  // Also define #clone so that we don't inherit Object#clone.
  rb_define_method(klass, "clone", Message_dup, 0);
  rb_define_method(klass, "==", Message_eq, 1);
Joe Bolinger's avatar
Joe Bolinger committed
667
  rb_define_method(klass, "eql?", Message_eq, 1);
Chris Fallin's avatar
Chris Fallin committed
668
  rb_define_method(klass, "hash", Message_hash, 0);
669 670
  rb_define_method(klass, "to_h", Message_to_h, 0);
  rb_define_method(klass, "to_hash", Message_to_h, 0);
Chris Fallin's avatar
Chris Fallin committed
671
  rb_define_method(klass, "inspect", Message_inspect, 0);
672
  rb_define_method(klass, "to_s", Message_inspect, 0);
Chris Fallin's avatar
Chris Fallin committed
673 674 675 676
  rb_define_method(klass, "[]", Message_index, 1);
  rb_define_method(klass, "[]=", Message_index_set, 2);
  rb_define_singleton_method(klass, "decode", Message_decode, 1);
  rb_define_singleton_method(klass, "encode", Message_encode, 1);
677
  rb_define_singleton_method(klass, "decode_json", Message_decode_json, -1);
678
  rb_define_singleton_method(klass, "encode_json", Message_encode_json, -1);
Chris Fallin's avatar
Chris Fallin committed
679
  rb_define_singleton_method(klass, "descriptor", Message_descriptor, 0);
680

Chris Fallin's avatar
Chris Fallin committed
681 682 683 684 685 686 687 688 689 690 691 692
  return klass;
}

/*
 * call-seq:
 *     Enum.lookup(number) => name
 *
 * This module method, provided on each generated enum module, looks up an enum
 * value by number and returns its name as a Ruby symbol, or nil if not found.
 */
VALUE enum_lookup(VALUE self, VALUE number) {
  int32_t num = NUM2INT(number);
693
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
Chris Fallin's avatar
Chris Fallin committed
694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712
  EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);

  const char* name = upb_enumdef_iton(enumdesc->enumdef, num);
  if (name == NULL) {
    return Qnil;
  } else {
    return ID2SYM(rb_intern(name));
  }
}

/*
 * call-seq:
 *     Enum.resolve(name) => number
 *
 * This module method, provided on each generated enum module, looks up an enum
 * value by name (as a Ruby symbol) and returns its name, or nil if not found.
 */
VALUE enum_resolve(VALUE self, VALUE sym) {
  const char* name = rb_id2name(SYM2ID(sym));
713
  VALUE desc = rb_ivar_get(self, descriptor_instancevar_interned);
Chris Fallin's avatar
Chris Fallin committed
714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732
  EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(desc);

  int32_t num = 0;
  bool found = upb_enumdef_ntoiz(enumdesc->enumdef, name, &num);
  if (!found) {
    return Qnil;
  } else {
    return INT2NUM(num);
  }
}

/*
 * call-seq:
 *     Enum.descriptor
 *
 * This module method, provided on each generated enum module, returns the
 * EnumDescriptor corresponding to this enum type.
 */
VALUE enum_descriptor(VALUE self) {
733
  return rb_ivar_get(self, descriptor_instancevar_interned);
Chris Fallin's avatar
Chris Fallin committed
734 735
}

736 737
VALUE build_module_from_enumdesc(VALUE _enumdesc) {
  EnumDescriptor* enumdesc = ruby_to_EnumDescriptor(_enumdesc);
Chris Fallin's avatar
Chris Fallin committed
738 739 740 741 742 743 744 745 746
  VALUE mod = rb_define_module_id(
      rb_intern(upb_enumdef_fullname(enumdesc->enumdef)));

  upb_enum_iter it;
  for (upb_enum_begin(&it, enumdesc->enumdef);
       !upb_enum_done(&it);
       upb_enum_next(&it)) {
    const char* name = upb_enum_iter_name(&it);
    int32_t value = upb_enum_iter_number(&it);
747 748 749 750 751
    if (name[0] < 'A' || name[0] > 'Z') {
      rb_warn("Enum value '%s' does not start with an uppercase letter "
              "as is required for Ruby constants.",
              name);
    }
Chris Fallin's avatar
Chris Fallin committed
752 753 754 755 756 757
    rb_define_const(mod, name, INT2NUM(value));
  }

  rb_define_singleton_method(mod, "lookup", enum_lookup, 1);
  rb_define_singleton_method(mod, "resolve", enum_resolve, 1);
  rb_define_singleton_method(mod, "descriptor", enum_descriptor, 0);
758
  rb_ivar_set(mod, descriptor_instancevar_interned, _enumdesc);
Chris Fallin's avatar
Chris Fallin committed
759 760 761 762 763 764 765 766

  return mod;
}

/*
 * call-seq:
 *     Google::Protobuf.deep_copy(obj) => copy_of_obj
 *
767 768
 * Performs a deep copy of a RepeatedField instance, a Map instance, or a
 * message object, recursively copying its members.
Chris Fallin's avatar
Chris Fallin committed
769 770 771 772 773
 */
VALUE Google_Protobuf_deep_copy(VALUE self, VALUE obj) {
  VALUE klass = CLASS_OF(obj);
  if (klass == cRepeatedField) {
    return RepeatedField_deep_copy(obj);
774 775
  } else if (klass == cMap) {
    return Map_deep_copy(obj);
Chris Fallin's avatar
Chris Fallin committed
776 777 778 779
  } else {
    return Message_deep_copy(obj);
  }
}