/* protobuf_lang_tree.c * * Routines of building and reading Protocol Buffers Language grammar tree. * Copyright 2019, Huang Qiangxiong * * Wireshark - Network traffic analyzer * By Gerald Combs * Copyright 1998 Gerald Combs * * SPDX-License-Identifier: GPL-2.0-or-later */ #include #include #include #include #include #include "protobuf_lang_tree.h" #include "protobuf-helper.h" /* only for PROTOBUF_TYPE_XXX enumeration */ #define MAX_PROTOBUF_NODE_DEPTH 100 static bool check_node_depth(const pbl_node_t *node) { int depth = 1; for (const pbl_node_t *parent = node; parent ; parent = parent->parent) { depth++; } if (depth > MAX_PROTOBUF_NODE_DEPTH) { return false; } return true; } extern void pbl_parser_error(protobuf_lang_state_t *state, const char *fmt, ...); /* Unescape string to bytes according to: * * strLit = ( { charValue } ) | ( "'" { charValue } "'" ) | ( '"' { charValue } '"' ) * charValue = hexEscape | octEscape | charEscape | /[^\0\n\\]/ * hexEscape = '\' ( "x" | "X" ) hexDigit hexDigit * octEscape = '\' octalDigit octalDigit octalDigit * charEscape = '\' ( "a" | "b" | "f" | "n" | "r" | "t" | "v" | '\' | "'" | '"' ) * * @param src the source escaped string terminated by '\0' * @param [out] size the length of the output byte array. * @return the unescaped byte array, should be released by g_free() */ static char* protobuf_string_unescape(const char* src, int* size) { int src_len; uint8_t* dst, * q; const char* p = src; if (!(src && size && (src_len = (int)strlen(src)))) return NULL; dst = q = (uint8_t *) g_malloc0(src_len + 1); while (p < src + src_len && *p) { if (*p == '\\') { p++; if (*p == 'x' || *p == 'X') { /* unescape hex byte */ *q++ = (uint8_t)strtol(p + 1, (char**)&p, 16); continue; } if (*p >= '0' && *p <= '7') { /* unescape octal byte */ *q++ = (uint8_t)strtol(p, (char**)&p, 8); continue; } switch (*p) { case 'a': *q++ = '\a'; break; case 'b': *q++ = '\b'; break; case 'f': *q++ = '\f'; break; case 'n': *q++ = '\n'; break; case 'r': *q++ = '\r'; break; case 't': *q++ = '\t'; break; case 'v': *q++ = '\v'; break; default: /* include copying '\', "'" or '"' */ *q++ = *p; break; } } else { *q++ = *p; } p++; } *q = 0; *size = (int)(q - dst); return (char*) dst; } /** Reinitialize the protocol buffers pool according to proto files directories. @param ppool The output descriptor_pool will be created. If *pool is not NULL, it will free it first. @param directories The root directories containing proto files. Must end with NULL element. @param error_cb The error reporter callback function. */ void pbl_reinit_descriptor_pool(pbl_descriptor_pool_t** ppool, const char** directories, pbl_report_error_cb_t error_cb) { unsigned i; pbl_free_pool(*ppool); pbl_descriptor_pool_t* p = g_new0(pbl_descriptor_pool_t, 1); p->source_paths = g_queue_new(); for (i = 0; directories[i] != NULL; i++) { g_queue_push_tail(p->source_paths, g_strdup(directories[i])); } p->error_cb = error_cb ? error_cb : pbl_printf; p->packages = g_hash_table_new_full(g_str_hash, g_str_equal, g_free, pbl_free_node); p->proto_files = g_hash_table_new_full(g_str_hash, g_str_equal, g_free, g_free); p->proto_files_to_be_parsed = g_queue_new(); *ppool = p; } /* free all memory used by this protocol buffers language pool */ void pbl_free_pool(pbl_descriptor_pool_t* pool) { if (pool == NULL) return; g_queue_free_full(pool->source_paths, g_free); g_hash_table_destroy(pool->packages); g_queue_free(pool->proto_files_to_be_parsed); /* elements will be removed in p->proto_files */ g_hash_table_destroy(pool->proto_files); g_free(pool); } /* Canonicalize absolute file path. We only accept path like: * /home/test/protos/example.proto * D:/mydir/test/example.proto * d:\mydir\test\example.proto * This function will replace all '\' to '/', and change '//' to '/'. * May use _fullpath() in windows or realpath() in *NIX. * Return a newly-allocated path, NULL if failed (file * does not exist, or file path contains '/../'). */ static char* pbl_canonicalize_absolute_filepath(const char* path) { int i, j; char* canon_path = g_new(char, strlen(path) + 1); /* replace all '\' to '/', and change '//' to '/' */ for (i = 0, j = 0; path[i] != '\0'; i++) { if (path[i] == '\\' || path[i] == '/') { if (j > 0 && canon_path[j-1] == '/') { /* ignore redundant slash */ } else { canon_path[j++] = '/'; } } else { #ifdef _WIN32 canon_path[j++] = g_ascii_tolower(path[i]); #else canon_path[j++] = path[i]; #endif } } canon_path[j] = '\0'; if (g_path_is_absolute(canon_path) && g_file_test(canon_path, G_FILE_TEST_IS_REGULAR) && strstr(canon_path, "/../") == NULL) { return canon_path; } else { g_free(canon_path); return NULL; } } /* Add a file into to do list */ bool pbl_add_proto_file_to_be_parsed(pbl_descriptor_pool_t* pool, const char* filepath) { char* path = NULL; GList* it = NULL; char* concat_path = NULL; /* Try to get the absolute path of the file */ if (g_path_is_absolute(filepath)) { path = pbl_canonicalize_absolute_filepath(filepath); } if (path == NULL) { /* try to concat with source directories */ for (it = g_queue_peek_head_link(pool->source_paths); it; it = it->next) { concat_path = g_build_filename((char*)it->data, filepath, NULL); path = pbl_canonicalize_absolute_filepath(concat_path); g_free(concat_path); if (path) break; } } if (path == NULL) { if (pool->parser_state) { /* only happened during parsing an 'import' line of a .proto file */ pbl_parser_error(pool->parser_state, "file [%s] does not exist!\n", filepath); } else { /* normally happened during initializing a pool by adding files that need be loaded */ pool->error_cb("Protobuf: file [%s] does not exist!\n", filepath); } return false; } if (!g_hash_table_lookup(pool->proto_files, path)) { /* create file descriptor info */ pbl_file_descriptor_t* file = g_new0(pbl_file_descriptor_t, 1); file->filename = path; file->syntax_version = 2; file->package_name = PBL_DEFAULT_PACKAGE_NAME; file->package_name_lineno = -1; file->pool = pool; /* store in hash table and list */ g_hash_table_insert(pool->proto_files, path, file); g_queue_push_tail(pool->proto_files_to_be_parsed, path); } else { /* The file is already in the proto_files */ g_free(path); } return true; } /* find node according to full_name */ static pbl_node_t* pbl_find_node_in_pool(const pbl_descriptor_pool_t* pool, const char* full_name, pbl_node_type_t nodetype) { char* full_name_buf; int len, i; pbl_node_t* package; pbl_node_t* node = NULL; GSList* names = NULL; /* NULL terminated name retrieved from full_name */ GSList* it = NULL; if (pool == NULL || full_name == NULL || pool->packages == NULL) { return NULL; } if (full_name[0] == '.') { full_name++; /* skip leading dot */ } full_name_buf = g_strdup(full_name); len = (int)strlen(full_name_buf); /* scan from end to begin, and replace '.' to '\0' */ for (i = len-1; i >= 0; i--) { if (full_name_buf[i] == '.' || i == 0) { if (i == 0) { /* no dot any more, we search in default package */ names = g_slist_prepend(names, full_name_buf); package = (pbl_node_t*) g_hash_table_lookup(pool->packages, PBL_DEFAULT_PACKAGE_NAME); } else { /* replace middle dot with '\0' */ /* push name at top of names */ names = g_slist_prepend(names, full_name_buf + i + 1); full_name_buf[i] = 0; /* take 0~i of full_name_buf as package name */ package = (pbl_node_t*) g_hash_table_lookup(pool->packages, full_name_buf); } if (package) { node = package; /* search node in this package */ for (it = names; (it && node && node->children_by_name); it = it->next) { node = (pbl_node_t*) g_hash_table_lookup(node->children_by_name, it->data); } if (it == NULL && node && node->nodetype == nodetype) { break; /* found */ } node = NULL; } } } if (names) { g_slist_free(names); } g_free(full_name_buf); return node; } /* get the full name of node. if it is NULL, it will be built. */ const char* // NOLINTNEXTLINE(misc-no-recursion) pbl_get_node_full_name(pbl_node_t* node) { const char* parent_full_name; if (node == NULL || node->nodetype == PBL_UNKNOWN || node->nodetype == PBL_OPTIONS || node->nodetype == PBL_OPTION) { return NULL; } if (node->full_name) { return node->full_name; } if (node->nodetype == PBL_ONEOF) { if (!check_node_depth(node)) { return NULL; } return pbl_get_node_full_name(node->parent); } if (node->nodetype == PBL_PACKAGE) { node->full_name = g_strdup(node->name); } else { parent_full_name = pbl_get_node_full_name(node->parent); if (parent_full_name && parent_full_name[0] != 0) { node->full_name = g_strconcat(parent_full_name, ".", node->name, NULL); } else { node->full_name = g_strdup(node->name); } } return node->full_name; } /* try to find node globally or in the context or parents (message or package) of the context */ static const pbl_node_t* pbl_find_node_in_context(const pbl_node_t* context, const char* name, pbl_node_type_t nodetype) { const pbl_node_t* node = NULL; pbl_descriptor_pool_t* pool = NULL; char* parent_name; char* full_name; if (context == NULL || name == NULL) { return NULL; } if (name[0] == '.') { /* A leading '.' (for example, .foo.bar.Baz) means to start from the outermost scope. */ if (context->file && context->file->pool) { return pbl_find_node_in_pool(context->file->pool, name, nodetype); } else { return NULL; } } /* find pool */ if (context->file) { pool = context->file->pool; } /* try find node in the context or parents (message or package) of the context */ if (pool) { int remaining; parent_name = g_strdup(pbl_get_node_full_name((pbl_node_t*) context)); remaining = (int)strlen(parent_name); while (remaining > 0) { full_name = g_strconcat(parent_name, ".", name, NULL); node = pbl_find_node_in_pool(pool, full_name, nodetype); g_free(full_name); if (node) { g_free(parent_name); return node; } /* scan from end to begin, and replace first '.' to '\0' */ for (remaining--; remaining > 0; remaining--) { if (parent_name[remaining] == '.') { /* found a potential parent node name */ parent_name[remaining] = '\0'; break; /* break from the 'for' loop, continue 'while' loop */ } } } g_free(parent_name); /* try find node in pool directly */ return pbl_find_node_in_pool(pool, name, nodetype); } return NULL; } /* like descriptor_pool::FindMethodByName */ const pbl_method_descriptor_t* pbl_message_descriptor_pool_FindMethodByName(const pbl_descriptor_pool_t* pool, const char* full_name) { pbl_node_t* n = pbl_find_node_in_pool(pool, full_name, PBL_METHOD); return n ? (pbl_method_descriptor_t*)n : NULL; } /* like MethodDescriptor::name() */ const char* pbl_method_descriptor_name(const pbl_method_descriptor_t* method) { return pbl_get_node_name((pbl_node_t*)method); } /* like MethodDescriptor::full_name() */ const char* pbl_method_descriptor_full_name(const pbl_method_descriptor_t* method) { return pbl_get_node_full_name((pbl_node_t*)method); } /* like MethodDescriptor::input_type() */ const pbl_message_descriptor_t* pbl_method_descriptor_input_type(const pbl_method_descriptor_t* method) { const pbl_node_t* n = pbl_find_node_in_context((pbl_node_t*)method, method->in_msg_type, PBL_MESSAGE); return n ? (const pbl_message_descriptor_t*)n : NULL; } /* like MethodDescriptor::output_type() */ const pbl_message_descriptor_t* pbl_method_descriptor_output_type(const pbl_method_descriptor_t* method) { const pbl_node_t* n = pbl_find_node_in_context((pbl_node_t*)method, method->out_msg_type, PBL_MESSAGE); return n ? (const pbl_message_descriptor_t*)n : NULL; } /* like descriptor_pool::FindMessageTypeByName() */ const pbl_message_descriptor_t* pbl_message_descriptor_pool_FindMessageTypeByName(const pbl_descriptor_pool_t* pool, const char* name) { pbl_node_t* n = pbl_find_node_in_pool(pool, name, PBL_MESSAGE); return n ? (pbl_message_descriptor_t*)n : NULL; } /* like Descriptor::name() */ const char* pbl_message_descriptor_name(const pbl_message_descriptor_t* message) { return pbl_get_node_name((pbl_node_t*)message); } /* like Descriptor::full_name() */ const char* pbl_message_descriptor_full_name(const pbl_message_descriptor_t* message) { return pbl_get_node_full_name((pbl_node_t*)message); } /* like Descriptor::field_count() */ int pbl_message_descriptor_field_count(const pbl_message_descriptor_t* message) { return (message && message->fields) ? g_queue_get_length(message->fields) : 0; } /* like Descriptor::field() */ const pbl_field_descriptor_t* pbl_message_descriptor_field(const pbl_message_descriptor_t* message, int field_index) { return (message && message->fields) ? (pbl_field_descriptor_t*) g_queue_peek_nth(message->fields, field_index) : NULL; } /* like Descriptor::FindFieldByNumber() */ const pbl_field_descriptor_t* pbl_message_descriptor_FindFieldByNumber(const pbl_message_descriptor_t* message, int number) { if (message && message->fields_by_number) { return (pbl_field_descriptor_t*) g_hash_table_lookup(message->fields_by_number, GINT_TO_POINTER(number)); } else { return NULL; } } /* like Descriptor::FindFieldByName() */ const pbl_field_descriptor_t* pbl_message_descriptor_FindFieldByName(const pbl_message_descriptor_t* message, const char* name) { if (message && ((pbl_node_t*)message)->children_by_name) { return (pbl_field_descriptor_t*) g_hash_table_lookup(((pbl_node_t*)message)->children_by_name, name); } else { return NULL; } } /* like FieldDescriptor::full_name() */ const char* pbl_field_descriptor_full_name(const pbl_field_descriptor_t* field) { return pbl_get_node_full_name((pbl_node_t*)field); } /* like FieldDescriptor::name() */ const char* pbl_field_descriptor_name(const pbl_field_descriptor_t* field) { return pbl_get_node_name((pbl_node_t*)field); } /* like FieldDescriptor::number() */ int pbl_field_descriptor_number(const pbl_field_descriptor_t* field) { return GPOINTER_TO_INT(field->number); } /* like FieldDescriptor::type() */ int pbl_field_descriptor_type(const pbl_field_descriptor_t* field) { const pbl_node_t* node; if (field->type == PROTOBUF_TYPE_NONE) { /* try to lookup as ENUM */ node = pbl_find_node_in_context(((pbl_node_t*)field)->parent, field->type_name, PBL_ENUM); if (node) { ((pbl_field_descriptor_t*)field)->type = PROTOBUF_TYPE_ENUM; } else { /* try to lookup as MESSAGE */ node = pbl_find_node_in_context(((pbl_node_t*)field)->parent, field->type_name, PBL_MESSAGE); if (node) { ((pbl_field_descriptor_t*)field)->type = PROTOBUF_TYPE_MESSAGE; } } } return field->type; } /* like FieldDescriptor::is_repeated() */ int pbl_field_descriptor_is_repeated(const pbl_field_descriptor_t* field) { return field->is_repeated ? 1 : 0; } /* like FieldDescriptor::is_packed() */ int pbl_field_descriptor_is_packed(const pbl_field_descriptor_t* field) { bool has_packed_option; bool packed_option_value; int syntax_version = ((pbl_node_t*)field)->file->syntax_version; /* determine packed flag */ if (field->is_repeated == false) { return false; } /* note: field->type may be undetermined until calling pbl_field_descriptor_type() */ switch (pbl_field_descriptor_type(field)) { case PROTOBUF_TYPE_STRING: case PROTOBUF_TYPE_GROUP: case PROTOBUF_TYPE_MESSAGE: case PROTOBUF_TYPE_BYTES: return false; default: /* only repeated fields of primitive numeric types can be declared "packed". */ has_packed_option = field->options_node && field->options_node->children_by_name && g_hash_table_lookup(field->options_node->children_by_name, "packed"); packed_option_value = (has_packed_option ? g_strcmp0( ((pbl_option_descriptor_t*)g_hash_table_lookup( field->options_node->children_by_name, "packed"))->value, "true") == 0 : false); if (syntax_version == 2) { return packed_option_value; } else { /* packed default in syntax_version = 3 */ return has_packed_option ? packed_option_value : true; } } } /* like FieldDescriptor::TypeName() */ const char* pbl_field_descriptor_TypeName(int field_type) { return val_to_str(field_type, protobuf_field_type, "UNKNOWN_FIELD_TYPE(%d)"); } /* like FieldDescriptor::message_type() type = TYPE_MESSAGE or TYPE_GROUP */ const pbl_message_descriptor_t* pbl_field_descriptor_message_type(const pbl_field_descriptor_t* field) { const pbl_node_t* n; if (field->type == PROTOBUF_TYPE_MESSAGE || field->type == PROTOBUF_TYPE_GROUP) { n = pbl_find_node_in_context(((pbl_node_t*)field)->parent, field->type_name, PBL_MESSAGE); return n ? (const pbl_message_descriptor_t*)n : NULL; } return NULL; } /* like FieldDescriptor::enum_type() type = TYPE_ENUM */ const pbl_enum_descriptor_t* pbl_field_descriptor_enum_type(const pbl_field_descriptor_t* field) { const pbl_node_t* n; if (field->type == PROTOBUF_TYPE_ENUM) { n = pbl_find_node_in_context(((pbl_node_t*)field)->parent, field->type_name, PBL_ENUM); return n ? (const pbl_enum_descriptor_t*)n : NULL; } return NULL; } /* like FieldDescriptor::is_required() */ bool pbl_field_descriptor_is_required(const pbl_field_descriptor_t* field) { return field->is_required; } /* like FieldDescriptor::has_default_value() */ bool pbl_field_descriptor_has_default_value(const pbl_field_descriptor_t* field) { return field->has_default_value; } /* like FieldDescriptor::default_value_int32() */ int32_t pbl_field_descriptor_default_value_int32(const pbl_field_descriptor_t* field) { return field->default_value.i32; } /* like FieldDescriptor::default_value_int64() */ int64_t pbl_field_descriptor_default_value_int64(const pbl_field_descriptor_t* field) { return field->default_value.i64; } /* like FieldDescriptor::default_value_uint32() */ uint32_t pbl_field_descriptor_default_value_uint32(const pbl_field_descriptor_t* field) { return field->default_value.u32; } /* like FieldDescriptor::default_value_uint64() */ uint64_t pbl_field_descriptor_default_value_uint64(const pbl_field_descriptor_t* field) { return field->default_value.u64; } /* like FieldDescriptor::default_value_float() */ float pbl_field_descriptor_default_value_float(const pbl_field_descriptor_t* field) { return field->default_value.f; } /* like FieldDescriptor::default_value_double() */ double pbl_field_descriptor_default_value_double(const pbl_field_descriptor_t* field) { return field->default_value.d; } /* like FieldDescriptor::default_value_bool() */ bool pbl_field_descriptor_default_value_bool(const pbl_field_descriptor_t* field) { return field->default_value.b; } /* like FieldDescriptor::default_value_string() */ const char* pbl_field_descriptor_default_value_string(const pbl_field_descriptor_t* field, int* size) { *size = field->string_or_bytes_default_value_length; return field->default_value.s; } /* like FieldDescriptor::default_value_enum() */ const pbl_enum_value_descriptor_t* pbl_field_descriptor_default_value_enum(const pbl_field_descriptor_t* field) { const pbl_enum_descriptor_t* enum_desc; if (pbl_field_descriptor_type(field) == PROTOBUF_TYPE_ENUM && field->default_value.e == NULL && (enum_desc = pbl_field_descriptor_enum_type(field))) { if (field->orig_default_value) { /* find enum_value according to the name of default value */ ((pbl_field_descriptor_t*)field)->default_value.e = pbl_enum_descriptor_FindValueByName(enum_desc, field->orig_default_value); } else { /* the default value is the first defined enum value */ ((pbl_field_descriptor_t*)field)->default_value.e = pbl_enum_descriptor_value(enum_desc, 0); } } return field->default_value.e; } /* like EnumDescriptor::name() */ const char* pbl_enum_descriptor_name(const pbl_enum_descriptor_t* anEnum) { return pbl_get_node_name((pbl_node_t*)anEnum); } /* like EnumDescriptor::full_name() */ const char* pbl_enum_descriptor_full_name(const pbl_enum_descriptor_t* anEnum) { return pbl_get_node_full_name((pbl_node_t*)anEnum); } /* like EnumDescriptor::value_count() */ int pbl_enum_descriptor_value_count(const pbl_enum_descriptor_t* anEnum) { return (anEnum && anEnum->values) ? g_queue_get_length(anEnum->values) : 0; } /* like EnumDescriptor::value() */ const pbl_enum_value_descriptor_t* pbl_enum_descriptor_value(const pbl_enum_descriptor_t* anEnum, int value_index) { return (anEnum && anEnum->values) ? (pbl_enum_value_descriptor_t*) g_queue_peek_nth(anEnum->values, value_index) : NULL; } /* like EnumDescriptor::FindValueByNumber() */ const pbl_enum_value_descriptor_t* pbl_enum_descriptor_FindValueByNumber(const pbl_enum_descriptor_t* anEnum, int number) { if (anEnum && anEnum->values_by_number) { return (pbl_enum_value_descriptor_t*) g_hash_table_lookup(anEnum->values_by_number, GINT_TO_POINTER(number)); } else { return NULL; } } /* like EnumDescriptor::FindValueByName() */ const pbl_enum_value_descriptor_t* pbl_enum_descriptor_FindValueByName(const pbl_enum_descriptor_t* anEnum, const char* name) { if (anEnum && ((pbl_node_t*)anEnum)->children_by_name) { return (pbl_enum_value_descriptor_t*)g_hash_table_lookup(((pbl_node_t*)anEnum)->children_by_name, name); } else { return NULL; } } /* like EnumValueDescriptor::name() */ const char* pbl_enum_value_descriptor_name(const pbl_enum_value_descriptor_t* enumValue) { return pbl_get_node_name((pbl_node_t*)enumValue); } /* like EnumValueDescriptor::full_name() */ const char* pbl_enum_value_descriptor_full_name(const pbl_enum_value_descriptor_t* enumValue) { return pbl_get_node_full_name((pbl_node_t*)enumValue); } /* like EnumValueDescriptor::number() */ int pbl_enum_value_descriptor_number(const pbl_enum_value_descriptor_t* enumValue) { return GPOINTER_TO_INT(enumValue->number); } static void // NOLINTNEXTLINE(misc-no-recursion) pbl_traverse_sub_tree(const pbl_node_t* node, void (*cb)(const pbl_message_descriptor_t*, void*), void* userdata) { GList* it; if (node == NULL) { return; } if (node->nodetype == PBL_MESSAGE) { (*cb)((const pbl_message_descriptor_t*) node, userdata); } if (node->children) { if (!check_node_depth(node)) { return; } for (it = g_queue_peek_head_link(node->children); it; it = it->next) { pbl_traverse_sub_tree((const pbl_node_t*) it->data, cb, userdata); } } } /* visit all message in this pool */ void pbl_foreach_message(const pbl_descriptor_pool_t* pool, void (*cb)(const pbl_message_descriptor_t*, void*), void* userdata) { GHashTableIter it; gpointer key, value; g_hash_table_iter_init (&it, pool->packages); while (g_hash_table_iter_next (&it, &key, &value)) { pbl_traverse_sub_tree((const pbl_node_t*)value, cb, userdata); } } /* * Following are tree building functions that should only be invoked by protobuf_lang parser. */ static void pbl_init_node(pbl_node_t* node, pbl_file_descriptor_t* file, int lineno, pbl_node_type_t nodetype, const char* name) { node->nodetype = nodetype; node->name = g_strdup(name); node->file = file; node->lineno = (lineno > -1) ? lineno : -1; } /* create a normal node */ pbl_node_t* pbl_create_node(pbl_file_descriptor_t* file, int lineno, pbl_node_type_t nodetype, const char* name) { pbl_node_t* node = NULL; switch (nodetype) { case PBL_METHOD: /* should use pbl_create_method_node() */ case PBL_FIELD: /* should use pbl_create_field_node() */ case PBL_MAP_FIELD: /* should use pbl_create_map_field_node() */ case PBL_ENUM_VALUE: /* should use pbl_create_enum_value_node() */ case PBL_OPTION: /* should use pbl_create_option_node() */ return NULL; case PBL_MESSAGE: node = (pbl_node_t*) g_malloc0(sizeof(pbl_message_descriptor_t)); break; case PBL_ENUM: node = (pbl_node_t*) g_malloc0(sizeof(pbl_enum_descriptor_t)); break; default: node = g_new0(pbl_node_t, 1); } pbl_init_node(node, file, lineno, nodetype, name); return node; } pbl_node_t* pbl_set_node_name(pbl_node_t* node, int lineno, const char* newname) { g_free(node->name); node->name = g_strdup(newname); if (lineno > -1) { node->lineno = lineno; } return node; } static pbl_option_descriptor_t* pbl_get_option_by_name(pbl_node_t* options, const char* name) { if (options && options->children_by_name) { return (pbl_option_descriptor_t*)g_hash_table_lookup(options->children_by_name, name); } else { return NULL; } } /* create a method (rpc or stream of service) node */ pbl_node_t* pbl_create_method_node(pbl_file_descriptor_t* file, int lineno, const char* name, const char* in_msg_type, bool in_is_stream, const char* out_msg_type, bool out_is_stream) { pbl_method_descriptor_t* node = g_new0(pbl_method_descriptor_t, 1); pbl_init_node(&node->basic_info, file, lineno, PBL_METHOD, name); node->in_msg_type = g_strdup(in_msg_type); node->in_is_stream = in_is_stream; node->out_msg_type = g_strdup(out_msg_type); node->out_is_stream = out_is_stream; return (pbl_node_t*)node; } /* Get type simple type enum value according to the type name. Return 0 means undetermined. */ static int pbl_get_simple_type_enum_value_by_typename(const char* type_name) { int i = str_to_val(type_name, protobuf_field_type, 0); if (i == PROTOBUF_TYPE_GROUP || i == PROTOBUF_TYPE_MESSAGE || i == PROTOBUF_TYPE_ENUM) { i = PROTOBUF_TYPE_NONE; /* complex type will find after parsing */ } return i; } /* create a field node */ pbl_node_t* pbl_create_field_node(pbl_file_descriptor_t* file, int lineno, const char* label, const char* type_name, const char* name, int number, pbl_node_t* options) { pbl_option_descriptor_t* default_option; pbl_field_descriptor_t* node = g_new0(pbl_field_descriptor_t, 1); pbl_init_node(&node->basic_info, file, lineno, PBL_FIELD, name); node->number = number; node->options_node = options; node->is_repeated = (g_strcmp0(label, "repeated") == 0); node->type_name = g_strdup(type_name); /* type 0 means undetermined, it will be determined on calling pbl_field_descriptor_type() later */ node->type = pbl_get_simple_type_enum_value_by_typename(type_name); node->is_required = (g_strcmp0(label, "required") == 0); /* Try to get default value for proto2. * There is nothing to do for proto3, because the default value * is zero or false in proto3. */ default_option = pbl_get_option_by_name(options, "default"); if (default_option && default_option->value) { node->has_default_value = true; node->orig_default_value = g_strdup(default_option->value); /* get default value for simple type */ switch (node->type) { case PROTOBUF_TYPE_INT32: case PROTOBUF_TYPE_SINT32: case PROTOBUF_TYPE_SFIXED32: sscanf(node->orig_default_value, "%" SCNd32, &node->default_value.i32); break; case PROTOBUF_TYPE_INT64: case PROTOBUF_TYPE_SINT64: case PROTOBUF_TYPE_SFIXED64: node->default_value.i64 = g_ascii_strtoll(node->orig_default_value, NULL, 10); break; case PROTOBUF_TYPE_UINT32: case PROTOBUF_TYPE_FIXED32: sscanf(node->orig_default_value, "%" SCNu32, &node->default_value.u32); break; case PROTOBUF_TYPE_UINT64: case PROTOBUF_TYPE_FIXED64: node->default_value.u64 = g_ascii_strtoull(node->orig_default_value, NULL, 10); break; case PROTOBUF_TYPE_BOOL: node->default_value.b = (g_strcmp0(node->orig_default_value, "true") == 0); break; case PROTOBUF_TYPE_DOUBLE: node->default_value.d = g_ascii_strtod(node->orig_default_value, NULL); break; case PROTOBUF_TYPE_FLOAT: node->default_value.f = (float) g_ascii_strtod(node->orig_default_value, NULL); break; case PROTOBUF_TYPE_STRING: case PROTOBUF_TYPE_BYTES: node->default_value.s = protobuf_string_unescape(node->orig_default_value, &node->string_or_bytes_default_value_length); break; default: /* The default value of ENUM type will be generated * in pbl_field_descriptor_default_value_enum(). * Message or group will be ignore. */ break; } } return (pbl_node_t*)node; } /* create a map field node */ pbl_node_t* pbl_create_map_field_node(pbl_file_descriptor_t* file, int lineno, const char* name, int number, pbl_node_t* options) { pbl_field_descriptor_t* node = g_new0(pbl_field_descriptor_t, 1); pbl_init_node(&node->basic_info, file, lineno, PBL_MAP_FIELD, name); node->number = number; node->type_name = g_strconcat(name, "MapEntry", NULL); node->type = PROTOBUF_TYPE_MESSAGE; node->is_repeated = true; node->options_node = options; return (pbl_node_t*)node; } /* create an enumeration field node */ pbl_node_t* pbl_create_enum_value_node(pbl_file_descriptor_t* file, int lineno, const char* name, int number) { pbl_enum_value_descriptor_t* node = g_new0(pbl_enum_value_descriptor_t, 1); pbl_init_node(&node->basic_info, file, lineno, PBL_ENUM_VALUE, name); node->number = number; return (pbl_node_t*)node; } /* create an option node */ pbl_node_t* pbl_create_option_node(pbl_file_descriptor_t* file, int lineno, const char* name, const char* value) { pbl_option_descriptor_t* node = g_new0(pbl_option_descriptor_t, 1); pbl_init_node(&node->basic_info, file, lineno, PBL_OPTION, name); if (value) node->value = g_strdup(value); return (pbl_node_t*)node; } /* add a node as a child of parent node, and return the parent pointer */ pbl_node_t* // NOLINTNEXTLINE(misc-no-recursion) pbl_add_child(pbl_node_t* parent, pbl_node_t* child) { pbl_node_t* node = NULL; if (child == NULL || parent == NULL) { return parent; } if (!check_node_depth(parent)) { return NULL; } /* add a message node for mapField first */ if (child->nodetype == PBL_MAP_FIELD) { node = pbl_create_node(child->file, child->lineno, PBL_MESSAGE, ((pbl_field_descriptor_t*)child)->type_name); pbl_merge_children(node, child); pbl_add_child(parent, node); } child->parent = parent; /* add child to children list */ if (parent->children == NULL) { parent->children = g_queue_new(); } g_queue_push_tail(parent->children, child); /* add child to children_by_name table */ if (parent->children_by_name == NULL) { parent->children_by_name = g_hash_table_new_full(g_str_hash, g_str_equal, NULL, NULL); } node = (pbl_node_t*) g_hash_table_lookup(parent->children_by_name, child->name); if (node && node->nodetype == PBL_OPTION && child->nodetype == PBL_OPTION && ((pbl_option_descriptor_t*)node)->value && ((pbl_option_descriptor_t*)child)->value) { /* repeated option can be set many times like: string fieldWithComplexOption5 = 5 [(rules).repeated_int = 1, (rules).repeated_int = 2]; we just merge the old value and new value in format /old_value "," new_value/. */ char* oval = ((pbl_option_descriptor_t*)node)->value; char* nval = ((pbl_option_descriptor_t*)child)->value; ((pbl_option_descriptor_t*)child)->value = g_strconcat(oval, ",", nval, NULL); g_free(nval); } else if (node && child->file && parent->file && child->file->pool && child->file->pool->error_cb /* Let's assume that any set of base types we point at are valid.. */ && !strstr(node->file->filename, "google")) { child->file->pool->error_cb( "Protobuf: Warning: \"%s\" of [%s:%d] is already defined in file [%s:%d].\n", child->name, child->file->filename, child->lineno, node->file->filename, node->lineno); } g_hash_table_insert(parent->children_by_name, child->name, child); if (parent->nodetype == PBL_MESSAGE) { pbl_message_descriptor_t* msg = (pbl_message_descriptor_t*) parent; /* add child to fields_by_number table */ if (child->nodetype == PBL_FIELD || child->nodetype == PBL_MAP_FIELD) { if (msg->fields == NULL) { msg->fields = g_queue_new(); } g_queue_push_tail(msg->fields, child); if (msg->fields_by_number == NULL) { msg->fields_by_number = g_hash_table_new_full(g_direct_hash, g_direct_equal, NULL, NULL); } g_hash_table_insert(msg->fields_by_number, GINT_TO_POINTER(((pbl_field_descriptor_t*)child)->number), child); } } else if (parent->nodetype == PBL_ENUM && child->nodetype == PBL_ENUM_VALUE) { pbl_enum_descriptor_t* anEnum = (pbl_enum_descriptor_t*) parent; if (anEnum->values == NULL) { anEnum->values = g_queue_new(); } g_queue_push_tail(anEnum->values, child); /* add child to values_by_number table */ if (anEnum->values_by_number == NULL) { anEnum->values_by_number = g_hash_table_new_full(g_direct_hash, g_direct_equal, NULL, NULL); } g_hash_table_insert(anEnum->values_by_number, GINT_TO_POINTER(((pbl_enum_value_descriptor_t*)child)->number), child); } return parent; } /* merge one('from') node's children to another('to') node, and return the 'to' pointer */ pbl_node_t* // NOLINTNEXTLINE(misc-no-recursion) pbl_merge_children(pbl_node_t* to, pbl_node_t* from) { GList* it; pbl_node_t* child; if (to == NULL || from == NULL) { return to; } if (from->children) { for (it = g_queue_peek_head_link(from->children); it; it = it->next) { child = (pbl_node_t*)it->data; pbl_add_child(to, child); } g_queue_free(from->children); from->children = NULL; if (from->children_by_name) { g_hash_table_destroy(from->children_by_name); } from->children_by_name = NULL; if (from->nodetype == PBL_MESSAGE) { pbl_message_descriptor_t* msg = (pbl_message_descriptor_t*) from; if (msg->fields) { g_queue_free(msg->fields); msg->fields = NULL; } if (msg->fields_by_number) { g_hash_table_destroy(msg->fields_by_number); msg->fields_by_number = NULL; } } else if (from->nodetype == PBL_ENUM) { pbl_enum_descriptor_t* anEnum = (pbl_enum_descriptor_t*) from; if (anEnum->values) { g_queue_free(anEnum->values); anEnum->values = NULL; } if (anEnum->values_by_number) { g_hash_table_destroy(anEnum->values_by_number); anEnum->values_by_number = NULL; } } } return to; } /* free a pbl_node_t and its children. */ void // NOLINTNEXTLINE(misc-no-recursion) pbl_free_node(void *anode) { pbl_method_descriptor_t* method_node; pbl_message_descriptor_t* message_node; pbl_field_descriptor_t* field_node; pbl_enum_descriptor_t* enum_node; pbl_option_descriptor_t* option_node; pbl_node_t* node = (pbl_node_t*) anode; if (node == NULL) return; switch (node->nodetype) { case PBL_METHOD: method_node = (pbl_method_descriptor_t*) node; g_free(method_node->in_msg_type); g_free(method_node->out_msg_type); break; case PBL_MESSAGE: message_node = (pbl_message_descriptor_t*) node; if (message_node->fields) { g_queue_free(message_node->fields); } if (message_node->fields_by_number) { g_hash_table_destroy(message_node->fields_by_number); } break; case PBL_FIELD: case PBL_MAP_FIELD: field_node = (pbl_field_descriptor_t*) node; g_free(field_node->type_name); if (field_node->orig_default_value) { g_free(field_node->orig_default_value); } if ((field_node->type == PROTOBUF_TYPE_STRING || field_node->type == PROTOBUF_TYPE_BYTES) && field_node->default_value.s) { g_free(field_node->default_value.s); } if (field_node->options_node) { // We recurse here, but we're limited by depth checks at allocation time pbl_free_node(field_node->options_node); } break; case PBL_ENUM: enum_node = (pbl_enum_descriptor_t*) node; if (enum_node->values) { g_queue_free(enum_node->values); } if (enum_node->values_by_number) { g_hash_table_destroy(enum_node->values_by_number); } break; case PBL_OPTION: option_node = (pbl_option_descriptor_t*) node; g_free(option_node->value); break; default: /* do nothing */ break; } g_free(node->name); g_free(node->full_name); if (node->children) { g_queue_free_full(node->children, pbl_free_node); } if (node->children_by_name) { g_hash_table_destroy(node->children_by_name); } g_free(node); } /* * Editor modelines - https://www.wireshark.org/tools/modelines.html * * Local variables: * c-basic-offset: 4 * tab-width: 8 * indent-tabs-mode: nil * End: * * vi: set shiftwidth=4 tabstop=8 expandtab: * :indentSize=4:tabSize=8:noTabs=true: */