diff options
author | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-10 20:34:10 +0000 |
---|---|---|
committer | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-10 20:34:10 +0000 |
commit | e4ba6dbc3f1e76890b22773807ea37fe8fa2b1bc (patch) | |
tree | 68cb5ef9081156392f1dd62a00c6ccc1451b93df /epan/dfilter/gencode.c | |
parent | Initial commit. (diff) | |
download | wireshark-e4ba6dbc3f1e76890b22773807ea37fe8fa2b1bc.tar.xz wireshark-e4ba6dbc3f1e76890b22773807ea37fe8fa2b1bc.zip |
Adding upstream version 4.2.2.upstream/4.2.2
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'epan/dfilter/gencode.c')
-rw-r--r-- | epan/dfilter/gencode.c | 897 |
1 files changed, 897 insertions, 0 deletions
diff --git a/epan/dfilter/gencode.c b/epan/dfilter/gencode.c new file mode 100644 index 0000000..6c4da95 --- /dev/null +++ b/epan/dfilter/gencode.c @@ -0,0 +1,897 @@ +/* + * Wireshark - Network traffic analyzer + * By Gerald Combs <gerald@wireshark.org> + * Copyright 2001 Gerald Combs + * + * SPDX-License-Identifier: GPL-2.0-or-later + */ + +#include "config.h" + +#include "gencode.h" +#include "dfvm.h" +#include "syntax-tree.h" +#include "sttype-field.h" +#include "sttype-slice.h" +#include "sttype-op.h" +#include "sttype-set.h" +#include "sttype-function.h" +#include "ftypes/ftypes.h" +#include <wsutil/ws_assert.h> + +static void +fixup_jumps(void *data, void *user_data); + +static void +gencode(dfwork_t *dfw, stnode_t *st_node); + +static dfvm_value_t * +gen_entity(dfwork_t *dfw, stnode_t *st_arg, GSList **jumps_ptr); + +static dfvm_opcode_t +select_opcode(dfvm_opcode_t op, stmatch_t how) +{ + if (how == STNODE_MATCH_DEF) + return op; + + switch (op) { + case DFVM_ALL_EQ: + case DFVM_ALL_NE: + case DFVM_ALL_GT: + case DFVM_ALL_GE: + case DFVM_ALL_LT: + case DFVM_ALL_LE: + case DFVM_ALL_CONTAINS: + case DFVM_ALL_MATCHES: + case DFVM_SET_ALL_IN: + case DFVM_SET_ALL_NOT_IN: + return how == STNODE_MATCH_ALL ? op : op + 1; + case DFVM_ANY_EQ: + case DFVM_ANY_NE: + case DFVM_ANY_GT: + case DFVM_ANY_GE: + case DFVM_ANY_LT: + case DFVM_ANY_LE: + case DFVM_ANY_CONTAINS: + case DFVM_ANY_MATCHES: + case DFVM_SET_ANY_IN: + case DFVM_SET_ANY_NOT_IN: + return how == STNODE_MATCH_ANY ? op : op - 1; + default: + break; + } + ws_assert_not_reached(); +} + +static void +dfw_append_insn(dfwork_t *dfw, dfvm_insn_t *insn) +{ + insn->id = dfw->next_insn_id; + dfw->next_insn_id++; + g_ptr_array_add(dfw->insns, insn); +} + +static void +dfw_append_stack_push(dfwork_t *dfw, dfvm_value_t *arg1) +{ + dfvm_insn_t *insn; + + insn = dfvm_insn_new(DFVM_STACK_PUSH); + insn->arg1 = dfvm_value_ref(arg1); + dfw_append_insn(dfw, insn); +} + +static void +dfw_append_stack_pop(dfwork_t *dfw, unsigned count) +{ + dfvm_insn_t *insn; + dfvm_value_t *val; + + insn = dfvm_insn_new(DFVM_STACK_POP); + val = dfvm_value_new_guint(count); + insn->arg1 = dfvm_value_ref(val); + dfw_append_insn(dfw, insn); +} + +static void +dfw_append_set_add_range(dfwork_t *dfw, dfvm_value_t *arg1, dfvm_value_t *arg2) +{ + dfvm_insn_t *insn; + + insn = dfvm_insn_new(DFVM_SET_ADD_RANGE); + insn->arg1 = dfvm_value_ref(arg1); + insn->arg2 = dfvm_value_ref(arg2); + dfw_append_insn(dfw, insn); +} + +static void +dfw_append_set_add(dfwork_t *dfw, dfvm_value_t *arg1) +{ + dfvm_insn_t *insn; + + insn = dfvm_insn_new(DFVM_SET_ADD); + insn->arg1 = dfvm_value_ref(arg1); + dfw_append_insn(dfw, insn); +} + +static dfvm_value_t * +dfw_append_jump(dfwork_t *dfw) +{ + dfvm_insn_t *insn; + dfvm_value_t *jmp; + + insn = dfvm_insn_new(DFVM_IF_FALSE_GOTO); + jmp = dfvm_value_new(INSN_NUMBER); + insn->arg1 = dfvm_value_ref(jmp); + dfw_append_insn(dfw, insn); + return jmp; +} + +/* returns register number */ +static dfvm_value_t * +dfw_append_read_tree(dfwork_t *dfw, header_field_info *hfinfo, + drange_t *range, + bool raw) +{ + dfvm_insn_t *insn; + int reg = -1; + dfvm_value_t *reg_val, *val1, *val3; + bool added_new_hfinfo = false; + GHashTable *loaded_fields; + void *loaded_key; + + /* Rewind to find the first field of this name. */ + while (hfinfo->same_name_prev_id != -1) { + hfinfo = proto_registrar_get_nth(hfinfo->same_name_prev_id); + } + + if (raw) + loaded_fields = dfw->loaded_raw_fields; + else + loaded_fields = dfw->loaded_fields; + + /* Keep track of which registers + * were used for which hfinfo's so that we + * can re-use registers. */ + /* Re-use only if we are not using a range (layer filter). */ + loaded_key = g_hash_table_lookup(loaded_fields, hfinfo); + if (loaded_key != NULL) { + if (range == NULL) { + /* + * Reg's are stored in has as reg+1, so + * that the non-existence of a hfinfo in + * the hash, or 0, can be differentiated from + * a hfinfo being loaded into register #0. + */ + reg = GPOINTER_TO_INT(loaded_key) - 1; + } + else { + reg = dfw->next_register++; + } + } + else { + reg = dfw->next_register++; + g_hash_table_insert(loaded_fields, + hfinfo, GINT_TO_POINTER(reg + 1)); + + added_new_hfinfo = true; + } + + val1 = dfvm_value_new_hfinfo(hfinfo, raw); + reg_val = dfvm_value_new_register(reg); + if (range) { + val3 = dfvm_value_new_drange(range); + insn = dfvm_insn_new(DFVM_READ_TREE_R); + } + else { + val3 = NULL; + insn = dfvm_insn_new(DFVM_READ_TREE); + } + insn->arg1 = dfvm_value_ref(val1); + insn->arg2 = dfvm_value_ref(reg_val); + insn->arg3 = dfvm_value_ref(val3); + dfw_append_insn(dfw, insn); + + if (added_new_hfinfo) { + while (hfinfo) { + /* Record the FIELD_ID in hash of interesting fields. */ + g_hash_table_add(dfw->interesting_fields, &hfinfo->id); + hfinfo = hfinfo->same_name_next; + } + } + + return reg_val; +} + +/* returns register number */ +static dfvm_value_t * +dfw_append_read_reference(dfwork_t *dfw, header_field_info *hfinfo, + drange_t *range, + bool raw) +{ + dfvm_insn_t *insn; + dfvm_value_t *reg_val, *val1, *val3; + GPtrArray *refs_array; + + /* Rewind to find the first field of this name. */ + while (hfinfo->same_name_prev_id != -1) { + hfinfo = proto_registrar_get_nth(hfinfo->same_name_prev_id); + } + + /* We can't reuse registers with a filter so just skip + * that optimization and don't reuse them at all. */ + val1 = dfvm_value_new_hfinfo(hfinfo, raw); + reg_val = dfvm_value_new_register(dfw->next_register++); + if (range) { + val3 = dfvm_value_new_drange(range); + insn = dfvm_insn_new(DFVM_READ_REFERENCE_R); + } + else { + val3 = NULL; + insn = dfvm_insn_new(DFVM_READ_REFERENCE); + } + insn->arg1 = dfvm_value_ref(val1); + insn->arg2 = dfvm_value_ref(reg_val); + insn->arg3 = dfvm_value_ref(val3); + dfw_append_insn(dfw, insn); + + refs_array = g_ptr_array_new_with_free_func((GDestroyNotify)reference_free); + if (raw) + g_hash_table_insert(dfw->raw_references, hfinfo, refs_array); + else + g_hash_table_insert(dfw->references, hfinfo, refs_array); + + /* Record the FIELD_ID in hash of interesting fields. */ + while (hfinfo) { + /* Record the FIELD_ID in hash of interesting fields. */ + g_hash_table_add(dfw->interesting_fields, &hfinfo->id); + hfinfo = hfinfo->same_name_next; + } + + return reg_val; +} + +/* returns register number */ +static dfvm_value_t * +dfw_append_mk_slice(dfwork_t *dfw, stnode_t *node, GSList **jumps_ptr) +{ + stnode_t *entity; + dfvm_insn_t *insn; + dfvm_value_t *reg_val, *val1, *val3; + + entity = sttype_slice_entity(node); + + insn = dfvm_insn_new(DFVM_SLICE); + val1 = gen_entity(dfw, entity, jumps_ptr); + insn->arg1 = dfvm_value_ref(val1); + reg_val = dfvm_value_new_register(dfw->next_register++); + insn->arg2 = dfvm_value_ref(reg_val); + val3 = dfvm_value_new_drange(sttype_slice_drange_steal(node)); + insn->arg3 = dfvm_value_ref(val3); + sttype_slice_remove_drange(node); + dfw_append_insn(dfw, insn); + + return reg_val; +} + +/* returns register number */ +_U_ static dfvm_value_t * +dfw_append_put_fvalue(dfwork_t *dfw, fvalue_t *fv) +{ + dfvm_insn_t *insn; + dfvm_value_t *reg_val, *val1; + + insn = dfvm_insn_new(DFVM_PUT_FVALUE); + val1 = dfvm_value_new_fvalue(fv); + insn->arg1 = dfvm_value_ref(val1); + reg_val = dfvm_value_new_register(dfw->next_register++); + insn->arg2 = dfvm_value_ref(reg_val); + dfw_append_insn(dfw, insn); + + return reg_val; +} + +/* returns register number that the length's result will be in. */ +static dfvm_value_t * +dfw_append_length(dfwork_t *dfw, stnode_t *node, GSList **jumps_ptr) +{ + GSList *params; + dfvm_insn_t *insn; + dfvm_value_t *reg_val, *val_arg; + + /* Create the new DFVM instruction */ + insn = dfvm_insn_new(DFVM_LENGTH); + /* Create input argument */ + params = sttype_function_params(node); + ws_assert(params); + ws_assert(g_slist_length(params) == 1); + val_arg = gen_entity(dfw, params->data, jumps_ptr); + insn->arg1 = dfvm_value_ref(val_arg); + /* Destination. */ + reg_val = dfvm_value_new_register(dfw->next_register++); + insn->arg2 = dfvm_value_ref(reg_val); + + dfw_append_insn(dfw, insn); + return reg_val; +} + +/* returns register number that the functions's result will be in. */ +static dfvm_value_t * +dfw_append_function(dfwork_t *dfw, stnode_t *node, GSList **jumps_ptr) +{ + GSList *params; + dfvm_value_t *jmp; + dfvm_insn_t *insn; + dfvm_value_t *reg_val, *val1, *val3, *val_arg; + unsigned count; + GSList *params_jumps = NULL; + + if (strcmp(sttype_function_name(node), "len") == 0) { + /* Replace len() function call with DFVM_LENGTH instruction. */ + return dfw_append_length(dfw, node, jumps_ptr); + } + + /* Create the new DFVM instruction */ + insn = dfvm_insn_new(DFVM_CALL_FUNCTION); + val1 = dfvm_value_new_funcdef(sttype_function_funcdef(node)); + insn->arg1 = dfvm_value_ref(val1); + reg_val = dfvm_value_new_register(dfw->next_register++); + insn->arg2 = dfvm_value_ref(reg_val); + + /* Create input arguments */ + params = sttype_function_params(node); + ws_assert(params); + count = 0; + while (params) { + val_arg = gen_entity(dfw, params->data, ¶ms_jumps); + /* If a parameter fails to generate jump here. + * Note: stack_push NULL register is valid. */ + g_slist_foreach(params_jumps, fixup_jumps, dfw); + g_slist_free(params_jumps); + params_jumps = NULL; + dfw_append_stack_push(dfw, val_arg); + count++; + params = params->next; + } + val3 = dfvm_value_new_guint(count); + insn->arg3 = dfvm_value_ref(val3); + dfw_append_insn(dfw, insn); + dfw_append_stack_pop(dfw, count); + + /* We need another instruction to jump to another exit + * place, if the call() of our function failed for some reason */ + insn = dfvm_insn_new(DFVM_IF_FALSE_GOTO); + jmp = dfvm_value_new(INSN_NUMBER); + insn->arg1 = dfvm_value_ref(jmp); + dfw_append_insn(dfw, insn); + *jumps_ptr = g_slist_prepend(*jumps_ptr, jmp); + + return reg_val; +} + +/** + * Adds an instruction for a relation operator where the values are already + * loaded in registers. + */ +static void +gen_relation_insn(dfwork_t *dfw, dfvm_opcode_t op, + dfvm_value_t *arg1, dfvm_value_t *arg2, + dfvm_value_t *arg3) +{ + dfvm_insn_t *insn; + + insn = dfvm_insn_new(op); + insn->arg1 = dfvm_value_ref(arg1); + insn->arg2 = dfvm_value_ref(arg2); + insn->arg3 = dfvm_value_ref(arg3); + dfw_append_insn(dfw, insn); +} + +static void +gen_relation(dfwork_t *dfw, dfvm_opcode_t op, stmatch_t how, + stnode_t *st_arg1, stnode_t *st_arg2) +{ + GSList *jumps = NULL; + dfvm_value_t *val1, *val2; + + /* Create code for the LHS and RHS of the relation */ + val1 = gen_entity(dfw, st_arg1, &jumps); + val2 = gen_entity(dfw, st_arg2, &jumps); + + /* Then combine them in a DFVM insruction */ + op = select_opcode(op, how); + gen_relation_insn(dfw, op, val1, val2, NULL); + + /* If either of the relation arguments need an "exit" instruction + * to jump to (on failure), mark them */ + g_slist_foreach(jumps, fixup_jumps, dfw); + g_slist_free(jumps); + jumps = NULL; +} + +static void +fixup_jumps(void *data, void *user_data) +{ + dfvm_value_t *jmp = (dfvm_value_t*)data; + dfwork_t *dfw = (dfwork_t*)user_data; + + if (jmp) { + jmp->value.numeric = dfw->next_insn_id; + } +} + +/* Generate the code for the in operator. Pushes set values into a stack + * and then evaluates membership in a single instruction. */ +static void +gen_relation_in(dfwork_t *dfw, dfvm_opcode_t op, stmatch_t how, + stnode_t *st_arg1, stnode_t *st_arg2) +{ + dfvm_insn_t *insn; + GSList *jumps = NULL; + GSList *node_jumps = NULL; + dfvm_value_t *val1, *val2, *val3; + stnode_t *node1, *node2; + GSList *nodelist_head, *nodelist; + + /* Create code for the LHS of the relation */ + val1 = gen_entity(dfw, st_arg1, &jumps); + + /* Create code to populate the set stack */ + nodelist_head = nodelist = stnode_steal_data(st_arg2); + while (nodelist) { + node1 = nodelist->data; + nodelist = g_slist_next(nodelist); + node2 = nodelist->data; + nodelist = g_slist_next(nodelist); + + if (node2) { + /* Range element. */ + val2 = gen_entity(dfw, node1, &node_jumps); + val3 = gen_entity(dfw, node2, &node_jumps); + dfw_append_set_add_range(dfw, val2, val3); + } else { + /* Normal element. */ + val2 = gen_entity(dfw, node1, &node_jumps); + dfw_append_set_add(dfw, val2); + } + + /* If an item is not present, just jump to the next item */ + g_slist_foreach(node_jumps, fixup_jumps, dfw); + g_slist_free(node_jumps); + node_jumps = NULL; + } + set_nodelist_free(nodelist_head); + + /* Create code for the set on the RHS of the relation */ + insn = dfvm_insn_new(select_opcode(op, how)); + insn->arg1 = dfvm_value_ref(val1); + dfw_append_insn(dfw, insn); + + /* Add instruction to clear the whole stack */ + insn = dfvm_insn_new(DFVM_SET_CLEAR); + dfw_append_insn(dfw, insn); + + /* Jump here if the LHS entity was not present */ + g_slist_foreach(jumps, fixup_jumps, dfw); + g_slist_free(jumps); + jumps = NULL; +} + +static dfvm_value_t * +gen_arithmetic(dfwork_t *dfw, stnode_t *st_arg, GSList **jumps_ptr) +{ + stnode_t *left, *right; + stnode_op_t st_op; + dfvm_value_t *reg_val, *val1, *val2 = NULL; + dfvm_opcode_t op; + + sttype_oper_get(st_arg, &st_op, &left, &right); + + if (st_op == STNODE_OP_UNARY_MINUS) { + op = DFVM_UNARY_MINUS; + } + else if (st_op == STNODE_OP_ADD) { + op = DFVM_ADD; + } + else if (st_op == STNODE_OP_SUBTRACT) { + op = DFVM_SUBTRACT; + } + else if (st_op == STNODE_OP_MULTIPLY) { + op = DFVM_MULTIPLY; + } + else if (st_op == STNODE_OP_DIVIDE) { + op = DFVM_DIVIDE; + } + else if (st_op == STNODE_OP_MODULO) { + op = DFVM_MODULO; + } + else if (st_op == STNODE_OP_BITWISE_AND) { + op = DFVM_BITWISE_AND; + } + else { + ws_assert_not_reached(); + } + + val1 = gen_entity(dfw, left, jumps_ptr); + if (right == NULL) { + /* Generate unary DFVM instruction. */ + reg_val = dfvm_value_new_register(dfw->next_register++); + gen_relation_insn(dfw, op, val1, reg_val, NULL); + return reg_val; + } + + val2 = gen_entity(dfw, right, jumps_ptr); + reg_val = dfvm_value_new_register(dfw->next_register++); + gen_relation_insn(dfw, op, val1, val2, reg_val); + return reg_val; +} + +/* Parse an entity, returning the reg that it gets put into. + * p_jmp will be set if it has to be set by the calling code; it should + * be set to the place to jump to, to return to the calling code, + * if the load of a field from the proto_tree fails. */ +static dfvm_value_t * +gen_entity(dfwork_t *dfw, stnode_t *st_arg, GSList **jumps_ptr) +{ + sttype_id_t e_type; + dfvm_value_t *val; + header_field_info *hfinfo; + drange_t *range = NULL; + bool raw; + e_type = stnode_type_id(st_arg); + + if (e_type == STTYPE_FIELD) { + hfinfo = sttype_field_hfinfo(st_arg); + range = sttype_field_drange_steal(st_arg); + raw = sttype_field_raw(st_arg); + val = dfw_append_read_tree(dfw, hfinfo, range, raw); + if (jumps_ptr != NULL) { + *jumps_ptr = g_slist_prepend(*jumps_ptr, dfw_append_jump(dfw)); + } + } + else if (e_type == STTYPE_REFERENCE) { + hfinfo = sttype_field_hfinfo(st_arg); + range = sttype_field_drange_steal(st_arg); + raw = sttype_field_raw(st_arg); + val = dfw_append_read_reference(dfw, hfinfo, range, raw); + if (jumps_ptr != NULL) { + *jumps_ptr = g_slist_prepend(*jumps_ptr, dfw_append_jump(dfw)); + } + } + else if (e_type == STTYPE_FVALUE) { + val = dfvm_value_new_fvalue(stnode_steal_data(st_arg)); + } + else if (e_type == STTYPE_SLICE) { + val = dfw_append_mk_slice(dfw, st_arg, jumps_ptr); + } + else if (e_type == STTYPE_FUNCTION) { + val = dfw_append_function(dfw, st_arg, jumps_ptr); + } + else if (e_type == STTYPE_PCRE) { + val = dfvm_value_new_pcre(stnode_steal_data(st_arg)); + } + else if (e_type == STTYPE_ARITHMETIC) { + val = gen_arithmetic(dfw, st_arg, jumps_ptr); + } + else { + ws_error("Invalid sttype: %s", stnode_type_name(st_arg)); + } + return val; +} + +static void +gen_exists(dfwork_t *dfw, stnode_t *st_node) +{ + dfvm_insn_t *insn; + dfvm_value_t *val1, *val2 = NULL; + header_field_info *hfinfo; + drange_t *range = NULL; + + hfinfo = sttype_field_hfinfo(st_node); + range = sttype_field_drange_steal(st_node); + + /* Rewind to find the first field of this name. */ + while (hfinfo->same_name_prev_id != -1) { + hfinfo = proto_registrar_get_nth(hfinfo->same_name_prev_id); + } + + /* Ignore "rawness" for existence tests. */ + val1 = dfvm_value_new_hfinfo(hfinfo, false); + if (range) { + val2 = dfvm_value_new_drange(range); + } + + if (val2) { + insn = dfvm_insn_new(DFVM_CHECK_EXISTS_R); + insn->arg1 = dfvm_value_ref(val1); + insn->arg2 = dfvm_value_ref(val2); + } + else { + insn = dfvm_insn_new(DFVM_CHECK_EXISTS); + insn->arg1 = dfvm_value_ref(val1); + } + dfw_append_insn(dfw, insn); + + /* Record the FIELD_ID in hash of interesting fields. */ + while (hfinfo) { + g_hash_table_add(dfw->interesting_fields, &hfinfo->id); + hfinfo = hfinfo->same_name_next; + } +} + +static void +gen_notzero(dfwork_t *dfw, stnode_t *st_node) +{ + dfvm_insn_t *insn; + dfvm_value_t *val1; + GSList *jumps = NULL; + + val1 = gen_arithmetic(dfw, st_node, &jumps); + insn = dfvm_insn_new(DFVM_NOT_ALL_ZERO); + insn->arg1 = dfvm_value_ref(val1); + dfw_append_insn(dfw, insn); + g_slist_foreach(jumps, fixup_jumps, dfw); + g_slist_free(jumps); +} + +static void +gen_exists_slice(dfwork_t *dfw, stnode_t *st_node) +{ + dfvm_insn_t *insn; + dfvm_value_t *val1, *reg_val; + GSList *jumps = NULL; + + val1 = gen_entity(dfw, st_node, &jumps); + /* Compute length. */ + insn = dfvm_insn_new(DFVM_LENGTH); + insn->arg1 = dfvm_value_ref(val1); + reg_val = dfvm_value_new_register(dfw->next_register++); + insn->arg2 = dfvm_value_ref(reg_val); + dfw_append_insn(dfw, insn); + /* Check length is not zero. */ + insn = dfvm_insn_new(DFVM_NOT_ALL_ZERO); + insn->arg1 = dfvm_value_ref(reg_val); + dfw_append_insn(dfw, insn); + /* Fixup jumps. */ + g_slist_foreach(jumps, fixup_jumps, dfw); + g_slist_free(jumps); +} + +static void +gen_test(dfwork_t *dfw, stnode_t *st_node) +{ + stnode_op_t st_op; + stmatch_t st_how; + stnode_t *st_arg1, *st_arg2; + dfvm_insn_t *insn; + dfvm_value_t *jmp; + + + sttype_oper_get(st_node, &st_op, &st_arg1, &st_arg2); + st_how = sttype_test_get_match(st_node); + + switch (st_op) { + case STNODE_OP_UNINITIALIZED: + ws_assert_not_reached(); + break; + + case STNODE_OP_NOT: + gencode(dfw, st_arg1); + insn = dfvm_insn_new(DFVM_NOT); + dfw_append_insn(dfw, insn); + break; + + case STNODE_OP_AND: + gencode(dfw, st_arg1); + + insn = dfvm_insn_new(DFVM_IF_FALSE_GOTO); + jmp = dfvm_value_new(INSN_NUMBER); + insn->arg1 = dfvm_value_ref(jmp); + dfw_append_insn(dfw, insn); + + gencode(dfw, st_arg2); + jmp->value.numeric = dfw->next_insn_id; + break; + + case STNODE_OP_OR: + gencode(dfw, st_arg1); + + insn = dfvm_insn_new(DFVM_IF_TRUE_GOTO); + jmp = dfvm_value_new(INSN_NUMBER); + insn->arg1 = dfvm_value_ref(jmp); + dfw_append_insn(dfw, insn); + + gencode(dfw, st_arg2); + jmp->value.numeric = dfw->next_insn_id; + break; + + case STNODE_OP_ALL_EQ: + gen_relation(dfw, DFVM_ALL_EQ, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_ANY_EQ: + gen_relation(dfw, DFVM_ANY_EQ, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_ALL_NE: + gen_relation(dfw, DFVM_ALL_NE, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_ANY_NE: + gen_relation(dfw, DFVM_ANY_NE, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_GT: + gen_relation(dfw, DFVM_ANY_GT, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_GE: + gen_relation(dfw, DFVM_ANY_GE, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_LT: + gen_relation(dfw, DFVM_ANY_LT, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_LE: + gen_relation(dfw, DFVM_ANY_LE, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_CONTAINS: + gen_relation(dfw, DFVM_ANY_CONTAINS, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_MATCHES: + gen_relation(dfw, DFVM_ANY_MATCHES, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_IN: + gen_relation_in(dfw, DFVM_SET_ANY_IN, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_NOT_IN: + gen_relation_in(dfw, DFVM_SET_ANY_NOT_IN, st_how, st_arg1, st_arg2); + break; + + case STNODE_OP_BITWISE_AND: + case STNODE_OP_UNARY_MINUS: + case STNODE_OP_ADD: + case STNODE_OP_SUBTRACT: + case STNODE_OP_MULTIPLY: + case STNODE_OP_DIVIDE: + case STNODE_OP_MODULO: + ws_assert_not_reached(); + break; + } +} + +static void +gencode(dfwork_t *dfw, stnode_t *st_node) +{ + switch (stnode_type_id(st_node)) { + case STTYPE_TEST: + gen_test(dfw, st_node); + break; + case STTYPE_FIELD: + gen_exists(dfw, st_node); + break; + case STTYPE_ARITHMETIC: + gen_notzero(dfw, st_node); + break; + case STTYPE_SLICE: + gen_exists_slice(dfw, st_node); + break; + default: + ws_assert_not_reached(); + } +} + + +static void +optimize(dfwork_t *dfw) +{ + int id, id1, length; + dfvm_insn_t *insn, *insn1, *prev; + dfvm_value_t *arg1; + + length = dfw->insns->len; + + for (id = 0, prev = NULL; id < length; prev = insn, id++) { + insn = (dfvm_insn_t *)g_ptr_array_index(dfw->insns, id); + arg1 = insn->arg1; + if (insn->op == DFVM_IF_TRUE_GOTO || insn->op == DFVM_IF_FALSE_GOTO) { + /* Try to optimize branch jumps */ + dfvm_opcode_t revert = (insn->op == DFVM_IF_FALSE_GOTO) ? DFVM_IF_TRUE_GOTO : DFVM_IF_FALSE_GOTO; + id1 = arg1->value.numeric; + for (;;) { + insn1 = (dfvm_insn_t*)g_ptr_array_index(dfw->insns, id1); + if (insn1->op == revert) { + /* Skip this one; it is always false and the branch is not taken */ + id1 = id1 +1; + continue; + } + if (insn1->op == DFVM_READ_TREE && prev && prev->op == DFVM_READ_TREE && + prev->arg2->value.numeric == insn1->arg2->value.numeric) { + /* Skip this one; hack if it's the same register it's the same field + * and it returns the same value */ + id1 = id1 +1; + continue; + } + if (insn1->op == insn->op) { + /* The branch jumps to the same branch instruction so + * coalesce the jumps */ + arg1 = insn1->arg1; + id1 = arg1->value.numeric; + continue; + } + /* Finished */ + arg1 = insn->arg1; + arg1->value.numeric = id1; + break; + } + } + } +} + +void +dfw_gencode(dfwork_t *dfw) +{ + dfw->insns = g_ptr_array_new(); + dfw->loaded_fields = g_hash_table_new(g_direct_hash, g_direct_equal); + dfw->loaded_raw_fields = g_hash_table_new(g_direct_hash, g_direct_equal); + dfw->interesting_fields = g_hash_table_new(g_int_hash, g_int_equal); + gencode(dfw, dfw->st_root); + dfw_append_insn(dfw, dfvm_insn_new(DFVM_RETURN)); + if (dfw->flags & DF_OPTIMIZE) { + optimize(dfw); + } +} + + +typedef struct { + int i; + int *fields; +} hash_key_iterator; + +static void +get_hash_key(void *key, void *value _U_, void *user_data) +{ + int field_id = *(int *)key; + hash_key_iterator *hki = (hash_key_iterator *)user_data; + + hki->fields[hki->i] = field_id; + hki->i++; +} + +int* +dfw_interesting_fields(dfwork_t *dfw, int *caller_num_fields) +{ + int num_fields = g_hash_table_size(dfw->interesting_fields); + + hash_key_iterator hki; + + if (num_fields == 0) { + *caller_num_fields = 0; + return NULL; + } + + hki.fields = g_new(int, num_fields); + hki.i = 0; + + g_hash_table_foreach(dfw->interesting_fields, get_hash_key, &hki); + *caller_num_fields = num_fields; + return hki.fields; +} + +/* + * Editor modelines - https://www.wireshark.org/tools/modelines.html + * + * Local variables: + * c-basic-offset: 8 + * tab-width: 8 + * indent-tabs-mode: t + * End: + * + * vi: set shiftwidth=8 tabstop=8 noexpandtab: + * :indentSize=8:tabSize=8:noTabs=false: + */ |