diff options
Diffstat (limited to '')
-rw-r--r-- | src/http_conv.c | 453 |
1 files changed, 453 insertions, 0 deletions
diff --git a/src/http_conv.c b/src/http_conv.c new file mode 100644 index 0000000..cf515a8 --- /dev/null +++ b/src/http_conv.c @@ -0,0 +1,453 @@ +/* + * HTTP sample conversion + * + * Copyright 2000-2018 Willy Tarreau <w@1wt.eu> + * + * This program is free software; you can redistribute it and/or + * modify it under the terms of the GNU General Public License + * as published by the Free Software Foundation; either version + * 2 of the License, or (at your option) any later version. + * + */ + +#include <sys/types.h> + +#include <ctype.h> +#include <string.h> +#include <time.h> + +#include <haproxy/api.h> +#include <haproxy/arg.h> +#include <haproxy/capture-t.h> +#include <haproxy/chunk.h> +#include <haproxy/http.h> +#include <haproxy/pool.h> +#include <haproxy/sample.h> +#include <haproxy/stream.h> +#include <haproxy/tools.h> +#include <haproxy/version.h> + +static int smp_check_http_date_unit(struct arg *args, struct sample_conv *conv, + const char *file, int line, char **err) +{ + return smp_check_date_unit(args, err); +} + +/* takes an UINT value on input supposed to represent the time since EPOCH, + * adds an optional offset found in args[0] and emits a string representing + * the date in RFC-1123/5322 format. If optional unit param in args[1] is + * provided, decode timestamp in milliseconds ("ms") or microseconds("us"), + * and use relevant output date format. + */ +static int sample_conv_http_date(const struct arg *args, struct sample *smp, void *private) +{ + const char day[7][4] = { "Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat" }; + const char mon[12][4] = { "Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec" }; + struct buffer *temp; + struct tm tm; + int sec_frac = 0; + time_t curr_date; + + /* add offset */ + if (args[0].type == ARGT_SINT) + smp->data.u.sint += args[0].data.sint; + + /* report in milliseconds */ + if (args[1].type == ARGT_SINT && args[1].data.sint == TIME_UNIT_MS) { + sec_frac = smp->data.u.sint % 1000; + smp->data.u.sint /= 1000; + } + /* report in microseconds */ + else if (args[1].type == ARGT_SINT && args[1].data.sint == TIME_UNIT_US) { + sec_frac = smp->data.u.sint % 1000000; + smp->data.u.sint /= 1000000; + } + + /* With high numbers, the date returned can be negative, the 55 bits mask prevent this. */ + curr_date = smp->data.u.sint & 0x007fffffffffffffLL; + + get_gmtime(curr_date, &tm); + + temp = get_trash_chunk(); + if (args[1].type == ARGT_SINT && args[1].data.sint != TIME_UNIT_S) { + temp->data = snprintf(temp->area, temp->size - temp->data, + "%s, %02d %s %04d %02d:%02d:%02d.%d GMT", + day[tm.tm_wday], tm.tm_mday, mon[tm.tm_mon], + 1900+tm.tm_year, + tm.tm_hour, tm.tm_min, tm.tm_sec, sec_frac); + } else { + temp->data = snprintf(temp->area, temp->size - temp->data, + "%s, %02d %s %04d %02d:%02d:%02d GMT", + day[tm.tm_wday], tm.tm_mday, mon[tm.tm_mon], + 1900+tm.tm_year, + tm.tm_hour, tm.tm_min, tm.tm_sec); + } + + smp->data.u.str = *temp; + smp->data.type = SMP_T_STR; + return 1; +} + +/* Arguments: The list of expected value, the number of parts returned and the separator */ +static int sample_conv_q_preferred(const struct arg *args, struct sample *smp, void *private) +{ + const char *al = smp->data.u.str.area; + const char *end = al + smp->data.u.str.data; + const char *token; + int toklen; + int qvalue; + const char *str; + const char *w; + int best_q = 0; + + /* Set the constant to the sample, because the output of the + * function will be peek in the constant configuration string. + */ + smp->flags |= SMP_F_CONST; + smp->data.u.str.size = 0; + smp->data.u.str.area = ""; + smp->data.u.str.data = 0; + + /* Parse the accept language */ + while (1) { + + /* Jump spaces, quit if the end is detected. */ + while (al < end && isspace((unsigned char)*al)) + al++; + if (al >= end) + break; + + /* Start of the first word. */ + token = al; + + /* Look for separator: isspace(), ',' or ';'. Next value if 0 length word. */ + while (al < end && *al != ';' && *al != ',' && !isspace((unsigned char)*al)) + al++; + if (al == token) + goto expect_comma; + + /* Length of the token. */ + toklen = al - token; + qvalue = 1000; + + /* Check if the token exists in the list. If the token not exists, + * jump to the next token. + */ + str = args[0].data.str.area; + w = str; + while (1) { + if (*str == ';' || *str == '\0') { + if (http_language_range_match(token, toklen, w, str - w)) + goto look_for_q; + if (*str == '\0') + goto expect_comma; + w = str + 1; + } + str++; + } + goto expect_comma; + +look_for_q: + + /* Jump spaces, quit if the end is detected. */ + while (al < end && isspace((unsigned char)*al)) + al++; + if (al >= end) + goto process_value; + + /* If ',' is found, process the result */ + if (*al == ',') + goto process_value; + + /* If the character is different from ';', look + * for the end of the header part in best effort. + */ + if (*al != ';') + goto expect_comma; + + /* Assumes that the char is ';', now expect "q=". */ + al++; + + /* Jump spaces, process value if the end is detected. */ + while (al < end && isspace((unsigned char)*al)) + al++; + if (al >= end) + goto process_value; + + /* Expect 'q'. If no 'q', continue in best effort */ + if (*al != 'q') + goto process_value; + al++; + + /* Jump spaces, process value if the end is detected. */ + while (al < end && isspace((unsigned char)*al)) + al++; + if (al >= end) + goto process_value; + + /* Expect '='. If no '=', continue in best effort */ + if (*al != '=') + goto process_value; + al++; + + /* Jump spaces, process value if the end is detected. */ + while (al < end && isspace((unsigned char)*al)) + al++; + if (al >= end) + goto process_value; + + /* Parse the q value. */ + qvalue = http_parse_qvalue(al, &al); + +process_value: + + /* If the new q value is the best q value, then store the associated + * language in the response. If qvalue is the biggest value (1000), + * break the process. + */ + if (qvalue > best_q) { + smp->data.u.str.area = (char *)w; + smp->data.u.str.data = str - w; + if (qvalue >= 1000) + break; + best_q = qvalue; + } + +expect_comma: + + /* Expect comma or end. If the end is detected, quit the loop. */ + while (al < end && *al != ',') + al++; + if (al >= end) + break; + + /* Comma is found, jump it and restart the analyzer. */ + al++; + } + + /* Set default value if required. */ + if (smp->data.u.str.data == 0 && args[1].type == ARGT_STR) { + smp->data.u.str.area = args[1].data.str.area; + smp->data.u.str.data = args[1].data.str.data; + } + + /* Return true only if a matching language was found. */ + return smp->data.u.str.data != 0; +} + +/* This fetch url-decode any input string. */ +static int sample_conv_url_dec(const struct arg *args, struct sample *smp, void *private) +{ + int in_form = 0; + int len; + + /* If the constant flag is set or if not size is available at + * the end of the buffer, copy the string in other buffer + * before decoding. + */ + if (smp->flags & SMP_F_CONST || smp->data.u.str.size <= smp->data.u.str.data) { + struct buffer *str = get_trash_chunk(); + memcpy(str->area, smp->data.u.str.area, smp->data.u.str.data); + smp->data.u.str.area = str->area; + smp->data.u.str.size = str->size; + smp->flags &= ~SMP_F_CONST; + } + + /* Add final \0 required by url_decode(), and convert the input string. */ + smp->data.u.str.area[smp->data.u.str.data] = '\0'; + + if (args[0].type == ARGT_SINT) + in_form = !!args[0].data.sint; + + len = url_decode(smp->data.u.str.area, in_form); + if (len < 0) + return 0; + smp->data.u.str.data = len; + return 1; +} + +/* url-encode types and encode maps */ +enum encode_type { + ENC_QUERY = 0, +}; +long query_encode_map[(256 / 8) / sizeof(long)]; + +/* Check url-encode type */ +static int sample_conv_url_enc_check(struct arg *arg, struct sample_conv *conv, + const char *file, int line, char **err) +{ + enum encode_type enc_type; + + if (strcmp(arg->data.str.area, "") == 0) + enc_type = ENC_QUERY; + else if (strcmp(arg->data.str.area, "query") == 0) + enc_type = ENC_QUERY; + else { + memprintf(err, "Unexpected encode type. " + "Allowed value is 'query'"); + return 0; + } + + chunk_destroy(&arg->data.str); + arg->type = ARGT_SINT; + arg->data.sint = enc_type; + return 1; +} + +/* Initializes some url encode data at boot */ +static void sample_conf_url_enc_init() +{ + int i; + + memset(query_encode_map, 0, sizeof(query_encode_map)); + /* use rfc3986 to determine list of characters to keep unchanged for + * query string */ + for (i = 0; i < 256; i++) { + if (!((i >= 'a' && i <= 'z') || (i >= 'A' && i <= 'Z') + || (i >= '0' && i <= '9') || + i == '-' || i == '.' || i == '_' || i == '~')) + ha_bit_set(i, query_encode_map); + } +} + +INITCALL0(STG_PREPARE, sample_conf_url_enc_init); + +/* This fetch url-encode any input string. Only support query string for now */ +static int sample_conv_url_enc(const struct arg *args, struct sample *smp, void + *private) +{ + enum encode_type enc_type; + struct buffer *trash = get_trash_chunk(); + long *encode_map; + char *ret; + + enc_type = ENC_QUERY; + enc_type = args->data.sint; + + if (enc_type == ENC_QUERY) + encode_map = query_encode_map; + else + return 0; + + ret = encode_chunk(trash->area, trash->area + trash->size, '%', + encode_map, &smp->data.u.str); + if (ret == NULL || *ret != '\0') + return 0; + trash->data = ret - trash->area; + smp->data.u.str = *trash; + return 1; +} + +static int smp_conv_req_capture(const struct arg *args, struct sample *smp, void *private) +{ + struct proxy *fe; + int idx, i; + struct cap_hdr *hdr; + int len; + + if (args->type != ARGT_SINT) + return 0; + + if (!smp->strm) + return 0; + + fe = strm_fe(smp->strm); + idx = args->data.sint; + + /* Check the availability of the capture id. */ + if (idx > fe->nb_req_cap - 1) + return 0; + + /* Look for the original configuration. */ + for (hdr = fe->req_cap, i = fe->nb_req_cap - 1; + hdr != NULL && i != idx ; + i--, hdr = hdr->next); + if (!hdr) + return 0; + + /* check for the memory allocation */ + if (smp->strm->req_cap[hdr->index] == NULL) + smp->strm->req_cap[hdr->index] = pool_alloc(hdr->pool); + if (smp->strm->req_cap[hdr->index] == NULL) + return 0; + + /* Check length. */ + len = smp->data.u.str.data; + if (len > hdr->len) + len = hdr->len; + + /* Capture input data. */ + memcpy(smp->strm->req_cap[idx], smp->data.u.str.area, len); + smp->strm->req_cap[idx][len] = '\0'; + + return 1; +} + +static int smp_conv_res_capture(const struct arg *args, struct sample *smp, void *private) +{ + struct proxy *fe; + int idx, i; + struct cap_hdr *hdr; + int len; + + if (args->type != ARGT_SINT) + return 0; + + if (!smp->strm) + return 0; + + fe = strm_fe(smp->strm); + idx = args->data.sint; + + /* Check the availability of the capture id. */ + if (idx > fe->nb_rsp_cap - 1) + return 0; + + /* Look for the original configuration. */ + for (hdr = fe->rsp_cap, i = fe->nb_rsp_cap - 1; + hdr != NULL && i != idx ; + i--, hdr = hdr->next); + if (!hdr) + return 0; + + /* check for the memory allocation */ + if (smp->strm->res_cap[hdr->index] == NULL) + smp->strm->res_cap[hdr->index] = pool_alloc(hdr->pool); + if (smp->strm->res_cap[hdr->index] == NULL) + return 0; + + /* Check length. */ + len = smp->data.u.str.data; + if (len > hdr->len) + len = hdr->len; + + /* Capture input data. */ + memcpy(smp->strm->res_cap[idx], smp->data.u.str.area, len); + smp->strm->res_cap[idx][len] = '\0'; + + return 1; +} + +/************************************************************************/ +/* All supported converter keywords must be declared here. */ +/************************************************************************/ + +/* Note: must not be declared <const> as its list will be overwritten */ +static struct sample_conv_kw_list sample_conv_kws = {ILH, { + { "http_date", sample_conv_http_date, ARG2(0,SINT,STR), smp_check_http_date_unit, SMP_T_SINT, SMP_T_STR}, + { "language", sample_conv_q_preferred, ARG2(1,STR,STR), NULL, SMP_T_STR, SMP_T_STR}, + { "capture-req", smp_conv_req_capture, ARG1(1,SINT), NULL, SMP_T_STR, SMP_T_STR}, + { "capture-res", smp_conv_res_capture, ARG1(1,SINT), NULL, SMP_T_STR, SMP_T_STR}, + { "url_dec", sample_conv_url_dec, ARG1(0,SINT), NULL, SMP_T_STR, SMP_T_STR}, + { "url_enc", sample_conv_url_enc, ARG1(1,STR), sample_conv_url_enc_check, SMP_T_STR, SMP_T_STR}, + { NULL, NULL, 0, 0, 0 }, +}}; + +INITCALL1(STG_REGISTER, sample_register_convs, &sample_conv_kws); + +/* + * Local variables: + * c-indent-level: 8 + * c-basic-offset: 8 + * End: + */ |