/* * HTTP sample conversion * * Copyright 2000-2018 Willy Tarreau * * This program is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation; either version * 2 of the License, or (at your option) any later version. * */ #include #include #include #include #include #include #include #include #include #include #include #include #include #include static int smp_check_http_date_unit(struct arg *args, struct sample_conv *conv, const char *file, int line, char **err) { return smp_check_date_unit(args, err); } /* takes an UINT value on input supposed to represent the time since EPOCH, * adds an optional offset found in args[0] and emits a string representing * the date in RFC-1123/5322 format. If optional unit param in args[1] is * provided, decode timestamp in milliseconds ("ms") or microseconds("us"), * and use relevant output date format. */ static int sample_conv_http_date(const struct arg *args, struct sample *smp, void *private) { const char day[7][4] = { "Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat" }; const char mon[12][4] = { "Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec" }; struct buffer *temp; struct tm tm; int sec_frac = 0; time_t curr_date; /* add offset */ if (args[0].type == ARGT_SINT) smp->data.u.sint += args[0].data.sint; /* report in milliseconds */ if (args[1].type == ARGT_SINT && args[1].data.sint == TIME_UNIT_MS) { sec_frac = smp->data.u.sint % 1000; smp->data.u.sint /= 1000; } /* report in microseconds */ else if (args[1].type == ARGT_SINT && args[1].data.sint == TIME_UNIT_US) { sec_frac = smp->data.u.sint % 1000000; smp->data.u.sint /= 1000000; } /* With high numbers, the date returned can be negative, the 55 bits mask prevent this. */ curr_date = smp->data.u.sint & 0x007fffffffffffffLL; get_gmtime(curr_date, &tm); temp = get_trash_chunk(); if (args[1].type == ARGT_SINT && args[1].data.sint != TIME_UNIT_S) { temp->data = snprintf(temp->area, temp->size - temp->data, "%s, %02d %s %04d %02d:%02d:%02d.%d GMT", day[tm.tm_wday], tm.tm_mday, mon[tm.tm_mon], 1900+tm.tm_year, tm.tm_hour, tm.tm_min, tm.tm_sec, sec_frac); } else { temp->data = snprintf(temp->area, temp->size - temp->data, "%s, %02d %s %04d %02d:%02d:%02d GMT", day[tm.tm_wday], tm.tm_mday, mon[tm.tm_mon], 1900+tm.tm_year, tm.tm_hour, tm.tm_min, tm.tm_sec); } smp->data.u.str = *temp; smp->data.type = SMP_T_STR; return 1; } /* Arguments: The list of expected value, the number of parts returned and the separator */ static int sample_conv_q_preferred(const struct arg *args, struct sample *smp, void *private) { const char *al = smp->data.u.str.area; const char *end = al + smp->data.u.str.data; const char *token; int toklen; int qvalue; const char *str; const char *w; int best_q = 0; /* Set the constant to the sample, because the output of the * function will be peek in the constant configuration string. */ smp->flags |= SMP_F_CONST; smp->data.u.str.size = 0; smp->data.u.str.area = ""; smp->data.u.str.data = 0; /* Parse the accept language */ while (1) { /* Jump spaces, quit if the end is detected. */ while (al < end && isspace((unsigned char)*al)) al++; if (al >= end) break; /* Start of the first word. */ token = al; /* Look for separator: isspace(), ',' or ';'. Next value if 0 length word. */ while (al < end && *al != ';' && *al != ',' && !isspace((unsigned char)*al)) al++; if (al == token) goto expect_comma; /* Length of the token. */ toklen = al - token; qvalue = 1000; /* Check if the token exists in the list. If the token not exists, * jump to the next token. */ str = args[0].data.str.area; w = str; while (1) { if (*str == ';' || *str == '\0') { if (http_language_range_match(token, toklen, w, str - w)) goto look_for_q; if (*str == '\0') goto expect_comma; w = str + 1; } str++; } goto expect_comma; look_for_q: /* Jump spaces, quit if the end is detected. */ while (al < end && isspace((unsigned char)*al)) al++; if (al >= end) goto process_value; /* If ',' is found, process the result */ if (*al == ',') goto process_value; /* If the character is different from ';', look * for the end of the header part in best effort. */ if (*al != ';') goto expect_comma; /* Assumes that the char is ';', now expect "q=". */ al++; /* Jump spaces, process value if the end is detected. */ while (al < end && isspace((unsigned char)*al)) al++; if (al >= end) goto process_value; /* Expect 'q'. If no 'q', continue in best effort */ if (*al != 'q') goto process_value; al++; /* Jump spaces, process value if the end is detected. */ while (al < end && isspace((unsigned char)*al)) al++; if (al >= end) goto process_value; /* Expect '='. If no '=', continue in best effort */ if (*al != '=') goto process_value; al++; /* Jump spaces, process value if the end is detected. */ while (al < end && isspace((unsigned char)*al)) al++; if (al >= end) goto process_value; /* Parse the q value. */ qvalue = http_parse_qvalue(al, &al); process_value: /* If the new q value is the best q value, then store the associated * language in the response. If qvalue is the biggest value (1000), * break the process. */ if (qvalue > best_q) { smp->data.u.str.area = (char *)w; smp->data.u.str.data = str - w; if (qvalue >= 1000) break; best_q = qvalue; } expect_comma: /* Expect comma or end. If the end is detected, quit the loop. */ while (al < end && *al != ',') al++; if (al >= end) break; /* Comma is found, jump it and restart the analyzer. */ al++; } /* Set default value if required. */ if (smp->data.u.str.data == 0 && args[1].type == ARGT_STR) { smp->data.u.str.area = args[1].data.str.area; smp->data.u.str.data = args[1].data.str.data; } /* Return true only if a matching language was found. */ return smp->data.u.str.data != 0; } /* This fetch url-decode any input string. */ static int sample_conv_url_dec(const struct arg *args, struct sample *smp, void *private) { int in_form = 0; int len; /* If the constant flag is set or if not size is available at * the end of the buffer, copy the string in other buffer * before decoding. */ if (smp->flags & SMP_F_CONST || smp->data.u.str.size <= smp->data.u.str.data) { struct buffer *str = get_trash_chunk(); memcpy(str->area, smp->data.u.str.area, smp->data.u.str.data); smp->data.u.str.area = str->area; smp->data.u.str.size = str->size; smp->flags &= ~SMP_F_CONST; } /* Add final \0 required by url_decode(), and convert the input string. */ smp->data.u.str.area[smp->data.u.str.data] = '\0'; if (args[0].type == ARGT_SINT) in_form = !!args[0].data.sint; len = url_decode(smp->data.u.str.area, in_form); if (len < 0) return 0; smp->data.u.str.data = len; return 1; } /* url-encode types and encode maps */ enum encode_type { ENC_QUERY = 0, }; long query_encode_map[(256 / 8) / sizeof(long)]; /* Check url-encode type */ static int sample_conv_url_enc_check(struct arg *arg, struct sample_conv *conv, const char *file, int line, char **err) { enum encode_type enc_type; if (strcmp(arg->data.str.area, "") == 0) enc_type = ENC_QUERY; else if (strcmp(arg->data.str.area, "query") == 0) enc_type = ENC_QUERY; else { memprintf(err, "Unexpected encode type. " "Allowed value is 'query'"); return 0; } chunk_destroy(&arg->data.str); arg->type = ARGT_SINT; arg->data.sint = enc_type; return 1; } /* Initializes some url encode data at boot */ static void sample_conf_url_enc_init() { int i; memset(query_encode_map, 0, sizeof(query_encode_map)); /* use rfc3986 to determine list of characters to keep unchanged for * query string */ for (i = 0; i < 256; i++) { if (!((i >= 'a' && i <= 'z') || (i >= 'A' && i <= 'Z') || (i >= '0' && i <= '9') || i == '-' || i == '.' || i == '_' || i == '~')) ha_bit_set(i, query_encode_map); } } INITCALL0(STG_PREPARE, sample_conf_url_enc_init); /* This fetch url-encode any input string. Only support query string for now */ static int sample_conv_url_enc(const struct arg *args, struct sample *smp, void *private) { enum encode_type enc_type; struct buffer *trash = get_trash_chunk(); long *encode_map; char *ret; enc_type = ENC_QUERY; enc_type = args->data.sint; if (enc_type == ENC_QUERY) encode_map = query_encode_map; else return 0; ret = encode_chunk(trash->area, trash->area + trash->size, '%', encode_map, &smp->data.u.str); if (ret == NULL || *ret != '\0') return 0; trash->data = ret - trash->area; smp->data.u.str = *trash; return 1; } static int smp_conv_req_capture(const struct arg *args, struct sample *smp, void *private) { struct proxy *fe; int idx, i; struct cap_hdr *hdr; int len; if (args->type != ARGT_SINT) return 0; if (!smp->strm) return 0; fe = strm_fe(smp->strm); idx = args->data.sint; /* Check the availability of the capture id. */ if (idx > fe->nb_req_cap - 1) return 0; /* Look for the original configuration. */ for (hdr = fe->req_cap, i = fe->nb_req_cap - 1; hdr != NULL && i != idx ; i--, hdr = hdr->next); if (!hdr) return 0; /* check for the memory allocation */ if (smp->strm->req_cap[hdr->index] == NULL) smp->strm->req_cap[hdr->index] = pool_alloc(hdr->pool); if (smp->strm->req_cap[hdr->index] == NULL) return 0; /* Check length. */ len = smp->data.u.str.data; if (len > hdr->len) len = hdr->len; /* Capture input data. */ memcpy(smp->strm->req_cap[idx], smp->data.u.str.area, len); smp->strm->req_cap[idx][len] = '\0'; return 1; } static int smp_conv_res_capture(const struct arg *args, struct sample *smp, void *private) { struct proxy *fe; int idx, i; struct cap_hdr *hdr; int len; if (args->type != ARGT_SINT) return 0; if (!smp->strm) return 0; fe = strm_fe(smp->strm); idx = args->data.sint; /* Check the availability of the capture id. */ if (idx > fe->nb_rsp_cap - 1) return 0; /* Look for the original configuration. */ for (hdr = fe->rsp_cap, i = fe->nb_rsp_cap - 1; hdr != NULL && i != idx ; i--, hdr = hdr->next); if (!hdr) return 0; /* check for the memory allocation */ if (smp->strm->res_cap[hdr->index] == NULL) smp->strm->res_cap[hdr->index] = pool_alloc(hdr->pool); if (smp->strm->res_cap[hdr->index] == NULL) return 0; /* Check length. */ len = smp->data.u.str.data; if (len > hdr->len) len = hdr->len; /* Capture input data. */ memcpy(smp->strm->res_cap[idx], smp->data.u.str.area, len); smp->strm->res_cap[idx][len] = '\0'; return 1; } /************************************************************************/ /* All supported converter keywords must be declared here. */ /************************************************************************/ /* Note: must not be declared as its list will be overwritten */ static struct sample_conv_kw_list sample_conv_kws = {ILH, { { "http_date", sample_conv_http_date, ARG2(0,SINT,STR), smp_check_http_date_unit, SMP_T_SINT, SMP_T_STR}, { "language", sample_conv_q_preferred, ARG2(1,STR,STR), NULL, SMP_T_STR, SMP_T_STR}, { "capture-req", smp_conv_req_capture, ARG1(1,SINT), NULL, SMP_T_STR, SMP_T_STR}, { "capture-res", smp_conv_res_capture, ARG1(1,SINT), NULL, SMP_T_STR, SMP_T_STR}, { "url_dec", sample_conv_url_dec, ARG1(0,SINT), NULL, SMP_T_STR, SMP_T_STR}, { "url_enc", sample_conv_url_enc, ARG1(1,STR), sample_conv_url_enc_check, SMP_T_STR, SMP_T_STR}, { NULL, NULL, 0, 0, 0 }, }}; INITCALL1(STG_REGISTER, sample_register_convs, &sample_conv_kws); /* * Local variables: * c-indent-level: 8 * c-basic-offset: 8 * End: */