| /* |
| * HTTP sample conversion |
| * |
| * Copyright 2000-2018 Willy Tarreau <w@1wt.eu> |
| * |
| * This program is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU General Public License |
| * as published by the Free Software Foundation; either version |
| * 2 of the License, or (at your option) any later version. |
| * |
| */ |
| |
| #include <sys/types.h> |
| |
| #include <ctype.h> |
| #include <string.h> |
| #include <time.h> |
| |
| #include <haproxy/api.h> |
| #include <haproxy/arg.h> |
| #include <haproxy/capture-t.h> |
| #include <haproxy/chunk.h> |
| #include <haproxy/http.h> |
| #include <haproxy/pool.h> |
| #include <haproxy/sample.h> |
| #include <haproxy/stream.h> |
| #include <haproxy/tools.h> |
| #include <haproxy/version.h> |
| |
| static int smp_check_http_date_unit(struct arg *args, struct sample_conv *conv, |
| const char *file, int line, char **err) |
| { |
| return smp_check_date_unit(args, err); |
| } |
| |
| /* takes an UINT value on input supposed to represent the time since EPOCH, |
| * adds an optional offset found in args[0] and emits a string representing |
| * the date in RFC-1123/5322 format. If optional unit param in args[1] is |
| * provided, decode timestamp in milliseconds ("ms") or microseconds("us"), |
| * and use relevant output date format. |
| */ |
| static int sample_conv_http_date(const struct arg *args, struct sample *smp, void *private) |
| { |
| const char day[7][4] = { "Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat" }; |
| const char mon[12][4] = { "Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec" }; |
| struct buffer *temp; |
| struct tm tm; |
| int sec_frac = 0; |
| time_t curr_date; |
| |
| /* add offset */ |
| if (args[0].type == ARGT_SINT) |
| smp->data.u.sint += args[0].data.sint; |
| |
| /* report in milliseconds */ |
| if (args[1].type == ARGT_SINT && args[1].data.sint == TIME_UNIT_MS) { |
| sec_frac = smp->data.u.sint % 1000; |
| smp->data.u.sint /= 1000; |
| } |
| /* report in microseconds */ |
| else if (args[1].type == ARGT_SINT && args[1].data.sint == TIME_UNIT_US) { |
| sec_frac = smp->data.u.sint % 1000000; |
| smp->data.u.sint /= 1000000; |
| } |
| |
| /* With high numbers, the date returned can be negative, the 55 bits mask prevent this. */ |
| curr_date = smp->data.u.sint & 0x007fffffffffffffLL; |
| |
| get_gmtime(curr_date, &tm); |
| |
| temp = get_trash_chunk(); |
| if (args[1].type == ARGT_SINT && args[1].data.sint != TIME_UNIT_S) { |
| temp->data = snprintf(temp->area, temp->size - temp->data, |
| "%s, %02d %s %04d %02d:%02d:%02d.%d GMT", |
| day[tm.tm_wday], tm.tm_mday, mon[tm.tm_mon], |
| 1900+tm.tm_year, |
| tm.tm_hour, tm.tm_min, tm.tm_sec, sec_frac); |
| } else { |
| temp->data = snprintf(temp->area, temp->size - temp->data, |
| "%s, %02d %s %04d %02d:%02d:%02d GMT", |
| day[tm.tm_wday], tm.tm_mday, mon[tm.tm_mon], |
| 1900+tm.tm_year, |
| tm.tm_hour, tm.tm_min, tm.tm_sec); |
| } |
| |
| smp->data.u.str = *temp; |
| smp->data.type = SMP_T_STR; |
| return 1; |
| } |
| |
| /* Arguments: The list of expected value, the number of parts returned and the separator */ |
| static int sample_conv_q_preferred(const struct arg *args, struct sample *smp, void *private) |
| { |
| const char *al = smp->data.u.str.area; |
| const char *end = al + smp->data.u.str.data; |
| const char *token; |
| int toklen; |
| int qvalue; |
| const char *str; |
| const char *w; |
| int best_q = 0; |
| |
| /* Set the constant to the sample, because the output of the |
| * function will be peek in the constant configuration string. |
| */ |
| smp->flags |= SMP_F_CONST; |
| smp->data.u.str.size = 0; |
| smp->data.u.str.area = ""; |
| smp->data.u.str.data = 0; |
| |
| /* Parse the accept language */ |
| while (1) { |
| |
| /* Jump spaces, quit if the end is detected. */ |
| while (al < end && isspace((unsigned char)*al)) |
| al++; |
| if (al >= end) |
| break; |
| |
| /* Start of the first word. */ |
| token = al; |
| |
| /* Look for separator: isspace(), ',' or ';'. Next value if 0 length word. */ |
| while (al < end && *al != ';' && *al != ',' && !isspace((unsigned char)*al)) |
| al++; |
| if (al == token) |
| goto expect_comma; |
| |
| /* Length of the token. */ |
| toklen = al - token; |
| qvalue = 1000; |
| |
| /* Check if the token exists in the list. If the token not exists, |
| * jump to the next token. |
| */ |
| str = args[0].data.str.area; |
| w = str; |
| while (1) { |
| if (*str == ';' || *str == '\0') { |
| if (http_language_range_match(token, toklen, w, str - w)) |
| goto look_for_q; |
| if (*str == '\0') |
| goto expect_comma; |
| w = str + 1; |
| } |
| str++; |
| } |
| goto expect_comma; |
| |
| look_for_q: |
| |
| /* Jump spaces, quit if the end is detected. */ |
| while (al < end && isspace((unsigned char)*al)) |
| al++; |
| if (al >= end) |
| goto process_value; |
| |
| /* If ',' is found, process the result */ |
| if (*al == ',') |
| goto process_value; |
| |
| /* If the character is different from ';', look |
| * for the end of the header part in best effort. |
| */ |
| if (*al != ';') |
| goto expect_comma; |
| |
| /* Assumes that the char is ';', now expect "q=". */ |
| al++; |
| |
| /* Jump spaces, process value if the end is detected. */ |
| while (al < end && isspace((unsigned char)*al)) |
| al++; |
| if (al >= end) |
| goto process_value; |
| |
| /* Expect 'q'. If no 'q', continue in best effort */ |
| if (*al != 'q') |
| goto process_value; |
| al++; |
| |
| /* Jump spaces, process value if the end is detected. */ |
| while (al < end && isspace((unsigned char)*al)) |
| al++; |
| if (al >= end) |
| goto process_value; |
| |
| /* Expect '='. If no '=', continue in best effort */ |
| if (*al != '=') |
| goto process_value; |
| al++; |
| |
| /* Jump spaces, process value if the end is detected. */ |
| while (al < end && isspace((unsigned char)*al)) |
| al++; |
| if (al >= end) |
| goto process_value; |
| |
| /* Parse the q value. */ |
| qvalue = http_parse_qvalue(al, &al); |
| |
| process_value: |
| |
| /* If the new q value is the best q value, then store the associated |
| * language in the response. If qvalue is the biggest value (1000), |
| * break the process. |
| */ |
| if (qvalue > best_q) { |
| smp->data.u.str.area = (char *)w; |
| smp->data.u.str.data = str - w; |
| if (qvalue >= 1000) |
| break; |
| best_q = qvalue; |
| } |
| |
| expect_comma: |
| |
| /* Expect comma or end. If the end is detected, quit the loop. */ |
| while (al < end && *al != ',') |
| al++; |
| if (al >= end) |
| break; |
| |
| /* Comma is found, jump it and restart the analyzer. */ |
| al++; |
| } |
| |
| /* Set default value if required. */ |
| if (smp->data.u.str.data == 0 && args[1].type == ARGT_STR) { |
| smp->data.u.str.area = args[1].data.str.area; |
| smp->data.u.str.data = args[1].data.str.data; |
| } |
| |
| /* Return true only if a matching language was found. */ |
| return smp->data.u.str.data != 0; |
| } |
| |
| /* This fetch url-decode any input string. */ |
| static int sample_conv_url_dec(const struct arg *args, struct sample *smp, void *private) |
| { |
| int in_form = 0; |
| int len; |
| |
| /* If the constant flag is set or if not size is available at |
| * the end of the buffer, copy the string in other buffer |
| * before decoding. |
| */ |
| if (smp->flags & SMP_F_CONST || smp->data.u.str.size <= smp->data.u.str.data) { |
| struct buffer *str = get_trash_chunk(); |
| memcpy(str->area, smp->data.u.str.area, smp->data.u.str.data); |
| smp->data.u.str.area = str->area; |
| smp->data.u.str.size = str->size; |
| smp->flags &= ~SMP_F_CONST; |
| } |
| |
| /* Add final \0 required by url_decode(), and convert the input string. */ |
| smp->data.u.str.area[smp->data.u.str.data] = '\0'; |
| |
| if (args[0].type == ARGT_SINT) |
| in_form = !!args[0].data.sint; |
| |
| len = url_decode(smp->data.u.str.area, in_form); |
| if (len < 0) |
| return 0; |
| smp->data.u.str.data = len; |
| return 1; |
| } |
| |
| /* url-encode types and encode maps */ |
| enum encode_type { |
| ENC_QUERY = 0, |
| }; |
| long query_encode_map[(256 / 8) / sizeof(long)]; |
| |
| /* Check url-encode type */ |
| static int sample_conv_url_enc_check(struct arg *arg, struct sample_conv *conv, |
| const char *file, int line, char **err) |
| { |
| enum encode_type enc_type; |
| |
| if (strcmp(arg->data.str.area, "") == 0) |
| enc_type = ENC_QUERY; |
| else if (strcmp(arg->data.str.area, "query") == 0) |
| enc_type = ENC_QUERY; |
| else { |
| memprintf(err, "Unexpected encode type. " |
| "Allowed value is 'query'"); |
| return 0; |
| } |
| |
| chunk_destroy(&arg->data.str); |
| arg->type = ARGT_SINT; |
| arg->data.sint = enc_type; |
| return 1; |
| } |
| |
| /* Initializes some url encode data at boot */ |
| static void sample_conf_url_enc_init() |
| { |
| int i; |
| |
| memset(query_encode_map, 0, sizeof(query_encode_map)); |
| /* use rfc3986 to determine list of characters to keep unchanged for |
| * query string */ |
| for (i = 0; i < 256; i++) { |
| if (!((i >= 'a' && i <= 'z') || (i >= 'A' && i <= 'Z') |
| || (i >= '0' && i <= '9') || |
| i == '-' || i == '.' || i == '_' || i == '~')) |
| ha_bit_set(i, query_encode_map); |
| } |
| } |
| |
| INITCALL0(STG_PREPARE, sample_conf_url_enc_init); |
| |
| /* This fetch url-encode any input string. Only support query string for now */ |
| static int sample_conv_url_enc(const struct arg *args, struct sample *smp, void |
| *private) |
| { |
| enum encode_type enc_type; |
| struct buffer *trash = get_trash_chunk(); |
| long *encode_map; |
| char *ret; |
| |
| enc_type = ENC_QUERY; |
| enc_type = args->data.sint; |
| |
| if (enc_type == ENC_QUERY) |
| encode_map = query_encode_map; |
| else |
| return 0; |
| |
| ret = encode_chunk(trash->area, trash->area + trash->size, '%', |
| encode_map, &smp->data.u.str); |
| if (ret == NULL || *ret != '\0') |
| return 0; |
| trash->data = ret - trash->area; |
| smp->data.u.str = *trash; |
| return 1; |
| } |
| |
| static int smp_conv_req_capture(const struct arg *args, struct sample *smp, void *private) |
| { |
| struct proxy *fe; |
| int idx, i; |
| struct cap_hdr *hdr; |
| int len; |
| |
| if (args->type != ARGT_SINT) |
| return 0; |
| |
| if (!smp->strm) |
| return 0; |
| |
| fe = strm_fe(smp->strm); |
| idx = args->data.sint; |
| |
| /* Check the availability of the capture id. */ |
| if (idx > fe->nb_req_cap - 1) |
| return 0; |
| |
| /* Look for the original configuration. */ |
| for (hdr = fe->req_cap, i = fe->nb_req_cap - 1; |
| hdr != NULL && i != idx ; |
| i--, hdr = hdr->next); |
| if (!hdr) |
| return 0; |
| |
| /* check for the memory allocation */ |
| if (smp->strm->req_cap[hdr->index] == NULL) |
| smp->strm->req_cap[hdr->index] = pool_alloc(hdr->pool); |
| if (smp->strm->req_cap[hdr->index] == NULL) |
| return 0; |
| |
| /* Check length. */ |
| len = smp->data.u.str.data; |
| if (len > hdr->len) |
| len = hdr->len; |
| |
| /* Capture input data. */ |
| memcpy(smp->strm->req_cap[idx], smp->data.u.str.area, len); |
| smp->strm->req_cap[idx][len] = '\0'; |
| |
| return 1; |
| } |
| |
| static int smp_conv_res_capture(const struct arg *args, struct sample *smp, void *private) |
| { |
| struct proxy *fe; |
| int idx, i; |
| struct cap_hdr *hdr; |
| int len; |
| |
| if (args->type != ARGT_SINT) |
| return 0; |
| |
| if (!smp->strm) |
| return 0; |
| |
| fe = strm_fe(smp->strm); |
| idx = args->data.sint; |
| |
| /* Check the availability of the capture id. */ |
| if (idx > fe->nb_rsp_cap - 1) |
| return 0; |
| |
| /* Look for the original configuration. */ |
| for (hdr = fe->rsp_cap, i = fe->nb_rsp_cap - 1; |
| hdr != NULL && i != idx ; |
| i--, hdr = hdr->next); |
| if (!hdr) |
| return 0; |
| |
| /* check for the memory allocation */ |
| if (smp->strm->res_cap[hdr->index] == NULL) |
| smp->strm->res_cap[hdr->index] = pool_alloc(hdr->pool); |
| if (smp->strm->res_cap[hdr->index] == NULL) |
| return 0; |
| |
| /* Check length. */ |
| len = smp->data.u.str.data; |
| if (len > hdr->len) |
| len = hdr->len; |
| |
| /* Capture input data. */ |
| memcpy(smp->strm->res_cap[idx], smp->data.u.str.area, len); |
| smp->strm->res_cap[idx][len] = '\0'; |
| |
| return 1; |
| } |
| |
| /************************************************************************/ |
| /* All supported converter keywords must be declared here. */ |
| /************************************************************************/ |
| |
| /* Note: must not be declared <const> as its list will be overwritten */ |
| static struct sample_conv_kw_list sample_conv_kws = {ILH, { |
| { "http_date", sample_conv_http_date, ARG2(0,SINT,STR), smp_check_http_date_unit, SMP_T_SINT, SMP_T_STR}, |
| { "language", sample_conv_q_preferred, ARG2(1,STR,STR), NULL, SMP_T_STR, SMP_T_STR}, |
| { "capture-req", smp_conv_req_capture, ARG1(1,SINT), NULL, SMP_T_STR, SMP_T_STR}, |
| { "capture-res", smp_conv_res_capture, ARG1(1,SINT), NULL, SMP_T_STR, SMP_T_STR}, |
| { "url_dec", sample_conv_url_dec, ARG1(0,SINT), NULL, SMP_T_STR, SMP_T_STR}, |
| { "url_enc", sample_conv_url_enc, ARG1(1,STR), sample_conv_url_enc_check, SMP_T_STR, SMP_T_STR}, |
| { NULL, NULL, 0, 0, 0 }, |
| }}; |
| |
| INITCALL1(STG_REGISTER, sample_register_convs, &sample_conv_kws); |
| |
| /* |
| * Local variables: |
| * c-indent-level: 8 |
| * c-basic-offset: 8 |
| * End: |
| */ |