| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388 |
- /*
- * Utility functions for protocol examples
- *
- * SPDX-FileCopyrightText: 2002-2021 Igor Sysoev
- * 2011-2022 Nginx, Inc.
- *
- * SPDX-License-Identifier: BSD-2-Clause
- *
- * SPDX-FileContributor: 2023 Espressif Systems (Shanghai) CO LTD
- */
- /*
- * Copyright (C) 2002-2021 Igor Sysoev
- * Copyright (C) 2011-2022 Nginx, Inc.
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in the
- * documentation and/or other materials provided with the distribution.
- *
- * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
- * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
- * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
- * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
- * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
- * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
- * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
- * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
- * SUCH DAMAGE.
- */
- #include <stdio.h>
- #include <stdlib.h>
- #include <string.h>
- #include <sys/types.h>
- #include "protocol_examples_utils.h"
- /* Type of Escape algorithms to be used */
- #define NGX_ESCAPE_URI (0)
- #define NGX_ESCAPE_ARGS (1)
- #define NGX_ESCAPE_URI_COMPONENT (2)
- #define NGX_ESCAPE_HTML (3)
- #define NGX_ESCAPE_REFRESH (4)
- #define NGX_ESCAPE_MEMCACHED (5)
- #define NGX_ESCAPE_MAIL_AUTH (6)
- /* Type of Unescape algorithms to be used */
- #define NGX_UNESCAPE_URI (1)
- #define NGX_UNESCAPE_REDIRECT (2)
- uintptr_t ngx_escape_uri(u_char *dst, u_char *src, size_t size, unsigned int type)
- {
- unsigned int n;
- uint32_t *escape;
- static u_char hex[] = "0123456789ABCDEF";
- /*
- * Per RFC 3986 only the following chars are allowed in URIs unescaped:
- *
- * unreserved = ALPHA / DIGIT / "-" / "." / "_" / "~"
- * gen-delims = ":" / "/" / "?" / "#" / "[" / "]" / "@"
- * sub-delims = "!" / "$" / "&" / "'" / "(" / ")"
- * / "*" / "+" / "," / ";" / "="
- *
- * And "%" can appear as a part of escaping itself. The following
- * characters are not allowed and need to be escaped: %00-%1F, %7F-%FF,
- * " ", """, "<", ">", "\", "^", "`", "{", "|", "}".
- */
- /* " ", "#", "%", "?", not allowed */
- static uint32_t uri[] = {
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- /* ?>=< ;:98 7654 3210 /.-, +*)( '&%$ #"! */
- 0xd000002d, /* 1101 0000 0000 0000 0000 0000 0010 1101 */
- /* _^]\ [ZYX WVUT SRQP ONML KJIH GFED CBA@ */
- 0x50000000, /* 0101 0000 0000 0000 0000 0000 0000 0000 */
- /* ~}| {zyx wvut srqp onml kjih gfed cba` */
- 0xb8000001, /* 1011 1000 0000 0000 0000 0000 0000 0001 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- };
- /* " ", "#", "%", "&", "+", ";", "?", not allowed */
- static uint32_t args[] = {
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- /* ?>=< ;:98 7654 3210 /.-, +*)( '&%$ #"! */
- 0xd800086d, /* 1101 1000 0000 0000 0000 1000 0110 1101 */
- /* _^]\ [ZYX WVUT SRQP ONML KJIH GFED CBA@ */
- 0x50000000, /* 0101 0000 0000 0000 0000 0000 0000 0000 */
- /* ~}| {zyx wvut srqp onml kjih gfed cba` */
- 0xb8000001, /* 1011 1000 0000 0000 0000 0000 0000 0001 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- };
- /* not ALPHA, DIGIT, "-", ".", "_", "~" */
- static uint32_t uri_component[] = {
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- /* ?>=< ;:98 7654 3210 /.-, +*)( '&%$ #"! */
- 0xfc009fff, /* 1111 1100 0000 0000 1001 1111 1111 1111 */
- /* _^]\ [ZYX WVUT SRQP ONML KJIH GFED CBA@ */
- 0x78000001, /* 0111 1000 0000 0000 0000 0000 0000 0001 */
- /* ~}| {zyx wvut srqp onml kjih gfed cba` */
- 0xb8000001, /* 1011 1000 0000 0000 0000 0000 0000 0001 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- };
- /* " ", "#", """, "%", "'", not allowed */
- static uint32_t html[] = {
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- /* ?>=< ;:98 7654 3210 /.-, +*)( '&%$ #"! */
- 0x500000ad, /* 0101 0000 0000 0000 0000 0000 1010 1101 */
- /* _^]\ [ZYX WVUT SRQP ONML KJIH GFED CBA@ */
- 0x50000000, /* 0101 0000 0000 0000 0000 0000 0000 0000 */
- /* ~}| {zyx wvut srqp onml kjih gfed cba` */
- 0xb8000001, /* 1011 1000 0000 0000 0000 0000 0000 0001 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- };
- /* " ", """, "'", not allowed */
- static uint32_t refresh[] = {
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- /* ?>=< ;:98 7654 3210 /.-, +*)( '&%$ #"! */
- 0x50000085, /* 0101 0000 0000 0000 0000 0000 1000 0101 */
- /* _^]\ [ZYX WVUT SRQP ONML KJIH GFED CBA@ */
- 0x50000000, /* 0101 0000 0000 0000 0000 0000 0000 0000 */
- /* ~}| {zyx wvut srqp onml kjih gfed cba` */
- 0xd8000001, /* 1011 1000 0000 0000 0000 0000 0000 0001 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- 0xffffffff /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- };
- /* " ", "%", %00-%1F */
- static uint32_t memcached[] = {
- 0xffffffff, /* 1111 1111 1111 1111 1111 1111 1111 1111 */
- /* ?>=< ;:98 7654 3210 /.-, +*)( '&%$ #"! */
- 0x00000021, /* 0000 0000 0000 0000 0000 0000 0010 0001 */
- /* _^]\ [ZYX WVUT SRQP ONML KJIH GFED CBA@ */
- 0x00000000, /* 0000 0000 0000 0000 0000 0000 0000 0000 */
- /* ~}| {zyx wvut srqp onml kjih gfed cba` */
- 0x00000000, /* 0000 0000 0000 0000 0000 0000 0000 0000 */
- 0x00000000, /* 0000 0000 0000 0000 0000 0000 0000 0000 */
- 0x00000000, /* 0000 0000 0000 0000 0000 0000 0000 0000 */
- 0x00000000, /* 0000 0000 0000 0000 0000 0000 0000 0000 */
- 0x00000000, /* 0000 0000 0000 0000 0000 0000 0000 0000 */
- };
- /* mail_auth is the same as memcached */
- static uint32_t *map[] =
- { uri, args, uri_component, html, refresh, memcached, memcached };
- escape = map[type];
- if (dst == NULL) {
- /* find the number of the characters to be escaped */
- n = 0;
- while (size) {
- if (escape[*src >> 5] & (1U << (*src & 0x1f))) {
- n++;
- }
- src++;
- size--;
- }
- return (uintptr_t) n;
- }
- while (size) {
- if (escape[*src >> 5] & (1U << (*src & 0x1f))) {
- *dst++ = '%';
- *dst++ = hex[*src >> 4];
- *dst++ = hex[*src & 0xf];
- src++;
- } else {
- *dst++ = *src++;
- }
- size--;
- }
- return (uintptr_t) dst;
- }
- void ngx_unescape_uri(u_char **dst, u_char **src, size_t size, unsigned int type)
- {
- u_char *d, *s, ch, c, decoded;
- enum {
- sw_usual = 0,
- sw_quoted,
- sw_quoted_second
- } state;
- d = *dst;
- s = *src;
- state = 0;
- decoded = 0;
- while (size--) {
- ch = *s++;
- switch (state) {
- case sw_usual:
- if (ch == '?'
- && (type & (NGX_UNESCAPE_URI | NGX_UNESCAPE_REDIRECT))) {
- *d++ = ch;
- goto done;
- }
- if (ch == '%') {
- state = sw_quoted;
- break;
- }
- *d++ = ch;
- break;
- case sw_quoted:
- if (ch >= '0' && ch <= '9') {
- decoded = (u_char) (ch - '0');
- state = sw_quoted_second;
- break;
- }
- c = (u_char) (ch | 0x20);
- if (c >= 'a' && c <= 'f') {
- decoded = (u_char) (c - 'a' + 10);
- state = sw_quoted_second;
- break;
- }
- /* the invalid quoted character */
- state = sw_usual;
- *d++ = ch;
- break;
- case sw_quoted_second:
- state = sw_usual;
- if (ch >= '0' && ch <= '9') {
- ch = (u_char) ((decoded << 4) + (ch - '0'));
- if (type & NGX_UNESCAPE_REDIRECT) {
- if (ch > '%' && ch < 0x7f) {
- *d++ = ch;
- break;
- }
- *d++ = '%'; *d++ = *(s - 2); *d++ = *(s - 1);
- break;
- }
- *d++ = ch;
- break;
- }
- c = (u_char) (ch | 0x20);
- if (c >= 'a' && c <= 'f') {
- ch = (u_char) ((decoded << 4) + (c - 'a') + 10);
- if (type & NGX_UNESCAPE_URI) {
- if (ch == '?') {
- *d++ = ch;
- goto done;
- }
- *d++ = ch;
- break;
- }
- if (type & NGX_UNESCAPE_REDIRECT) {
- if (ch == '?') {
- *d++ = ch;
- goto done;
- }
- if (ch > '%' && ch < 0x7f) {
- *d++ = ch;
- break;
- }
- *d++ = '%'; *d++ = *(s - 2); *d++ = *(s - 1);
- break;
- }
- *d++ = ch;
- break;
- }
- /* the invalid quoted character */
- break;
- }
- }
- done:
- *dst = d;
- *src = s;
- }
- uint32_t example_uri_encode(char *dest, const char *src, size_t len)
- {
- if (!src || !dest) {
- return 0;
- }
- uintptr_t ret = ngx_escape_uri((unsigned char *)dest, (unsigned char *)src, len, NGX_ESCAPE_URI_COMPONENT);
- return (uint32_t)(ret - (uintptr_t)dest);
- }
- void example_uri_decode(char *dest, const char *src, size_t len)
- {
- if (!src || !dest) {
- return;
- }
- unsigned char *src_ptr = (unsigned char *)src;
- unsigned char *dst_ptr = (unsigned char *)dest;
- ngx_unescape_uri(&dst_ptr, &src_ptr, len, NGX_UNESCAPE_URI);
- }
|