s3/lib/ctdbd_conn: assert hdr following read/recv
[Samba.git] / lib / util / rfc1738.c
bloba6c54ce61a9cf8f8e8c3b007df1f6433f4c7509d
1 /*
2 * Functions for RFC 3986 percent-encoding.
4 * NOTE:
6 * This file was originally imported from the Squid project but has been
7 * significantly altered. The licence below is reproduced intact, but refers
8 * to files in Squid's repository, not in Samba. See COPYING for the GPLv3
9 * notice (being the later version mentioned below).
13 * $Id$
15 * DEBUG:
16 * AUTHOR: Harvest Derived
18 * SQUID Web Proxy Cache http://www.squid-cache.org/
19 * ----------------------------------------------------------
21 * Squid is the result of efforts by numerous individuals from
22 * the Internet community; see the CONTRIBUTORS file for full
23 * details. Many organizations have provided support for Squid's
24 * development; see the SPONSORS file for full details. Squid is
25 * Copyrighted (C) 2001 by the Regents of the University of
26 * California; see the COPYRIGHT file for full details. Squid
27 * incorporates software developed and/or copyrighted by other
28 * sources; see the CREDITS file for full details.
30 * This program is free software; you can redistribute it and/or modify
31 * it under the terms of the GNU General Public License as published by
32 * the Free Software Foundation; either version 2 of the License, or
33 * (at your option) any later version.
35 * This program is distributed in the hope that it will be useful,
36 * but WITHOUT ANY WARRANTY; without even the implied warranty of
37 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
38 * GNU General Public License for more details.
40 * You should have received a copy of the GNU General Public License
41 * along with this program; if not, write to the Free Software
42 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111, USA.
46 #include "replace.h"
47 #include <talloc.h>
48 #include "lib/util/samba_util.h"
49 #include "lib/util/util_str_hex.h"
51 #define RFC1738_ENCODE 1
52 #define RFC1738_RESERVED 2
55 * According to RFC 1738, "$-_.+!*'()," are not reserved or unsafe, but as
56 * that has been obsolete since 2004, we sm instead for RFC 3986, where:
58 * reserved = : / ? # [ ] @ ! $ & ' ( ) * + , ; =
59 * unreserved = ALPHA DIGIT - . _ ~
61 * and whatever is not in either of those are what RFC 1738 called "unsafe",
62 * meaning that they should are canonically but not mandatorily escaped.
64 * Characters below 0x20 or above 0x7E are always enocded.
67 static const unsigned char escapees[127] = {
68 [' '] = RFC1738_ENCODE,
69 ['"'] = RFC1738_ENCODE,
70 ['%'] = RFC1738_ENCODE,
71 ['<'] = RFC1738_ENCODE,
72 ['>'] = RFC1738_ENCODE,
73 ['\\'] = RFC1738_ENCODE,
74 ['^'] = RFC1738_ENCODE,
75 ['`'] = RFC1738_ENCODE,
76 ['{'] = RFC1738_ENCODE,
77 ['|'] = RFC1738_ENCODE,
78 ['}'] = RFC1738_ENCODE,
79 /* reserved : / ? # [ ] @ ! $ & ' ( ) * + , ; = */
80 [':'] = RFC1738_RESERVED,
81 ['/'] = RFC1738_RESERVED,
82 ['?'] = RFC1738_RESERVED,
83 ['#'] = RFC1738_RESERVED,
84 ['['] = RFC1738_RESERVED,
85 [']'] = RFC1738_RESERVED,
86 ['@'] = RFC1738_RESERVED,
87 ['!'] = RFC1738_RESERVED,
88 ['$'] = RFC1738_RESERVED,
89 ['&'] = RFC1738_RESERVED,
90 ['\''] = RFC1738_RESERVED,
91 ['('] = RFC1738_RESERVED,
92 [')'] = RFC1738_RESERVED,
93 ['*'] = RFC1738_RESERVED,
94 ['+'] = RFC1738_RESERVED,
95 [','] = RFC1738_RESERVED,
96 [';'] = RFC1738_RESERVED,
97 ['='] = RFC1738_RESERVED,
101 * rfc1738_do_escape - fills a preallocated buffer with an escaped version of
102 * the given string.
104 * For canonical escaping, mask should be RFC1738_ENCODE | RFC1738_RESERVED.
105 * For mandatory escaping, mask should be RFC1738_RESERVED.
107 static char *
108 rfc1738_do_escape(char *buf, size_t bufsize,
109 const char *url, size_t len, unsigned char mask)
111 size_t i;
112 size_t j = 0;
113 for (i = 0; i < len; i++) {
114 unsigned int c = (unsigned char) url[i];
115 if (c > 126 || c < 32 || (escapees[c] & mask)) {
116 if (j + 3 >= bufsize) {
117 return NULL;
119 (void) snprintf(&buf[j], 4, "%%%02X", c);
120 j += 3;
121 } else {
122 if (j + 1 >= bufsize) {
123 return NULL;
125 buf[j] = c;
126 j++;
129 buf[j] = '\0';
130 return buf;
134 * rfc1738_escape_part - Returns a talloced buffer that contains the RFC 3986
135 * compliant, escaped version of the given url segment.
137 char *
138 rfc1738_escape_part(TALLOC_CTX *mem_ctx, const char *url)
140 size_t bufsize = 0;
141 char *buf = NULL;
143 size_t len = strlen(url);
144 if (len >= SIZE_MAX / 3) {
145 return NULL;
148 bufsize = len * 3 + 1;
149 buf = talloc_array(mem_ctx, char, bufsize);
150 if (buf == NULL) {
151 return NULL;
154 talloc_set_name_const(buf, buf);
156 return rfc1738_do_escape(buf, bufsize, url, len,
157 RFC1738_ENCODE | RFC1738_RESERVED);
161 * rfc1738_unescape() - Converts url-escaped characters in the string.
163 * The two characters following a '%' in a string should be hex digits that
164 * describe an encoded byte. For example, "%25" is hex 0x25 or '%' in ASCII;
165 * this is the only way to include a % in the unescaped string. Any character
166 * can be escaped, including plain letters (e.g. "%61" for "a"). Anything
167 * other than 2 hex characters following the % is an error.
169 * The conversion is done in-place, which is always safe as unescapes can only
170 * shorten the string.
172 * Returns a pointer to the end of the string (that is, the '\0' byte), or
173 * NULL on error, at which point s is in an undefined state.
175 * Note that after `char *e = rfc_unescape(s)`, `strlen(s)` will not equal
176 * `e - s` if s originally contained "%00". You might want to check for this.
179 _PUBLIC_ char *rfc1738_unescape(char *s)
181 size_t i, j; /* i is write, j is read */
182 uint64_t x;
183 NTSTATUS status;
184 for (i = 0, j = 0; s[j] != '\0'; i++, j++) {
185 if (s[j] == '%') {
186 status = read_hex_bytes(&s[j + 1], 2, &x);
187 if (! NT_STATUS_IS_OK(status)) {
188 return NULL;
190 j += 2; /* OK; read_hex_bytes() has checked ahead */
191 s[i] = (unsigned char)x;
192 } else {
193 s[i] = s[j];
196 s[i] = '\0';
197 return s + i;