blob: f116964b78a0c9cc4f574832b462b047df4f02e7 [file] [log] [blame]
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +00001/* vi: set sw=4 ts=4: */
2
3/* RFC1035 domain compression routines (C) 2007 Gabriel Somlo <somlo at cmu.edu>
4 *
5 * Loosely based on the isc-dhcpd implementation by dhankins@isc.org
6 *
7 * Licensed under GPLv2 or later, see file LICENSE in this tarball for details.
8 */
Denys Vlasenko3d9c69f2010-03-24 16:43:16 +01009#ifdef DNS_COMPR_TESTING
10# define FAST_FUNC /* nothing */
11# define xmalloc malloc
12# include <stdlib.h>
13# include <stdint.h>
14# include <string.h>
15# include <stdio.h>
16#else
17# include "common.h"
18#endif
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000019
20#define NS_MAXDNAME 1025 /* max domain name length */
21#define NS_MAXCDNAME 255 /* max compressed domain name length */
22#define NS_MAXLABEL 63 /* max label length */
23#define NS_MAXDNSRCH 6 /* max domains in search path */
24#define NS_CMPRSFLGS 0xc0 /* name compression pointer flag */
25
26
27/* expand a RFC1035-compressed list of domain names "cstr", of length "clen";
28 * returns a newly allocated string containing the space-separated domains,
29 * prefixed with the contents of string pre, or NULL if an error occurs.
30 */
Denis Vlasenkof1980f62008-09-26 09:34:59 +000031char* FAST_FUNC dname_dec(const uint8_t *cstr, int clen, const char *pre)
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000032{
Denys Vlasenko7895b912009-07-03 16:59:59 +020033 char *ret = ret; /* for compiler */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000034 char *dst = NULL;
35
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000036 /* We make two passes over the cstr string. First, we compute
37 * how long the resulting string would be. Then we allocate a
38 * new buffer of the required length, and fill it in with the
39 * expanded content. The advantage of this approach is not
40 * having to deal with requiring callers to supply their own
41 * buffer, then having to check if it's sufficiently large, etc.
42 */
Denys Vlasenko7895b912009-07-03 16:59:59 +020043 while (1) {
44 /* note: "return NULL" below are leak-safe since
45 * dst isn't yet allocated */
46 const uint8_t *c;
47 unsigned crtpos, retpos, depth, len;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000048
49 crtpos = retpos = depth = len = 0;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000050 while (crtpos < clen) {
51 c = cstr + crtpos;
52
Denys Vlasenkoa14a9d72010-03-24 15:06:23 +010053 if ((*c & NS_CMPRSFLGS) == NS_CMPRSFLGS) {
Denys Vlasenko7895b912009-07-03 16:59:59 +020054 /* pointer */
55 if (crtpos + 2 > clen) /* no offset to jump to? abort */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000056 return NULL;
Denys Vlasenko7895b912009-07-03 16:59:59 +020057 if (retpos == 0) /* toplevel? save return spot */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000058 retpos = crtpos + 2;
59 depth++;
Denys Vlasenkoa14a9d72010-03-24 15:06:23 +010060 crtpos = ((c[0] & 0x3f) << 8) | c[1]; /* jump */
Denys Vlasenko7895b912009-07-03 16:59:59 +020061 } else if (*c) {
62 /* label */
63 if (crtpos + *c + 1 > clen) /* label too long? abort */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000064 return NULL;
65 if (dst)
Denys Vlasenko7895b912009-07-03 16:59:59 +020066 memcpy(dst + len, c + 1, *c);
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000067 len += *c + 1;
68 crtpos += *c + 1;
69 if (dst)
Denys Vlasenko7895b912009-07-03 16:59:59 +020070 dst[len - 1] = '.';
71 } else {
Denys Vlasenko702f7d62010-03-24 16:11:32 +010072 /* NUL: end of current domain name */
Denys Vlasenko7895b912009-07-03 16:59:59 +020073 if (retpos == 0) {
74 /* toplevel? keep going */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000075 crtpos++;
Denys Vlasenko7895b912009-07-03 16:59:59 +020076 } else {
77 /* return to toplevel saved spot */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000078 crtpos = retpos;
79 retpos = depth = 0;
80 }
81 if (dst)
Denys Vlasenko7895b912009-07-03 16:59:59 +020082 dst[len - 1] = ' ';
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000083 }
84
Denys Vlasenko7895b912009-07-03 16:59:59 +020085 if (depth > NS_MAXDNSRCH /* too many jumps? abort, it's a loop */
86 || len > NS_MAXDNAME * NS_MAXDNSRCH /* result too long? abort */
87 ) {
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000088 return NULL;
Denys Vlasenko7895b912009-07-03 16:59:59 +020089 }
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000090 }
91
Denys Vlasenko7895b912009-07-03 16:59:59 +020092 if (!len) /* expanded string has 0 length? abort */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +000093 return NULL;
94
Denys Vlasenko7895b912009-07-03 16:59:59 +020095 if (!dst) { /* first pass? */
96 /* allocate dst buffer and copy pre */
97 unsigned plen = strlen(pre);
98 ret = dst = xmalloc(plen + len);
99 memcpy(dst, pre, plen);
100 dst += plen;
101 } else {
102 dst[len - 1] = '\0';
103 break;
104 }
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000105 }
106
Denys Vlasenko7895b912009-07-03 16:59:59 +0200107 return ret;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000108}
109
110/* Convert a domain name (src) from human-readable "foo.blah.com" format into
111 * RFC1035 encoding "\003foo\004blah\003com\000". Return allocated string, or
112 * NULL if an error occurs.
113 */
114static uint8_t *convert_dname(const char *src)
115{
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100116 uint8_t c, *res, *lenptr, *dst;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000117 int len;
118
119 res = xmalloc(strlen(src) + 2);
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100120 dst = lenptr = res;
121 dst++;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000122
123 for (;;) {
124 c = (uint8_t)*src++;
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100125 if (c == '.' || c == '\0') { /* end of label */
126 len = dst - lenptr - 1;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000127 /* label too long, too short, or two '.'s in a row? abort */
128 if (len > NS_MAXLABEL || len == 0 || (c == '.' && *src == '.')) {
129 free(res);
130 return NULL;
131 }
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100132 *lenptr = len;
133 if (c == '\0' || *src == '\0') /* "" or ".": end of src */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000134 break;
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100135 lenptr = dst++;
136 continue;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000137 }
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100138 if (c >= 'A' && c <= 'Z') /* uppercase? convert to lower */
139 c += ('a' - 'A');
140 *dst++ = c;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000141 }
142
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100143 if (dst - res >= NS_MAXCDNAME) { /* dname too long? abort */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000144 free(res);
145 return NULL;
146 }
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100147
148 *dst = 0;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000149 return res;
150}
151
152/* returns the offset within cstr at which dname can be found, or -1
153 */
154static int find_offset(const uint8_t *cstr, int clen, const uint8_t *dname)
155{
156 const uint8_t *c, *d;
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100157 int off;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000158
159 /* find all labels in cstr */
160 off = 0;
161 while (off < clen) {
162 c = cstr + off;
163
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100164 if ((*c & NS_CMPRSFLGS) == NS_CMPRSFLGS) { /* pointer, skip */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000165 off += 2;
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100166 continue;
167 }
168 if (*c) { /* label, try matching dname */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000169 d = dname;
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100170 while (1) {
171 unsigned len1 = *c + 1;
172 if (memcmp(c, d, len1) != 0)
173 break;
174 if (len1 == 1) /* at terminating NUL - match, return offset */
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000175 return off;
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100176 d += len1;
177 c += len1;
Denys Vlasenkoa14a9d72010-03-24 15:06:23 +0100178 if ((*c & NS_CMPRSFLGS) == NS_CMPRSFLGS) /* pointer, jump */
179 c = cstr + (((c[0] & 0x3f) << 8) | c[1]);
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000180 }
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100181 off += cstr[off] + 1;
182 continue;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000183 }
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100184 /* NUL, skip */
185 off++;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000186 }
187
188 return -1;
189}
190
191/* computes string to be appended to cstr so that src would be added to
192 * the compression (best case, it's a 2-byte pointer to some offset within
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100193 * cstr; worst case, it's all of src, converted to <4>host<3>com<0> format).
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000194 * The computed string is returned directly; its length is returned via retlen;
195 * NULL and 0, respectively, are returned if an error occurs.
196 */
Denis Vlasenkof1980f62008-09-26 09:34:59 +0000197uint8_t* FAST_FUNC dname_enc(const uint8_t *cstr, int clen, const char *src, int *retlen)
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000198{
199 uint8_t *d, *dname;
200 int off;
201
202 dname = convert_dname(src);
203 if (dname == NULL) {
204 *retlen = 0;
205 return NULL;
206 }
207
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100208 d = dname;
209 while (*d) {
210 if (cstr) {
211 off = find_offset(cstr, clen, d);
212 if (off >= 0) { /* found a match, add pointer and return */
213 *d++ = NS_CMPRSFLGS | (off >> 8);
214 *d = off;
215 break;
216 }
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000217 }
Denys Vlasenko702f7d62010-03-24 16:11:32 +0100218 d += *d + 1;
Denis Vlasenko4c7e5b62007-02-27 22:39:19 +0000219 }
220
221 *retlen = d - dname + 1;
222 return dname;
Denis Vlasenko8e858e22007-03-07 09:35:43 +0000223}
Denys Vlasenko3d9c69f2010-03-24 16:43:16 +0100224
225#ifdef DNS_COMPR_TESTING
226/* gcc -Wall -DDNS_COMPR_TESTING domain_codec.c -o domain_codec && ./domain_codec */
227int main(int argc, char **argv)
228{
229 int len;
230 uint8_t *encoded;
231
232#define DNAME_DEC(encoded,pre) dname_dec((uint8_t*)(encoded), sizeof(encoded), (pre))
233 printf("'%s'\n", DNAME_DEC("\4host\3com\0", "test1:"));
234 printf("test2:'%s'\n", DNAME_DEC("\4host\3com\0\4host\3com\0", ""));
235 printf("test3:'%s'\n", DNAME_DEC("\4host\3com\0\xC0\0", ""));
236 printf("test4:'%s'\n", DNAME_DEC("\4host\3com\0\xC0\5", ""));
237 printf("test5:'%s'\n", DNAME_DEC("\4host\3com\0\xC0\5\1z\xC0\xA", ""));
238
239#define DNAME_ENC(cache,source,lenp) dname_enc((uint8_t*)(cache), sizeof(cache), (source), (lenp))
240 encoded = dname_enc(NULL, 0, "test.net", &len);
241 printf("test6:'%s' len:%d\n", dname_dec(encoded, len, ""), len);
242 encoded = DNAME_ENC("\3net\0", "test.net", &len);
243 printf("test7:'%s' len:%d\n", dname_dec(encoded, len, ""), len);
244 encoded = DNAME_ENC("\4test\3net\0", "test.net", &len);
245 printf("test8:'%s' len:%d\n", dname_dec(encoded, len, ""), len);
246 return 0;
247}
248#endif