2 * Copyright (c) 2021 Omar Polo <op@omarpolo.com>
4 * Permission to use, copy, modify, and distribute this software for any
5 * purpose with or without fee is hereby granted, provided that the above
6 * copyright notice and this permission notice appear in all copies.
8 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
9 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
10 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
11 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
12 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
13 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
14 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
32 adapt(int delta, int numpoints, int firsttime)
41 delta += (delta / numpoints);
44 while (delta > ((BASE - TMIN) * TMAX) / 2) {
45 delta = delta / (BASE - TMIN);
48 return k + (((BASE - TMIN + 1) * delta) / (delta + SKEW));
52 copy_until_delimiter(const char *s, char *out, size_t len)
56 end = strchr(s, '\0');
60 for (t = end; t >= s; --t)
67 for (; s < t; ++s, ++out) {
79 if ('A' <= c && c <= 'Z')
82 if ('a' <= c && c <= 'z')
85 if ('0' <= c && c <= '9')
92 insert(char *out, size_t len, int codepoint, size_t i)
98 if (codepoint <= 0x7F)
100 else if (codepoint <= 0x7FF)
102 else if (codepoint <= 0xFFFF)
104 else if (codepoint <= 0x10FFFF)
109 if ((t = utf8_nth(out, i)) == NULL)
111 if (t + l >= out + len)
114 memmove(t + l, t, strlen(t));
118 t[1] = ( codepoint & 0x3F) + 0x80;
119 t[0] = ((codepoint >> 6) & 0x1F) + 0xC0;
122 t[2] = ( codepoint & 0x3F) + 0x80;
123 t[1] = ((codepoint >> 6) & 0x3F) + 0x80;
124 t[0] = ((codepoint >> 12) & 0x0F) + 0xE0;
127 t[3] = ( codepoint & 0x3F) + 0x80;
128 t[2] = ((codepoint >> 6) & 0x3F) + 0x80;
129 t[1] = ((codepoint >> 12) & 0x3F) + 0x80;
130 t[0] = ((codepoint >> 18) & 0x07) + 0xF0;
137 decode(const char *str, char *out, size_t len)
141 unsigned int oldi, bias, w, k, digit, t;
142 unsigned int numpoints;
145 if (str == NULL || len <= 4)
148 /* todo: starts_with */
149 if (strstr(str, "xn--") != str) {
150 strncpy(out, str, len);
157 if (strchr(str, '-') != NULL) {
158 if ((s = copy_until_delimiter(str, out, len)) == NULL)
165 numpoints = strlen(out);
175 for (k = BASE; ; k += BASE) {
178 /* fail eventually? */
179 digit = digit_value(*s);
182 /* fail on overflow */
187 else if (k >= bias + TMAX)
197 bias = adapt(i - oldi, numpoints+1, oldi == 0);
198 n += i / (numpoints+1); /* fail on overflow */
199 i = i % (numpoints+1);
201 if (!insert(out, len, n, i))
211 end_of_component(const char *hostname)
213 for (; *hostname != '\0' && *hostname != '.'; ++hostname)
219 puny_decode(const char *hostname, char *out, size_t len)
221 char comp[DOMAIN_NAME_LEN];
229 end = end_of_component(s);
230 if (end - s >= sizeof(comp))
233 memcpy(comp, s, end - s);
234 comp[end - s] = '\0';
236 if (!decode(comp, out, len))
242 if (strlcat(out, ".", len) >= len)