mirror of
https://github.com/idolpx/libMeatloaf.git
synced 2025-12-06 04:38:49 -05:00
316 lines
7.1 KiB
C++
316 lines
7.1 KiB
C++
/**
|
|
* Copyright (C) 2011 by Ben Noordhuis <info@bnoordhuis.nl>
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
* in the Software without restriction, including without limitation the rights
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
* furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
* THE SOFTWARE.
|
|
*/
|
|
#include "punycode.h"
|
|
|
|
#include <assert.h>
|
|
#include <stdint.h>
|
|
#include <string.h>
|
|
#include <ctype.h>
|
|
|
|
#define min(a, b) ((a) < (b) ? (a) : (b))
|
|
|
|
/* punycode parameters, see http://tools.ietf.org/html/rfc3492#section-5 */
|
|
#define BASE 36
|
|
#define TMIN 1
|
|
#define TMAX 26
|
|
#define SKEW 38
|
|
#define DAMP 700
|
|
#define INITIAL_N 128
|
|
#define INITIAL_BIAS 72
|
|
|
|
static uint32_t adapt_bias (uint32_t delta, unsigned n_points, int is_first)
|
|
{
|
|
uint32_t k;
|
|
|
|
delta /= is_first ? DAMP : 2;
|
|
delta += delta / n_points;
|
|
|
|
/* while delta > 455: delta /= 35 */
|
|
for (k = 0; delta > ((BASE - TMIN) * TMAX) / 2; k += BASE)
|
|
{
|
|
delta /= (BASE - TMIN);
|
|
}
|
|
|
|
return k + (((BASE - TMIN + 1) * delta) / (delta + SKEW));
|
|
}
|
|
|
|
static char encode_digit (int c)
|
|
{
|
|
assert (c >= 0 && c <= BASE - TMIN);
|
|
if (c > 25)
|
|
{
|
|
return c + 22; /* '0'..'9' */
|
|
}
|
|
else
|
|
{
|
|
return c + 'a'; /* 'a'..'z' */
|
|
}
|
|
}
|
|
|
|
/* Encode as a generalized variable-length integer. Returns number of bytes written. */
|
|
static size_t encode_var_int (const size_t bias, const size_t delta, char *const dst, size_t dstlen)
|
|
{
|
|
size_t i, k, q, t;
|
|
|
|
i = 0;
|
|
k = BASE;
|
|
q = delta;
|
|
|
|
while (i < dstlen)
|
|
{
|
|
if (k <= bias)
|
|
{
|
|
t = TMIN;
|
|
}
|
|
else
|
|
if (k >= bias + TMAX)
|
|
{
|
|
t = TMAX;
|
|
}
|
|
else
|
|
{
|
|
t = k - bias;
|
|
}
|
|
|
|
if (q < t)
|
|
{
|
|
break;
|
|
}
|
|
|
|
dst[i++] = encode_digit (t + (q - t) % (BASE - t));
|
|
|
|
q = (q - t) / (BASE - t);
|
|
k += BASE;
|
|
}
|
|
|
|
if (i < dstlen)
|
|
{
|
|
dst[i++] = encode_digit (q);
|
|
}
|
|
|
|
return i;
|
|
}
|
|
|
|
static size_t decode_digit (uint32_t v)
|
|
{
|
|
if (isdigit (v))
|
|
{
|
|
return 22 + (v - '0');
|
|
}
|
|
if (islower (v))
|
|
{
|
|
return v - 'a';
|
|
}
|
|
if (isupper (v))
|
|
{
|
|
return v - 'A';
|
|
}
|
|
return SIZE_MAX;
|
|
}
|
|
|
|
size_t punycode_encode (const uint32_t *const src, const size_t srclen, char *const dst, size_t *const dstlen)
|
|
{
|
|
size_t b, h;
|
|
size_t delta, bias;
|
|
size_t m, n;
|
|
size_t si, di;
|
|
|
|
for (si = 0, di = 0; si < srclen && di < *dstlen; si++)
|
|
{
|
|
if (src[si] < 128)
|
|
{
|
|
dst[di++] = src[si];
|
|
}
|
|
}
|
|
|
|
b = h = di;
|
|
|
|
/* Write out delimiter if any basic code points were processed. */
|
|
if (di > 0 && di < *dstlen)
|
|
{
|
|
dst[di++] = '-';
|
|
}
|
|
|
|
n = INITIAL_N;
|
|
bias = INITIAL_BIAS;
|
|
delta = 0;
|
|
|
|
for (; h < srclen && di < *dstlen; n++, delta++)
|
|
{
|
|
/* Find next smallest non-basic code point. */
|
|
for (m = SIZE_MAX, si = 0; si < srclen; si++)
|
|
{
|
|
if (src[si] >= n && src[si] < m)
|
|
{
|
|
m = src[si];
|
|
}
|
|
}
|
|
|
|
if ((m - n) > (SIZE_MAX - delta) / (h + 1))
|
|
{
|
|
/* OVERFLOW */
|
|
assert (0 && "OVERFLOW");
|
|
goto fail;
|
|
}
|
|
|
|
delta += (m - n) * (h + 1);
|
|
n = m;
|
|
|
|
for (si = 0; si < srclen; si++)
|
|
{
|
|
if (src[si] < n)
|
|
{
|
|
if (++delta == 0)
|
|
{
|
|
/* OVERFLOW */
|
|
assert (0 && "OVERFLOW");
|
|
goto fail;
|
|
}
|
|
}
|
|
else
|
|
if (src[si] == n)
|
|
{
|
|
di += encode_var_int (bias, delta, &dst[di], *dstlen - di);
|
|
bias = adapt_bias (delta, h + 1, h == b);
|
|
delta = 0;
|
|
h++;
|
|
}
|
|
}
|
|
}
|
|
|
|
fail:
|
|
/* Tell the caller how many bytes were written to the output buffer. */
|
|
*dstlen = di;
|
|
|
|
/* Return how many Unicode code points were converted. */
|
|
return si;
|
|
}
|
|
|
|
size_t punycode_decode (const char *const src, const size_t srclen, uint32_t *const dst, size_t *const dstlen)
|
|
{
|
|
const char *p;
|
|
size_t b, n, t;
|
|
size_t i, k, w;
|
|
size_t si, di;
|
|
size_t digit;
|
|
size_t org_i;
|
|
size_t bias;
|
|
|
|
/* Ensure that the input contains only ASCII characters. */
|
|
for (si = 0; si < srclen; si++)
|
|
{
|
|
if (src[si] & 0x80)
|
|
{
|
|
*dstlen = 0;
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
/* Reverse-search for delimiter in input. */
|
|
for (p = src + srclen - 1; p > src && *p != '-'; p--);
|
|
b = p - src;
|
|
|
|
/* Copy basic code points to output. */
|
|
di = min (b, *dstlen);
|
|
|
|
for (i = 0; i < di; i++)
|
|
{
|
|
dst[i] = src[i];
|
|
}
|
|
|
|
i = 0;
|
|
n = INITIAL_N;
|
|
bias = INITIAL_BIAS;
|
|
|
|
for (si = b + (b > 0); si < srclen && di < *dstlen; di++)
|
|
{
|
|
org_i = i;
|
|
|
|
for (w = 1, k = BASE; di < *dstlen; k += BASE)
|
|
{
|
|
digit = decode_digit (src[si++]);
|
|
|
|
if (digit == SIZE_MAX)
|
|
{
|
|
goto fail;
|
|
}
|
|
|
|
if (digit > (SIZE_MAX - i) / w)
|
|
{
|
|
/* OVERFLOW */
|
|
assert (0 && "OVERFLOW");
|
|
goto fail;
|
|
}
|
|
|
|
i += digit * w;
|
|
|
|
if (k <= bias)
|
|
{
|
|
t = TMIN;
|
|
}
|
|
else
|
|
if (k >= bias + TMAX)
|
|
{
|
|
t = TMAX;
|
|
}
|
|
else
|
|
{
|
|
t = k - bias;
|
|
}
|
|
|
|
if (digit < t)
|
|
{
|
|
break;
|
|
}
|
|
|
|
if (w > SIZE_MAX / (BASE - t))
|
|
{
|
|
/* OVERFLOW */
|
|
assert (0 && "OVERFLOW");
|
|
goto fail;
|
|
}
|
|
|
|
w *= BASE - t;
|
|
}
|
|
|
|
bias = adapt_bias (i - org_i, di + 1, org_i == 0);
|
|
|
|
if (i / (di + 1) > SIZE_MAX - n)
|
|
{
|
|
/* OVERFLOW */
|
|
assert (0 && "OVERFLOW");
|
|
goto fail;
|
|
}
|
|
|
|
n += i / (di + 1);
|
|
i %= (di + 1);
|
|
|
|
memmove (dst + i + 1, dst + i, (di - i) * sizeof (uint32_t));
|
|
dst[i++] = n;
|
|
}
|
|
|
|
fail:
|
|
/* Tell the caller how many bytes were written to the output buffer. */
|
|
*dstlen = di;
|
|
|
|
return si;
|
|
} |