punycode_test.c 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294
  1. /*
  2. * Copyright 2022-2023 The OpenSSL Project Authors. All Rights Reserved.
  3. *
  4. * Licensed under the Apache License 2.0 (the "License"). You may not use
  5. * this file except in compliance with the License. You can obtain a copy
  6. * in the file LICENSE in the source distribution or at
  7. * https://www.openssl.org/source/license.html
  8. */
  9. #include <openssl/crypto.h>
  10. #include <string.h>
  11. #include "crypto/punycode.h"
  12. #include "internal/nelem.h"
  13. #include "internal/packet.h"
  14. #include "testutil.h"
  15. static const struct puny_test {
  16. unsigned int raw[50];
  17. const char *encoded;
  18. } puny_cases[] = {
  19. { /* Test of 4 byte codepoint using smileyface emoji */
  20. { 0x1F600
  21. },
  22. "e28h"
  23. },
  24. /* Test cases from RFC 3492 */
  25. { /* Arabic (Egyptian) */
  26. { 0x0644, 0x064A, 0x0647, 0x0645, 0x0627, 0x0628, 0x062A, 0x0643, 0x0644,
  27. 0x0645, 0x0648, 0x0634, 0x0639, 0x0631, 0x0628, 0x064A, 0x061F
  28. },
  29. "egbpdaj6bu4bxfgehfvwxn"
  30. },
  31. { /* Chinese (simplified) */
  32. { 0x4ED6, 0x4EEC, 0x4E3A, 0x4EC0, 0x4E48, 0x4E0D, 0x8BF4, 0x4E2D, 0x6587
  33. },
  34. "ihqwcrb4cv8a8dqg056pqjye"
  35. },
  36. { /* Chinese (traditional) */
  37. { 0x4ED6, 0x5011, 0x7232, 0x4EC0, 0x9EBD, 0x4E0D, 0x8AAA, 0x4E2D, 0x6587
  38. },
  39. "ihqwctvzc91f659drss3x8bo0yb"
  40. },
  41. { /* Czech: Pro<ccaron>prost<ecaron>nemluv<iacute><ccaron>esky */
  42. { 0x0050, 0x0072, 0x006F, 0x010D, 0x0070, 0x0072, 0x006F, 0x0073, 0x0074,
  43. 0x011B, 0x006E, 0x0065, 0x006D, 0x006C, 0x0075, 0x0076, 0x00ED, 0x010D,
  44. 0x0065, 0x0073, 0x006B, 0x0079
  45. },
  46. "Proprostnemluvesky-uyb24dma41a"
  47. },
  48. { /* Hebrew */
  49. { 0x05DC, 0x05DE, 0x05D4, 0x05D4, 0x05DD, 0x05E4, 0x05E9, 0x05D5, 0x05D8,
  50. 0x05DC, 0x05D0, 0x05DE, 0x05D3, 0x05D1, 0x05E8, 0x05D9, 0x05DD, 0x05E2,
  51. 0x05D1, 0x05E8, 0x05D9, 0x05EA
  52. },
  53. "4dbcagdahymbxekheh6e0a7fei0b"
  54. },
  55. { /* Hindi (Devanagari) */
  56. { 0x092F, 0x0939, 0x0932, 0x094B, 0x0917, 0x0939, 0x093F, 0x0928, 0x094D,
  57. 0x0926, 0x0940, 0x0915, 0x094D, 0x092F, 0x094B, 0x0902, 0x0928, 0x0939,
  58. 0x0940, 0x0902, 0x092C, 0x094B, 0x0932, 0x0938, 0x0915, 0x0924, 0x0947,
  59. 0x0939, 0x0948, 0x0902
  60. },
  61. "i1baa7eci9glrd9b2ae1bj0hfcgg6iyaf8o0a1dig0cd"
  62. },
  63. { /* Japanese (kanji and hiragana) */
  64. { 0x306A, 0x305C, 0x307F, 0x3093, 0x306A, 0x65E5, 0x672C, 0x8A9E, 0x3092,
  65. 0x8A71, 0x3057, 0x3066, 0x304F, 0x308C, 0x306A, 0x3044, 0x306E, 0x304B
  66. },
  67. "n8jok5ay5dzabd5bym9f0cm5685rrjetr6pdxa"
  68. },
  69. { /* Korean (Hangul syllables) */
  70. { 0xC138, 0xACC4, 0xC758, 0xBAA8, 0xB4E0, 0xC0AC, 0xB78C, 0xB4E4, 0xC774,
  71. 0xD55C, 0xAD6D, 0xC5B4, 0xB97C, 0xC774, 0xD574, 0xD55C, 0xB2E4, 0xBA74,
  72. 0xC5BC, 0xB9C8, 0xB098, 0xC88B, 0xC744, 0xAE4C
  73. },
  74. "989aomsvi5e83db1d2a355cv1e0vak1dwrv93d5xbh15a0dt30a5jpsd879ccm6fea98c"
  75. },
  76. { /* Russian (Cyrillic) */
  77. { 0x043F, 0x043E, 0x0447, 0x0435, 0x043C, 0x0443, 0x0436, 0x0435, 0x043E,
  78. 0x043D, 0x0438, 0x043D, 0x0435, 0x0433, 0x043E, 0x0432, 0x043E, 0x0440,
  79. 0x044F, 0x0442, 0x043F, 0x043E, 0x0440, 0x0443, 0x0441, 0x0441, 0x043A,
  80. 0x0438
  81. },
  82. "b1abfaaepdrnnbgefbaDotcwatmq2g4l"
  83. },
  84. { /* Spanish */
  85. { 0x0050, 0x006F, 0x0072, 0x0071, 0x0075, 0x00E9, 0x006E, 0x006F, 0x0070,
  86. 0x0075, 0x0065, 0x0064, 0x0065, 0x006E, 0x0073, 0x0069, 0x006D, 0x0070,
  87. 0x006C, 0x0065, 0x006D, 0x0065, 0x006E, 0x0074, 0x0065, 0x0068, 0x0061,
  88. 0x0062, 0x006C, 0x0061, 0x0072, 0x0065, 0x006E, 0x0045, 0x0073, 0x0070,
  89. 0x0061, 0x00F1, 0x006F, 0x006C
  90. },
  91. "PorqunopuedensimplementehablarenEspaol-fmd56a"
  92. },
  93. { /* Vietnamese */
  94. { 0x0054, 0x1EA1, 0x0069, 0x0073, 0x0061, 0x006F, 0x0068, 0x1ECD, 0x006B,
  95. 0x0068, 0x00F4, 0x006E, 0x0067, 0x0074, 0x0068, 0x1EC3, 0x0063, 0x0068,
  96. 0x1EC9, 0x006E, 0x00F3, 0x0069, 0x0074, 0x0069, 0x1EBF, 0x006E, 0x0067,
  97. 0x0056, 0x0069, 0x1EC7, 0x0074
  98. },
  99. "TisaohkhngthchnitingVit-kjcr8268qyxafd2f1b9g"
  100. },
  101. { /* Japanese: 3<nen>B<gumi><kinpachi><sensei> */
  102. { 0x0033, 0x5E74, 0x0042, 0x7D44, 0x91D1, 0x516B, 0x5148, 0x751F
  103. },
  104. "3B-ww4c5e180e575a65lsy2b"
  105. },
  106. { /* Japanese: <amuro><namie>-with-SUPER-MONKEYS */
  107. { 0x5B89, 0x5BA4, 0x5948, 0x7F8E, 0x6075, 0x002D, 0x0077, 0x0069, 0x0074,
  108. 0x0068, 0x002D, 0x0053, 0x0055, 0x0050, 0x0045, 0x0052, 0x002D, 0x004D,
  109. 0x004F, 0x004E, 0x004B, 0x0045, 0x0059, 0x0053
  110. },
  111. "-with-SUPER-MONKEYS-pc58ag80a8qai00g7n9n"
  112. },
  113. { /* Japanese: Hello-Another-Way-<sorezore><no><basho> */
  114. { 0x0048, 0x0065, 0x006C, 0x006C, 0x006F, 0x002D, 0x0041, 0x006E, 0x006F,
  115. 0x0074, 0x0068, 0x0065, 0x0072, 0x002D, 0x0057, 0x0061, 0x0079, 0x002D,
  116. 0x305D, 0x308C, 0x305E, 0x308C, 0x306E, 0x5834, 0x6240
  117. },
  118. "Hello-Another-Way--fc4qua05auwb3674vfr0b"
  119. },
  120. { /* Japanese: <hitotsu><yane><no><shita>2 */
  121. { 0x3072, 0x3068, 0x3064, 0x5C4B, 0x6839, 0x306E, 0x4E0B, 0x0032
  122. },
  123. "2-u9tlzr9756bt3uc0v"
  124. },
  125. { /* Japanese: Maji<de>Koi<suru>5<byou><mae> */
  126. { 0x004D, 0x0061, 0x006A, 0x0069, 0x3067, 0x004B, 0x006F, 0x0069, 0x3059,
  127. 0x308B, 0x0035, 0x79D2, 0x524D
  128. },
  129. "MajiKoi5-783gue6qz075azm5e"
  130. },
  131. { /* Japanese: <pafii>de<runba> */
  132. { 0x30D1, 0x30D5, 0x30A3, 0x30FC, 0x0064, 0x0065, 0x30EB, 0x30F3, 0x30D0
  133. },
  134. "de-jg4avhby1noc0d"
  135. },
  136. { /* Japanese: <sono><supiido><de> */
  137. { 0x305D, 0x306E, 0x30B9, 0x30D4, 0x30FC, 0x30C9, 0x3067
  138. },
  139. "d9juau41awczczp"
  140. },
  141. { /* -> $1.00 <- */
  142. { 0x002D, 0x003E, 0x0020, 0x0024, 0x0031, 0x002E, 0x0030, 0x0030, 0x0020,
  143. 0x003C, 0x002D
  144. },
  145. "-> $1.00 <--"
  146. }
  147. };
  148. static int test_punycode(int n)
  149. {
  150. const struct puny_test *tc = puny_cases + n;
  151. unsigned int buffer[50];
  152. unsigned int bsize = OSSL_NELEM(buffer);
  153. size_t i;
  154. if (!TEST_true(ossl_punycode_decode(tc->encoded, strlen(tc->encoded),
  155. buffer, &bsize)))
  156. return 0;
  157. for (i = 0; i < OSSL_NELEM(tc->raw); i++)
  158. if (tc->raw[i] == 0)
  159. break;
  160. if (!TEST_mem_eq(buffer, bsize * sizeof(*buffer),
  161. tc->raw, i * sizeof(*tc->raw)))
  162. return 0;
  163. return 1;
  164. }
  165. static const struct bad_decode_test {
  166. size_t outlen;
  167. const char input[20];
  168. } bad_decode_tests[] = {
  169. { 20, "xn--e-*" }, /* bad digit '*' */
  170. { 10, "xn--e-999" }, /* loop > enc_len */
  171. { 20, "xn--e-999999999" }, /* Too big */
  172. { 20, {'x', 'n', '-', '-', (char)0x80, '-' } }, /* Not basic */
  173. { 20, "xn--e-Oy65t" }, /* codepoint > 0x10FFFF */
  174. };
  175. static int test_a2ulabel_bad_decode(int tst)
  176. {
  177. char out[20];
  178. return TEST_int_eq(ossl_a2ulabel(bad_decode_tests[tst].input, out, bad_decode_tests[tst].outlen), -1);
  179. }
  180. static int test_a2ulabel(void)
  181. {
  182. char out[50];
  183. char in[530] = { 0 };
  184. /*
  185. * The punycode being passed in and parsed is malformed but we're not
  186. * verifying that behaviour here.
  187. */
  188. if (!TEST_int_eq(ossl_a2ulabel("xn--a.b.c", out, 1), 0)
  189. || !TEST_int_eq(ossl_a2ulabel("xn--a.b.c", out, 7), 1))
  190. return 0;
  191. /* Test for an off by one on the buffer size works */
  192. if (!TEST_int_eq(ossl_a2ulabel("xn--a.b.c", out, 6), 0)
  193. || !TEST_int_eq(ossl_a2ulabel("xn--a.b.c", out, 7), 1)
  194. || !TEST_str_eq(out,"\xc2\x80.b.c"))
  195. return 0;
  196. /* Test 4 byte smiley face */
  197. if (!TEST_int_eq(ossl_a2ulabel("xn--e28h.com", out, 10), 1))
  198. return 0;
  199. /* Test that we dont overflow the fixed internal buffer of 512 bytes when the starting bytes are copied */
  200. strcpy(in, "xn--");
  201. memset(in + 4, 'e', 513);
  202. memcpy(in + 517, "-3ya", 4);
  203. if (!TEST_int_eq(ossl_a2ulabel(in, out, 50), -1))
  204. return 0;
  205. return 1;
  206. }
  207. static int test_puny_overrun(void)
  208. {
  209. static const unsigned int out[] = {
  210. 0x0033, 0x5E74, 0x0042, 0x7D44, 0x91D1, 0x516B, 0x5148, 0x751F
  211. };
  212. static const char *in = "3B-ww4c5e180e575a65lsy2b";
  213. unsigned int buf[OSSL_NELEM(out)];
  214. unsigned int bsize = OSSL_NELEM(buf) - 1;
  215. if (!TEST_false(ossl_punycode_decode(in, strlen(in), buf, &bsize))) {
  216. if (TEST_mem_eq(buf, bsize * sizeof(*buf), out, sizeof(out)))
  217. TEST_error("CRITICAL: buffer overrun detected!");
  218. return 0;
  219. }
  220. return 1;
  221. }
  222. static int test_dotted_overflow(void)
  223. {
  224. static const char string[] = "a.a.a.a.a.a.a.a.a.a.a.a.a.a.a.a.a.a.a.a.a.a";
  225. const size_t num_reps = OSSL_NELEM(string) / 2;
  226. WPACKET p;
  227. BUF_MEM *in;
  228. char *out = NULL;
  229. size_t i;
  230. int res = 0;
  231. /* Create out input punycode string */
  232. if (!TEST_ptr(in = BUF_MEM_new()))
  233. return 0;
  234. if (!TEST_true(WPACKET_init_len(&p, in, 0))) {
  235. BUF_MEM_free(in);
  236. return 0;
  237. }
  238. for (i = 0; i < num_reps; i++) {
  239. if (i > 1 && !TEST_true(WPACKET_put_bytes_u8(&p, '.')))
  240. goto err;
  241. if (!TEST_true(WPACKET_memcpy(&p, "xn--a", sizeof("xn--a") - 1)))
  242. goto err;
  243. }
  244. if (!TEST_true(WPACKET_put_bytes_u8(&p, '\0')))
  245. goto err;
  246. if (!TEST_ptr(out = OPENSSL_malloc(in->length)))
  247. goto err;
  248. /* Test the decode into an undersized buffer */
  249. memset(out, 0x7f, in->length - 1);
  250. if (!TEST_int_le(ossl_a2ulabel(in->data, out, num_reps), 0)
  251. || !TEST_int_eq(out[num_reps], 0x7f))
  252. goto err;
  253. /* Test the decode works into a full size buffer */
  254. if (!TEST_int_gt(ossl_a2ulabel(in->data, out, in->length), 0)
  255. || !TEST_size_t_eq(strlen(out), num_reps * 3))
  256. goto err;
  257. res = 1;
  258. err:
  259. WPACKET_cleanup(&p);
  260. BUF_MEM_free(in);
  261. OPENSSL_free(out);
  262. return res;
  263. }
  264. int setup_tests(void)
  265. {
  266. ADD_ALL_TESTS(test_punycode, OSSL_NELEM(puny_cases));
  267. ADD_TEST(test_dotted_overflow);
  268. ADD_TEST(test_a2ulabel);
  269. ADD_TEST(test_puny_overrun);
  270. ADD_ALL_TESTS(test_a2ulabel_bad_decode, OSSL_NELEM(bad_decode_tests));
  271. return 1;
  272. }