test-strcmp.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523
  1. /* Test and measure strcmp and wcscmp functions.
  2. Copyright (C) 1999-2026 Free Software Foundation, Inc.
  3. This file is part of the GNU C Library.
  4. The GNU C Library is free software; you can redistribute it and/or
  5. modify it under the terms of the GNU Lesser General Public
  6. License as published by the Free Software Foundation; either
  7. version 2.1 of the License, or (at your option) any later version.
  8. The GNU C Library is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  11. Lesser General Public License for more details.
  12. You should have received a copy of the GNU Lesser General Public
  13. License along with the GNU C Library; if not, see
  14. <https://www.gnu.org/licenses/>. */
  15. #define TEST_LEN (getpagesize () * 3)
  16. #define MIN_PAGE_SIZE (TEST_LEN + 2 * getpagesize ())
  17. #define TEST_MAIN
  18. #ifdef WIDE
  19. # define TEST_NAME "wcscmp"
  20. #else
  21. # define TEST_NAME "strcmp"
  22. #endif
  23. #include "test-string.h"
  24. #include <support/test-driver.h>
  25. #ifdef WIDE
  26. # include <wchar.h>
  27. # define L(str) L##str
  28. # define STRCMP wcscmp
  29. # define STRCPY wcscpy
  30. # define STRLEN wcslen
  31. # define MEMCPY wmemcpy
  32. # define SIMPLE_STRCMP simple_wcscmp
  33. # define CHAR wchar_t
  34. # define UCHAR wchar_t
  35. # define CHARBYTES 4
  36. # define CHARBYTESLOG 2
  37. # define CHARALIGN __alignof__ (CHAR)
  38. # define MIDCHAR 0x7fffffff
  39. # define LARGECHAR 0xfffffffe
  40. # define CHAR__MAX WCHAR_MAX
  41. # define CHAR__MIN WCHAR_MIN
  42. /* Wcscmp uses signed semantics for comparison, not unsigned */
  43. /* Avoid using subtraction since possible overflow */
  44. int
  45. simple_wcscmp (const wchar_t *s1, const wchar_t *s2)
  46. {
  47. wchar_t c1, c2;
  48. do
  49. {
  50. c1 = *s1++;
  51. c2 = *s2++;
  52. if (c2 == L'\0')
  53. return c1 - c2;
  54. }
  55. while (c1 == c2);
  56. return c1 < c2 ? -1 : 1;
  57. }
  58. #else
  59. # include <limits.h>
  60. # define L(str) str
  61. # define STRCMP strcmp
  62. # define STRCPY strcpy
  63. # define STRLEN strlen
  64. # define MEMCPY memcpy
  65. # define SIMPLE_STRCMP simple_strcmp
  66. # define CHAR char
  67. # define UCHAR unsigned char
  68. # define CHARBYTES 1
  69. # define CHARBYTESLOG 0
  70. # define CHARALIGN 1
  71. # define MIDCHAR 0x7f
  72. # define LARGECHAR 0xfe
  73. # define CHAR__MAX CHAR_MAX
  74. # define CHAR__MIN CHAR_MIN
  75. /* Strcmp uses unsigned semantics for comparison. */
  76. int
  77. simple_strcmp (const char *s1, const char *s2)
  78. {
  79. int ret;
  80. while ((ret = *(unsigned char *) s1 - *(unsigned char*) s2++) == 0 && *s1++);
  81. return ret;
  82. }
  83. #endif
  84. typedef int (*proto_t) (const CHAR *, const CHAR *);
  85. IMPL (STRCMP, 1)
  86. /* Also check the default implementation. */
  87. #undef STRCMP
  88. #undef libc_hidden_builtin_def
  89. #define libc_hidden_builtin_def(a)
  90. #undef libc_hidden_def
  91. #define libc_hidden_def(a)
  92. #undef weak_alias
  93. #define weak_alias(a, b)
  94. #undef attribute_hidden
  95. #define attribute_hidden
  96. #ifndef WIDE
  97. # define STRCMP __strcmp_default
  98. # include "string/strcmp.c"
  99. # define STRCMP_DEFAULT STRCMP
  100. #else
  101. # define WCSCMP __wcscmp_default
  102. # include "wcsmbs/wcscmp.c"
  103. # define STRCMP_DEFAULT WCSCMP
  104. #endif
  105. IMPL (STRCMP_DEFAULT, 1)
  106. static int
  107. check_result (impl_t *impl,
  108. const CHAR *s1, const CHAR *s2,
  109. int exp_result)
  110. {
  111. int result = CALL (impl, s1, s2);
  112. if ((exp_result == 0 && result != 0)
  113. || (exp_result < 0 && result >= 0)
  114. || (exp_result > 0 && result <= 0))
  115. {
  116. error (0, 0, "Wrong result in function %s %d %d", impl->name,
  117. result, exp_result);
  118. ret = 1;
  119. return -1;
  120. }
  121. return 0;
  122. }
  123. static void
  124. do_one_test (impl_t *impl,
  125. const CHAR *s1, const CHAR *s2,
  126. int exp_result)
  127. {
  128. if (check_result (impl, s1, s2, exp_result) < 0)
  129. return;
  130. }
  131. static void
  132. do_test (size_t align1, size_t align2, size_t len, int max_char,
  133. int exp_result)
  134. {
  135. size_t i;
  136. CHAR *s1, *s2;
  137. if (len == 0)
  138. return;
  139. align1 &= ~(CHARBYTES - 1);
  140. align2 &= ~(CHARBYTES - 1);
  141. align1 &= getpagesize () - 1;
  142. if (align1 + (len + 1) * CHARBYTES >= page_size)
  143. return;
  144. align2 &= getpagesize () - 1;
  145. if (align2 + (len + 1) * CHARBYTES >= page_size)
  146. return;
  147. /* Put them close to the end of page. */
  148. i = align1 + CHARBYTES * (len + 2);
  149. s1 = (CHAR *)(buf1 + ((page_size - i) / 16 * 16) + align1);
  150. i = align2 + CHARBYTES * (len + 2);
  151. s2 = (CHAR *)(buf2 + ((page_size - i) / 16 * 16) + align2);
  152. for (i = 0; i < len; i++)
  153. s1[i] = s2[i] = 1 + (23 << ((CHARBYTES - 1) * 8)) * i % max_char;
  154. s1[len] = s2[len] = 0;
  155. s1[len + 1] = 23;
  156. s2[len + 1] = 24 + exp_result;
  157. s2[len - 1] -= exp_result;
  158. FOR_EACH_IMPL (impl, 0)
  159. do_one_test (impl, s1, s2, exp_result);
  160. }
  161. static void
  162. do_random_tests (void)
  163. {
  164. UCHAR *p1 = (UCHAR *) (buf1 + page_size - 512 * CHARBYTES);
  165. UCHAR *p2 = (UCHAR *) (buf2 + page_size - 512 * CHARBYTES);
  166. for (size_t n = 0; n < ITERATIONS; n++)
  167. {
  168. /* for wcscmp case align1 and align2 mean here alignment
  169. in wchar_t symbols, it equal 4*k alignment in bytes, we
  170. don't check other alignments like for example
  171. p1 = (wchar_t *)(buf1 + 1)
  172. because it's wrong using of wchar_t type. */
  173. size_t align1 = random () & 31;
  174. size_t align2;
  175. if (random () & 1)
  176. align2 = random () & 31;
  177. else
  178. align2 = align1 + (random () & 24);
  179. size_t pos = random () & 511;
  180. size_t j = align1 > align2 ? align1 : align2;
  181. if (pos + j >= 511)
  182. pos = 510 - j - (random () & 7);
  183. size_t len1 = random () & 511;
  184. if (pos >= len1 && (random () & 1))
  185. len1 = pos + (random () & 7);
  186. if (len1 + j >= 512)
  187. len1 = 511 - j - (random () & 7);
  188. size_t len2;
  189. if (pos >= len1)
  190. len2 = len1;
  191. else
  192. len2 = len1 + (len1 != 511 - j ? random () % (511 - j - len1) : 0);
  193. j = (pos > len2 ? pos : len2) + align1 + 64;
  194. if (j > 512)
  195. j = 512;
  196. for (size_t i = 0; i < j; ++i)
  197. {
  198. p1[i] = random () & 255;
  199. if (i < len1 + align1 && !p1[i])
  200. {
  201. p1[i] = random () & 255;
  202. if (!p1[i])
  203. p1[i] = 1 + (random () & 127);
  204. }
  205. }
  206. for (size_t i = 0; i < j; ++i)
  207. {
  208. p2[i] = random () & 255;
  209. if (i < len2 + align2 && !p2[i])
  210. {
  211. p2[i] = random () & 255;
  212. if (!p2[i])
  213. p2[i] = 1 + (random () & 127);
  214. }
  215. }
  216. int result = 0;
  217. MEMCPY (p2 + align2, p1 + align1, pos);
  218. if (pos < len1)
  219. {
  220. if (p2[align2 + pos] == p1[align1 + pos])
  221. {
  222. p2[align2 + pos] = random () & 255;
  223. if (p2[align2 + pos] == p1[align1 + pos])
  224. p2[align2 + pos] = p1[align1 + pos] + 3 + (random () & 127);
  225. }
  226. if (p1[align1 + pos] < p2[align2 + pos])
  227. result = -1;
  228. else
  229. result = 1;
  230. }
  231. p1[len1 + align1] = 0;
  232. p2[len2 + align2] = 0;
  233. FOR_EACH_IMPL (impl, 1)
  234. {
  235. int r = CALL (impl, (CHAR *) (p1 + align1), (CHAR *) (p2 + align2));
  236. /* Test whether on 64-bit architectures where ABI requires
  237. callee to promote has the promotion been done. */
  238. asm ("" : "=g" (r) : "0" (r));
  239. if ((r == 0 && result)
  240. || (r < 0 && result >= 0)
  241. || (r > 0 && result <= 0))
  242. {
  243. error (0, 0, "Iteration %zd - wrong result in function %s (align in bytes: %zd, align in bytes: %zd, len1: %zd, len2: %zd, pos: %zd) %d != %d, p1 %p p2 %p",
  244. n, impl->name, (size_t) (p1 + align1) & 63, (size_t) (p1 + align2) & 63, len1, len2, pos, r, result, p1, p2);
  245. ret = 1;
  246. }
  247. }
  248. }
  249. }
  250. static void
  251. check (void)
  252. {
  253. CHAR *s1 = (CHAR *) (buf1 + 0xb2c);
  254. CHAR *s2 = (CHAR *) (buf1 + 0xfd8);
  255. STRCPY(s1, L("abcdefghijklmnopqrstuvwxyzabcdefghijklmnopqrstuvwxyzabcdefghijklmnopqrs"));
  256. STRCPY(s2, L("abcdefghijklmnopqrstuvwxyzabcdefghijklmnopqrstuvwxyzabcdefghijkLMNOPQRSTUV"));
  257. /* Check correct working for negatives values */
  258. s1[0] = 1;
  259. s2[0] = 1;
  260. s1[1] = 1;
  261. s2[1] = 1;
  262. s1[2] = -1;
  263. s2[2] = 3;
  264. s1[3] = 0;
  265. s2[3] = -1;
  266. /* Check possible overflow bug, actual more for wcscmp */
  267. s1[7] = CHAR__MIN;
  268. s2[7] = CHAR__MAX;
  269. size_t l1 = STRLEN (s1);
  270. size_t l2 = STRLEN (s2);
  271. for (size_t i1 = 0; i1 < l1; i1++)
  272. for (size_t i2 = 0; i2 < l2; i2++)
  273. {
  274. int exp_result = SIMPLE_STRCMP (s1 + i1, s2 + i2);
  275. FOR_EACH_IMPL (impl, 0)
  276. check_result (impl, s1 + i1, s2 + i2, exp_result);
  277. }
  278. /* Test cases where there are multiple zero bytes after the first. */
  279. for (size_t i = 0; i < 16 + 1; i++)
  280. {
  281. s1[i] = 0x00;
  282. s2[i] = 0x00;
  283. }
  284. for (size_t i = 0; i < 16; i++)
  285. {
  286. int exp_result;
  287. for (int val = 0x01; val < 0x100; val++)
  288. {
  289. for (size_t j = 0; j < i; j++)
  290. {
  291. s1[j] = val;
  292. s2[j] = val;
  293. }
  294. s2[i] = val;
  295. exp_result = SIMPLE_STRCMP (s1, s2);
  296. FOR_EACH_IMPL (impl, 0)
  297. check_result (impl, s1, s2, exp_result);
  298. }
  299. }
  300. }
  301. static void
  302. check2 (void)
  303. {
  304. /* To trigger bug 25933, we need a size that is equal to the vector
  305. length times 4. In the case of AVX2 for Intel, we need 32 * 4. We
  306. make this test generic and run it for all architectures as additional
  307. boundary testing for such related algorithms. */
  308. size_t size = 32 * 4;
  309. CHAR *s1 = (CHAR *) (buf1 + (BUF1PAGES - 1) * page_size);
  310. CHAR *s2 = (CHAR *) (buf2 + (BUF1PAGES - 1) * page_size);
  311. int exp_result;
  312. memset (s1, 'a', page_size);
  313. memset (s2, 'a', page_size);
  314. s1[(page_size / CHARBYTES) - 1] = (CHAR) 0;
  315. s2[(page_size / CHARBYTES) - 1] = (CHAR) 0;
  316. /* Iterate over a size that is just below where we expect the bug to
  317. trigger up to the size we expect will trigger the bug e.g. [99-128].
  318. Likewise iterate the start of two strings between 30 and 31 bytes
  319. away from the boundary to simulate alignment changes. */
  320. for (size_t s = 99; s <= size; s++)
  321. for (size_t s1a = 30; s1a < 32; s1a++)
  322. for (size_t s2a = 30; s2a < 32; s2a++)
  323. {
  324. CHAR *s1p = s1 + (page_size / CHARBYTES - s) - s1a;
  325. CHAR *s2p = s2 + (page_size / CHARBYTES - s) - s2a;
  326. exp_result = SIMPLE_STRCMP (s1p, s2p);
  327. FOR_EACH_IMPL (impl, 0)
  328. check_result (impl, s1p, s2p, exp_result);
  329. }
  330. }
  331. static void
  332. check3 (void)
  333. {
  334. size_t size = 0xd000 + 0x4000;
  335. CHAR *s1, *s2;
  336. CHAR *buffer1 = mmap (NULL, size, PROT_READ | PROT_WRITE,
  337. MAP_PRIVATE | MAP_ANON, -1, 0);
  338. CHAR *buffer2 = mmap (NULL, size, PROT_READ | PROT_WRITE,
  339. MAP_PRIVATE | MAP_ANON, -1, 0);
  340. if (buffer1 == MAP_FAILED || buffer1 == MAP_FAILED)
  341. error (EXIT_UNSUPPORTED, errno, "mmap failed");
  342. s1 = (CHAR *) (buffer1 + 0x8f8 / sizeof (CHAR));
  343. s2 = (CHAR *) (buffer2 + 0xcff3 / sizeof (CHAR));
  344. STRCPY(s1, L("/export/redhat/rpms/BUILD/java-1.8.0-openjdk-1.8.0.312.b07-2.fc35.x86_64/openjdk/langtools/src/share/classes/com/sun/tools/doclets/internal/toolkit/util/PathDocFileFactory.java"));
  345. STRCPY(s2, L("/export/redhat/rpms/BUILD/java-1.8.0-openjdk-1.8.0.312.b07-2.fc35.x86_64/openjdk/langtools/src/share/classes/com/sun/tools/doclets/internal/toolkit/taglets/ThrowsTaglet.java"));
  346. int exp_result = SIMPLE_STRCMP (s1, s2);
  347. FOR_EACH_IMPL (impl, 0)
  348. check_result (impl, s1, s2, exp_result);
  349. munmap ((void *) buffer1, size);
  350. munmap ((void *) buffer2, size);
  351. }
  352. int
  353. test_main (void)
  354. {
  355. size_t i, j, k;
  356. const size_t test_len = MIN(TEST_LEN, 3 * 4096);
  357. test_init ();
  358. check();
  359. check2 ();
  360. check3 ();
  361. printf ("%23s", "");
  362. FOR_EACH_IMPL (impl, 0)
  363. printf ("\t%s", impl->name);
  364. putchar ('\n');
  365. for (i = 1; i < 32; ++i)
  366. {
  367. do_test (CHARBYTES * i, CHARBYTES * i, i, MIDCHAR, 0);
  368. do_test (CHARBYTES * i, CHARBYTES * i, i, MIDCHAR, 1);
  369. do_test (CHARBYTES * i, CHARBYTES * i, i, MIDCHAR, -1);
  370. }
  371. for (i = 1; i < 10 + CHARBYTESLOG; ++i)
  372. {
  373. do_test (0, 0, 2 << i, MIDCHAR, 0);
  374. do_test (0, 0, 2 << i, LARGECHAR, 0);
  375. do_test (0, 0, 2 << i, MIDCHAR, 1);
  376. do_test (0, 0, 2 << i, LARGECHAR, 1);
  377. do_test (0, 0, 2 << i, MIDCHAR, -1);
  378. do_test (0, 0, 2 << i, LARGECHAR, -1);
  379. do_test (0, CHARBYTES * i, 2 << i, MIDCHAR, 1);
  380. do_test (CHARBYTES * i, CHARBYTES * (i + 1), 2 << i, LARGECHAR, 1);
  381. }
  382. for (i = 1; i < 8; ++i)
  383. {
  384. do_test (CHARBYTES * i, 2 * CHARBYTES * i, 8 << i, MIDCHAR, 0);
  385. do_test (2 * CHARBYTES * i, CHARBYTES * i, 8 << i, LARGECHAR, 0);
  386. do_test (CHARBYTES * i, 2 * CHARBYTES * i, 8 << i, MIDCHAR, 1);
  387. do_test (2 * CHARBYTES * i, CHARBYTES * i, 8 << i, LARGECHAR, 1);
  388. do_test (CHARBYTES * i, 2 * CHARBYTES * i, 8 << i, MIDCHAR, -1);
  389. do_test (2 * CHARBYTES * i, CHARBYTES * i, 8 << i, LARGECHAR, -1);
  390. }
  391. for (j = 0; j < 160; ++j)
  392. {
  393. for (i = 0; i < test_len;)
  394. {
  395. do_test (getpagesize () - j - 1, 0, i, 127, 0);
  396. do_test (getpagesize () - j - 1, 0, i, 127, 1);
  397. do_test (getpagesize () - j - 1, 0, i, 127, -1);
  398. do_test (getpagesize () - j - 1, j, i, 127, 0);
  399. do_test (getpagesize () - j - 1, j, i, 127, 1);
  400. do_test (getpagesize () - j - 1, j, i, 127, -1);
  401. do_test (0, getpagesize () - j - 1, i, 127, 0);
  402. do_test (0, getpagesize () - j - 1, i, 127, 1);
  403. do_test (0, getpagesize () - j - 1, i, 127, -1);
  404. do_test (j, getpagesize () - j - 1, i, 127, 0);
  405. do_test (j, getpagesize () - j - 1, i, 127, 1);
  406. do_test (j, getpagesize () - j - 1, i, 127, -1);
  407. for (k = 2; k <= 128; k += k)
  408. {
  409. do_test (getpagesize () - k, getpagesize () - j - 1, i, 127, 0);
  410. do_test (getpagesize () - k - 1, getpagesize () - j - 1, i, 127,
  411. 0);
  412. do_test (getpagesize () - k, getpagesize () - j - 1, i, 127, 1);
  413. do_test (getpagesize () - k - 1, getpagesize () - j - 1, i, 127,
  414. 1);
  415. do_test (getpagesize () - k, getpagesize () - j - 1, i, 127, -1);
  416. do_test (getpagesize () - k - 1, getpagesize () - j - 1, i, 127,
  417. -1);
  418. }
  419. if (i < 32)
  420. {
  421. i += 1;
  422. }
  423. else if (i < 161)
  424. {
  425. i += 7;
  426. }
  427. else if (i + 161 < test_len)
  428. {
  429. i += 31;
  430. i *= 17;
  431. i /= 16;
  432. if (i + 161 > test_len)
  433. {
  434. i = test_len - 160;
  435. }
  436. }
  437. else if (i + 32 < test_len)
  438. {
  439. i += 7;
  440. }
  441. else
  442. {
  443. i += 1;
  444. }
  445. }
  446. }
  447. do_random_tests ();
  448. return ret;
  449. }
  450. #include <support/test-driver.c>