root/maint/gnulib/tests/test-strstr.c

/* [previous][next][first][last][top][bottom][index][help] */

DEFINITIONS

This source file includes following definitions.
  1. main

   1 /*
   2  * Copyright (C) 2004, 2007-2021 Free Software Foundation, Inc.
   3  * Written by Bruno Haible and Eric Blake
   4  *
   5  * This program is free software: you can redistribute it and/or modify
   6  * it under the terms of the GNU General Public License as published by
   7  * the Free Software Foundation; either version 3 of the License, or
   8  * (at your option) any later version.
   9  *
  10  * This program is distributed in the hope that it will be useful,
  11  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  13  * GNU General Public License for more details.
  14  *
  15  * You should have received a copy of the GNU General Public License
  16  * along with this program.  If not, see <https://www.gnu.org/licenses/>.  */
  17 
  18 #include <config.h>
  19 
  20 #include <string.h>
  21 
  22 #include "signature.h"
  23 SIGNATURE_CHECK (strstr, char *, (char const *, char const *));
  24 
  25 #include <signal.h>
  26 #include <stdlib.h>
  27 #include <unistd.h>
  28 
  29 #include "zerosize-ptr.h"
  30 #include "macros.h"
  31 
  32 int
  33 main (int argc, char *argv[])
     /* [previous][next][first][last][top][bottom][index][help] */
  34 {
  35 #if HAVE_DECL_ALARM
  36   /* Declare failure if test takes too long, by using default abort
  37      caused by SIGALRM.  All known platforms that lack alarm also have
  38      a quadratic strstr, and the replacement strstr is known to not
  39      take too long.  */
  40   int alarm_value = 50;
  41   signal (SIGALRM, SIG_DFL);
  42   alarm (alarm_value);
  43 #endif
  44 
  45   {
  46     const char input[] = "foo";
  47     const char *result = strstr (input, "");
  48     ASSERT (result == input);
  49   }
  50 
  51   {
  52     const char input[] = "foo";
  53     const char *result = strstr (input, "o");
  54     ASSERT (result == input + 1);
  55   }
  56 
  57   {
  58     /* On some platforms, the memchr() functions reads past the first
  59        occurrence of the byte to be searched, leading to an out-of-bounds
  60        read access for strstr().
  61        See <https://bugs.debian.org/cgi-bin/bugreport.cgi?bug=521737>.
  62        This is a bug in memchr(), see the Austin Group's clarification
  63        <https://www.opengroup.org/austin/docs/austin_454.txt>.  */
  64     const char *fix = "aBaaaaaaaaaaax";
  65     char *page_boundary = (char *) zerosize_ptr ();
  66     size_t len = strlen (fix) + 1;
  67     char *input = page_boundary ? page_boundary - len : malloc (len);
  68     const char *result;
  69 
  70     strcpy (input, fix);
  71     result = strstr (input, "B1x");
  72     ASSERT (result == NULL);
  73     if (!page_boundary)
  74       free (input);
  75   }
  76 
  77   {
  78     const char input[] = "ABC ABCDAB ABCDABCDABDE";
  79     const char *result = strstr (input, "ABCDABD");
  80     ASSERT (result == input + 15);
  81   }
  82 
  83   {
  84     const char input[] = "ABC ABCDAB ABCDABCDABDE";
  85     const char *result = strstr (input, "ABCDABE");
  86     ASSERT (result == NULL);
  87   }
  88 
  89   {
  90     const char input[] = "ABC ABCDAB ABCDABCDABDE";
  91     const char *result = strstr (input, "ABCDABCD");
  92     ASSERT (result == input + 11);
  93   }
  94 
  95   /* Check that a long periodic needle does not cause false positives.  */
  96   {
  97     const char input[] = "F_BD_CE_BD_EF_BF_BD_EF_BF_BD_EF_BF_BD_EF_BF_BD"
  98                          "_C3_88_20_EF_BF_BD_EF_BF_BD_EF_BF_BD"
  99                          "_C3_A7_20_EF_BF_BD";
 100     const char need[] = "_EF_BF_BD_EF_BF_BD_EF_BF_BD_EF_BF_BD_EF_BF_BD";
 101     const char *result = strstr (input, need);
 102     ASSERT (result == NULL);
 103   }
 104   {
 105     const char input[] = "F_BD_CE_BD_EF_BF_BD_EF_BF_BD_EF_BF_BD_EF_BF_BD"
 106                          "_C3_88_20_EF_BF_BD_EF_BF_BD_EF_BF_BD"
 107                          "_C3_A7_20_EF_BF_BD_DA_B5_C2_A6_20"
 108                          "_EF_BF_BD_EF_BF_BD_EF_BF_BD_EF_BF_BD_EF_BF_BD";
 109     const char need[] = "_EF_BF_BD_EF_BF_BD_EF_BF_BD_EF_BF_BD_EF_BF_BD";
 110     const char *result = strstr (input, need);
 111     ASSERT (result == input + 115);
 112   }
 113 
 114   /* Check that a very long haystack is handled quickly if the needle is
 115      short and occurs near the beginning.  */
 116   {
 117     size_t repeat = 10000;
 118     size_t m = 1000000;
 119     const char *needle =
 120       "AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA"
 121       "AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA";
 122     char *haystack = (char *) malloc (m + 1);
 123     if (haystack != NULL)
 124       {
 125         memset (haystack, 'A', m);
 126         haystack[0] = 'B';
 127         haystack[m] = '\0';
 128 
 129         for (; repeat > 0; repeat--)
 130           {
 131             ASSERT (strstr (haystack, needle) == haystack + 1);
 132           }
 133 
 134         free (haystack);
 135       }
 136   }
 137 
 138   /* Check that a very long needle is discarded quickly if the haystack is
 139      short.  */
 140   {
 141     size_t repeat = 10000;
 142     size_t m = 1000000;
 143     const char *haystack =
 144       "AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA"
 145       "ABABABABABABABABABABABABABABABABABABABABABABABABABABABABABABABABABAB";
 146     char *needle = (char *) malloc (m + 1);
 147     if (needle != NULL)
 148       {
 149         memset (needle, 'A', m);
 150         needle[m] = '\0';
 151 
 152         for (; repeat > 0; repeat--)
 153           {
 154             ASSERT (strstr (haystack, needle) == NULL);
 155           }
 156 
 157         free (needle);
 158       }
 159   }
 160 
 161   /* Check that the asymptotic worst-case complexity is not quadratic.  */
 162   {
 163     size_t m = 1000000;
 164     char *haystack = (char *) malloc (2 * m + 2);
 165     char *needle = (char *) malloc (m + 2);
 166     if (haystack != NULL && needle != NULL)
 167       {
 168         const char *result;
 169 
 170         memset (haystack, 'A', 2 * m);
 171         haystack[2 * m] = 'B';
 172         haystack[2 * m + 1] = '\0';
 173 
 174         memset (needle, 'A', m);
 175         needle[m] = 'B';
 176         needle[m + 1] = '\0';
 177 
 178         result = strstr (haystack, needle);
 179         ASSERT (result == haystack + m);
 180       }
 181     free (needle);
 182     free (haystack);
 183   }
 184 
 185   /* Sublinear speed is only possible in memmem; strstr must examine
 186      every character of haystack to find its length.  */
 187 
 188 
 189   {
 190     /* Ensure that with a barely periodic "short" needle, strstr's
 191        search does not mistakenly skip just past the match point.
 192        This use of strstr would mistakenly return NULL before
 193        gnulib v0.0-4927.  */
 194     const char *haystack =
 195       "\n"
 196       "with_build_libsubdir\n"
 197       "with_local_prefix\n"
 198       "with_gxx_include_dir\n"
 199       "with_cpp_install_dir\n"
 200       "enable_generated_files_in_srcdir\n"
 201       "with_gnu_ld\n"
 202       "with_ld\n"
 203       "with_demangler_in_ld\n"
 204       "with_gnu_as\n"
 205       "with_as\n"
 206       "enable_largefile\n"
 207       "enable_werror_always\n"
 208       "enable_checking\n"
 209       "enable_coverage\n"
 210       "enable_gather_detailed_mem_stats\n"
 211       "enable_build_with_cxx\n"
 212       "with_stabs\n"
 213       "enable_multilib\n"
 214       "enable___cxa_atexit\n"
 215       "enable_decimal_float\n"
 216       "enable_fixed_point\n"
 217       "enable_threads\n"
 218       "enable_tls\n"
 219       "enable_objc_gc\n"
 220       "with_dwarf2\n"
 221       "enable_shared\n"
 222       "with_build_sysroot\n"
 223       "with_sysroot\n"
 224       "with_specs\n"
 225       "with_pkgversion\n"
 226       "with_bugurl\n"
 227       "enable_languages\n"
 228       "with_multilib_list\n";
 229     const char *needle = "\n"
 230       "with_gnu_ld\n";
 231     const char* p = strstr (haystack, needle);
 232     ASSERT (p - haystack == 114);
 233   }
 234 
 235   {
 236     /* Same bug, shorter trigger.  */
 237     const char *haystack = "..wi.d.";
 238     const char *needle = ".d.";
 239     const char* p = strstr (haystack, needle);
 240     ASSERT (p - haystack == 4);
 241   }
 242 
 243   {
 244     /* Like the above, but trigger the flaw in two_way_long_needle
 245        by using a needle of length LONG_NEEDLE_THRESHOLD (32) or greater.
 246        Rather than trying to find the right alignment manually, I've
 247        arbitrarily chosen the following needle and template for the
 248        haystack, and ensure that for each placement of the needle in
 249        that haystack, strstr finds it.  */
 250     const char *needle = "\nwith_gnu_ld-extend-to-len-32-b\n";
 251     const char *h =
 252       "\n"
 253       "with_build_libsubdir\n"
 254       "with_local_prefix\n"
 255       "with_gxx_include_dir\n"
 256       "with_cpp_install_dir\n"
 257       "with_e_\n"
 258       "..............................\n"
 259       "with_FGHIJKLMNOPQRSTUVWXYZ\n"
 260       "with_567890123456789\n"
 261       "with_multilib_list\n";
 262     size_t h_len = strlen (h);
 263     char *haystack = malloc (h_len + 1);
 264     size_t i;
 265     ASSERT (haystack);
 266     for (i = 0; i < h_len - strlen (needle); i++)
 267       {
 268         const char *p;
 269         memcpy (haystack, h, h_len + 1);
 270         memcpy (haystack + i, needle, strlen (needle) + 1);
 271         p = strstr (haystack, needle);
 272         ASSERT (p);
 273         ASSERT (p - haystack == i);
 274       }
 275     free (haystack);
 276   }
 277 
 278   /* Test long needles.  */
 279   {
 280     size_t m = 1024;
 281     char *haystack = (char *) malloc (2 * m + 1);
 282     char *needle = (char *) malloc (m + 1);
 283     if (haystack != NULL && needle != NULL)
 284       {
 285         const char *p;
 286         haystack[0] = 'x';
 287         memset (haystack + 1, ' ', m - 1);
 288         memset (haystack + m, 'x', m);
 289         haystack[2 * m] = '\0';
 290         memset (needle, 'x', m);
 291         needle[m] = '\0';
 292         p = strstr (haystack, needle);
 293         ASSERT (p);
 294         ASSERT (p - haystack == m);
 295       }
 296     free (needle);
 297     free (haystack);
 298   }
 299 
 300   return 0;
 301 }

/* [previous][next][first][last][top][bottom][index][help] */