gnulib/import/memchr.c

*4b169a6bSchristos/* Copyright (C) 1991, 1993, 1996-1997, 1999-2000, 2003-2004, 2006, 2008-2022
8dffb485Schristos   Free Software Foundation, Inc.
8dffb485Schristos
8dffb485Schristos   Based on strlen implementation by Torbjorn Granlund (tege@sics.se),
8dffb485Schristos   with help from Dan Sahlin (dan@sics.se) and
8dffb485Schristos   commentary by Jim Blandy (jimb@ai.mit.edu);
8dffb485Schristos   adaptation to memchr suggested by Dick Karpinski (dick@cca.ucsf.edu),
8dffb485Schristos   and implemented by Roland McGrath (roland@ai.mit.edu).
8dffb485Schristos
8dffb485Schristos   NOTE: The canonical source of this file is maintained with the GNU C Library.
8dffb485Schristos   Bugs can be reported to bug-glibc@prep.ai.mit.edu.
8dffb485Schristos
*4b169a6bSchristos   This file is free software: you can redistribute it and/or modify
*4b169a6bSchristos   it under the terms of the GNU Lesser General Public License as
*4b169a6bSchristos   published by the Free Software Foundation; either version 2.1 of the
*4b169a6bSchristos   License, or (at your option) any later version.
8dffb485Schristos
*4b169a6bSchristos   This file is distributed in the hope that it will be useful,
8dffb485Schristos   but WITHOUT ANY WARRANTY; without even the implied warranty of
8dffb485Schristos   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
*4b169a6bSchristos   GNU Lesser General Public License for more details.
8dffb485Schristos
*4b169a6bSchristos   You should have received a copy of the GNU Lesser General Public License
8dffb485Schristos   along with this program.  If not, see <https://www.gnu.org/licenses/>.  */
8dffb485Schristos
8dffb485Schristos#ifndef _LIBC
8dffb485Schristos# include <config.h>
8dffb485Schristos#endif
8dffb485Schristos
8dffb485Schristos#include <string.h>
8dffb485Schristos
8dffb485Schristos#include <stddef.h>
8dffb485Schristos
8dffb485Schristos#if defined _LIBC
8dffb485Schristos# include <memcopy.h>
8dffb485Schristos#else
8dffb485Schristos# define reg_char char
8dffb485Schristos#endif
8dffb485Schristos
8dffb485Schristos#include <limits.h>
8dffb485Schristos
8dffb485Schristos#if HAVE_BP_SYM_H || defined _LIBC
8dffb485Schristos# include <bp-sym.h>
8dffb485Schristos#else
8dffb485Schristos# define BP_SYM(sym) sym
8dffb485Schristos#endif
8dffb485Schristos
8dffb485Schristos#undef __memchr
8dffb485Schristos#ifdef _LIBC
8dffb485Schristos# undef memchr
8dffb485Schristos#endif
8dffb485Schristos
8dffb485Schristos#ifndef weak_alias
8dffb485Schristos# define __memchr memchr
8dffb485Schristos#endif
8dffb485Schristos
8dffb485Schristos/* Search no more than N bytes of S for C.  */
8dffb485Schristosvoid *
8dffb485Schristos__memchr (void const *s, int c_in, size_t n)
8dffb485Schristos{
8dffb485Schristos  /* On 32-bit hardware, choosing longword to be a 32-bit unsigned
8dffb485Schristos     long instead of a 64-bit uintmax_t tends to give better
8dffb485Schristos     performance.  On 64-bit hardware, unsigned long is generally 64
8dffb485Schristos     bits already.  Change this typedef to experiment with
8dffb485Schristos     performance.  */
8dffb485Schristos  typedef unsigned long int longword;
8dffb485Schristos
8dffb485Schristos  const unsigned char *char_ptr;
8dffb485Schristos  const longword *longword_ptr;
8dffb485Schristos  longword repeated_one;
8dffb485Schristos  longword repeated_c;
8dffb485Schristos  unsigned reg_char c;
8dffb485Schristos
8dffb485Schristos  c = (unsigned char) c_in;
8dffb485Schristos
8dffb485Schristos  /* Handle the first few bytes by reading one byte at a time.
8dffb485Schristos     Do this until CHAR_PTR is aligned on a longword boundary.  */
8dffb485Schristos  for (char_ptr = (const unsigned char *) s;
8dffb485Schristos       n > 0 && (size_t) char_ptr % sizeof (longword) != 0;
8dffb485Schristos       --n, ++char_ptr)
8dffb485Schristos    if (*char_ptr == c)
8dffb485Schristos      return (void *) char_ptr;
8dffb485Schristos
8dffb485Schristos  longword_ptr = (const longword *) char_ptr;
8dffb485Schristos
8dffb485Schristos  /* All these elucidatory comments refer to 4-byte longwords,
8dffb485Schristos     but the theory applies equally well to any size longwords.  */
8dffb485Schristos
8dffb485Schristos  /* Compute auxiliary longword values:
8dffb485Schristos     repeated_one is a value which has a 1 in every byte.
8dffb485Schristos     repeated_c has c in every byte.  */
8dffb485Schristos  repeated_one = 0x01010101;
8dffb485Schristos  repeated_c = c | (c << 8);
8dffb485Schristos  repeated_c |= repeated_c << 16;
8dffb485Schristos  if (0xffffffffU < (longword) -1)
8dffb485Schristos    {
8dffb485Schristos      repeated_one |= repeated_one << 31 << 1;
8dffb485Schristos      repeated_c |= repeated_c << 31 << 1;
8dffb485Schristos      if (8 < sizeof (longword))
8dffb485Schristos        {
8dffb485Schristos          size_t i;
8dffb485Schristos
8dffb485Schristos          for (i = 64; i < sizeof (longword) * 8; i *= 2)
8dffb485Schristos            {
8dffb485Schristos              repeated_one |= repeated_one << i;
8dffb485Schristos              repeated_c |= repeated_c << i;
8dffb485Schristos            }
8dffb485Schristos        }
8dffb485Schristos    }
8dffb485Schristos
8dffb485Schristos  /* Instead of the traditional loop which tests each byte, we will test a
8dffb485Schristos     longword at a time.  The tricky part is testing if *any of the four*
8dffb485Schristos     bytes in the longword in question are equal to c.  We first use an xor
8dffb485Schristos     with repeated_c.  This reduces the task to testing whether *any of the
8dffb485Schristos     four* bytes in longword1 is zero.
8dffb485Schristos
8dffb485Schristos     We compute tmp =
8dffb485Schristos       ((longword1 - repeated_one) & ~longword1) & (repeated_one << 7).
8dffb485Schristos     That is, we perform the following operations:
8dffb485Schristos       1. Subtract repeated_one.
8dffb485Schristos       2. & ~longword1.
8dffb485Schristos       3. & a mask consisting of 0x80 in every byte.
8dffb485Schristos     Consider what happens in each byte:
8dffb485Schristos       - If a byte of longword1 is zero, step 1 and 2 transform it into 0xff,
8dffb485Schristos         and step 3 transforms it into 0x80.  A carry can also be propagated
8dffb485Schristos         to more significant bytes.
8dffb485Schristos       - If a byte of longword1 is nonzero, let its lowest 1 bit be at
8dffb485Schristos         position k (0 <= k <= 7); so the lowest k bits are 0.  After step 1,
8dffb485Schristos         the byte ends in a single bit of value 0 and k bits of value 1.
8dffb485Schristos         After step 2, the result is just k bits of value 1: 2^k - 1.  After
8dffb485Schristos         step 3, the result is 0.  And no carry is produced.
8dffb485Schristos     So, if longword1 has only non-zero bytes, tmp is zero.
8dffb485Schristos     Whereas if longword1 has a zero byte, call j the position of the least
8dffb485Schristos     significant zero byte.  Then the result has a zero at positions 0, ...,
8dffb485Schristos     j-1 and a 0x80 at position j.  We cannot predict the result at the more
8dffb485Schristos     significant bytes (positions j+1..3), but it does not matter since we
8dffb485Schristos     already have a non-zero bit at position 8*j+7.
8dffb485Schristos
8dffb485Schristos     So, the test whether any byte in longword1 is zero is equivalent to
8dffb485Schristos     testing whether tmp is nonzero.  */
8dffb485Schristos
8dffb485Schristos  while (n >= sizeof (longword))
8dffb485Schristos    {
8dffb485Schristos      longword longword1 = *longword_ptr ^ repeated_c;
8dffb485Schristos
8dffb485Schristos      if ((((longword1 - repeated_one) & ~longword1)
8dffb485Schristos           & (repeated_one << 7)) != 0)
8dffb485Schristos        break;
8dffb485Schristos      longword_ptr++;
8dffb485Schristos      n -= sizeof (longword);
8dffb485Schristos    }
8dffb485Schristos
8dffb485Schristos  char_ptr = (const unsigned char *) longword_ptr;
8dffb485Schristos
8dffb485Schristos  /* At this point, we know that either n < sizeof (longword), or one of the
8dffb485Schristos     sizeof (longword) bytes starting at char_ptr is == c.  On little-endian
8dffb485Schristos     machines, we could determine the first such byte without any further
8dffb485Schristos     memory accesses, just by looking at the tmp result from the last loop
8dffb485Schristos     iteration.  But this does not work on big-endian machines.  Choose code
8dffb485Schristos     that works in both cases.  */
8dffb485Schristos
8dffb485Schristos  for (; n > 0; --n, ++char_ptr)
8dffb485Schristos    {
8dffb485Schristos      if (*char_ptr == c)
8dffb485Schristos        return (void *) char_ptr;
8dffb485Schristos    }
8dffb485Schristos
8dffb485Schristos  return NULL;
8dffb485Schristos}
8dffb485Schristos#ifdef weak_alias
8dffb485Schristosweak_alias (__memchr, BP_SYM (memchr))
8dffb485Schristos#endif