1 /* fast SSE2 memchr with 64 byte loop and pmaxub instruction using
3 Copyright (C) 2011-2022 Free Software Foundation, Inc.
4 This file is part of the GNU C Library.
6 The GNU C Library is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Lesser General Public
8 License as published by the Free Software Foundation; either
9 version 2.1 of the License, or (at your option) any later version.
11 The GNU C Library is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public
17 License along with the GNU C Library; if not, see
18 <https://www.gnu.org/licenses/>. */
27 punpcklbw %xmm1, %xmm1
28 punpcklbw %xmm1, %xmm1
31 pshufd $0, %xmm1, %xmm1
38 /* Check if there is a match. */
54 /* Check if there is a match. */
56 /* Remove the leading bytes. */
59 je L(unaligned_no_match)
60 /* Check which byte is a match. */
68 L(unaligned_no_match):
79 movdqa 16(%rdi), %xmm2
85 movdqa 32(%rdi), %xmm3
91 movdqa 48(%rdi), %xmm4
107 movdqa 16(%rdi), %xmm2
113 movdqa 32(%rdi), %xmm3
119 movdqa 48(%rdi), %xmm3
132 movdqa 16(%rdi), %xmm2
133 movdqa 32(%rdi), %xmm3
134 movdqa 48(%rdi), %xmm4
161 movdqa 32(%rdi), %xmm3
164 pcmpeqb 48(%rdi), %xmm1
171 lea 48(%rdi, %rax), %rax
177 lea -16(%rax, %rdi), %rax
189 lea 16(%rax, %rdi), %rax
195 lea 32(%rax, %rdi), %rax
200 weak_alias (__rawmemchr, rawmemchr)
201 libc_hidden_builtin_def (__rawmemchr)