1 /* Optimized strcmp implementation for PowerPC64.
2 Copyright (C) 2003, 2011 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
5 The GNU C Library is free software; you can redistribute it and/or
6 modify it under the terms of the GNU Lesser General Public
7 License as published by the Free Software Foundation; either
8 version 2.1 of the License, or (at your option) any later version.
10 The GNU C Library is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 Lesser General Public License for more details.
15 You should have received a copy of the GNU Lesser General Public
16 License along with the GNU C Library; if not, see
17 <http://www.gnu.org/licenses/>. */
23 /* See strlen.s for comments on how the end-of-string testing works. */
25 /* int [r3] strncmp (const char *s1 [r3], const char *s2 [r4], size_t size [r5]) */
27 EALIGN (BP_SYM(strncmp), 4, 0)
32 #define rSTR1 r3 /* first string arg */
33 #define rSTR2 r4 /* second string arg */
34 #define rN r5 /* max string length */
35 /* Note: The Bounded pointer support in this code is broken. This code
36 was inherited from PPC32 and that support was never completed.
37 Current PPC gcc does not support -fbounds-check or -fbounded-pointers. */
38 #define rWORD1 r6 /* current word in s1 */
39 #define rWORD2 r7 /* current word in s2 */
40 #define rFEFE r8 /* constant 0xfefefefefefefeff (-0x0101010101010101) */
41 #define r7F7F r9 /* constant 0x7f7f7f7f7f7f7f7f */
42 #define rNEG r10 /* ~(word in s1 | 0x7f7f7f7f7f7f7f7f) */
43 #define rBITDIF r11 /* bits that differ in s1 & s2 words */
49 clrldi. rTMP, rTMP, 61
53 /* We are doubleword alligned so set up for two loops. first a double word
54 loop, then fall into the byte loop if any residual. */
57 addi rFEFE, rFEFE, -0x101
58 addi r7F7F, r7F7F, 0x7f7f
62 mtctr rTMP /* Power4 wants mtctr 1st in dispatch group. */
66 insrdi r7F7F, r7F7F, 32, 0
67 add rFEFE, rFEFE, rTMP
72 bne- cr1, L(different)
74 L(g1): add rTMP, rFEFE, rWORD1
75 nor rNEG, r7F7F, rWORD1
78 cmpd cr1, rWORD1, rWORD2
81 /* OK. We've hit the end of the string. We need to be careful that
82 we don't compare two strings as different because of gunk beyond
83 the end of the strings... */
86 and rTMP, r7F7F, rWORD1
89 xor. rBITDIF, rWORD1, rWORD2
93 cntlzd rBITDIF, rBITDIF
96 cmpd cr1, rNEG, rBITDIF
97 sub rRTN, rWORD1, rWORD2
107 ldu rWORD1, -8(rSTR1)
108 xor. rBITDIF, rWORD1, rWORD2
109 sub rRTN, rWORD1, rWORD2
115 srdi rWORD2, rWORD2, 56
116 srdi rWORD1, rWORD1, 56
117 sub rRTN, rWORD1, rWORD2
121 /* Oh well. In this case, we just do a byte-by-byte comparison. */
124 and. rTMP, rTMP, rNEG
125 cmpd cr1, rWORD1, rWORD2
128 bne- cr1, L(different)
132 mtctr rN /* Power4 wants mtctr 1st in dispatch group */
144 lbzu rWORD2, 1(rSTR2)
150 lbzu rWORD1, 1(rSTR1)
152 lbzu rWORD2, 1(rSTR2)
157 lbzu rWORD1, 1(rSTR1)
160 L(u2): lbzu rWORD1, -1(rSTR1)
161 L(u3): sub rRTN, rWORD1, rWORD2
163 END (BP_SYM (strncmp))
164 libc_hidden_builtin_def (strncmp)