1 /* Optimized strcmp implementation for PowerPC64.
2 Copyright (C) 2003-2020 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
5 The GNU C Library is free software; you can redistribute it and/or
6 modify it under the terms of the GNU Lesser General Public
7 License as published by the Free Software Foundation; either
8 version 2.1 of the License, or (at your option) any later version.
10 The GNU C Library is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 Lesser General Public License for more details.
15 You should have received a copy of the GNU Lesser General Public
16 License along with the GNU C Library; if not, see
17 <https://www.gnu.org/licenses/>. */
21 /* See strlen.s for comments on how the end-of-string testing works. */
23 /* int [r3] strncmp (const char *s1 [r3], const char *s2 [r4], size_t size [r5]) */
26 # define STRNCMP strncmp
29 ENTRY_TOCLESS (STRNCMP, 4)
34 #define rSTR1 r3 /* first string arg */
35 #define rSTR2 r4 /* second string arg */
36 #define rN r5 /* max string length */
37 #define rWORD1 r6 /* current word in s1 */
38 #define rWORD2 r7 /* current word in s2 */
39 #define rFEFE r8 /* constant 0xfefefefefefefeff (-0x0101010101010101) */
40 #define r7F7F r9 /* constant 0x7f7f7f7f7f7f7f7f */
41 #define rNEG r10 /* ~(word in s1 | 0x7f7f7f7f7f7f7f7f) */
42 #define rBITDIF r11 /* bits that differ in s1 & s2 words */
49 clrldi. rTMP, rTMP, 61
53 /* We are doubleword aligned so set up for two loops. first a double word
54 loop, then fall into the byte loop if any residual. */
57 addi rFEFE, rFEFE, -0x101
58 addi r7F7F, r7F7F, 0x7f7f
62 mtctr rTMP /* Power4 wants mtctr 1st in dispatch group. */
66 insrdi r7F7F, r7F7F, 32, 0
67 add rFEFE, rFEFE, rTMP
72 bne- cr1, L(different)
74 L(g1): add rTMP, rFEFE, rWORD1
75 nor rNEG, r7F7F, rWORD1
78 cmpd cr1, rWORD1, rWORD2
81 /* OK. We've hit the end of the string. We need to be careful that
82 we don't compare two strings as different because of gunk beyond
83 the end of the strings... */
85 #ifdef __LITTLE_ENDIAN__
89 andc rTMP2, rTMP2, rTMP
90 rldimi rTMP2, rTMP2, 1, 0
91 and rWORD2, rWORD2, rTMP2 /* Mask off gunk. */
92 and rWORD1, rWORD1, rTMP2
93 cmpd cr1, rWORD1, rWORD2
95 xor rBITDIF, rWORD1, rWORD2 /* rBITDIF has bits that differ. */
97 and rNEG, rNEG, rBITDIF /* rNEG has LS bit that differs. */
98 cntlzd rNEG, rNEG /* bitcount of the bit. */
99 andi. rNEG, rNEG, 56 /* bitcount to LS byte that differs. */
100 sld rWORD1, rWORD1, rNEG /* shift left to clear MS bytes. */
101 sld rWORD2, rWORD2, rNEG
102 xor. rBITDIF, rWORD1, rWORD2
103 sub rRTN, rWORD1, rWORD2
105 sradi rRTN, rRTN, 63 /* must return an int. */
114 xor rBITDIF, rWORD1, rWORD2 /* rBITDIF has bits that differ. */
116 and rNEG, rNEG, rBITDIF /* rNEG has LS bit that differs. */
117 cntlzd rNEG, rNEG /* bitcount of the bit. */
118 andi. rNEG, rNEG, 56 /* bitcount to LS byte that differs. */
119 sld rWORD1, rWORD1, rNEG /* shift left to clear MS bytes. */
120 sld rWORD2, rWORD2, rNEG
121 xor. rBITDIF, rWORD1, rWORD2
122 sub rRTN, rWORD1, rWORD2
128 sradi rRTN, rWORD2, 63
134 and rTMP, r7F7F, rWORD1
136 add rTMP, rTMP, r7F7F
137 xor. rBITDIF, rWORD1, rWORD2
138 andc rNEG, rNEG, rTMP
140 cntlzd rBITDIF, rBITDIF
143 cmpd cr1, rNEG, rBITDIF
144 sub rRTN, rWORD1, rWORD2
146 sradi rRTN, rRTN, 63 /* must return an int. */
155 xor. rBITDIF, rWORD1, rWORD2
156 sub rRTN, rWORD1, rWORD2
162 sradi rRTN, rWORD2, 63
167 /* Oh well. In this case, we just do a byte-by-byte comparison. */
170 and. rTMP, rTMP, rNEG
171 cmpd cr1, rWORD1, rWORD2
174 bne- cr1, L(different)
178 mtctr rN /* Power4 wants mtctr 1st in dispatch group */
190 lbzu rWORD2, 1(rSTR2)
196 lbzu rWORD1, 1(rSTR1)
198 lbzu rWORD2, 1(rSTR2)
203 lbzu rWORD1, 1(rSTR1)
206 L(u2): lbzu rWORD1, -1(rSTR1)
207 L(u3): sub rRTN, rWORD1, rWORD2
210 libc_hidden_builtin_def (strncmp)