]>
Commit | Line | Data |
---|---|---|
53f770e0 | 1 | /* memset/bzero -- set memory area to CH/0 |
cc3fa755 | 2 | Highly optimized version for ix86, x>=5. |
2b778ceb | 3 | Copyright (C) 1996-2021 Free Software Foundation, Inc. |
5929563f UD |
4 | This file is part of the GNU C Library. |
5 | Contributed by Torbjorn Granlund, <tege@matematik.su.se> | |
6 | ||
7 | The GNU C Library is free software; you can redistribute it and/or | |
41bdb6e2 AJ |
8 | modify it under the terms of the GNU Lesser General Public |
9 | License as published by the Free Software Foundation; either | |
10 | version 2.1 of the License, or (at your option) any later version. | |
5929563f UD |
11 | |
12 | The GNU C Library is distributed in the hope that it will be useful, | |
13 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
14 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
41bdb6e2 | 15 | Lesser General Public License for more details. |
5929563f | 16 | |
41bdb6e2 | 17 | You should have received a copy of the GNU Lesser General Public |
59ba27a6 | 18 | License along with the GNU C Library; if not, see |
5a82c748 | 19 | <https://www.gnu.org/licenses/>. */ |
53f770e0 RM |
20 | |
21 | #include <sysdep.h> | |
5929563f | 22 | #include "asm-syntax.h" |
53f770e0 | 23 | |
2366713d | 24 | #define PARMS 4+4 /* space for 1 saved reg */ |
3f02f778 | 25 | #define RTN PARMS |
2366713d | 26 | #define DEST RTN |
f6b71ead | 27 | #ifdef USE_AS_BZERO |
2366713d | 28 | # define LEN DEST+4 |
3f02f778 | 29 | #else |
2366713d | 30 | # define CHR DEST+4 |
3f02f778 GM |
31 | # define LEN CHR+4 |
32 | #endif | |
53f770e0 RM |
33 | |
34 | .text | |
f6b71ead | 35 | #if defined SHARED && IS_IN (libc) && !defined USE_AS_BZERO |
9bdfff60 UD |
36 | ENTRY (__memset_chk) |
37 | movl 12(%esp), %eax | |
38 | cmpl %eax, 16(%esp) | |
39 | jb HIDDEN_JUMPTARGET (__chk_fail) | |
40 | END (__memset_chk) | |
41 | #endif | |
2366713d | 42 | ENTRY (memset) |
3f02f778 | 43 | |
53f770e0 | 44 | pushl %edi |
1ad9da69 | 45 | cfi_adjust_cfa_offset (4) |
53f770e0 | 46 | |
3f02f778 | 47 | movl DEST(%esp), %edi |
1ad9da69 | 48 | cfi_rel_offset (edi, 0) |
3f02f778 | 49 | movl LEN(%esp), %edx |
f6b71ead | 50 | #ifdef USE_AS_BZERO |
53f770e0 | 51 | xorl %eax, %eax /* we fill with 0 */ |
53f770e0 | 52 | #else |
3f02f778 | 53 | movb CHR(%esp), %al |
53f770e0 RM |
54 | movb %al, %ah |
55 | movl %eax, %ecx | |
56 | shll $16, %eax | |
57 | movw %cx, %ax | |
58 | #endif | |
59 | cld | |
60 | ||
61 | /* If less than 36 bytes to write, skip tricky code (it wouldn't work). */ | |
62 | cmpl $36, %edx | |
63 | movl %edx, %ecx /* needed when branch is taken! */ | |
5929563f | 64 | jl L(2) |
53f770e0 RM |
65 | |
66 | /* First write 0-3 bytes to make the pointer 32-bit aligned. */ | |
67 | movl %edi, %ecx /* Copy ptr to ecx... */ | |
68 | negl %ecx /* ...and negate that and... */ | |
69 | andl $3, %ecx /* ...mask to get byte count. */ | |
70 | subl %ecx, %edx /* adjust global byte count */ | |
71 | rep | |
72 | stosb | |
73 | ||
74 | subl $32, %edx /* offset count for unrolled loop */ | |
75 | movl (%edi), %ecx /* Fetch destination cache line */ | |
76 | ||
77 | .align 2, 0x90 /* supply 0x90 for broken assemblers */ | |
5929563f | 78 | L(1): movl 28(%edi), %ecx /* allocate cache line for destination */ |
53f770e0 RM |
79 | subl $32, %edx /* decr loop count */ |
80 | movl %eax, 0(%edi) /* store words pairwise */ | |
81 | movl %eax, 4(%edi) | |
82 | movl %eax, 8(%edi) | |
83 | movl %eax, 12(%edi) | |
84 | movl %eax, 16(%edi) | |
85 | movl %eax, 20(%edi) | |
86 | movl %eax, 24(%edi) | |
87 | movl %eax, 28(%edi) | |
88 | leal 32(%edi), %edi /* update destination pointer */ | |
5929563f | 89 | jge L(1) |
53f770e0 RM |
90 | |
91 | leal 32(%edx), %ecx /* reset offset count */ | |
92 | ||
93 | /* Write last 0-7 full 32-bit words (up to 8 words if loop was skipped). */ | |
5929563f | 94 | L(2): shrl $2, %ecx /* convert byte count to longword count */ |
53f770e0 RM |
95 | rep |
96 | stosl | |
97 | ||
98 | /* Finally write the last 0-3 bytes. */ | |
99 | movl %edx, %ecx | |
100 | andl $3, %ecx | |
101 | rep | |
102 | stosb | |
103 | ||
f6b71ead | 104 | #ifndef USE_AS_BZERO |
53f770e0 | 105 | /* Load result (only if used as memset). */ |
2fc08826 | 106 | movl DEST(%esp), %eax /* start address of destination is result */ |
53f770e0 RM |
107 | #endif |
108 | popl %edi | |
1ad9da69 UD |
109 | cfi_adjust_cfa_offset (-4) |
110 | cfi_restore (edi) | |
53f770e0 | 111 | |
2366713d | 112 | ret |
2366713d | 113 | END (memset) |
85dd1003 | 114 | libc_hidden_builtin_def (memset) |