mirror of
				https://sourceware.org/git/glibc.git
				synced 2025-11-03 20:53:13 +03:00 
			
		
		
		
	* sysdeps/i386/fpu/ftestexcept.c: Also check SSE status word. * include/signal.h: Use libc_hidden_proto for sigaddset and sigdelset. * signal/sigaddset.c: Add libc_hidden_def. * signal/sigdelset.c: Likewise. 2003-04-29 Jakub Jelinek <jakub@redhat.com> * sysdeps/i386/i486/string-inlines.c (__memcpy_g, __strchr_g): Move to the end of the file. * configure.in: Change __oline__ to $LINENO. (HAVE_BUILTIN_REDIRECTION): New check. * config.h.in (HAVE_BUILTIN_REDIRECTION): Add. * include/libc-symbols.h (libc_hidden_builtin_proto, libc_hidden_builtin_def, libc_hidden_builtin_weak, libc_hidden_builtin_ver): Define. * include/string.h (memchr, memcpy, memmove, memset, strcat, strchr, strcmp, strcpy, strcspn, strlen, strncmp, strncpy, strpbrk, strrchr, strspn, strstr): Add libc_hidden_builtin_proto. * intl/plural.y: Include string.h. * sysdeps/alpha/alphaev6/memchr.S (memchr): Add libc_hidden_builtin_def. * sysdeps/alpha/alphaev6/memcpy.S (memcpy): Likewise. * sysdeps/alpha/alphaev6/memset.S (memset): Likewise. * sysdeps/alpha/alphaev67/strcat.S (strcat): Likewise. * sysdeps/alpha/alphaev67/strchr.S (strchr): Likewise. * sysdeps/alpha/alphaev67/strlen.S (strlen): Likewise. * sysdeps/alpha/alphaev67/strrchr.S (strrchr): Likewise. * sysdeps/alpha/memchr.S (memchr): Likewise. * sysdeps/alpha/memset.S (memset): Likewise. * sysdeps/alpha/strcat.S (strcat): Likewise. * sysdeps/alpha/strchr.S (strchr): Likewise. * sysdeps/alpha/strcmp.S (strcmp): Likewise. * sysdeps/alpha/strcpy.S (strcpy): Likewise. * sysdeps/alpha/strlen.S (strlen): Likewise. * sysdeps/alpha/strncmp.S (strncmp): Likewise. * sysdeps/alpha/strncpy.S (strncpy): Likewise. * sysdeps/alpha/strrchr.S (strrchr): Likewise. * sysdeps/arm/memset.S (memset): Likewise. * sysdeps/arm/strlen.S (strlen): Likewise. * sysdeps/generic/memchr.c (memchr): Likewise. * sysdeps/generic/memcpy.c (memcpy): Likewise. * sysdeps/generic/memmove.c (memmove): Likewise. * sysdeps/generic/memset.c (memset): Likewise. * sysdeps/generic/strcat.c (strcat): Likewise. * sysdeps/generic/strchr.c (strchr): Likewise. * sysdeps/generic/strcmp.c (strcmp): Likewise. * sysdeps/generic/strcpy.c (strcpy): Likewise. * sysdeps/generic/strcspn.c (strcspn): Likewise. * sysdeps/generic/strlen.c (strlen): Likewise. * sysdeps/generic/strncmp.c (strncmp): Likewise. * sysdeps/generic/strncpy.c (strncpy): Likewise. * sysdeps/generic/strpbrk.c (strpbrk): Likewise. * sysdeps/generic/strrchr.c (strrchr): Likewise. * sysdeps/generic/strspn.c (strspn): Likewise. * sysdeps/generic/strstr.c (strstr): Likewise. * sysdeps/i386/i486/strcat.S (strcat): Likewise. * sysdeps/i386/i486/strlen.S (strlen): Likewise. * sysdeps/i386/i586/memcpy.S (memcpy): Likewise. * sysdeps/i386/i586/memset.S (memset): Likewise. * sysdeps/i386/i586/strchr.S (strchr): Likewise. * sysdeps/i386/i586/strcpy.S (strcpy): Likewise. * sysdeps/i386/i586/strlen.S (strlen): Likewise. * sysdeps/i386/i686/memcpy.S (memcpy): Likewise. * sysdeps/i386/i686/memmove.S (memmove): Likewise. * sysdeps/i386/i686/memset.S (memset): Likewise. * sysdeps/i386/i686/strcmp.S (strcmp): Likewise. * sysdeps/i386/memchr.S (memchr): Likewise. * sysdeps/i386/memset.c (memset): Likewise. * sysdeps/i386/strchr.S (strchr): Likewise. * sysdeps/i386/strcspn.S (strcspn): Likewise. * sysdeps/i386/strlen.c (strlen): Likewise. * sysdeps/i386/strpbrk.S (strpbrk): Likewise. * sysdeps/i386/strrchr.S (strrchr): Likewise. * sysdeps/i386/strspn.S (strspn): Likewise. * sysdeps/ia64/memchr.S (memchr): Likewise. * sysdeps/ia64/memcpy.S (memcpy): Likewise. * sysdeps/ia64/memmove.S (memmove): Likewise. * sysdeps/ia64/memset.S (memset): Likewise. * sysdeps/ia64/strcat.S (strcat): Likewise. * sysdeps/ia64/strchr.S (strchr): Likewise. * sysdeps/ia64/strcmp.S (strcmp): Likewise. * sysdeps/ia64/strcpy.S (strcpy): Likewise. * sysdeps/ia64/strlen.S (strlen): Likewise. * sysdeps/ia64/strncmp.S (strncmp): Likewise. * sysdeps/ia64/strncpy.S (strncpy): Likewise. * sysdeps/m68k/memchr.S (memchr): Likewise. * sysdeps/m68k/strchr.S (strchr): Likewise. * sysdeps/mips/mips64/memcpy.S (memcpy): Likewise. * sysdeps/mips/mips64/memset.S (memset): Likewise. * sysdeps/mips/memcpy.S (memcpy): Likewise. * sysdeps/mips/memset.S (memset): Likewise. * sysdeps/powerpc/powerpc32/memset.S (memset): Likewise. * sysdeps/powerpc/powerpc32/strchr.S (strchr): Likewise. * sysdeps/powerpc/powerpc32/strcmp.S (strcmp): Likewise. * sysdeps/powerpc/powerpc32/strcpy.S (strcpy): Likewise. * sysdeps/powerpc/powerpc32/strlen.S (strlen): Likewise. * sysdeps/powerpc/powerpc64/memcpy.S (memcpy): Likewise. * sysdeps/powerpc/powerpc64/memset.S (memset): Likewise. * sysdeps/powerpc/powerpc64/strchr.S (strchr): Likewise. * sysdeps/powerpc/powerpc64/strcmp.S (strcmp): Likewise. * sysdeps/powerpc/powerpc64/strcpy.S (strcpy): Likewise. * sysdeps/powerpc/powerpc64/strlen.S (strlen): Likewise. * sysdeps/powerpc/strcat.c (strcat): Likewise. * sysdeps/sparc/sparc32/memchr.S (memchr): Likewise. * sysdeps/sparc/sparc32/memcpy.S (memcpy): Likewise. * sysdeps/sparc/sparc32/memset.S (memset): Likewise. * sysdeps/sparc/sparc32/strcat.S (strcat): Likewise. * sysdeps/sparc/sparc32/strchr.S (strchr, strrchr): Likewise. * sysdeps/sparc/sparc32/strcmp.S (strcmp): Likewise. * sysdeps/sparc/sparc32/strcpy.S (strcpy): Likewise. * sysdeps/sparc/sparc32/strlen.S (strlen): Likewise. * sysdeps/sparc/sparc64/sparcv9b/memcpy.S (memcpy, memmove): Likewise. * sysdeps/sparc/sparc64/memchr.S (memchr): Likewise. * sysdeps/sparc/sparc64/memcpy.S (memcpy, memmove): Likewise. * sysdeps/sparc/sparc64/memset.S (memset): Likewise. * sysdeps/sparc/sparc64/strcat.S (strcat): Likewise. * sysdeps/sparc/sparc64/strchr.S (strchr, strrchr): Likewise. * sysdeps/sparc/sparc64/strcmp.S (strcmp): Likewise. * sysdeps/sparc/sparc64/strcpy.S (strcpy): Likewise. * sysdeps/sparc/sparc64/strcspn.S (strcspn): Likewise. * sysdeps/sparc/sparc64/strlen.S (strlen): Likewise. * sysdeps/sparc/sparc64/strncmp.S (strncmp): Likewise. * sysdeps/sparc/sparc64/strncpy.S (strncpy): Likewise. * sysdeps/sparc/sparc64/strpbrk.S (strpbrk): Likewise. * sysdeps/sparc/sparc64/strspn.S (strspn): Likewise. * sysdeps/sh/memcpy.S (memcpy): Likewise. * sysdeps/sh/memset.S (memset): Likewise. * sysdeps/sh/strlen.S (strlen): Likewise. * sysdeps/s390/s390-32/memchr.S (memchr): Likewise. * sysdeps/s390/s390-32/memcpy.S (memcpy): Likewise. * sysdeps/s390/s390-32/memset.S (memset): Likewise. * sysdeps/s390/s390-32/strcmp.S (strcmp): Likewise. * sysdeps/s390/s390-32/strcpy.S (strcpy): Likewise. * sysdeps/s390/s390-32/strncpy.S (strncpy): Likewise. * sysdeps/s390/s390-64/memchr.S (memchr): Likewise. * sysdeps/s390/s390-64/memcpy.S (memcpy): Likewise. * sysdeps/s390/s390-64/memset.S (memset): Likewise. * sysdeps/s390/s390-64/strcmp.S (strcmp): Likewise. * sysdeps/s390/s390-64/strcpy.S (strcpy): Likewise. * sysdeps/s390/s390-64/strncpy.S (strncpy): Likewise. * sysdeps/x86_64/memcpy.S (memcpy): Likewise. * sysdeps/x86_64/memset.S (memset): Likewise. * sysdeps/x86_64/strcat.S (strcat): Likewise. * sysdeps/x86_64/strchr.S (strchr): Likewise. * sysdeps/x86_64/strcmp.S (strcmp): Likewise. * sysdeps/x86_64/strcpy.S (strcpy): Likewise. * sysdeps/x86_64/strcspn.S (strcspn): Likewise. * sysdeps/x86_64/strlen.S (strlen): Likewise. * sysdeps/x86_64/strspn.S (strspn): Likewise. * string/string-inlines.c: Move... * sysdeps/generic/string-inlines.c: ...here. (__memcpy_g, __strchr_g): Remove. (__NO_INLINE__): Define before including <string.h>, undefine after. Include bits/string.h and bits/string2.h. * sysdeps/i386/i486/string-inlines.c: New file. * sysdeps/i386/string-inlines.c: New file. * sysdeps/i386/i486/Versions: Remove. All GLIBC_2.1.1 symbols moved... * sysdeps/i386/Versions (libc): ...here. 2003-04-29 Ulrich Drepper <drepper@redhat.com>
		
			
				
	
	
		
			212 lines
		
	
	
		
			5.4 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
			
		
		
	
	
			212 lines
		
	
	
		
			5.4 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
/* Optimized memcpy implementation for PowerPC64.
 | 
						|
   Copyright (C) 2003 Free Software Foundation, Inc.
 | 
						|
   This file is part of the GNU C Library.
 | 
						|
 | 
						|
   The GNU C Library is free software; you can redistribute it and/or
 | 
						|
   modify it under the terms of the GNU Lesser General Public
 | 
						|
   License as published by the Free Software Foundation; either
 | 
						|
   version 2.1 of the License, or (at your option) any later version.
 | 
						|
 | 
						|
   The GNU C Library is distributed in the hope that it will be useful,
 | 
						|
   but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | 
						|
   Lesser General Public License for more details.
 | 
						|
 | 
						|
   You should have received a copy of the GNU Lesser General Public
 | 
						|
   License along with the GNU C Library; if not, write to the Free
 | 
						|
   Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
 | 
						|
   02111-1307 USA.  */
 | 
						|
 | 
						|
#include <sysdep.h>
 | 
						|
#include <bp-sym.h>
 | 
						|
#include <bp-asm.h>
 | 
						|
 | 
						|
/* __ptr_t [r3] memcpy (__ptr_t dst [r3], __ptr_t src [r4], size_t len [r5]);
 | 
						|
   Returns 'dst'.
 | 
						|
 | 
						|
   Memcpy handles short copies (< 32-bytes) using an unaligned
 | 
						|
   word lwz/stw loop.  The tail (remaining 1-3) bytes is handled with the
 | 
						|
   appropriate combination of byte and halfword load/stores. There is no
 | 
						|
   attempt to optimize the alignment of short moves.  The 64-bit
 | 
						|
   implementations of POWER3 and POWER4 do a reasonable job of handling
 | 
						|
   unligned load/stores that do not cross 32-byte boundries.
 | 
						|
 | 
						|
   Longer moves (>= 32-bytes) justify the effort to get at least the
 | 
						|
   destination doubleword (8-byte) aligned.  Further optimization is
 | 
						|
   posible when both source and destination are doubleword aligned.
 | 
						|
   Each case has a optimized unrolled loop.   */
 | 
						|
 | 
						|
EALIGN (BP_SYM (memcpy), 5, 0)
 | 
						|
    cmpldi cr1,5,31
 | 
						|
    neg   0,3
 | 
						|
    std   30,-16(1)
 | 
						|
    std   31,-8(1)
 | 
						|
    rldicl. 0,0,0,61
 | 
						|
    mr    12,4
 | 
						|
    mr    31,5
 | 
						|
    mr    30,3
 | 
						|
    ble-  cr1,.L2
 | 
						|
    subf  31,0,5
 | 
						|
 | 
						|
  /* Move 0-7 bytes as needed to get the destination doubleword alligned.  */
 | 
						|
    beq   0f
 | 
						|
    mtcrf 0x01,0
 | 
						|
1:  bf    31,2f
 | 
						|
    lbz   6,0(12)
 | 
						|
    addi  12,12,1
 | 
						|
    stb   6,0(3)
 | 
						|
    addi  3,3,1
 | 
						|
2:  bf    30,4f
 | 
						|
    lhz   6,0(12)
 | 
						|
    addi  12,12,2
 | 
						|
    sth   6,0(3)
 | 
						|
    addi  3,3,2
 | 
						|
4:  bf    29,0f
 | 
						|
    lwz   6,0(12)
 | 
						|
    addi  12,12,4
 | 
						|
    stw   6,0(3)
 | 
						|
    addi  3,3,4
 | 
						|
0:
 | 
						|
  /* Copy doublewords from source to destination, assumpting the
 | 
						|
     destination is aligned on a doubleword boundary.
 | 
						|
 | 
						|
     First verify that there is > 7 bytes to copy and check if the source
 | 
						|
     is also doubleword aligned.  If there are < 8 bytes to copy fall
 | 
						|
     through to the tail byte copy code.  Otherwise if the source and
 | 
						|
     destination are both doubleword aligned use an optimized doubleword
 | 
						|
     copy loop.  Otherwise the source has a different alignment and we use
 | 
						|
     a load, shift, store strategy.  */
 | 
						|
    rldicl. 0,12,0,61
 | 
						|
    cmpldi cr6,31,7
 | 
						|
    ble-  cr6,.L2  /* less than 8 bytes left.  */
 | 
						|
    bne-  0,.L6   /* Source is not DW aligned.  */
 | 
						|
    srdi. 9,31,3
 | 
						|
    mr    10,3
 | 
						|
    mr    11,12
 | 
						|
 | 
						|
  /* Move doublewords where destination and source are aligned.
 | 
						|
     Use a unrolled loop to copy 4 doubleword (32-bytes) per iteration.
 | 
						|
     If the remainder is >0 and < 32 bytes copy 1-3 doublewords.  */
 | 
						|
    cmpldi	cr1,9,4
 | 
						|
    beq   0f
 | 
						|
    mtcrf 0x01,9
 | 
						|
    blt   cr1,2f
 | 
						|
    ld    6,0(11)
 | 
						|
    .align  4
 | 
						|
4:
 | 
						|
    ld    7,8(11)
 | 
						|
    addi  9,9,-4
 | 
						|
    std   6,0(10)
 | 
						|
    ld    6,16(11)
 | 
						|
    std   7,8(10)
 | 
						|
    ld    7,24(11)
 | 
						|
    addi  11,11,32
 | 
						|
    cmpldi	cr1,9,4
 | 
						|
    std   6,16(10)
 | 
						|
    blt   cr1,3f
 | 
						|
    ld    6,0(11)
 | 
						|
    std   7,24(10)
 | 
						|
    addi  10,10,32
 | 
						|
    b     4b
 | 
						|
3:  std   7,24(10)
 | 
						|
    addi  10,10,32
 | 
						|
2:  bf    30,1f
 | 
						|
    ld    6,0(11)
 | 
						|
    ld    7,8(11)
 | 
						|
    addi  11,11,16
 | 
						|
    std   6,0(10)
 | 
						|
    std   7,8(10)
 | 
						|
    addi  10,10,16
 | 
						|
1:  bf    31,0f
 | 
						|
    ld    6,0(11)
 | 
						|
    addi  11,11,8
 | 
						|
    std   6,0(10)
 | 
						|
    addi  10,10,8
 | 
						|
0:
 | 
						|
 | 
						|
.L8:
 | 
						|
    rldicr 0,31,0,60
 | 
						|
    rldicl 31,31,0,61
 | 
						|
    add   3,3,0
 | 
						|
    add   12,12,0
 | 
						|
 | 
						|
	/* Copy the tail for up to 31 bytes.  If this is the tail of a longer
 | 
						|
	   copy then the destination will be aligned and the length will be
 | 
						|
	   less than 8.  So it is normally not worth the set-up overhead to
 | 
						|
	   get doubleword aligned and do doubleword load/store.  */
 | 
						|
.L2:
 | 
						|
    mr.   10,31
 | 
						|
    cmpldi	cr1,31,4
 | 
						|
    beq   0f
 | 
						|
    mtcrf 0x01,31
 | 
						|
    blt   cr1,2f
 | 
						|
4:  lwz   6,0(12)
 | 
						|
    addi  12,12,4
 | 
						|
    addi  10,10,-4
 | 
						|
    stw   6,0(3)
 | 
						|
    cmpldi	cr1,10,4
 | 
						|
    addi  3,3,4
 | 
						|
    bge   cr1,4b
 | 
						|
2:  bf    30,1f
 | 
						|
    lhz   6,0(12)
 | 
						|
    addi  12,12,2
 | 
						|
    sth   6,0(3)
 | 
						|
    addi  3,3,2
 | 
						|
1:  bf    31,0f
 | 
						|
    lbz   6,0(12)
 | 
						|
    addi  12,12,1
 | 
						|
    stb   6,0(3)
 | 
						|
    addi  3,3,1
 | 
						|
0:
 | 
						|
  /* Return original dst pointer.  */
 | 
						|
    ld 31,-8(1)
 | 
						|
    mr 3,30
 | 
						|
    ld 30,-16(1)
 | 
						|
    blr
 | 
						|
 | 
						|
.L6:
 | 
						|
    srdi 11,31,3
 | 
						|
    mr 4,3
 | 
						|
    mr 5,12
 | 
						|
 | 
						|
  /* Copy doublewords where the destination is aligned but the source is
 | 
						|
     not.  Use aligned doubleword loads from the source, shifted to realign
 | 
						|
     the data, to allow aligned destination stores.  */
 | 
						|
    andi. 10,5,7
 | 
						|
    andi. 0,11,1
 | 
						|
    subf  5,10,5
 | 
						|
    ld    6,0(5)
 | 
						|
    sldi  10,10,3
 | 
						|
    ld    7,8(5)
 | 
						|
    subfic  9,10,64
 | 
						|
    beq   2f
 | 
						|
    sld   0,6,10
 | 
						|
    addi  11,11,-1
 | 
						|
    mr    6,7
 | 
						|
    addi  4,4,-8
 | 
						|
    cmpldi  11,0
 | 
						|
    b     1f
 | 
						|
2:  addi  5,5,8
 | 
						|
    .align  4
 | 
						|
0:  sld   0,6,10
 | 
						|
    srd   8,7,9
 | 
						|
    addi  11,11,-2
 | 
						|
    ld    6,8(5)
 | 
						|
    or    0,0,8
 | 
						|
    cmpldi  11,0
 | 
						|
    std   0,0(4)
 | 
						|
    sld   0,7,10
 | 
						|
1:  srd   8,6,9
 | 
						|
    or    0,0,8
 | 
						|
    beq   8f
 | 
						|
    ld    7,16(5)
 | 
						|
    std   0,8(4)
 | 
						|
    addi  5,5,16
 | 
						|
    addi  4,4,16
 | 
						|
    b     0b
 | 
						|
8:
 | 
						|
    std   0,8(4)
 | 
						|
    b .L8
 | 
						|
END_GEN_TB (BP_SYM (memcpy),TB_TOCLESS)
 | 
						|
libc_hidden_builtin_def (memcpy)
 |