mirror of git://sourceware.org/git/glibc.git
				
				
				
			
		
			
				
	
	
		
			352 lines
		
	
	
		
			6.6 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
			
		
		
	
	
			352 lines
		
	
	
		
			6.6 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
| /* strcat (dest, src) -- Append SRC on the end of DEST.
 | |
|    For SPARC v7.
 | |
|    Copyright (C) 1996-2024 Free Software Foundation, Inc.
 | |
|    This file is part of the GNU C Library.
 | |
| 
 | |
|    The GNU C Library is free software; you can redistribute it and/or
 | |
|    modify it under the terms of the GNU Lesser General Public
 | |
|    License as published by the Free Software Foundation; either
 | |
|    version 2.1 of the License, or (at your option) any later version.
 | |
| 
 | |
|    The GNU C Library is distributed in the hope that it will be useful,
 | |
|    but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|    Lesser General Public License for more details.
 | |
| 
 | |
|    You should have received a copy of the GNU Lesser General Public
 | |
|    License along with the GNU C Library; if not, see
 | |
|    <https://www.gnu.org/licenses/>.  */
 | |
| 
 | |
| #include <sysdep.h>
 | |
| 
 | |
| 	/* Normally, this uses ((xword - 0x01010101) & 0x80808080) test
 | |
| 	   to find out if any byte in xword could be zero. This is fast, but
 | |
| 	   also gives false alarm for any byte in range 0x81-0xff. It does
 | |
| 	   not matter for correctness, as if this test tells us there could
 | |
| 	   be some zero byte, we check it byte by byte, but if bytes with
 | |
| 	   high bits set are common in the strings, then this will give poor
 | |
| 	   performance. You can #define EIGHTBIT_NOT_RARE and the algorithm
 | |
| 	   will use one tick slower, but more precise test
 | |
| 	   ((xword - 0x01010101) & (~xword) & 0x80808080),
 | |
| 	   which does not give any false alarms (but if some bits are set,
 | |
| 	   one cannot assume from it which bytes are zero and which are not).
 | |
| 	   It is yet to be measured, what is the correct default for glibc
 | |
| 	   in these days for an average user.
 | |
| 	 */
 | |
| 
 | |
| 	.text
 | |
| 	.align		4
 | |
| 
 | |
| ENTRY(strcat)
 | |
| 	mov		%o0, %g2
 | |
| 	andcc		%o0, 3, %g0
 | |
| 	be		30f
 | |
| 	 sethi		%hi(0x80808080), %o4
 | |
| 
 | |
| 	ldub		[%o0], %o5
 | |
| 	cmp		%o5, 0
 | |
| 	be		1f
 | |
| 	 add		%o0, 1, %o0
 | |
| 	andcc		%o0, 3, %g0
 | |
| 	be		7f
 | |
| 	 or		%o4, %lo(0x80808080), %o3
 | |
| 	ldub		[%o0], %o5
 | |
| 	cmp		%o5, 0
 | |
| 	be		2f
 | |
| 	 add		%o0, 1, %o0
 | |
| 	andcc		%o0, 3, %g0
 | |
| 	be		8f
 | |
| 	 sethi		%hi(0x01010101), %o4
 | |
| 	ldub		[%o0], %o5
 | |
| 	cmp		%o5, 0
 | |
| 	be		3f
 | |
| 	 add		%o0, 1, %o0
 | |
| 	b		9f
 | |
| 	 or		%o4, %lo(0x01010101), %o2
 | |
| 1:	or		%o4, %lo(0x80808080), %o3
 | |
| 2:	sethi		%hi(0x01010101), %o4
 | |
| 3:	or		%o4, %lo(0x01010101), %o2
 | |
| 	b		3f
 | |
| 	 sub		%o0, 1, %o0
 | |
| 
 | |
| 30:	or		%o4, %lo(0x80808080), %o3
 | |
| 7:	sethi		%hi(0x01010101), %o4
 | |
| 8:	or		%o4, %lo(0x01010101), %o2
 | |
| 9:	ld		[%o0], %o5
 | |
| 7:	sub		%o5, %o2, %o4
 | |
| #ifdef EIGHTBIT_NOT_RARE
 | |
| 	andn		%o4, %o5, %o4
 | |
| #endif
 | |
| 	andcc		%o4, %o3, %g0
 | |
| 	be		9b
 | |
| 	 add		%o0, 4, %o0
 | |
| 
 | |
| 	srl		%o5, 24, %g5
 | |
| 	andcc		%g5, 0xff, %g0
 | |
| 	be		3f
 | |
| 	 add		%o0, -4, %o0
 | |
| 	srl		%o5, 16, %g5
 | |
| 	andcc		%g5, 0xff, %g0
 | |
| 	be		3f
 | |
| 	 add		%o0, 1, %o0
 | |
| 	srl		%o5, 8, %g5
 | |
| 	andcc		%g5, 0xff, %g0
 | |
| 	be		3f
 | |
| 	 add		%o0, 1, %o0
 | |
| 	andcc		%o5, 0xff, %g0
 | |
| 	add		%o0, 2, %o0
 | |
| 	bne,a		7b
 | |
| 	 ld		[%o0], %o5
 | |
| 	sub		%o0, 1, %o0
 | |
| 3:	andcc		%o1, 3, %o4
 | |
| 	be		4f
 | |
| 	 nop
 | |
| 
 | |
| 	cmp		%o4, 2
 | |
| 	be		11f
 | |
| 	 cmp		%o4, 3
 | |
| 	ldub		[%o1], %o5
 | |
| 	add		%o1, 1, %o1
 | |
| 	stb		%o5, [%o0]
 | |
| 	be		13f
 | |
| 	 cmp		%o5, 0
 | |
| 	be		0f
 | |
| 	 add		%o0, 1, %o0
 | |
| 11:	lduh		[%o1], %o5
 | |
| 	add		%o1, 2, %o1
 | |
| 	srl		%o5, 8, %o4
 | |
| 	cmp		%o4, 0
 | |
| 	stb		%o4, [%o0]
 | |
| 	bne,a		12f
 | |
| 	 stb		%o5, [%o0 + 1]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 12:	andcc		%o5, 0xff, %o5
 | |
| 	bne		4f
 | |
| 	 add		%o0, 2, %o0
 | |
| 	retl
 | |
| 	 mov 		%g2, %o0
 | |
| 13:	bne		4f
 | |
| 	 add		%o0, 1, %o0
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 4:	andcc		%o0, 3, %g3
 | |
| 	bne		12f
 | |
| 1:	ld		[%o1], %o5
 | |
| 	add		%o1, 4, %o1
 | |
| 	sub		%o5, %o2, %o4
 | |
| #ifdef EIGHTBIT_NOT_RARE
 | |
| 	andn		%o4, %o5, %o4
 | |
| #endif
 | |
| 	add		%o0, 4, %o0
 | |
| 	andcc		%o4, %o3, %g0
 | |
| 	be,a		1b
 | |
| 	 st		%o5, [%o0 - 4]
 | |
| 
 | |
| 	srl		%o5, 24, %g5
 | |
| 	andcc		%g5, 0xff, %g0
 | |
| 	be		1f
 | |
| 	 srl		%o5, 16, %g5
 | |
| 	andcc		%g5, 0xff, %g0
 | |
| 	be		2f
 | |
| 	 srl		%o5, 8, %g5
 | |
| 	andcc		%g5, 0xff, %g0
 | |
| 	be		3f
 | |
| 	 andcc		%o5, 0xff, %g0
 | |
| 	bne		1b
 | |
| 	 st		%o5, [%o0 - 4]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 3:	srl		%o5, 16, %o5
 | |
| 	sth		%o5, [%o0 - 4]
 | |
| 	stb		%g0, [%o0 - 2]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 2:	srl		%o5, 16, %o5
 | |
| 	sth		%o5, [%o0 - 4]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 1:	stb		%g0, [%o0 - 4]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 12:	add		%o1, 4, %o1
 | |
| 	sub		%o5, %o2, %o4
 | |
| 	cmp		%g3, 2
 | |
| 	be		2f
 | |
| 	 cmp		%g3, 3
 | |
| 	be		3f
 | |
| 	 andcc		%o4, %o3, %g0
 | |
| 	bne		5f
 | |
| 	 srl		%o5, 24, %g5
 | |
| 	stb		%g5, [%o0]
 | |
| 	sub		%o0, 1, %o0
 | |
| 	srl		%o5, 8, %g5
 | |
| 	sth		%g5, [%o0 + 2]
 | |
| 1:	add		%o0, 4, %o0
 | |
| 4:	sll		%o5, 24, %g6
 | |
| 	ld		[%o1], %o5
 | |
| 	add		%o1, 4, %o1
 | |
| 	srl		%o5, 8, %g5
 | |
| 	sub		%o5, %o2, %o4
 | |
| #ifdef EIGHTBIT_NOT_RARE
 | |
| 	andn		%o4, %o5, %o4
 | |
| #endif
 | |
| 	or		%g5, %g6, %g5
 | |
| 	andcc		%o4, %o3, %g0
 | |
| 	be,a		1b
 | |
| 	 st		%g5, [%o0]
 | |
| 	srl		%o5, 24, %o4
 | |
| 	andcc		%o4, 0xff, %g0
 | |
| 	be		6f
 | |
| 	 srl		%o5, 16, %o4
 | |
| 	andcc		%o4, 0xff, %g0
 | |
| 	be		7f
 | |
| 	 srl		%o5, 8, %o4
 | |
| 	st		%g5, [%o0]
 | |
| 	andcc		%o4, 0xff, %g0
 | |
| 	be		0f
 | |
| 	 andcc		%o5, 0xff, %g0
 | |
| 1:	bne		4b
 | |
| 	 add		%o0, 4, %o0
 | |
| 9:	stb		%g0, [%o0]
 | |
| 0:	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 6:	srl		%g5, 16, %g5
 | |
| 	sth		%g5, [%o0]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 7:	srl		%g5, 16, %g5
 | |
| 	sth		%g5, [%o0]
 | |
| 	stb		%g0, [%o0 + 2]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 5:	andcc		%g5, 0xff, %g4
 | |
| 	be		9b
 | |
| 	 srl		%o5, 16, %g5
 | |
| 	andcc		%g5, 0xff, %g0
 | |
| 	be		7f
 | |
| 	 srl		%o5, 8, %g5
 | |
| 	andcc		%g5, 0xff, %g0
 | |
| 	stb		%g4, [%o0]
 | |
| 	sth		%g5, [%o0 + 1]
 | |
| 	sub		%o0, 1, %o0
 | |
| 	bne		1b
 | |
| 	 andcc		%o5, 0xff, %g0
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 7:	stb		%g4, [%o0]
 | |
| 	stb		%g0, [%o0 + 1]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 2:	andcc		%o4, %o3, %g0
 | |
| 	bne		5f
 | |
| 	 srl		%o5, 16, %g5
 | |
| 	sth		%g5, [%o0]
 | |
| 	sub		%o0, 2, %o0
 | |
| 1:	add		%o0, 4, %o0
 | |
| 4:	sll		%o5, 16, %g6
 | |
| 	ld		[%o1], %o5
 | |
| 	add		%o1, 4, %o1
 | |
| 	srl		%o5, 16, %g5
 | |
| 	sub		%o5, %o2, %o4
 | |
| #ifdef EIGHTBIT_NOT_RARE
 | |
| 	andn		%o4, %o5, %o4
 | |
| #endif
 | |
| 	or		%g5, %g6, %g5
 | |
| 	andcc		%o4, %o3, %g0
 | |
| 	be,a		1b
 | |
| 	 st		%g5, [%o0]
 | |
| 	srl		%o5, 24, %o4
 | |
| 	andcc		%o4, 0xff, %g0
 | |
| 	be		7f
 | |
| 	 srl		%o5, 16, %o4
 | |
| 	st		%g5, [%o0]
 | |
| 	andcc		%o4, 0xff, %g0
 | |
| 	be		0b
 | |
| 	 srl		%o5, 8, %o4
 | |
| 1:	andcc		%o4, 0xff, %g0
 | |
| 	be		8f
 | |
| 	 andcc		%o5, 0xff, %g0
 | |
| 	bne		4b
 | |
| 	 add		%o0, 4, %o0
 | |
| 	sth		%o5, [%o0]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 7:	srl		%g5, 16, %g5
 | |
| 	sth		%g5, [%o0]
 | |
| 	stb		%g0, [%o0 + 2]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 8:	stb		%g0, [%o0 + 4]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 5:	srl		%o5, 24, %g5
 | |
| 	andcc		%g5, 0xff, %g0
 | |
| 	be		9b
 | |
| 	 srl		%o5, 16, %g5
 | |
| 	andcc		%g5, 0xff, %g0
 | |
| 	sth		%g5, [%o0]
 | |
| 	sub		%o0, 2, %o0
 | |
| 	bne		1b
 | |
| 	 srl		%o5, 8, %o4
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 
 | |
| 3:	bne		5f
 | |
| 	 srl		%o5, 24, %g5
 | |
| 	stb		%g5, [%o0]
 | |
| 	sub		%o0, 3, %o0
 | |
| 1:	add		%o0, 4, %o0
 | |
| 4:	sll		%o5, 8, %g6
 | |
| 	ld		[%o1], %o5
 | |
| 	add		%o1, 4, %o1
 | |
| 	srl		%o5, 24, %g5
 | |
| 	sub		%o5, %o2, %o4
 | |
| #ifdef EIGHTBIT_NOT_RARE
 | |
| 	andn		%o4, %o5, %o4
 | |
| #endif
 | |
| 	or		%g5, %g6, %g5
 | |
| 	andcc		%o4, %o3, %g0
 | |
| 	be		1b
 | |
| 	 st		%g5, [%o0]
 | |
| 	srl		%o5, 24, %o4
 | |
| 	andcc		%o4, 0xff, %g0
 | |
| 	be		0b
 | |
| 	 srl		%o5, 16, %o4
 | |
| 1:	andcc		%o4, 0xff, %g0
 | |
| 	be		8b
 | |
| 	 srl		%o5, 8, %o4
 | |
| 	andcc		%o4, 0xff, %g0
 | |
| 	be		9f
 | |
| 	 andcc		%o5, 0xff, %g0
 | |
| 	bne		4b
 | |
| 	 add		%o0, 4, %o0
 | |
| 	srl		%o5, 8, %o5
 | |
| 	sth		%o5, [%o0]
 | |
| 	stb		%g0, [%o0 + 2]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 9:	srl		%o5, 8, %o5
 | |
| 	sth		%o5, [%o0 + 4]
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| 5:	andcc		%g5, 0xff, %g0
 | |
| 	stb		%g5, [%o0]
 | |
| 	sub		%o0, 3, %o0
 | |
| 	bne		1b
 | |
| 	 srl		%o5, 16, %o4
 | |
| 	retl
 | |
| 	 mov		%g2, %o0
 | |
| END(strcat)
 | |
| libc_hidden_builtin_def (strcat)
 |