Subject: ARM bswap optimizations
To: None <port-arm@netbsd.org>
From: Jason R Thorpe <thorpej@wasabisystems.com>
List: port-arm
Date: 08/13/2002 13:51:43
--6c2NcOVqGQ03X4Wi
Content-Type: text/plain; charset=us-ascii
Content-Disposition: inline

Hi folks...

I'm wanting to shave some cycles out of the TCP/IP code on ARM.  hton*()
and ntoh*() is low-hanging fruit.  The issues:

	* Constants are not byte-swapped at compile-time.

	* A function must be called to do the byte-swap.  This costs
	  3 cycles to call the function (one to branch, 2 for the
	  pipeline flush), and 3 cycles to return.  This is significant
	  overhead if you consider that it's 4 insns to byte-swap an int,
	  and 3 insns to byte-swap a short.

The following patch addresses these issues.  I'd appreciate it if people
would read it over to make sure that I didn't screw up the asm (mostly
the constraints :-)  I've booted it multi-user on an XScale.

-- 
        -- Jason R. Thorpe <thorpej@wasabisystems.com>

--6c2NcOVqGQ03X4Wi
Content-Type: text/plain; charset=us-ascii
Content-Disposition: attachment; filename=bswap-diff

Index: Makefile
===================================================================
RCS file: /cvsroot/syssrc/sys/arch/arm/include/Makefile,v
retrieving revision 1.25
diff -c -r1.25 Makefile
*** Makefile	2002/08/07 05:14:58	1.25
--- Makefile	2002/08/13 20:34:20
***************
*** 4,10 ****
  INCSDIR= /usr/include/arm
  
  INCS=	ansi.h aout_machdep.h armreg.h asm.h \
! 	bswap.h bus.h \
  	cdefs.h cpu.h \
  	db_machdep.h disklabel.h \
  	elf_machdep.h endian.h endian_machdep.h \
--- 4,10 ----
  INCSDIR= /usr/include/arm
  
  INCS=	ansi.h aout_machdep.h armreg.h asm.h \
! 	bswap.h byte_swap.h bus.h \
  	cdefs.h cpu.h \
  	db_machdep.h disklabel.h \
  	elf_machdep.h endian.h endian_machdep.h \
Index: bswap.h
===================================================================
RCS file: /cvsroot/syssrc/sys/arch/arm/include/bswap.h,v
retrieving revision 1.1
diff -c -r1.1 bswap.h
*** bswap.h	2001/01/10 19:02:05	1.1
--- bswap.h	2002/08/13 20:34:20
***************
*** 6,9 ****
--- 6,17 ----
  #define __BSWAP_RENAME
  #include <sys/bswap.h>
  
+ #ifdef __GNUC__
+ 
+ #include <arm/byte_swap.h>
+ #define	bswap16(x)	__byte_swap_word(x)
+ #define	bswap32(x)	__byte_swap_long(x)
+ 
+ #endif /* __GNUC__ */
+ 
  #endif /* !_MACHINE_BSWAP_H_ */
Index: byte_swap.h
===================================================================
RCS file: byte_swap.h
diff -N byte_swap.h
*** /dev/null	Tue Aug 13 23:34:08 2002
--- byte_swap.h	Tue Aug 13 23:34:20 2002
***************
*** 0 ****
--- 1,102 ----
+ /*	$NetBSD$	*/
+ 
+ /*-
+  * Copyright (c) 1997, 1999, 2002 The NetBSD Foundation, Inc.
+  * All rights reserved.
+  *
+  * This code is derived from software contributed to The NetBSD Foundation
+  * by Charles M. Hannum, Neil A. Carson, and Jason R. Thorpe.
+  *
+  * Redistribution and use in source and binary forms, with or without
+  * modification, are permitted provided that the following conditions
+  * are met:
+  * 1. Redistributions of source code must retain the above copyright
+  *    notice, this list of conditions and the following disclaimer.
+  * 2. Redistributions in binary form must reproduce the above copyright
+  *    notice, this list of conditions and the following disclaimer in the
+  *    documentation and/or other materials provided with the distribution.
+  * 3. All advertising materials mentioning features or use of this software
+  *    must display the following acknowledgement:
+  *	This product includes software developed by the NetBSD
+  *	Foundation, Inc. and its contributors.
+  * 4. Neither the name of The NetBSD Foundation nor the names of its
+  *    contributors may be used to endorse or promote products derived
+  *    from this software without specific prior written permission.
+  *
+  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
+  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
+  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
+  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
+  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
+  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+  * POSSIBILITY OF SUCH DAMAGE.
+  */
+ 
+ #ifndef _ARM_BYTE_SWAP_H_
+ #define	_ARM_BYTE_SWAP_H_
+ 
+ #include <sys/types.h>
+ 
+ static __inline u_int32_t
+ __byte_swap_long_variable(u_int32_t v)
+ {
+ 	int tmp;
+ 
+ 	__asm __volatile(
+ 		"eor	%1, %2, %2, ror #16\n"
+ 		"bic	%1, %1, #0x00ff0000\n"
+ 		"mov	%0, %2, ror #8\n"
+ 		"eor	%0, %0, %1, lsr #8"
+ 	: "=r" (v), "=r" (tmp)
+ 	: "r" (v));
+ 
+ 	return (v);
+ }
+ 
+ static __inline u_int16_t
+ __byte_swap_word_variable(u_int16_t v)
+ {
+ 	int tmp;
+ 
+ 	__asm __volatile(
+ 		"and	%1, %2, #0xff\n"
+ 		"mov	%0, %2, lsr #8\n"
+ 		"orr	%0, %0, %1, lsl #8"
+ 	: "=r" (v), "=r" (tmp)
+ 	: "r" (v));
+ 
+ 	return (v);
+ }
+ 
+ #ifdef __OPTIMIZE__
+ 
+ #define __byte_swap_long_constant(x)	\
+ 	((((x) & 0xff000000) >> 24) |	\
+ 	 (((x) & 0x00ff0000) >>  8) |	\
+ 	 (((x) & 0x0000ff00) <<  8) |	\
+ 	 (((x) & 0x000000ff) << 24))
+ 
+ #define	__byte_swap_word_constant(x)	\
+ 	((((x) & 0xff00) >> 8) |	\
+ 	 (((x) & 0x00ff) << 8))
+ 
+ #define	__byte_swap_long(x)		\
+ 	(__builtin_constant_p((x)) ?	\
+ 	 __byte_swap_long_constant(x) :	__byte_swap_long_variable(x))
+ 
+ #define	__byte_swap_word(x)		\
+ 	(__builtin_constant_p((x)) ?	\
+ 	 __byte_swap_word_constant(x) : __byte_swap_word_variable(x))
+ 
+ #else
+ 
+ #define	__byte_swap_long(x)	__byte_swap_long_variable(x)
+ #define	__byte_swap_word(x)	__byte_swap_word_variable(x)
+ 
+ #endif /* __OPTIMIZE__ */
+ 
+ #endif /* _ARM_BYTE_SWAP_H_ */
Index: endian_machdep.h
===================================================================
RCS file: /cvsroot/syssrc/sys/arch/arm/include/endian_machdep.h,v
retrieving revision 1.3
diff -c -r1.3 endian_machdep.h
*** endian_machdep.h	2001/02/17 14:55:44	1.3
--- endian_machdep.h	2002/08/13 20:34:20
***************
*** 6,8 ****
--- 6,19 ----
  #else
  #define _BYTE_ORDER _LITTLE_ENDIAN
  #endif
+ 
+ #ifdef __GNUC__
+ 
+ #include <arm/byte_swap.h>
+ 
+ #define	ntohl(x)	((in_addr_t)__byte_swap_long((in_addr_t)(x)))
+ #define	ntohs(x)	((in_port_t)__byte_swap_word((in_port_t)(x)))
+ #define	htonl(x)	((in_addr_t)__byte_swap_long((in_addr_t)(x)))
+ #define	htons(x)	((in_port_t)__byte_swap_word((in_port_t)(x)))
+ 
+ #endif

--6c2NcOVqGQ03X4Wi--