From: "Bryan O'Sullivan" This assembly version is measurably faster than the generic version in lib/iomap_copy.c. Signed-off-by: Bryan O'Sullivan Cc: Andi Kleen Signed-off-by: Andrew Morton --- arch/x86_64/lib/Makefile | 2 +- arch/x86_64/lib/iomap_copy.S | 26 ++++++++++++++++++++++++++ 2 files changed, 27 insertions(+), 1 deletion(-) diff -puN /dev/null arch/x86_64/lib/iomap_copy.S --- /dev/null Thu Apr 11 07:25:15 2002 +++ 25-akpm/arch/x86_64/lib/iomap_copy.S Thu Jan 12 16:43:17 2006 @@ -0,0 +1,26 @@ +/* + * Copyright 2006 PathScale, Inc. All Rights Reserved. + * + * This file is free software; you can redistribute it and/or modify + * it under the terms of version 2 of the GNU General Public License + * as published by the Free Software Foundation. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. + */ + +/* + * override generic version in lib/iomap_copy.c + */ + .globl __iowrite32_copy + .p2align 4 +__iowrite32_copy: + movl %edx,%ecx + rep movsd + ret diff -puN arch/x86_64/lib/Makefile~add-faster-__iowrite32_copy-routine-for-x86_64 arch/x86_64/lib/Makefile --- 25/arch/x86_64/lib/Makefile~add-faster-__iowrite32_copy-routine-for-x86_64 Thu Jan 12 16:43:17 2006 +++ 25-akpm/arch/x86_64/lib/Makefile Thu Jan 12 16:43:17 2006 @@ -4,7 +4,7 @@ CFLAGS_csum-partial.o := -funroll-loops -obj-y := io.o +obj-y := io.o iomap_copy.o lib-y := csum-partial.o csum-copy.o csum-wrappers.o delay.o \ usercopy.o getuser.o putuser.o \ _