[patch 2.6.16-rc5-mm2] i386 memcpy: optimal memcpy for IO

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



From: H. Peter Anvin <[email protected]>

Optimal memcpy for moves to/from IO space.  Does as few moves as
possible while keeping transfers optimally aligned.

Signed-off-by: Chuck Ebbert <[email protected]>

---

Andrew, remove i386-memcpy-use-as-few-moves-as.patch from -mm
and replace it with this, please.

 arch/i386/lib/memcpy.c |   57 +++++++++++++++++++++++++++++++++++++++++++++++++
 include/asm-i386/io.h  |   11 ++-------
 2 files changed, 60 insertions(+), 8 deletions(-)

--- 2.6.17-rc5-32.orig/arch/i386/lib/memcpy.c
+++ 2.6.17-rc5-32/arch/i386/lib/memcpy.c
@@ -42,3 +42,60 @@ void *memmove(void *dest, const void *sr
 	return dest;
 }
 EXPORT_SYMBOL(memmove);
+
+/*
+ * The most general form of memory copy to/from I/O space, used for
+ * devices which can handle arbitrary transactions with appropriate
+ * handling of byte enables.  The goal is to produce the minimum
+ * number of naturally aligned transactions on the bus.
+ */
+
+#define build_memcpy_io(dst, src, count, align_reg)	\
+({							\
+unsigned long d0, d1, d2, d3;				\
+asm volatile(						\
+	"jecxz	1f\n\t"					\
+							\
+	"testl	$1, " align_reg "\n\t"			\
+	"jz	2f\n\t"					\
+	"movsb\n\t"					\
+	"decl	%2\n"					\
+"2:\n\t"						\
+	"cmpl	$2, %2\n\t"				\
+	"jb	3f\n\t"					\
+	"testl	$2, " align_reg "\n\t"			\
+	"jz	4f\n\t"					\
+	"movsw\n\t"					\
+	"decl	%2\n\t"					\
+	"decl	%2\n"					\
+"4:\n\t"						\
+	"movl	%2, %3\n\t"				\
+	"shrl	$2, %2\n\t"				\
+	"jz	5f\n\t"					\
+	"rep ; movsl\n"					\
+"5:\n\t"						\
+	"movl	%3, %2\n\t"				\
+	"testb	$2, %b2\n\t"				\
+	"jz	3f\n\t"					\
+	"movsw\n"					\
+"3:\n\t"						\
+	"testb	$1, %b2\n\t"				\
+	"jz	1f\n\t"					\
+	"movsb\n"					\
+"1:"							\
+	: "=&D" (d0), "=&S" (d1), "=&c" (d2), "=&g" (d3)\
+	: "0" (dst), "1" (src), "2" (count)		\
+	: "memory");					\
+})
+
+void memcpy_fromio(void *dst, const volatile void __iomem *src, int count)
+{
+	build_memcpy_io(dst, src, count, "%%esi");
+}
+EXPORT_SYMBOL(memcpy_fromio)
+
+void memcpy_toio(volatile void __iomem *dst, const void *src, int count)
+{
+	build_memcpy_io(dst, src, count, "%%edi");
+}
+EXPORT_SYMBOL(memcpy_toio)
--- 2.6.17-rc5-32.orig/include/asm-i386/io.h
+++ 2.6.17-rc5-32/include/asm-i386/io.h
@@ -200,14 +200,9 @@ static inline void memset_io(volatile vo
 {
 	memset((void __force *) addr, val, count);
 }
-static inline void memcpy_fromio(void *dst, const volatile void __iomem *src, int count)
-{
-	__memcpy(dst, (void __force *) src, count);
-}
-static inline void memcpy_toio(volatile void __iomem *dst, const void *src, int count)
-{
-	__memcpy((void __force *) dst, src, count);
-}
+
+extern void memcpy_fromio(void *dst, const volatile void __iomem *src, int count);
+extern void memcpy_toio(volatile void __iomem *dst, const void *src, int count);
 
 /*
  * ISA space is 'always mapped' on a typical x86 system, no need to
-- 
Chuck
-
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to [email protected]
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/

[Index of Archives]     [Kernel Newbies]     [Netfilter]     [Bugtraq]     [Photo]     [Stuff]     [Gimp]     [Yosemite News]     [MIPS Linux]     [ARM Linux]     [Linux Security]     [Linux RAID]     [Video 4 Linux]     [Linux for the blind]     [Linux Resources]
  Powered by Linux