| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* | 
 | 2 |  *  linux/include/asm-arm/xor.h | 
 | 3 |  * | 
 | 4 |  *  Copyright (C) 2001 Russell King | 
 | 5 |  * | 
 | 6 |  * This program is free software; you can redistribute it and/or modify | 
 | 7 |  * it under the terms of the GNU General Public License version 2 as | 
 | 8 |  * published by the Free Software Foundation. | 
 | 9 |  */ | 
 | 10 | #include <asm-generic/xor.h> | 
 | 11 |  | 
 | 12 | #define __XOR(a1, a2) a1 ^= a2 | 
 | 13 |  | 
 | 14 | #define GET_BLOCK_2(dst) \ | 
 | 15 | 	__asm__("ldmia	%0, {%1, %2}" \ | 
 | 16 | 		: "=r" (dst), "=r" (a1), "=r" (a2) \ | 
 | 17 | 		: "0" (dst)) | 
 | 18 |  | 
 | 19 | #define GET_BLOCK_4(dst) \ | 
 | 20 | 	__asm__("ldmia	%0, {%1, %2, %3, %4}" \ | 
 | 21 | 		: "=r" (dst), "=r" (a1), "=r" (a2), "=r" (a3), "=r" (a4) \ | 
 | 22 | 		: "0" (dst)) | 
 | 23 |  | 
 | 24 | #define XOR_BLOCK_2(src) \ | 
 | 25 | 	__asm__("ldmia	%0!, {%1, %2}" \ | 
 | 26 | 		: "=r" (src), "=r" (b1), "=r" (b2) \ | 
 | 27 | 		: "0" (src)); \ | 
 | 28 | 	__XOR(a1, b1); __XOR(a2, b2); | 
 | 29 |  | 
 | 30 | #define XOR_BLOCK_4(src) \ | 
 | 31 | 	__asm__("ldmia	%0!, {%1, %2, %3, %4}" \ | 
 | 32 | 		: "=r" (src), "=r" (b1), "=r" (b2), "=r" (b3), "=r" (b4) \ | 
 | 33 | 		: "0" (src)); \ | 
 | 34 | 	__XOR(a1, b1); __XOR(a2, b2); __XOR(a3, b3); __XOR(a4, b4) | 
 | 35 |  | 
 | 36 | #define PUT_BLOCK_2(dst) \ | 
 | 37 | 	__asm__ __volatile__("stmia	%0!, {%2, %3}" \ | 
 | 38 | 		: "=r" (dst) \ | 
 | 39 | 		: "0" (dst), "r" (a1), "r" (a2)) | 
 | 40 |  | 
 | 41 | #define PUT_BLOCK_4(dst) \ | 
 | 42 | 	__asm__ __volatile__("stmia	%0!, {%2, %3, %4, %5}" \ | 
 | 43 | 		: "=r" (dst) \ | 
 | 44 | 		: "0" (dst), "r" (a1), "r" (a2), "r" (a3), "r" (a4)) | 
 | 45 |  | 
 | 46 | static void | 
 | 47 | xor_arm4regs_2(unsigned long bytes, unsigned long *p1, unsigned long *p2) | 
 | 48 | { | 
 | 49 | 	unsigned int lines = bytes / sizeof(unsigned long) / 4; | 
 | 50 | 	register unsigned int a1 __asm__("r4"); | 
 | 51 | 	register unsigned int a2 __asm__("r5"); | 
 | 52 | 	register unsigned int a3 __asm__("r6"); | 
 | 53 | 	register unsigned int a4 __asm__("r7"); | 
 | 54 | 	register unsigned int b1 __asm__("r8"); | 
 | 55 | 	register unsigned int b2 __asm__("r9"); | 
 | 56 | 	register unsigned int b3 __asm__("ip"); | 
 | 57 | 	register unsigned int b4 __asm__("lr"); | 
 | 58 |  | 
 | 59 | 	do { | 
 | 60 | 		GET_BLOCK_4(p1); | 
 | 61 | 		XOR_BLOCK_4(p2); | 
 | 62 | 		PUT_BLOCK_4(p1); | 
 | 63 | 	} while (--lines); | 
 | 64 | } | 
 | 65 |  | 
 | 66 | static void | 
 | 67 | xor_arm4regs_3(unsigned long bytes, unsigned long *p1, unsigned long *p2, | 
 | 68 | 		unsigned long *p3) | 
 | 69 | { | 
 | 70 | 	unsigned int lines = bytes / sizeof(unsigned long) / 4; | 
 | 71 | 	register unsigned int a1 __asm__("r4"); | 
 | 72 | 	register unsigned int a2 __asm__("r5"); | 
 | 73 | 	register unsigned int a3 __asm__("r6"); | 
 | 74 | 	register unsigned int a4 __asm__("r7"); | 
 | 75 | 	register unsigned int b1 __asm__("r8"); | 
 | 76 | 	register unsigned int b2 __asm__("r9"); | 
 | 77 | 	register unsigned int b3 __asm__("ip"); | 
 | 78 | 	register unsigned int b4 __asm__("lr"); | 
 | 79 |  | 
 | 80 | 	do { | 
 | 81 | 		GET_BLOCK_4(p1); | 
 | 82 | 		XOR_BLOCK_4(p2); | 
 | 83 | 		XOR_BLOCK_4(p3); | 
 | 84 | 		PUT_BLOCK_4(p1); | 
 | 85 | 	} while (--lines); | 
 | 86 | } | 
 | 87 |  | 
 | 88 | static void | 
 | 89 | xor_arm4regs_4(unsigned long bytes, unsigned long *p1, unsigned long *p2, | 
 | 90 | 		unsigned long *p3, unsigned long *p4) | 
 | 91 | { | 
 | 92 | 	unsigned int lines = bytes / sizeof(unsigned long) / 2; | 
 | 93 | 	register unsigned int a1 __asm__("r8"); | 
 | 94 | 	register unsigned int a2 __asm__("r9"); | 
 | 95 | 	register unsigned int b1 __asm__("ip"); | 
 | 96 | 	register unsigned int b2 __asm__("lr"); | 
 | 97 |  | 
 | 98 | 	do { | 
 | 99 | 		GET_BLOCK_2(p1); | 
 | 100 | 		XOR_BLOCK_2(p2); | 
 | 101 | 		XOR_BLOCK_2(p3); | 
 | 102 | 		XOR_BLOCK_2(p4); | 
 | 103 | 		PUT_BLOCK_2(p1); | 
 | 104 | 	} while (--lines); | 
 | 105 | } | 
 | 106 |  | 
 | 107 | static void | 
 | 108 | xor_arm4regs_5(unsigned long bytes, unsigned long *p1, unsigned long *p2, | 
 | 109 | 		unsigned long *p3, unsigned long *p4, unsigned long *p5) | 
 | 110 | { | 
 | 111 | 	unsigned int lines = bytes / sizeof(unsigned long) / 2; | 
 | 112 | 	register unsigned int a1 __asm__("r8"); | 
 | 113 | 	register unsigned int a2 __asm__("r9"); | 
 | 114 | 	register unsigned int b1 __asm__("ip"); | 
 | 115 | 	register unsigned int b2 __asm__("lr"); | 
 | 116 |  | 
 | 117 | 	do { | 
 | 118 | 		GET_BLOCK_2(p1); | 
 | 119 | 		XOR_BLOCK_2(p2); | 
 | 120 | 		XOR_BLOCK_2(p3); | 
 | 121 | 		XOR_BLOCK_2(p4); | 
 | 122 | 		XOR_BLOCK_2(p5); | 
 | 123 | 		PUT_BLOCK_2(p1); | 
 | 124 | 	} while (--lines); | 
 | 125 | } | 
 | 126 |  | 
 | 127 | static struct xor_block_template xor_block_arm4regs = { | 
 | 128 | 	.name	= "arm4regs", | 
 | 129 | 	.do_2	= xor_arm4regs_2, | 
 | 130 | 	.do_3	= xor_arm4regs_3, | 
 | 131 | 	.do_4	= xor_arm4regs_4, | 
 | 132 | 	.do_5	= xor_arm4regs_5, | 
 | 133 | }; | 
 | 134 |  | 
 | 135 | #undef XOR_TRY_TEMPLATES | 
 | 136 | #define XOR_TRY_TEMPLATES			\ | 
 | 137 | 	do {					\ | 
 | 138 | 		xor_speed(&xor_block_arm4regs);	\ | 
 | 139 | 		xor_speed(&xor_block_8regs);	\ | 
 | 140 | 		xor_speed(&xor_block_32regs);	\ | 
 | 141 | 	} while (0) |