| /* | 
 |  *  Generic fillrect for frame buffers with packed pixels of any depth. | 
 |  * | 
 |  *      Copyright (C)  2000 James Simmons (jsimmons@linux-fbdev.org) | 
 |  * | 
 |  *  This file is subject to the terms and conditions of the GNU General Public | 
 |  *  License.  See the file COPYING in the main directory of this archive for | 
 |  *  more details. | 
 |  * | 
 |  * NOTES: | 
 |  * | 
 |  *  The code for depths like 24 that don't have integer number of pixels per | 
 |  *  long is broken and needs to be fixed. For now I turned these types of | 
 |  *  mode off. | 
 |  * | 
 |  *  Also need to add code to deal with cards endians that are different than | 
 |  *  the native cpu endians. I also need to deal with MSB position in the word. | 
 |  * | 
 |  */ | 
 | #include <linux/config.h> | 
 | #include <linux/module.h> | 
 | #include <linux/string.h> | 
 | #include <linux/fb.h> | 
 | #include <asm/types.h> | 
 |  | 
 | #if BITS_PER_LONG == 32 | 
 | #  define FB_WRITEL fb_writel | 
 | #  define FB_READL  fb_readl | 
 | #else | 
 | #  define FB_WRITEL fb_writeq | 
 | #  define FB_READL  fb_readq | 
 | #endif | 
 |  | 
 |     /* | 
 |      *  Compose two values, using a bitmask as decision value | 
 |      *  This is equivalent to (a & mask) | (b & ~mask) | 
 |      */ | 
 |  | 
 | static inline unsigned long | 
 | comp(unsigned long a, unsigned long b, unsigned long mask) | 
 | { | 
 |     return ((a ^ b) & mask) ^ b; | 
 | } | 
 |  | 
 |     /* | 
 |      *  Create a pattern with the given pixel's color | 
 |      */ | 
 |  | 
 | #if BITS_PER_LONG == 64 | 
 | static inline unsigned long | 
 | pixel_to_pat( u32 bpp, u32 pixel) | 
 | { | 
 | 	switch (bpp) { | 
 | 	case 1: | 
 | 		return 0xfffffffffffffffful*pixel; | 
 | 	case 2: | 
 | 		return 0x5555555555555555ul*pixel; | 
 | 	case 4: | 
 | 		return 0x1111111111111111ul*pixel; | 
 | 	case 8: | 
 | 		return 0x0101010101010101ul*pixel; | 
 | 	case 12: | 
 | 		return 0x0001001001001001ul*pixel; | 
 | 	case 16: | 
 | 		return 0x0001000100010001ul*pixel; | 
 | 	case 24: | 
 | 		return 0x0000000001000001ul*pixel; | 
 | 	case 32: | 
 | 		return 0x0000000100000001ul*pixel; | 
 | 	default: | 
 | 		panic("pixel_to_pat(): unsupported pixelformat\n"); | 
 |     } | 
 | } | 
 | #else | 
 | static inline unsigned long | 
 | pixel_to_pat( u32 bpp, u32 pixel) | 
 | { | 
 | 	switch (bpp) { | 
 | 	case 1: | 
 | 		return 0xfffffffful*pixel; | 
 | 	case 2: | 
 | 		return 0x55555555ul*pixel; | 
 | 	case 4: | 
 | 		return 0x11111111ul*pixel; | 
 | 	case 8: | 
 | 		return 0x01010101ul*pixel; | 
 | 	case 12: | 
 | 		return 0x00001001ul*pixel; | 
 | 	case 16: | 
 | 		return 0x00010001ul*pixel; | 
 | 	case 24: | 
 | 		return 0x00000001ul*pixel; | 
 | 	case 32: | 
 | 		return 0x00000001ul*pixel; | 
 | 	default: | 
 | 		panic("pixel_to_pat(): unsupported pixelformat\n"); | 
 |     } | 
 | } | 
 | #endif | 
 |  | 
 |     /* | 
 |      *  Aligned pattern fill using 32/64-bit memory accesses | 
 |      */ | 
 |  | 
 | static void | 
 | bitfill_aligned(unsigned long __iomem *dst, int dst_idx, unsigned long pat, unsigned n, int bits) | 
 | { | 
 | 	unsigned long first, last; | 
 |  | 
 | 	if (!n) | 
 | 		return; | 
 |  | 
 | 	first = ~0UL >> dst_idx; | 
 | 	last = ~(~0UL >> ((dst_idx+n) % bits)); | 
 |  | 
 | 	if (dst_idx+n <= bits) { | 
 | 		// Single word | 
 | 		if (last) | 
 | 			first &= last; | 
 | 		FB_WRITEL(comp(pat, FB_READL(dst), first), dst); | 
 | 	} else { | 
 | 		// Multiple destination words | 
 |  | 
 | 		// Leading bits | 
 | 		if (first!= ~0UL) { | 
 | 			FB_WRITEL(comp(pat, FB_READL(dst), first), dst); | 
 | 			dst++; | 
 | 			n -= bits - dst_idx; | 
 | 		} | 
 |  | 
 | 		// Main chunk | 
 | 		n /= bits; | 
 | 		while (n >= 8) { | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			n -= 8; | 
 | 		} | 
 | 		while (n--) | 
 | 			FB_WRITEL(pat, dst++); | 
 |  | 
 | 		// Trailing bits | 
 | 		if (last) | 
 | 			FB_WRITEL(comp(pat, FB_READL(dst), last), dst); | 
 | 	} | 
 | } | 
 |  | 
 |  | 
 |     /* | 
 |      *  Unaligned generic pattern fill using 32/64-bit memory accesses | 
 |      *  The pattern must have been expanded to a full 32/64-bit value | 
 |      *  Left/right are the appropriate shifts to convert to the pattern to be | 
 |      *  used for the next 32/64-bit word | 
 |      */ | 
 |  | 
 | static void | 
 | bitfill_unaligned(unsigned long __iomem *dst, int dst_idx, unsigned long pat, | 
 | 			int left, int right, unsigned n, int bits) | 
 | { | 
 | 	unsigned long first, last; | 
 |  | 
 | 	if (!n) | 
 | 		return; | 
 |  | 
 | 	first = ~0UL >> dst_idx; | 
 | 	last = ~(~0UL >> ((dst_idx+n) % bits)); | 
 |  | 
 | 	if (dst_idx+n <= bits) { | 
 | 		// Single word | 
 | 		if (last) | 
 | 			first &= last; | 
 | 		FB_WRITEL(comp(pat, FB_READL(dst), first), dst); | 
 | 	} else { | 
 | 		// Multiple destination words | 
 | 		// Leading bits | 
 | 		if (first) { | 
 | 			FB_WRITEL(comp(pat, FB_READL(dst), first), dst); | 
 | 			dst++; | 
 | 			pat = pat << left | pat >> right; | 
 | 			n -= bits - dst_idx; | 
 | 		} | 
 |  | 
 | 		// Main chunk | 
 | 		n /= bits; | 
 | 		while (n >= 4) { | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			pat = pat << left | pat >> right; | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			pat = pat << left | pat >> right; | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			pat = pat << left | pat >> right; | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			pat = pat << left | pat >> right; | 
 | 			n -= 4; | 
 | 		} | 
 | 		while (n--) { | 
 | 			FB_WRITEL(pat, dst++); | 
 | 			pat = pat << left | pat >> right; | 
 | 		} | 
 |  | 
 | 		// Trailing bits | 
 | 		if (last) | 
 | 			FB_WRITEL(comp(pat, FB_READL(dst), first), dst); | 
 | 	} | 
 | } | 
 |  | 
 |     /* | 
 |      *  Aligned pattern invert using 32/64-bit memory accesses | 
 |      */ | 
 | static void | 
 | bitfill_aligned_rev(unsigned long __iomem *dst, int dst_idx, unsigned long pat, unsigned n, int bits) | 
 | { | 
 | 	unsigned long val = pat, dat; | 
 | 	unsigned long first, last; | 
 |  | 
 | 	if (!n) | 
 | 		return; | 
 |  | 
 | 	first = ~0UL >> dst_idx; | 
 | 	last = ~(~0UL >> ((dst_idx+n) % bits)); | 
 |  | 
 | 	if (dst_idx+n <= bits) { | 
 | 		// Single word | 
 | 		if (last) | 
 | 			first &= last; | 
 | 		dat = FB_READL(dst); | 
 | 		FB_WRITEL(comp(dat ^ val, dat, first), dst); | 
 | 	} else { | 
 | 		// Multiple destination words | 
 | 		// Leading bits | 
 | 		if (first!=0UL) { | 
 | 			dat = FB_READL(dst); | 
 | 			FB_WRITEL(comp(dat ^ val, dat, first), dst); | 
 | 			dst++; | 
 | 			n -= bits - dst_idx; | 
 | 		} | 
 |  | 
 | 		// Main chunk | 
 | 		n /= bits; | 
 | 		while (n >= 8) { | 
 | 			FB_WRITEL(FB_READL(dst) ^ val, dst); | 
 | 			dst++; | 
 | 			FB_WRITEL(FB_READL(dst) ^ val, dst); | 
 | 			dst++; | 
 | 			FB_WRITEL(FB_READL(dst) ^ val, dst); | 
 | 			dst++; | 
 | 			FB_WRITEL(FB_READL(dst) ^ val, dst); | 
 | 			dst++; | 
 | 			FB_WRITEL(FB_READL(dst) ^ val, dst); | 
 | 			dst++; | 
 | 			FB_WRITEL(FB_READL(dst) ^ val, dst); | 
 | 			dst++; | 
 | 			FB_WRITEL(FB_READL(dst) ^ val, dst); | 
 | 			dst++; | 
 | 			FB_WRITEL(FB_READL(dst) ^ val, dst); | 
 | 			dst++; | 
 | 			n -= 8; | 
 | 		} | 
 | 		while (n--) { | 
 | 			FB_WRITEL(FB_READL(dst) ^ val, dst); | 
 | 			dst++; | 
 | 		} | 
 | 		// Trailing bits | 
 | 		if (last) { | 
 | 			dat = FB_READL(dst); | 
 | 			FB_WRITEL(comp(dat ^ val, dat, last), dst); | 
 | 		} | 
 | 	} | 
 | } | 
 |  | 
 |  | 
 |     /* | 
 |      *  Unaligned generic pattern invert using 32/64-bit memory accesses | 
 |      *  The pattern must have been expanded to a full 32/64-bit value | 
 |      *  Left/right are the appropriate shifts to convert to the pattern to be | 
 |      *  used for the next 32/64-bit word | 
 |      */ | 
 |  | 
 | static void | 
 | bitfill_unaligned_rev(unsigned long __iomem *dst, int dst_idx, unsigned long pat, | 
 | 			int left, int right, unsigned n, int bits) | 
 | { | 
 | 	unsigned long first, last, dat; | 
 |  | 
 | 	if (!n) | 
 | 		return; | 
 |  | 
 | 	first = ~0UL >> dst_idx; | 
 | 	last = ~(~0UL >> ((dst_idx+n) % bits)); | 
 |  | 
 | 	if (dst_idx+n <= bits) { | 
 | 		// Single word | 
 | 		if (last) | 
 | 			first &= last; | 
 | 		dat = FB_READL(dst); | 
 | 		FB_WRITEL(comp(dat ^ pat, dat, first), dst); | 
 | 	} else { | 
 | 		// Multiple destination words | 
 |  | 
 | 		// Leading bits | 
 | 		if (first != 0UL) { | 
 | 			dat = FB_READL(dst); | 
 | 			FB_WRITEL(comp(dat ^ pat, dat, first), dst); | 
 | 			dst++; | 
 | 			pat = pat << left | pat >> right; | 
 | 			n -= bits - dst_idx; | 
 | 		} | 
 |  | 
 | 		// Main chunk | 
 | 		n /= bits; | 
 | 		while (n >= 4) { | 
 | 			FB_WRITEL(FB_READL(dst) ^ pat, dst); | 
 | 			dst++; | 
 | 			pat = pat << left | pat >> right; | 
 | 			FB_WRITEL(FB_READL(dst) ^ pat, dst); | 
 | 			dst++; | 
 | 			pat = pat << left | pat >> right; | 
 | 			FB_WRITEL(FB_READL(dst) ^ pat, dst); | 
 | 			dst++; | 
 | 			pat = pat << left | pat >> right; | 
 | 			FB_WRITEL(FB_READL(dst) ^ pat, dst); | 
 | 			dst++; | 
 | 			pat = pat << left | pat >> right; | 
 | 			n -= 4; | 
 | 		} | 
 | 		while (n--) { | 
 | 			FB_WRITEL(FB_READL(dst) ^ pat, dst); | 
 | 			dst++; | 
 | 			pat = pat << left | pat >> right; | 
 | 		} | 
 |  | 
 | 		// Trailing bits | 
 | 		if (last) { | 
 | 			dat = FB_READL(dst); | 
 | 			FB_WRITEL(comp(dat ^ pat, dat, last), dst); | 
 | 		} | 
 | 	} | 
 | } | 
 |  | 
 | void cfb_fillrect(struct fb_info *p, const struct fb_fillrect *rect) | 
 | { | 
 | 	unsigned long x2, y2, vxres, vyres, height, width, pat, fg; | 
 | 	int bits = BITS_PER_LONG, bytes = bits >> 3; | 
 | 	u32 bpp = p->var.bits_per_pixel; | 
 | 	unsigned long __iomem *dst; | 
 | 	int dst_idx, left; | 
 |  | 
 | 	if (p->state != FBINFO_STATE_RUNNING) | 
 | 		return; | 
 |  | 
 | 	/* We want rotation but lack hardware to do it for us. */ | 
 | 	if (!p->fbops->fb_rotate && p->var.rotate) { | 
 | 	} | 
 |  | 
 | 	vxres = p->var.xres_virtual; | 
 | 	vyres = p->var.yres_virtual; | 
 |  | 
 | 	if (!rect->width || !rect->height || | 
 | 	    rect->dx > vxres || rect->dy > vyres) | 
 | 		return; | 
 |  | 
 | 	/* We could use hardware clipping but on many cards you get around | 
 | 	 * hardware clipping by writing to framebuffer directly. */ | 
 |  | 
 | 	x2 = rect->dx + rect->width; | 
 | 	y2 = rect->dy + rect->height; | 
 | 	x2 = x2 < vxres ? x2 : vxres; | 
 | 	y2 = y2 < vyres ? y2 : vyres; | 
 | 	width = x2 - rect->dx; | 
 | 	height = y2 - rect->dy; | 
 |  | 
 | 	if (p->fix.visual == FB_VISUAL_TRUECOLOR || | 
 | 	    p->fix.visual == FB_VISUAL_DIRECTCOLOR ) | 
 | 		fg = ((u32 *) (p->pseudo_palette))[rect->color]; | 
 | 	else | 
 | 		fg = rect->color; | 
 |  | 
 | 	pat = pixel_to_pat( bpp, fg); | 
 |  | 
 | 	dst = (unsigned long __iomem *)((unsigned long)p->screen_base & ~(bytes-1)); | 
 | 	dst_idx = ((unsigned long)p->screen_base & (bytes - 1))*8; | 
 | 	dst_idx += rect->dy*p->fix.line_length*8+rect->dx*bpp; | 
 | 	/* FIXME For now we support 1-32 bpp only */ | 
 | 	left = bits % bpp; | 
 | 	if (p->fbops->fb_sync) | 
 | 		p->fbops->fb_sync(p); | 
 | 	if (!left) { | 
 | 		void (*fill_op32)(unsigned long __iomem *dst, int dst_idx, | 
 | 		                  unsigned long pat, unsigned n, int bits) = NULL; | 
 |  | 
 | 		switch (rect->rop) { | 
 | 		case ROP_XOR: | 
 | 			fill_op32 = bitfill_aligned_rev; | 
 | 			break; | 
 | 		case ROP_COPY: | 
 | 			fill_op32 = bitfill_aligned; | 
 | 			break; | 
 | 		default: | 
 | 			printk( KERN_ERR "cfb_fillrect(): unknown rop, defaulting to ROP_COPY\n"); | 
 | 			fill_op32 = bitfill_aligned; | 
 | 			break; | 
 | 		} | 
 | 		while (height--) { | 
 | 			dst += dst_idx >> (ffs(bits) - 1); | 
 | 			dst_idx &= (bits - 1); | 
 | 			fill_op32(dst, dst_idx, pat, width*bpp, bits); | 
 | 			dst_idx += p->fix.line_length*8; | 
 | 		} | 
 | 	} else { | 
 | 		int right; | 
 | 		int r; | 
 | 		int rot = (left-dst_idx) % bpp; | 
 | 		void (*fill_op)(unsigned long __iomem *dst, int dst_idx, | 
 | 		                unsigned long pat, int left, int right, | 
 | 		                unsigned n, int bits) = NULL; | 
 |  | 
 | 		/* rotate pattern to correct start position */ | 
 | 		pat = pat << rot | pat >> (bpp-rot); | 
 |  | 
 | 		right = bpp-left; | 
 | 		switch (rect->rop) { | 
 | 		case ROP_XOR: | 
 | 			fill_op = bitfill_unaligned_rev; | 
 | 			break; | 
 | 		case ROP_COPY: | 
 | 			fill_op = bitfill_unaligned; | 
 | 			break; | 
 | 		default: | 
 | 			printk( KERN_ERR "cfb_fillrect(): unknown rop, defaulting to ROP_COPY\n"); | 
 | 			fill_op = bitfill_unaligned; | 
 | 			break; | 
 | 		} | 
 | 		while (height--) { | 
 | 			dst += dst_idx >> (ffs(bits) - 1); | 
 | 			dst_idx &= (bits - 1); | 
 | 			fill_op(dst, dst_idx, pat, left, right, | 
 | 				width*bpp, bits); | 
 | 			r = (p->fix.line_length*8) % bpp; | 
 | 			pat = pat << (bpp-r) | pat >> r; | 
 | 			dst_idx += p->fix.line_length*8; | 
 | 		} | 
 | 	} | 
 | } | 
 |  | 
 | EXPORT_SYMBOL(cfb_fillrect); | 
 |  | 
 | MODULE_AUTHOR("James Simmons <jsimmons@users.sf.net>"); | 
 | MODULE_DESCRIPTION("Generic software accelerated fill rectangle"); | 
 | MODULE_LICENSE("GPL"); |