n_tty: Reduce branching in canon_copy_from_read_buf()
[linux/fpc-iii.git] / drivers / video / fbdev / core / cfbcopyarea.c
blob6d4bfeecee35088f86d257d871c40ad934f79737
1 /*
2 * Generic function for frame buffer with packed pixels of any depth.
4 * Copyright (C) 1999-2005 James Simmons <jsimmons@www.infradead.org>
6 * This file is subject to the terms and conditions of the GNU General Public
7 * License. See the file COPYING in the main directory of this archive for
8 * more details.
10 * NOTES:
12 * This is for cfb packed pixels. Iplan and such are incorporated in the
13 * drivers that need them.
15 * FIXME
17 * Also need to add code to deal with cards endians that are different than
18 * the native cpu endians. I also need to deal with MSB position in the word.
20 * The two functions or copying forward and backward could be split up like
21 * the ones for filling, i.e. in aligned and unaligned versions. This would
22 * help moving some redundant computations and branches out of the loop, too.
25 #include <linux/module.h>
26 #include <linux/kernel.h>
27 #include <linux/string.h>
28 #include <linux/fb.h>
29 #include <asm/types.h>
30 #include <asm/io.h>
31 #include "fb_draw.h"
33 #if BITS_PER_LONG == 32
34 # define FB_WRITEL fb_writel
35 # define FB_READL fb_readl
36 #else
37 # define FB_WRITEL fb_writeq
38 # define FB_READL fb_readq
39 #endif
42 * Generic bitwise copy algorithm
45 static void
46 bitcpy(struct fb_info *p, unsigned long __iomem *dst, unsigned dst_idx,
47 const unsigned long __iomem *src, unsigned src_idx, int bits,
48 unsigned n, u32 bswapmask)
50 unsigned long first, last;
51 int const shift = dst_idx-src_idx;
53 #if 0
55 * If you suspect bug in this function, compare it with this simple
56 * memmove implementation.
58 memmove((char *)dst + ((dst_idx & (bits - 1))) / 8,
59 (char *)src + ((src_idx & (bits - 1))) / 8, n / 8);
60 return;
61 #endif
63 first = fb_shifted_pixels_mask_long(p, dst_idx, bswapmask);
64 last = ~fb_shifted_pixels_mask_long(p, (dst_idx+n) % bits, bswapmask);
66 if (!shift) {
67 // Same alignment for source and dest
69 if (dst_idx+n <= bits) {
70 // Single word
71 if (last)
72 first &= last;
73 FB_WRITEL( comp( FB_READL(src), FB_READL(dst), first), dst);
74 } else {
75 // Multiple destination words
77 // Leading bits
78 if (first != ~0UL) {
79 FB_WRITEL( comp( FB_READL(src), FB_READL(dst), first), dst);
80 dst++;
81 src++;
82 n -= bits - dst_idx;
85 // Main chunk
86 n /= bits;
87 while (n >= 8) {
88 FB_WRITEL(FB_READL(src++), dst++);
89 FB_WRITEL(FB_READL(src++), dst++);
90 FB_WRITEL(FB_READL(src++), dst++);
91 FB_WRITEL(FB_READL(src++), dst++);
92 FB_WRITEL(FB_READL(src++), dst++);
93 FB_WRITEL(FB_READL(src++), dst++);
94 FB_WRITEL(FB_READL(src++), dst++);
95 FB_WRITEL(FB_READL(src++), dst++);
96 n -= 8;
98 while (n--)
99 FB_WRITEL(FB_READL(src++), dst++);
101 // Trailing bits
102 if (last)
103 FB_WRITEL( comp( FB_READL(src), FB_READL(dst), last), dst);
105 } else {
106 /* Different alignment for source and dest */
107 unsigned long d0, d1;
108 int m;
110 int const left = shift & (bits - 1);
111 int const right = -shift & (bits - 1);
113 if (dst_idx+n <= bits) {
114 // Single destination word
115 if (last)
116 first &= last;
117 d0 = FB_READL(src);
118 d0 = fb_rev_pixels_in_long(d0, bswapmask);
119 if (shift > 0) {
120 // Single source word
121 d0 <<= left;
122 } else if (src_idx+n <= bits) {
123 // Single source word
124 d0 >>= right;
125 } else {
126 // 2 source words
127 d1 = FB_READL(src + 1);
128 d1 = fb_rev_pixels_in_long(d1, bswapmask);
129 d0 = d0 >> right | d1 << left;
131 d0 = fb_rev_pixels_in_long(d0, bswapmask);
132 FB_WRITEL(comp(d0, FB_READL(dst), first), dst);
133 } else {
134 // Multiple destination words
135 /** We must always remember the last value read, because in case
136 SRC and DST overlap bitwise (e.g. when moving just one pixel in
137 1bpp), we always collect one full long for DST and that might
138 overlap with the current long from SRC. We store this value in
139 'd0'. */
140 d0 = FB_READL(src++);
141 d0 = fb_rev_pixels_in_long(d0, bswapmask);
142 // Leading bits
143 if (shift > 0) {
144 // Single source word
145 d1 = d0;
146 d0 <<= left;
147 n -= bits - dst_idx;
148 } else {
149 // 2 source words
150 d1 = FB_READL(src++);
151 d1 = fb_rev_pixels_in_long(d1, bswapmask);
153 d0 = d0 >> right | d1 << left;
154 n -= bits - dst_idx;
156 d0 = fb_rev_pixels_in_long(d0, bswapmask);
157 FB_WRITEL(comp(d0, FB_READL(dst), first), dst);
158 d0 = d1;
159 dst++;
161 // Main chunk
162 m = n % bits;
163 n /= bits;
164 while ((n >= 4) && !bswapmask) {
165 d1 = FB_READL(src++);
166 FB_WRITEL(d0 >> right | d1 << left, dst++);
167 d0 = d1;
168 d1 = FB_READL(src++);
169 FB_WRITEL(d0 >> right | d1 << left, dst++);
170 d0 = d1;
171 d1 = FB_READL(src++);
172 FB_WRITEL(d0 >> right | d1 << left, dst++);
173 d0 = d1;
174 d1 = FB_READL(src++);
175 FB_WRITEL(d0 >> right | d1 << left, dst++);
176 d0 = d1;
177 n -= 4;
179 while (n--) {
180 d1 = FB_READL(src++);
181 d1 = fb_rev_pixels_in_long(d1, bswapmask);
182 d0 = d0 >> right | d1 << left;
183 d0 = fb_rev_pixels_in_long(d0, bswapmask);
184 FB_WRITEL(d0, dst++);
185 d0 = d1;
188 // Trailing bits
189 if (m) {
190 if (m <= bits - right) {
191 // Single source word
192 d0 >>= right;
193 } else {
194 // 2 source words
195 d1 = FB_READL(src);
196 d1 = fb_rev_pixels_in_long(d1,
197 bswapmask);
198 d0 = d0 >> right | d1 << left;
200 d0 = fb_rev_pixels_in_long(d0, bswapmask);
201 FB_WRITEL(comp(d0, FB_READL(dst), last), dst);
208 * Generic bitwise copy algorithm, operating backward
211 static void
212 bitcpy_rev(struct fb_info *p, unsigned long __iomem *dst, unsigned dst_idx,
213 const unsigned long __iomem *src, unsigned src_idx, int bits,
214 unsigned n, u32 bswapmask)
216 unsigned long first, last;
217 int shift;
219 #if 0
221 * If you suspect bug in this function, compare it with this simple
222 * memmove implementation.
224 memmove((char *)dst + ((dst_idx & (bits - 1))) / 8,
225 (char *)src + ((src_idx & (bits - 1))) / 8, n / 8);
226 return;
227 #endif
229 dst += (dst_idx + n - 1) / bits;
230 src += (src_idx + n - 1) / bits;
231 dst_idx = (dst_idx + n - 1) % bits;
232 src_idx = (src_idx + n - 1) % bits;
234 shift = dst_idx-src_idx;
236 first = ~fb_shifted_pixels_mask_long(p, (dst_idx + 1) % bits, bswapmask);
237 last = fb_shifted_pixels_mask_long(p, (bits + dst_idx + 1 - n) % bits, bswapmask);
239 if (!shift) {
240 // Same alignment for source and dest
242 if ((unsigned long)dst_idx+1 >= n) {
243 // Single word
244 if (first)
245 last &= first;
246 FB_WRITEL( comp( FB_READL(src), FB_READL(dst), last), dst);
247 } else {
248 // Multiple destination words
250 // Leading bits
251 if (first) {
252 FB_WRITEL( comp( FB_READL(src), FB_READL(dst), first), dst);
253 dst--;
254 src--;
255 n -= dst_idx+1;
258 // Main chunk
259 n /= bits;
260 while (n >= 8) {
261 FB_WRITEL(FB_READL(src--), dst--);
262 FB_WRITEL(FB_READL(src--), dst--);
263 FB_WRITEL(FB_READL(src--), dst--);
264 FB_WRITEL(FB_READL(src--), dst--);
265 FB_WRITEL(FB_READL(src--), dst--);
266 FB_WRITEL(FB_READL(src--), dst--);
267 FB_WRITEL(FB_READL(src--), dst--);
268 FB_WRITEL(FB_READL(src--), dst--);
269 n -= 8;
271 while (n--)
272 FB_WRITEL(FB_READL(src--), dst--);
274 // Trailing bits
275 if (last != -1UL)
276 FB_WRITEL( comp( FB_READL(src), FB_READL(dst), last), dst);
278 } else {
279 // Different alignment for source and dest
280 unsigned long d0, d1;
281 int m;
283 int const left = shift & (bits-1);
284 int const right = -shift & (bits-1);
286 if ((unsigned long)dst_idx+1 >= n) {
287 // Single destination word
288 if (first)
289 last &= first;
290 d0 = FB_READL(src);
291 if (shift < 0) {
292 // Single source word
293 d0 >>= right;
294 } else if (1+(unsigned long)src_idx >= n) {
295 // Single source word
296 d0 <<= left;
297 } else {
298 // 2 source words
299 d1 = FB_READL(src - 1);
300 d1 = fb_rev_pixels_in_long(d1, bswapmask);
301 d0 = d0 << left | d1 >> right;
303 d0 = fb_rev_pixels_in_long(d0, bswapmask);
304 FB_WRITEL(comp(d0, FB_READL(dst), last), dst);
305 } else {
306 // Multiple destination words
307 /** We must always remember the last value read, because in case
308 SRC and DST overlap bitwise (e.g. when moving just one pixel in
309 1bpp), we always collect one full long for DST and that might
310 overlap with the current long from SRC. We store this value in
311 'd0'. */
313 d0 = FB_READL(src--);
314 d0 = fb_rev_pixels_in_long(d0, bswapmask);
315 // Leading bits
316 if (shift < 0) {
317 // Single source word
318 d1 = d0;
319 d0 >>= right;
320 } else {
321 // 2 source words
322 d1 = FB_READL(src--);
323 d1 = fb_rev_pixels_in_long(d1, bswapmask);
324 d0 = d0 << left | d1 >> right;
326 d0 = fb_rev_pixels_in_long(d0, bswapmask);
327 if (!first)
328 FB_WRITEL(d0, dst);
329 else
330 FB_WRITEL(comp(d0, FB_READL(dst), first), dst);
331 d0 = d1;
332 dst--;
333 n -= dst_idx+1;
335 // Main chunk
336 m = n % bits;
337 n /= bits;
338 while ((n >= 4) && !bswapmask) {
339 d1 = FB_READL(src--);
340 FB_WRITEL(d0 << left | d1 >> right, dst--);
341 d0 = d1;
342 d1 = FB_READL(src--);
343 FB_WRITEL(d0 << left | d1 >> right, dst--);
344 d0 = d1;
345 d1 = FB_READL(src--);
346 FB_WRITEL(d0 << left | d1 >> right, dst--);
347 d0 = d1;
348 d1 = FB_READL(src--);
349 FB_WRITEL(d0 << left | d1 >> right, dst--);
350 d0 = d1;
351 n -= 4;
353 while (n--) {
354 d1 = FB_READL(src--);
355 d1 = fb_rev_pixels_in_long(d1, bswapmask);
356 d0 = d0 << left | d1 >> right;
357 d0 = fb_rev_pixels_in_long(d0, bswapmask);
358 FB_WRITEL(d0, dst--);
359 d0 = d1;
362 // Trailing bits
363 if (m) {
364 if (m <= bits - left) {
365 // Single source word
366 d0 <<= left;
367 } else {
368 // 2 source words
369 d1 = FB_READL(src);
370 d1 = fb_rev_pixels_in_long(d1,
371 bswapmask);
372 d0 = d0 << left | d1 >> right;
374 d0 = fb_rev_pixels_in_long(d0, bswapmask);
375 FB_WRITEL(comp(d0, FB_READL(dst), last), dst);
381 void cfb_copyarea(struct fb_info *p, const struct fb_copyarea *area)
383 u32 dx = area->dx, dy = area->dy, sx = area->sx, sy = area->sy;
384 u32 height = area->height, width = area->width;
385 unsigned long const bits_per_line = p->fix.line_length*8u;
386 unsigned long __iomem *base = NULL;
387 int bits = BITS_PER_LONG, bytes = bits >> 3;
388 unsigned dst_idx = 0, src_idx = 0, rev_copy = 0;
389 u32 bswapmask = fb_compute_bswapmask(p);
391 if (p->state != FBINFO_STATE_RUNNING)
392 return;
394 /* if the beginning of the target area might overlap with the end of
395 the source area, be have to copy the area reverse. */
396 if ((dy == sy && dx > sx) || (dy > sy)) {
397 dy += height;
398 sy += height;
399 rev_copy = 1;
402 // split the base of the framebuffer into a long-aligned address and the
403 // index of the first bit
404 base = (unsigned long __iomem *)((unsigned long)p->screen_base & ~(bytes-1));
405 dst_idx = src_idx = 8*((unsigned long)p->screen_base & (bytes-1));
406 // add offset of source and target area
407 dst_idx += dy*bits_per_line + dx*p->var.bits_per_pixel;
408 src_idx += sy*bits_per_line + sx*p->var.bits_per_pixel;
410 if (p->fbops->fb_sync)
411 p->fbops->fb_sync(p);
413 if (rev_copy) {
414 while (height--) {
415 dst_idx -= bits_per_line;
416 src_idx -= bits_per_line;
417 bitcpy_rev(p, base + (dst_idx / bits), dst_idx % bits,
418 base + (src_idx / bits), src_idx % bits, bits,
419 width*p->var.bits_per_pixel, bswapmask);
421 } else {
422 while (height--) {
423 bitcpy(p, base + (dst_idx / bits), dst_idx % bits,
424 base + (src_idx / bits), src_idx % bits, bits,
425 width*p->var.bits_per_pixel, bswapmask);
426 dst_idx += bits_per_line;
427 src_idx += bits_per_line;
432 EXPORT_SYMBOL(cfb_copyarea);
434 MODULE_AUTHOR("James Simmons <jsimmons@users.sf.net>");
435 MODULE_DESCRIPTION("Generic software accelerated copyarea");
436 MODULE_LICENSE("GPL");