/* $NetBSD: rasops.c,v 1.44 2003/11/08 22:49:28 uwe Exp $ */ /*- * Copyright (c) 1999 The NetBSD Foundation, Inc. * All rights reserved. * * This code is derived from software contributed to The NetBSD Foundation * by Andrew Doran. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * 3. All advertising materials mentioning features or use of this software * must display the following acknowledgement: * This product includes software developed by the NetBSD * Foundation, Inc. and its contributors. * 4. Neither the name of The NetBSD Foundation nor the names of its * contributors may be used to endorse or promote products derived * from this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE * POSSIBILITY OF SUCH DAMAGE. */ #include __KERNEL_RCSID(0, "$NetBSD: rasops.c,v 1.44 2003/11/08 22:49:28 uwe Exp $"); #include "opt_rasops.h" #include "rasops_glue.h" #include #include #include #include #include #include #include #include #include #ifndef _KERNEL #include #endif /* ANSI colormap (R,G,B). Upper 8 are high-intensity */ const u_char rasops_cmap[256*3] = { 0x00, 0x00, 0x00, /* black */ 0x7f, 0x00, 0x00, /* red */ 0x00, 0x7f, 0x00, /* green */ 0x7f, 0x7f, 0x00, /* brown */ 0x00, 0x00, 0x7f, /* blue */ 0x7f, 0x00, 0x7f, /* magenta */ 0x00, 0x7f, 0x7f, /* cyan */ 0xc7, 0xc7, 0xc7, /* white - XXX too dim? */ 0x7f, 0x7f, 0x7f, /* black */ 0xff, 0x00, 0x00, /* red */ 0x00, 0xff, 0x00, /* green */ 0xff, 0xff, 0x00, /* brown */ 0x00, 0x00, 0xff, /* blue */ 0xff, 0x00, 0xff, /* magenta */ 0x00, 0xff, 0xff, /* cyan */ 0xff, 0xff, 0xff, /* white */ /* * For the cursor, we need at least the last (255th) * color to be white. Fill up white completely for * simplicity. */ #define _CMWHITE 0xff, 0xff, 0xff, #define _CMWHITE16 _CMWHITE _CMWHITE _CMWHITE _CMWHITE \ _CMWHITE _CMWHITE _CMWHITE _CMWHITE \ _CMWHITE _CMWHITE _CMWHITE _CMWHITE \ _CMWHITE _CMWHITE _CMWHITE _CMWHITE _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 _CMWHITE16 /* but not the last one */ #undef _CMWHITE16 #undef _CMWHITE /* * For the cursor the fg/bg indices are bit inverted, so * provide complimentary colors in the upper 16 entries. */ 0x7f, 0x7f, 0x7f, /* black */ 0xff, 0x00, 0x00, /* red */ 0x00, 0xff, 0x00, /* green */ 0xff, 0xff, 0x00, /* brown */ 0x00, 0x00, 0xff, /* blue */ 0xff, 0x00, 0xff, /* magenta */ 0x00, 0xff, 0xff, /* cyan */ 0xff, 0xff, 0xff, /* white */ 0x00, 0x00, 0x00, /* black */ 0x7f, 0x00, 0x00, /* red */ 0x00, 0x7f, 0x00, /* green */ 0x7f, 0x7f, 0x00, /* brown */ 0x00, 0x00, 0x7f, /* blue */ 0x7f, 0x00, 0x7f, /* magenta */ 0x00, 0x7f, 0x7f, /* cyan */ 0xc7, 0xc7, 0xc7, /* white - XXX too dim? */ }; /* True if color is gray */ const u_char rasops_isgray[16] = { 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1 }; /* Generic functions */ static void rasops_copyrows __P((void *, int, int, int)); static int rasops_mapchar __P((void *, int, u_int *)); static void rasops_cursor __P((void *, int, int, int)); static int rasops_allocattr_color __P((void *, int, int, int, long *)); static int rasops_allocattr_mono __P((void *, int, int, int, long *)); static void rasops_do_cursor __P((struct rasops_info *)); static void rasops_init_devcmap __P((struct rasops_info *)); /* * Initialize a 'rasops_info' descriptor. */ int rasops_init(ri, wantrows, wantcols) struct rasops_info *ri; int wantrows, wantcols; { #ifdef _KERNEL /* Select a font if the caller doesn't care */ if (ri->ri_font == NULL) { int cookie; wsfont_init(); /* Want 8 pixel wide, don't care about aestethics */ cookie = wsfont_find(NULL, 8, 0, 0, WSDISPLAY_FONTORDER_L2R, WSDISPLAY_FONTORDER_L2R); if (cookie <= 0) cookie = wsfont_find(NULL, 0, 0, 0, WSDISPLAY_FONTORDER_L2R, WSDISPLAY_FONTORDER_L2R); if (cookie <= 0) { printf("rasops_init: font table is empty\n"); return (-1); } if (wsfont_lock(cookie, &ri->ri_font)) { printf("rasops_init: couldn't lock font\n"); return (-1); } ri->ri_wsfcookie = cookie; } #endif /* This should never happen in reality... */ #ifdef DEBUG if ((long)ri->ri_bits & 3) { printf("rasops_init: bits not aligned on 32-bit boundary\n"); return (-1); } if ((int)ri->ri_stride & 3) { printf("rasops_init: stride not aligned on 32-bit boundary\n"); return (-1); } #endif if (rasops_reconfig(ri, wantrows, wantcols)) return (-1); rasops_init_devcmap(ri); return (0); } /* * Reconfigure (because parameters have changed in some way). */ int rasops_reconfig(ri, wantrows, wantcols) struct rasops_info *ri; int wantrows, wantcols; { int bpp, s; s = splhigh(); if (ri->ri_font->fontwidth > 32 || ri->ri_font->fontwidth < 4) panic("rasops_init: fontwidth assumptions botched!"); /* Need this to frob the setup below */ bpp = (ri->ri_depth == 15 ? 16 : ri->ri_depth); if ((ri->ri_flg & RI_CFGDONE) != 0) ri->ri_bits = ri->ri_origbits; /* Don't care if the caller wants a hideously small console */ if (wantrows < 10) wantrows = 10; if (wantcols < 20) wantcols = 20; /* Now constrain what they get */ ri->ri_emuwidth = ri->ri_font->fontwidth * wantcols; ri->ri_emuheight = ri->ri_font->fontheight * wantrows; if (ri->ri_emuwidth > ri->ri_width) ri->ri_emuwidth = ri->ri_width; if (ri->ri_emuheight > ri->ri_height) ri->ri_emuheight = ri->ri_height; /* Reduce width until aligned on a 32-bit boundary */ while ((ri->ri_emuwidth * bpp & 31) != 0) ri->ri_emuwidth--; ri->ri_cols = ri->ri_emuwidth / ri->ri_font->fontwidth; ri->ri_rows = ri->ri_emuheight / ri->ri_font->fontheight; ri->ri_emustride = ri->ri_emuwidth * bpp >> 3; ri->ri_delta = ri->ri_stride - ri->ri_emustride; ri->ri_ccol = 0; ri->ri_crow = 0; ri->ri_pelbytes = bpp >> 3; ri->ri_xscale = (ri->ri_font->fontwidth * bpp) >> 3; ri->ri_yscale = ri->ri_font->fontheight * ri->ri_stride; ri->ri_fontscale = ri->ri_font->fontheight * ri->ri_font->stride; #ifdef DEBUG if ((ri->ri_delta & 3) != 0) panic("rasops_init: ri_delta not aligned on 32-bit boundary"); #endif /* Clear the entire display */ if ((ri->ri_flg & RI_CLEAR) != 0) memset(ri->ri_bits, 0, ri->ri_stride * ri->ri_height); /* Now centre our window if needs be */ ri->ri_origbits = ri->ri_bits; if ((ri->ri_flg & RI_CENTER) != 0) { ri->ri_bits += (((ri->ri_width * bpp >> 3) - ri->ri_emustride) >> 1) & ~3; ri->ri_bits += ((ri->ri_height - ri->ri_emuheight) >> 1) * ri->ri_stride; ri->ri_yorigin = (int)(ri->ri_bits - ri->ri_origbits) / ri->ri_stride; ri->ri_xorigin = (((int)(ri->ri_bits - ri->ri_origbits) % ri->ri_stride) * 8 / bpp); } else ri->ri_xorigin = ri->ri_yorigin = 0; /* * Fill in defaults for operations set. XXX this nukes private * routines used by accelerated fb drivers. */ ri->ri_ops.mapchar = rasops_mapchar; ri->ri_ops.copyrows = rasops_copyrows; ri->ri_ops.copycols = rasops_copycols; ri->ri_ops.erasecols = rasops_erasecols; ri->ri_ops.eraserows = rasops_eraserows; ri->ri_ops.cursor = rasops_cursor; ri->ri_do_cursor = rasops_do_cursor; if (ri->ri_depth < 8 || (ri->ri_flg & RI_FORCEMONO) != 0) { ri->ri_ops.allocattr = rasops_allocattr_mono; ri->ri_caps = WSSCREEN_UNDERLINE | WSSCREEN_REVERSE; } else { ri->ri_ops.allocattr = rasops_allocattr_color; ri->ri_caps = WSSCREEN_UNDERLINE | WSSCREEN_HILIT | WSSCREEN_WSCOLORS | WSSCREEN_REVERSE; } switch (ri->ri_depth) { #if NRASOPS1 > 0 case 1: rasops1_init(ri); break; #endif #if NRASOPS2 > 0 case 2: rasops2_init(ri); break; #endif #if NRASOPS4 > 0 case 4: rasops4_init(ri); break; #endif #if NRASOPS8 > 0 case 8: rasops8_init(ri); break; #endif #if NRASOPS15 > 0 || NRASOPS16 > 0 case 15: case 16: rasops15_init(ri); break; #endif #if NRASOPS24 > 0 case 24: rasops24_init(ri); break; #endif #if NRASOPS32 > 0 case 32: rasops32_init(ri); break; #endif default: ri->ri_flg &= ~RI_CFGDONE; splx(s); return (-1); } ri->ri_flg |= RI_CFGDONE; splx(s); return (0); } /* * Map a character. */ static int rasops_mapchar(cookie, c, cp) void *cookie; int c; u_int *cp; { struct rasops_info *ri; ri = (struct rasops_info *)cookie; #ifdef DIAGNOSTIC if (ri->ri_font == NULL) panic("rasops_mapchar: no font selected"); #endif if (ri->ri_font->encoding != WSDISPLAY_FONTENC_ISO) { if ( (c = wsfont_map_unichar(ri->ri_font, c)) < 0) { *cp = ' '; return (0); } } if (c < ri->ri_font->firstchar) { *cp = ' '; return (0); } if (c - ri->ri_font->firstchar >= ri->ri_font->numchars) { *cp = ' '; return (0); } *cp = c; return (5); } /* * Allocate a color attribute. */ static int rasops_allocattr_color(cookie, fg, bg, flg, attr) void *cookie; int fg, bg, flg; long *attr; { int swap; #ifdef RASOPS_CLIPPING fg &= 7; bg &= 7; #endif if ((flg & WSATTR_BLINK) != 0) return (EINVAL); if ((flg & WSATTR_WSCOLORS) == 0) { fg = WSCOL_WHITE; bg = WSCOL_BLACK; } if ((flg & WSATTR_REVERSE) != 0) { swap = fg; fg = bg; bg = swap; } if ((flg & WSATTR_HILIT) != 0) fg += 8; flg = ((flg & WSATTR_UNDERLINE) ? 1 : 0); if (rasops_isgray[fg]) flg |= 2; if (rasops_isgray[bg]) flg |= 4; *attr = (bg << 16) | (fg << 24) | flg; return (0); } /* * Allocate a mono attribute. */ static int rasops_allocattr_mono(cookie, fg, bg, flg, attr) void *cookie; int fg, bg, flg; long *attr; { int swap; if ((flg & (WSATTR_BLINK | WSATTR_HILIT | WSATTR_WSCOLORS)) != 0) return (EINVAL); fg = 1; bg = 0; if ((flg & WSATTR_REVERSE) != 0) { swap = fg; fg = bg; bg = swap; } *attr = (bg << 16) | (fg << 24) | ((flg & WSATTR_UNDERLINE) ? 7 : 6); return (0); } /* * Copy rows. */ static void rasops_copyrows(cookie, src, dst, num) void *cookie; int src, dst, num; { int32_t *sp, *dp, *srp, *drp; struct rasops_info *ri; int n8, n1, cnt, delta; ri = (struct rasops_info *)cookie; #ifdef RASOPS_CLIPPING if (dst == src) return; if (src < 0) { num += src; src = 0; } if ((src + num) > ri->ri_rows) num = ri->ri_rows - src; if (dst < 0) { num += dst; dst = 0; } if ((dst + num) > ri->ri_rows) num = ri->ri_rows - dst; if (num <= 0) return; #endif num *= ri->ri_font->fontheight; n8 = ri->ri_emustride >> 5; n1 = (ri->ri_emustride >> 2) & 7; if (dst < src) { srp = (int32_t *)(ri->ri_bits + src * ri->ri_yscale); drp = (int32_t *)(ri->ri_bits + dst * ri->ri_yscale); delta = ri->ri_stride; } else { src = ri->ri_font->fontheight * src + num - 1; dst = ri->ri_font->fontheight * dst + num - 1; srp = (int32_t *)(ri->ri_bits + src * ri->ri_stride); drp = (int32_t *)(ri->ri_bits + dst * ri->ri_stride); delta = -ri->ri_stride; } while (num--) { dp = drp; sp = srp; DELTA(drp, delta, int32_t *); DELTA(srp, delta, int32_t *); for (cnt = n8; cnt; cnt--) { dp[0] = sp[0]; dp[1] = sp[1]; dp[2] = sp[2]; dp[3] = sp[3]; dp[4] = sp[4]; dp[5] = sp[5]; dp[6] = sp[6]; dp[7] = sp[7]; dp += 8; sp += 8; } for (cnt = n1; cnt; cnt--) *dp++ = *sp++; } } /* * Copy columns. This is slow, and hard to optimize due to alignment, * and the fact that we have to copy both left->right and right->left. * We simply cop-out here and use memmove(), since it handles all of * these cases anyway. */ void rasops_copycols(cookie, row, src, dst, num) void *cookie; int row, src, dst, num; { struct rasops_info *ri; u_char *sp, *dp; int height; ri = (struct rasops_info *)cookie; #ifdef RASOPS_CLIPPING if (dst == src) return; /* Catches < 0 case too */ if ((unsigned)row >= (unsigned)ri->ri_rows) return; if (src < 0) { num += src; src = 0; } if ((src + num) > ri->ri_cols) num = ri->ri_cols - src; if (dst < 0) { num += dst; dst = 0; } if ((dst + num) > ri->ri_cols) num = ri->ri_cols - dst; if (num <= 0) return; #endif num *= ri->ri_xscale; row *= ri->ri_yscale; height = ri->ri_font->fontheight; sp = ri->ri_bits + row + src * ri->ri_xscale; dp = ri->ri_bits + row + dst * ri->ri_xscale; while (height--) { memmove(dp, sp, num); dp += ri->ri_stride; sp += ri->ri_stride; } } /* * Turn cursor off/on. */ static void rasops_cursor(cookie, on, row, col) void *cookie; int on, row, col; { struct rasops_info *ri; ri = (struct rasops_info *)cookie; /* Turn old cursor off */ if ((ri->ri_flg & RI_CURSOR) != 0) #ifdef RASOPS_CLIPPING if ((ri->ri_flg & RI_CURSORCLIP) == 0) #endif ri->ri_do_cursor(ri); /* Select new cursor */ #ifdef RASOPS_CLIPPING ri->ri_flg &= ~RI_CURSORCLIP; if (row < 0 || row >= ri->ri_rows) ri->ri_flg |= RI_CURSORCLIP; else if (col < 0 || col >= ri->ri_cols) ri->ri_flg |= RI_CURSORCLIP; #endif ri->ri_crow = row; ri->ri_ccol = col; if (on) { ri->ri_flg |= RI_CURSOR; #ifdef RASOPS_CLIPPING if ((ri->ri_flg & RI_CURSORCLIP) == 0) #endif ri->ri_do_cursor(ri); } else ri->ri_flg &= ~RI_CURSOR; } /* * Make the device colormap */ static void rasops_init_devcmap(ri) struct rasops_info *ri; { const u_char *p; int i, c; switch (ri->ri_depth) { case 1: ri->ri_devcmap[0] = 0; for (i = 1; i < 16; i++) ri->ri_devcmap[i] = -1; return; case 2: for (i = 1; i < 15; i++) ri->ri_devcmap[i] = 0xaaaaaaaa; ri->ri_devcmap[0] = 0; ri->ri_devcmap[8] = 0x55555555; ri->ri_devcmap[15] = -1; return; case 8: for (i = 0; i < 16; i++) ri->ri_devcmap[i] = i | (i<<8) | (i<<16) | (i<<24); return; } p = rasops_cmap; for (i = 0; i < 16; i++) { if (ri->ri_rnum <= 8) c = (*p >> (8 - ri->ri_rnum)) << ri->ri_rpos; else c = (*p << (ri->ri_rnum - 8)) << ri->ri_rpos; p++; if (ri->ri_gnum <= 8) c |= (*p >> (8 - ri->ri_gnum)) << ri->ri_gpos; else c |= (*p << (ri->ri_gnum - 8)) << ri->ri_gpos; p++; if (ri->ri_bnum <= 8) c |= (*p >> (8 - ri->ri_bnum)) << ri->ri_bpos; else c |= (*p << (ri->ri_bnum - 8)) << ri->ri_bpos; p++; /* Fill the word for generic routines, which want this */ if (ri->ri_depth == 24) c = c | ((c & 0xff) << 24); else if (ri->ri_depth <= 16) c = c | (c << 16); /* 24bpp does bswap on the fly. {32,16,15}bpp do it here. */ if ((ri->ri_flg & RI_BSWAP) == 0) ri->ri_devcmap[i] = c; else if (ri->ri_depth == 32) ri->ri_devcmap[i] = bswap32(c); else if (ri->ri_depth == 16 || ri->ri_depth == 15) ri->ri_devcmap[i] = bswap16(c); else ri->ri_devcmap[i] = c; } } /* * Unpack a rasops attribute */ void rasops_unpack_attr(attr, fg, bg, underline) long attr; int *fg, *bg, *underline; { *fg = ((u_int)attr >> 24) & 0xf; *bg = ((u_int)attr >> 16) & 0xf; if (underline != NULL) *underline = (u_int)attr & 1; } /* * Erase rows. This isn't static, since 24-bpp uses it in special cases. */ void rasops_eraserows(cookie, row, num, attr) void *cookie; int row, num; long attr; { struct rasops_info *ri; int np, nw, cnt, delta; int32_t *dp, clr; ri = (struct rasops_info *)cookie; #ifdef RASOPS_CLIPPING if (row < 0) { num += row; row = 0; } if ((row + num) > ri->ri_rows) num = ri->ri_rows - row; if (num <= 0) return; #endif clr = ri->ri_devcmap[(attr >> 16) & 0xf]; /* * XXX The wsdisplay_emulops interface seems a little deficient in * that there is no way to clear the *entire* screen. We provide a * workaround here: if the entire console area is being cleared, and * the RI_FULLCLEAR flag is set, clear the entire display. */ if (num == ri->ri_rows && (ri->ri_flg & RI_FULLCLEAR) != 0) { np = ri->ri_stride >> 5; nw = (ri->ri_stride >> 2) & 7; num = ri->ri_height; dp = (int32_t *)ri->ri_origbits; delta = 0; } else { np = ri->ri_emustride >> 5; nw = (ri->ri_emustride >> 2) & 7; num *= ri->ri_font->fontheight; dp = (int32_t *)(ri->ri_bits + row * ri->ri_yscale); delta = ri->ri_delta; } while (num--) { for (cnt = np; cnt; cnt--) { dp[0] = clr; dp[1] = clr; dp[2] = clr; dp[3] = clr; dp[4] = clr; dp[5] = clr; dp[6] = clr; dp[7] = clr; dp += 8; } for (cnt = nw; cnt; cnt--) { *(int32_t *)dp = clr; DELTA(dp, 4, int32_t *); } DELTA(dp, delta, int32_t *); } } /* * Actually turn the cursor on or off. This does the dirty work for * rasops_cursor(). */ static void rasops_do_cursor(ri) struct rasops_info *ri; { int full1, height, cnt, slop1, slop2, row, col; u_char *dp, *rp; row = ri->ri_crow; col = ri->ri_ccol; rp = ri->ri_bits + row * ri->ri_yscale + col * ri->ri_xscale; height = ri->ri_font->fontheight; slop1 = (4 - ((long)rp & 3)) & 3; if (slop1 > ri->ri_xscale) slop1 = ri->ri_xscale; slop2 = (ri->ri_xscale - slop1) & 3; full1 = (ri->ri_xscale - slop1 - slop2) >> 2; if ((slop1 | slop2) == 0) { /* A common case */ while (height--) { dp = rp; rp += ri->ri_stride; for (cnt = full1; cnt; cnt--) { *(int32_t *)dp ^= ~0; dp += 4; } } } else { /* XXX this is stupid.. use masks instead */ while (height--) { dp = rp; rp += ri->ri_stride; if (slop1 & 1) *dp++ ^= ~0; if (slop1 & 2) { *(int16_t *)dp ^= ~0; dp += 2; } for (cnt = full1; cnt; cnt--) { *(int32_t *)dp ^= ~0; dp += 4; } if (slop2 & 1) *dp++ ^= ~0; if (slop2 & 2) *(int16_t *)dp ^= ~0; } } } /* * Erase columns. */ void rasops_erasecols(cookie, row, col, num, attr) void *cookie; int row, col, num; long attr; { int n8, height, cnt, slop1, slop2, clr; struct rasops_info *ri; int32_t *rp, *dp; ri = (struct rasops_info *)cookie; #ifdef RASOPS_CLIPPING if ((unsigned)row >= (unsigned)ri->ri_rows) return; if (col < 0) { num += col; col = 0; } if ((col + num) > ri->ri_cols) num = ri->ri_cols - col; if (num <= 0) return; #endif num = num * ri->ri_xscale; rp = (int32_t *)(ri->ri_bits + row*ri->ri_yscale + col*ri->ri_xscale); height = ri->ri_font->fontheight; clr = ri->ri_devcmap[(attr >> 16) & 0xf]; /* Don't bother using the full loop for <= 32 pels */ if (num <= 32) { if (((num | ri->ri_xscale) & 3) == 0) { /* Word aligned blt */ num >>= 2; while (height--) { dp = rp; DELTA(rp, ri->ri_stride, int32_t *); for (cnt = num; cnt; cnt--) *dp++ = clr; } } else if (((num | ri->ri_xscale) & 1) == 0) { /* * Halfword aligned blt. This is needed so the * 15/16 bit ops can use this function. */ num >>= 1; while (height--) { dp = rp; DELTA(rp, ri->ri_stride, int32_t *); for (cnt = num; cnt; cnt--) { *(int16_t *)dp = clr; DELTA(dp, 2, int32_t *); } } } else { while (height--) { dp = rp; DELTA(rp, ri->ri_stride, int32_t *); for (cnt = num; cnt; cnt--) { *(u_char *)dp = clr; DELTA(dp, 1, int32_t *); } } } return; } slop1 = (4 - ((long)rp & 3)) & 3; slop2 = (num - slop1) & 3; num -= slop1 + slop2; n8 = num >> 5; num = (num >> 2) & 7; while (height--) { dp = rp; DELTA(rp, ri->ri_stride, int32_t *); /* Align span to 4 bytes */ if (slop1 & 1) { *(u_char *)dp = clr; DELTA(dp, 1, int32_t *); } if (slop1 & 2) { *(int16_t *)dp = clr; DELTA(dp, 2, int32_t *); } /* Write 32 bytes per loop */ for (cnt = n8; cnt; cnt--) { dp[0] = clr; dp[1] = clr; dp[2] = clr; dp[3] = clr; dp[4] = clr; dp[5] = clr; dp[6] = clr; dp[7] = clr; dp += 8; } /* Write 4 bytes per loop */ for (cnt = num; cnt; cnt--) *dp++ = clr; /* Write unaligned trailing slop */ if (slop2 & 1) { *(u_char *)dp = clr; DELTA(dp, 1, int32_t *); } if (slop2 & 2) *(int16_t *)dp = clr; } }