Bochs/bochs/iodev/display/voodoo_data.h
Volker Ruppert 3cee1f74ee Now using WIN32 event / wait functions in the Voodoo2 thread. I noticed a speed
improvement of around 10 % (tested with donut demo only).
TODO: Use similar functions of the pthread library for improvements on other
platforms.
2017-08-08 18:23:12 +00:00

3660 lines
191 KiB
C

/////////////////////////////////////////////////////////////////////////
// $Id$
/////////////////////////////////////////////////////////////////////////
/*
* Portion of this software comes with the following license
*/
/***************************************************************************
Copyright Aaron Giles
All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are
met:
* Redistributions of source code must retain the above copyright
notice, this list of conditions and the following disclaimer.
* Redistributions in binary form must reproduce the above copyright
notice, this list of conditions and the following disclaimer in
the documentation and/or other materials provided with the
distribution.
* Neither the name 'MAME' nor the names of its contributors may be
used to endorse or promote products derived from this software
without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY AARON GILES ''AS IS'' AND ANY EXPRESS OR
IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
DISCLAIMED. IN NO EVENT SHALL AARON GILES BE LIABLE FOR ANY DIRECT,
INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
POSSIBILITY OF SUCH DAMAGE.
***************************************************************************/
/*************************************************************************
3dfx Voodoo Graphics SST-1/2 emulator
emulator by Aaron Giles
**************************************************************************/
/*************************************
*
* Misc. constants
*
*************************************/
/* enumeration describing reasons we might be stalled */
enum
{
NOT_STALLED = 0,
STALLED_UNTIL_FIFO_LWM,
STALLED_UNTIL_FIFO_EMPTY
};
/* maximum number of TMUs */
#define MAX_TMU 2
/* accumulate operations less than this number of clocks */
#define ACCUMULATE_THRESHOLD 0
/* number of clocks to set up a triangle (just a guess) */
#define TRIANGLE_SETUP_CLOCKS 100
/* maximum number of rasterizers */
#define MAX_RASTERIZERS 1024
/* size of the rasterizer hash table */
#define RASTER_HASH_SIZE 97
/* flags for LFB writes */
#define LFB_RGB_PRESENT 1
#define LFB_ALPHA_PRESENT 2
#define LFB_DEPTH_PRESENT 4
#define LFB_DEPTH_PRESENT_MSW 8
/* flags for the register access array */
#define REGISTER_READ 0x01 /* reads are allowed */
#define REGISTER_WRITE 0x02 /* writes are allowed */
#define REGISTER_PIPELINED 0x04 /* writes are pipelined */
#define REGISTER_FIFO 0x08 /* writes go to FIFO */
#define REGISTER_WRITETHRU 0x10 /* writes are valid even for CMDFIFO */
/* shorter combinations to make the table smaller */
#define REG_R (REGISTER_READ)
#define REG_W (REGISTER_WRITE)
#define REG_WT (REGISTER_WRITE | REGISTER_WRITETHRU)
#define REG_RW (REGISTER_READ | REGISTER_WRITE)
#define REG_RWT (REGISTER_READ | REGISTER_WRITE | REGISTER_WRITETHRU)
#define REG_RP (REGISTER_READ | REGISTER_PIPELINED)
#define REG_WP (REGISTER_WRITE | REGISTER_PIPELINED)
#define REG_RWP (REGISTER_READ | REGISTER_WRITE | REGISTER_PIPELINED)
#define REG_RWPT (REGISTER_READ | REGISTER_WRITE | REGISTER_PIPELINED | REGISTER_WRITETHRU)
#define REG_RF (REGISTER_READ | REGISTER_FIFO)
#define REG_WF (REGISTER_WRITE | REGISTER_FIFO)
#define REG_RWF (REGISTER_READ | REGISTER_WRITE | REGISTER_FIFO)
#define REG_RPF (REGISTER_READ | REGISTER_PIPELINED | REGISTER_FIFO)
#define REG_WPF (REGISTER_WRITE | REGISTER_PIPELINED | REGISTER_FIFO)
#define REG_RWPF (REGISTER_READ | REGISTER_WRITE | REGISTER_PIPELINED | REGISTER_FIFO)
/* lookup bits is the log2 of the size of the reciprocal/log table */
#define RECIPLOG_LOOKUP_BITS 9
/* input precision is how many fraction bits the input value has; this is a 64-bit number */
#define RECIPLOG_INPUT_PREC 32
/* lookup precision is how many fraction bits each table entry contains */
#define RECIPLOG_LOOKUP_PREC 22
/* output precision is how many fraction bits the result should have */
#define RECIP_OUTPUT_PREC 15
#define LOG_OUTPUT_PREC 8
/*************************************
*
* Register constants
*
*************************************/
/* Codes to the right:
R = readable
W = writeable
P = pipelined
F = goes to FIFO
*/
/* 0x000 */
#define status (0x000/4) /* R P */
#define intrCtrl (0x004/4) /* RW P -- Voodoo2/Banshee only */
#define vertexAx (0x008/4) /* W PF */
#define vertexAy (0x00c/4) /* W PF */
#define vertexBx (0x010/4) /* W PF */
#define vertexBy (0x014/4) /* W PF */
#define vertexCx (0x018/4) /* W PF */
#define vertexCy (0x01c/4) /* W PF */
#define startR (0x020/4) /* W PF */
#define startG (0x024/4) /* W PF */
#define startB (0x028/4) /* W PF */
#define startZ (0x02c/4) /* W PF */
#define startA (0x030/4) /* W PF */
#define startS (0x034/4) /* W PF */
#define startT (0x038/4) /* W PF */
#define startW (0x03c/4) /* W PF */
/* 0x040 */
#define dRdX (0x040/4) /* W PF */
#define dGdX (0x044/4) /* W PF */
#define dBdX (0x048/4) /* W PF */
#define dZdX (0x04c/4) /* W PF */
#define dAdX (0x050/4) /* W PF */
#define dSdX (0x054/4) /* W PF */
#define dTdX (0x058/4) /* W PF */
#define dWdX (0x05c/4) /* W PF */
#define dRdY (0x060/4) /* W PF */
#define dGdY (0x064/4) /* W PF */
#define dBdY (0x068/4) /* W PF */
#define dZdY (0x06c/4) /* W PF */
#define dAdY (0x070/4) /* W PF */
#define dSdY (0x074/4) /* W PF */
#define dTdY (0x078/4) /* W PF */
#define dWdY (0x07c/4) /* W PF */
/* 0x080 */
#define triangleCMD (0x080/4) /* W PF */
#define fvertexAx (0x088/4) /* W PF */
#define fvertexAy (0x08c/4) /* W PF */
#define fvertexBx (0x090/4) /* W PF */
#define fvertexBy (0x094/4) /* W PF */
#define fvertexCx (0x098/4) /* W PF */
#define fvertexCy (0x09c/4) /* W PF */
#define fstartR (0x0a0/4) /* W PF */
#define fstartG (0x0a4/4) /* W PF */
#define fstartB (0x0a8/4) /* W PF */
#define fstartZ (0x0ac/4) /* W PF */
#define fstartA (0x0b0/4) /* W PF */
#define fstartS (0x0b4/4) /* W PF */
#define fstartT (0x0b8/4) /* W PF */
#define fstartW (0x0bc/4) /* W PF */
/* 0x0c0 */
#define fdRdX (0x0c0/4) /* W PF */
#define fdGdX (0x0c4/4) /* W PF */
#define fdBdX (0x0c8/4) /* W PF */
#define fdZdX (0x0cc/4) /* W PF */
#define fdAdX (0x0d0/4) /* W PF */
#define fdSdX (0x0d4/4) /* W PF */
#define fdTdX (0x0d8/4) /* W PF */
#define fdWdX (0x0dc/4) /* W PF */
#define fdRdY (0x0e0/4) /* W PF */
#define fdGdY (0x0e4/4) /* W PF */
#define fdBdY (0x0e8/4) /* W PF */
#define fdZdY (0x0ec/4) /* W PF */
#define fdAdY (0x0f0/4) /* W PF */
#define fdSdY (0x0f4/4) /* W PF */
#define fdTdY (0x0f8/4) /* W PF */
#define fdWdY (0x0fc/4) /* W PF */
/* 0x100 */
#define ftriangleCMD (0x100/4) /* W PF */
#define fbzColorPath (0x104/4) /* RW PF */
#define fogMode (0x108/4) /* RW PF */
#define alphaMode (0x10c/4) /* RW PF */
#define fbzMode (0x110/4) /* RW F */
#define lfbMode (0x114/4) /* RW F */
#define clipLeftRight (0x118/4) /* RW F */
#define clipLowYHighY (0x11c/4) /* RW F */
#define nopCMD (0x120/4) /* W F */
#define fastfillCMD (0x124/4) /* W F */
#define swapbufferCMD (0x128/4) /* W F */
#define fogColor (0x12c/4) /* W F */
#define zaColor (0x130/4) /* W F */
#define chromaKey (0x134/4) /* W F */
#define chromaRange (0x138/4) /* W F -- Voodoo2/Banshee only */
#define userIntrCMD (0x13c/4) /* W F -- Voodoo2/Banshee only */
/* 0x140 */
#define stipple (0x140/4) /* RW F */
#define color0 (0x144/4) /* RW F */
#define color1 (0x148/4) /* RW F */
#define fbiPixelsIn (0x14c/4) /* R */
#define fbiChromaFail (0x150/4) /* R */
#define fbiZfuncFail (0x154/4) /* R */
#define fbiAfuncFail (0x158/4) /* R */
#define fbiPixelsOut (0x15c/4) /* R */
#define fogTable (0x160/4) /* W F */
/* 0x1c0 */
#define cmdFifoBaseAddr (0x1e0/4) /* RW -- Voodoo2 only */
#define cmdFifoBump (0x1e4/4) /* RW -- Voodoo2 only */
#define cmdFifoRdPtr (0x1e8/4) /* RW -- Voodoo2 only */
#define cmdFifoAMin (0x1ec/4) /* RW -- Voodoo2 only */
#define colBufferAddr (0x1ec/4) /* RW -- Banshee only */
#define cmdFifoAMax (0x1f0/4) /* RW -- Voodoo2 only */
#define colBufferStride (0x1f0/4) /* RW -- Banshee only */
#define cmdFifoDepth (0x1f4/4) /* RW -- Voodoo2 only */
#define auxBufferAddr (0x1f4/4) /* RW -- Banshee only */
#define cmdFifoHoles (0x1f8/4) /* RW -- Voodoo2 only */
#define auxBufferStride (0x1f8/4) /* RW -- Banshee only */
/* 0x200 */
#define fbiInit4 (0x200/4) /* RW -- Voodoo/Voodoo2 only */
#define clipLeftRight1 (0x200/4) /* RW -- Banshee only */
#define vRetrace (0x204/4) /* R -- Voodoo/Voodoo2 only */
#define clipTopBottom1 (0x204/4) /* RW -- Banshee only */
#define backPorch (0x208/4) /* RW -- Voodoo/Voodoo2 only */
#define videoDimensions (0x20c/4) /* RW -- Voodoo/Voodoo2 only */
#define fbiInit0 (0x210/4) /* RW -- Voodoo/Voodoo2 only */
#define fbiInit1 (0x214/4) /* RW -- Voodoo/Voodoo2 only */
#define fbiInit2 (0x218/4) /* RW -- Voodoo/Voodoo2 only */
#define fbiInit3 (0x21c/4) /* RW -- Voodoo/Voodoo2 only */
#define hSync (0x220/4) /* W -- Voodoo/Voodoo2 only */
#define vSync (0x224/4) /* W -- Voodoo/Voodoo2 only */
#define clutData (0x228/4) /* W F -- Voodoo/Voodoo2 only */
#define dacData (0x22c/4) /* W -- Voodoo/Voodoo2 only */
#define maxRgbDelta (0x230/4) /* W -- Voodoo/Voodoo2 only */
#define hBorder (0x234/4) /* W -- Voodoo2 only */
#define vBorder (0x238/4) /* W -- Voodoo2 only */
#define borderColor (0x23c/4) /* W -- Voodoo2 only */
/* 0x240 */
#define hvRetrace (0x240/4) /* R -- Voodoo2 only */
#define fbiInit5 (0x244/4) /* RW -- Voodoo2 only */
#define fbiInit6 (0x248/4) /* RW -- Voodoo2 only */
#define fbiInit7 (0x24c/4) /* RW -- Voodoo2 only */
#define swapPending (0x24c/4) /* W -- Banshee only */
#define leftOverlayBuf (0x250/4) /* W -- Banshee only */
#define rightOverlayBuf (0x254/4) /* W -- Banshee only */
#define fbiSwapHistory (0x258/4) /* R -- Voodoo2/Banshee only */
#define fbiTrianglesOut (0x25c/4) /* R -- Voodoo2/Banshee only */
#define sSetupMode (0x260/4) /* W PF -- Voodoo2/Banshee only */
#define sVx (0x264/4) /* W PF -- Voodoo2/Banshee only */
#define sVy (0x268/4) /* W PF -- Voodoo2/Banshee only */
#define sARGB (0x26c/4) /* W PF -- Voodoo2/Banshee only */
#define sRed (0x270/4) /* W PF -- Voodoo2/Banshee only */
#define sGreen (0x274/4) /* W PF -- Voodoo2/Banshee only */
#define sBlue (0x278/4) /* W PF -- Voodoo2/Banshee only */
#define sAlpha (0x27c/4) /* W PF -- Voodoo2/Banshee only */
/* 0x280 */
#define sVz (0x280/4) /* W PF -- Voodoo2/Banshee only */
#define sWb (0x284/4) /* W PF -- Voodoo2/Banshee only */
#define sWtmu0 (0x288/4) /* W PF -- Voodoo2/Banshee only */
#define sS_W0 (0x28c/4) /* W PF -- Voodoo2/Banshee only */
#define sT_W0 (0x290/4) /* W PF -- Voodoo2/Banshee only */
#define sWtmu1 (0x294/4) /* W PF -- Voodoo2/Banshee only */
#define sS_Wtmu1 (0x298/4) /* W PF -- Voodoo2/Banshee only */
#define sT_Wtmu1 (0x29c/4) /* W PF -- Voodoo2/Banshee only */
#define sDrawTriCMD (0x2a0/4) /* W PF -- Voodoo2/Banshee only */
#define sBeginTriCMD (0x2a4/4) /* W PF -- Voodoo2/Banshee only */
/* 0x2c0 */
#define bltSrcBaseAddr (0x2c0/4) /* RW PF -- Voodoo2 only */
#define bltDstBaseAddr (0x2c4/4) /* RW PF -- Voodoo2 only */
#define bltXYStrides (0x2c8/4) /* RW PF -- Voodoo2 only */
#define bltSrcChromaRange (0x2cc/4) /* RW PF -- Voodoo2 only */
#define bltDstChromaRange (0x2d0/4) /* RW PF -- Voodoo2 only */
#define bltClipX (0x2d4/4) /* RW PF -- Voodoo2 only */
#define bltClipY (0x2d8/4) /* RW PF -- Voodoo2 only */
#define bltSrcXY (0x2e0/4) /* RW PF -- Voodoo2 only */
#define bltDstXY (0x2e4/4) /* RW PF -- Voodoo2 only */
#define bltSize (0x2e8/4) /* RW PF -- Voodoo2 only */
#define bltRop (0x2ec/4) /* RW PF -- Voodoo2 only */
#define bltColor (0x2f0/4) /* RW PF -- Voodoo2 only */
#define bltCommand (0x2f8/4) /* RW PF -- Voodoo2 only */
#define bltData (0x2fc/4) /* W PF -- Voodoo2 only */
/* 0x300 */
#define textureMode (0x300/4) /* W PF */
#define tLOD (0x304/4) /* W PF */
#define tDetail (0x308/4) /* W PF */
#define texBaseAddr (0x30c/4) /* W PF */
#define texBaseAddr_1 (0x310/4) /* W PF */
#define texBaseAddr_2 (0x314/4) /* W PF */
#define texBaseAddr_3_8 (0x318/4) /* W PF */
#define trexInit0 (0x31c/4) /* W F -- Voodoo/Voodoo2 only */
#define trexInit1 (0x320/4) /* W F */
#define nccTable (0x324/4) /* W F */
/*************************************
*
* Alias map of the first 64
* registers when remapped
*
*************************************/
static const Bit8u register_alias_map[0x40] =
{
status, 0x004/4, vertexAx, vertexAy,
vertexBx, vertexBy, vertexCx, vertexCy,
startR, dRdX, dRdY, startG,
dGdX, dGdY, startB, dBdX,
dBdY, startZ, dZdX, dZdY,
startA, dAdX, dAdY, startS,
dSdX, dSdY, startT, dTdX,
dTdY, startW, dWdX, dWdY,
triangleCMD,0x084/4, fvertexAx, fvertexAy,
fvertexBx, fvertexBy, fvertexCx, fvertexCy,
fstartR, fdRdX, fdRdY, fstartG,
fdGdX, fdGdY, fstartB, fdBdX,
fdBdY, fstartZ, fdZdX, fdZdY,
fstartA, fdAdX, fdAdY, fstartS,
fdSdX, fdSdY, fstartT, fdTdX,
fdTdY, fstartW, fdWdX, fdWdY
};
/*************************************
*
* Table of per-register access rights
*
*************************************/
static const Bit8u voodoo_register_access[0x100] =
{
/* 0x000 */
REG_RP, 0, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x040 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x080 */
REG_WPF, 0, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x0c0 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x100 */
REG_WPF, REG_RWPF, REG_RWPF, REG_RWPF,
REG_RWF, REG_RWF, REG_RWF, REG_RWF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, 0, 0,
/* 0x140 */
REG_RWF, REG_RWF, REG_RWF, REG_R,
REG_R, REG_R, REG_R, REG_R,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x180 */
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x1c0 */
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
0, 0, 0, 0,
0, 0, 0, 0,
/* 0x200 */
REG_RW, REG_R, REG_RW, REG_RW,
REG_RW, REG_RW, REG_RW, REG_RW,
REG_W, REG_W, REG_W, REG_W,
REG_W, 0, 0, 0,
/* 0x240 */
0, 0, 0, 0,
0, 0, 0, 0,
0, 0, 0, 0,
0, 0, 0, 0,
/* 0x280 */
0, 0, 0, 0,
0, 0, 0, 0,
0, 0, 0, 0,
0, 0, 0, 0,
/* 0x2c0 */
0, 0, 0, 0,
0, 0, 0, 0,
0, 0, 0, 0,
0, 0, 0, 0,
/* 0x300 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x340 */
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x380 */
REG_WF
};
static const Bit8u voodoo2_register_access[0x100] =
{
/* 0x000 */
REG_RP, REG_RWPT, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x040 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x080 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x0c0 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x100 */
REG_WPF, REG_RWPF, REG_RWPF, REG_RWPF,
REG_RWF, REG_RWF, REG_RWF, REG_RWF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x140 */
REG_RWF, REG_RWF, REG_RWF, REG_R,
REG_R, REG_R, REG_R, REG_R,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x180 */
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x1c0 */
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_RWT, REG_RWT, REG_RWT, REG_RWT,
REG_RWT, REG_RWT, REG_RWT, REG_RW,
/* 0x200 */
REG_RWT, REG_R, REG_RWT, REG_RWT,
REG_RWT, REG_RWT, REG_RWT, REG_RWT,
REG_WT, REG_WT, REG_WF, REG_WT,
REG_WT, REG_WT, REG_WT, REG_WT,
/* 0x240 */
REG_R, REG_RWT, REG_RWT, REG_RWT,
0, 0, REG_R, REG_R,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x280 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, 0, 0,
0, 0, 0, 0,
/* 0x2c0 */
REG_RWPF, REG_RWPF, REG_RWPF, REG_RWPF,
REG_RWPF, REG_RWPF, REG_RWPF, REG_RWPF,
REG_RWPF, REG_RWPF, REG_RWPF, REG_RWPF,
REG_RWPF, REG_RWPF, REG_RWPF, REG_WPF,
/* 0x300 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x340 */
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x380 */
REG_WF
};
static const Bit8u banshee_register_access[0x100] =
{
/* 0x000 */
REG_RP, REG_RWPT, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x040 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x080 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x0c0 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x100 */
REG_WPF, REG_RWPF, REG_RWPF, REG_RWPF,
REG_RWF, REG_RWF, REG_RWF, REG_RWF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x140 */
REG_RWF, REG_RWF, REG_RWF, REG_R,
REG_R, REG_R, REG_R, REG_R,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x180 */
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x1c0 */
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
0, 0, 0, REG_RWF,
REG_RWF, REG_RWF, REG_RWF, 0,
/* 0x200 */
REG_RWF, REG_RWF, 0, 0,
0, 0, 0, 0,
0, 0, 0, 0,
0, 0, 0, 0,
/* 0x240 */
0, 0, 0, REG_WT,
REG_RWF, REG_RWF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_R, REG_R,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
/* 0x280 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, 0, 0,
0, 0, 0, 0,
/* 0x2c0 */
0, 0, 0, 0,
0, 0, 0, 0,
0, 0, 0, 0,
0, 0, 0, 0,
/* 0x300 */
REG_WPF, REG_WPF, REG_WPF, REG_WPF,
REG_WPF, REG_WPF, REG_WPF, 0,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x340 */
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
REG_WF, REG_WF, REG_WF, REG_WF,
/* 0x380 */
REG_WF
};
/*************************************
*
* Register string table for debug
*
*************************************/
static const char *const voodoo_reg_name[0x100] =
{
/* 0x000 */
"status", "{intrCtrl}", "vertexAx", "vertexAy",
"vertexBx", "vertexBy", "vertexCx", "vertexCy",
"startR", "startG", "startB", "startZ",
"startA", "startS", "startT", "startW",
/* 0x040 */
"dRdX", "dGdX", "dBdX", "dZdX",
"dAdX", "dSdX", "dTdX", "dWdX",
"dRdY", "dGdY", "dBdY", "dZdY",
"dAdY", "dSdY", "dTdY", "dWdY",
/* 0x080 */
"triangleCMD", "reserved084", "fvertexAx", "fvertexAy",
"fvertexBx", "fvertexBy", "fvertexCx", "fvertexCy",
"fstartR", "fstartG", "fstartB", "fstartZ",
"fstartA", "fstartS", "fstartT", "fstartW",
/* 0x0c0 */
"fdRdX", "fdGdX", "fdBdX", "fdZdX",
"fdAdX", "fdSdX", "fdTdX", "fdWdX",
"fdRdY", "fdGdY", "fdBdY", "fdZdY",
"fdAdY", "fdSdY", "fdTdY", "fdWdY",
/* 0x100 */
"ftriangleCMD", "fbzColorPath", "fogMode", "alphaMode",
"fbzMode", "lfbMode", "clipLeftRight","clipLowYHighY",
"nopCMD", "fastfillCMD", "swapbufferCMD","fogColor",
"zaColor", "chromaKey", "{chromaRange}","{userIntrCMD}",
/* 0x140 */
"stipple", "color0", "color1", "fbiPixelsIn",
"fbiChromaFail","fbiZfuncFail", "fbiAfuncFail", "fbiPixelsOut",
"fogTable160", "fogTable164", "fogTable168", "fogTable16c",
"fogTable170", "fogTable174", "fogTable178", "fogTable17c",
/* 0x180 */
"fogTable180", "fogTable184", "fogTable188", "fogTable18c",
"fogTable190", "fogTable194", "fogTable198", "fogTable19c",
"fogTable1a0", "fogTable1a4", "fogTable1a8", "fogTable1ac",
"fogTable1b0", "fogTable1b4", "fogTable1b8", "fogTable1bc",
/* 0x1c0 */
"fogTable1c0", "fogTable1c4", "fogTable1c8", "fogTable1cc",
"fogTable1d0", "fogTable1d4", "fogTable1d8", "fogTable1dc",
"{cmdFifoBaseAddr}","{cmdFifoBump}","{cmdFifoRdPtr}","{cmdFifoAMin}",
"{cmdFifoAMax}","{cmdFifoDepth}","{cmdFifoHoles}","reserved1fc",
/* 0x200 */
"fbiInit4", "vRetrace", "backPorch", "videoDimensions",
"fbiInit0", "fbiInit1", "fbiInit2", "fbiInit3",
"hSync", "vSync", "clutData", "dacData",
"maxRgbDelta", "{hBorder}", "{vBorder}", "{borderColor}",
/* 0x240 */
"{hvRetrace}", "{fbiInit5}", "{fbiInit6}", "{fbiInit7}",
"reserved250", "reserved254", "{fbiSwapHistory}","{fbiTrianglesOut}",
"{sSetupMode}", "{sVx}", "{sVy}", "{sARGB}",
"{sRed}", "{sGreen}", "{sBlue}", "{sAlpha}",
/* 0x280 */
"{sVz}", "{sWb}", "{sWtmu0}", "{sS/Wtmu0}",
"{sT/Wtmu0}", "{sWtmu1}", "{sS/Wtmu1}", "{sT/Wtmu1}",
"{sDrawTriCMD}","{sBeginTriCMD}","reserved2a8", "reserved2ac",
"reserved2b0", "reserved2b4", "reserved2b8", "reserved2bc",
/* 0x2c0 */
"{bltSrcBaseAddr}","{bltDstBaseAddr}","{bltXYStrides}","{bltSrcChromaRange}",
"{bltDstChromaRange}","{bltClipX}","{bltClipY}","reserved2dc",
"{bltSrcXY}", "{bltDstXY}", "{bltSize}", "{bltRop}",
"{bltColor}", "reserved2f4", "{bltCommand}", "{bltData}",
/* 0x300 */
"textureMode", "tLOD", "tDetail", "texBaseAddr",
"texBaseAddr_1","texBaseAddr_2","texBaseAddr_3_8","trexInit0",
"trexInit1", "nccTable0.0", "nccTable0.1", "nccTable0.2",
"nccTable0.3", "nccTable0.4", "nccTable0.5", "nccTable0.6",
/* 0x340 */
"nccTable0.7", "nccTable0.8", "nccTable0.9", "nccTable0.A",
"nccTable0.B", "nccTable1.0", "nccTable1.1", "nccTable1.2",
"nccTable1.3", "nccTable1.4", "nccTable1.5", "nccTable1.6",
"nccTable1.7", "nccTable1.8", "nccTable1.9", "nccTable1.A",
/* 0x380 */
"nccTable1.B", "reserved384", "reserved388", "reserved38c"
};
static const char *const banshee_reg_name[] =
{
/* 0x000 */
"status", "intrCtrl", "vertexAx", "vertexAy",
"vertexBx", "vertexBy", "vertexCx", "vertexCy",
"startR", "startG", "startB", "startZ",
"startA", "startS", "startT", "startW",
/* 0x040 */
"dRdX", "dGdX", "dBdX", "dZdX",
"dAdX", "dSdX", "dTdX", "dWdX",
"dRdY", "dGdY", "dBdY", "dZdY",
"dAdY", "dSdY", "dTdY", "dWdY",
/* 0x080 */
"triangleCMD", "reserved084", "fvertexAx", "fvertexAy",
"fvertexBx", "fvertexBy", "fvertexCx", "fvertexCy",
"fstartR", "fstartG", "fstartB", "fstartZ",
"fstartA", "fstartS", "fstartT", "fstartW",
/* 0x0c0 */
"fdRdX", "fdGdX", "fdBdX", "fdZdX",
"fdAdX", "fdSdX", "fdTdX", "fdWdX",
"fdRdY", "fdGdY", "fdBdY", "fdZdY",
"fdAdY", "fdSdY", "fdTdY", "fdWdY",
/* 0x100 */
"ftriangleCMD", "fbzColorPath", "fogMode", "alphaMode",
"fbzMode", "lfbMode", "clipLeftRight","clipLowYHighY",
"nopCMD", "fastfillCMD", "swapbufferCMD","fogColor",
"zaColor", "chromaKey", "chromaRange", "userIntrCMD",
/* 0x140 */
"stipple", "color0", "color1", "fbiPixelsIn",
"fbiChromaFail","fbiZfuncFail", "fbiAfuncFail", "fbiPixelsOut",
"fogTable160", "fogTable164", "fogTable168", "fogTable16c",
"fogTable170", "fogTable174", "fogTable178", "fogTable17c",
/* 0x180 */
"fogTable180", "fogTable184", "fogTable188", "fogTable18c",
"fogTable190", "fogTable194", "fogTable198", "fogTable19c",
"fogTable1a0", "fogTable1a4", "fogTable1a8", "fogTable1ac",
"fogTable1b0", "fogTable1b4", "fogTable1b8", "fogTable1bc",
/* 0x1c0 */
"fogTable1c0", "fogTable1c4", "fogTable1c8", "fogTable1cc",
"fogTable1d0", "fogTable1d4", "fogTable1d8", "fogTable1dc",
"reserved1e0", "reserved1e4", "reserved1e8", "colBufferAddr",
"colBufferStride","auxBufferAddr","auxBufferStride","reserved1fc",
/* 0x200 */
"clipLeftRight1","clipTopBottom1","reserved208","reserved20c",
"reserved210", "reserved214", "reserved218", "reserved21c",
"reserved220", "reserved224", "reserved228", "reserved22c",
"reserved230", "reserved234", "reserved238", "reserved23c",
/* 0x240 */
"reserved240", "reserved244", "reserved248", "swapPending",
"leftOverlayBuf","rightOverlayBuf","fbiSwapHistory","fbiTrianglesOut",
"sSetupMode", "sVx", "sVy", "sARGB",
"sRed", "sGreen", "sBlue", "sAlpha",
/* 0x280 */
"sVz", "sWb", "sWtmu0", "sS/Wtmu0",
"sT/Wtmu0", "sWtmu1", "sS/Wtmu1", "sT/Wtmu1",
"sDrawTriCMD", "sBeginTriCMD", "reserved2a8", "reserved2ac",
"reserved2b0", "reserved2b4", "reserved2b8", "reserved2bc",
/* 0x2c0 */
"reserved2c0", "reserved2c4", "reserved2c8", "reserved2cc",
"reserved2d0", "reserved2d4", "reserved2d8", "reserved2dc",
"reserved2e0", "reserved2e4", "reserved2e8", "reserved2ec",
"reserved2f0", "reserved2f4", "reserved2f8", "reserved2fc",
/* 0x300 */
"textureMode", "tLOD", "tDetail", "texBaseAddr",
"texBaseAddr_1","texBaseAddr_2","texBaseAddr_3_8","reserved31c",
"trexInit1", "nccTable0.0", "nccTable0.1", "nccTable0.2",
"nccTable0.3", "nccTable0.4", "nccTable0.5", "nccTable0.6",
/* 0x340 */
"nccTable0.7", "nccTable0.8", "nccTable0.9", "nccTable0.A",
"nccTable0.B", "nccTable1.0", "nccTable1.1", "nccTable1.2",
"nccTable1.3", "nccTable1.4", "nccTable1.5", "nccTable1.6",
"nccTable1.7", "nccTable1.8", "nccTable1.9", "nccTable1.A",
/* 0x380 */
"nccTable1.B"
};
/*************************************
*
* Voodoo Banshee I/O space registers
*
*************************************/
/* 0x000 */
#define io_status (0x000/4) /* */
#define io_pciInit0 (0x004/4) /* */
#define io_sipMonitor (0x008/4) /* */
#define io_lfbMemoryConfig (0x00c/4) /* */
#define io_miscInit0 (0x010/4) /* */
#define io_miscInit1 (0x014/4) /* */
#define io_dramInit0 (0x018/4) /* */
#define io_dramInit1 (0x01c/4) /* */
#define io_agpInit (0x020/4) /* */
#define io_tmuGbeInit (0x024/4) /* */
#define io_vgaInit0 (0x028/4) /* */
#define io_vgaInit1 (0x02c/4) /* */
#define io_dramCommand (0x030/4) /* */
#define io_dramData (0x034/4) /* */
/* 0x040 */
#define io_pllCtrl0 (0x040/4) /* */
#define io_pllCtrl1 (0x044/4) /* */
#define io_pllCtrl2 (0x048/4) /* */
#define io_dacMode (0x04c/4) /* */
#define io_dacAddr (0x050/4) /* */
#define io_dacData (0x054/4) /* */
#define io_rgbMaxDelta (0x058/4) /* */
#define io_vidProcCfg (0x05c/4) /* */
#define io_hwCurPatAddr (0x060/4) /* */
#define io_hwCurLoc (0x064/4) /* */
#define io_hwCurC0 (0x068/4) /* */
#define io_hwCurC1 (0x06c/4) /* */
#define io_vidInFormat (0x070/4) /* */
#define io_vidInStatus (0x074/4) /* */
#define io_vidSerialParallelPort (0x078/4) /* */
#define io_vidInXDecimDeltas (0x07c/4) /* */
/* 0x080 */
#define io_vidInDecimInitErrs (0x080/4) /* */
#define io_vidInYDecimDeltas (0x084/4) /* */
#define io_vidPixelBufThold (0x088/4) /* */
#define io_vidChromaMin (0x08c/4) /* */
#define io_vidChromaMax (0x090/4) /* */
#define io_vidCurrentLine (0x094/4) /* */
#define io_vidScreenSize (0x098/4) /* */
#define io_vidOverlayStartCoords (0x09c/4) /* */
#define io_vidOverlayEndScreenCoord (0x0a0/4) /* */
#define io_vidOverlayDudx (0x0a4/4) /* */
#define io_vidOverlayDudxOffsetSrcWidth (0x0a8/4) /* */
#define io_vidOverlayDvdy (0x0ac/4) /* */
#define io_vgab0 (0x0b0/4) /* */
#define io_vgab4 (0x0b4/4) /* */
#define io_vgab8 (0x0b8/4) /* */
#define io_vgabc (0x0bc/4) /* */
/* 0x0c0 */
#define io_vgac0 (0x0c0/4) /* */
#define io_vgac4 (0x0c4/4) /* */
#define io_vgac8 (0x0c8/4) /* */
#define io_vgacc (0x0cc/4) /* */
#define io_vgad0 (0x0d0/4) /* */
#define io_vgad4 (0x0d4/4) /* */
#define io_vgad8 (0x0d8/4) /* */
#define io_vgadc (0x0dc/4) /* */
#define io_vidOverlayDvdyOffset (0x0e0/4) /* */
#define io_vidDesktopStartAddr (0x0e4/4) /* */
#define io_vidDesktopOverlayStride (0x0e8/4) /* */
#define io_vidInAddr0 (0x0ec/4) /* */
#define io_vidInAddr1 (0x0f0/4) /* */
#define io_vidInAddr2 (0x0f4/4) /* */
#define io_vidInStride (0x0f8/4) /* */
#define io_vidCurrOverlayStartAddr (0x0fc/4) /* */
/*************************************
*
* Register string table for debug
*
*************************************/
static const char *const banshee_io_reg_name[] =
{
/* 0x000 */
"status", "pciInit0", "sipMonitor", "lfbMemoryConfig",
"miscInit0", "miscInit1", "dramInit0", "dramInit1",
"agpInit", "tmuGbeInit", "vgaInit0", "vgaInit1",
"dramCommand", "dramData", "reserved38", "reserved3c",
/* 0x040 */
"pllCtrl0", "pllCtrl1", "pllCtrl2", "dacMode",
"dacAddr", "dacData", "rgbMaxDelta", "vidProcCfg",
"hwCurPatAddr", "hwCurLoc", "hwCurC0", "hwCurC1",
"vidInFormat", "vidInStatus", "vidSerialParallelPort","vidInXDecimDeltas",
/* 0x080 */
"vidInDecimInitErrs","vidInYDecimDeltas","vidPixelBufThold","vidChromaMin",
"vidChromaMax", "vidCurrentLine","vidScreenSize","vidOverlayStartCoords",
"vidOverlayEndScreenCoord","vidOverlayDudx","vidOverlayDudxOffsetSrcWidth","vidOverlayDvdy",
"vga[b0]", "vga[b4]", "vga[b8]", "vga[bc]",
/* 0x0c0 */
"vga[c0]", "vga[c4]", "vga[c8]", "vga[cc]",
"vga[d0]", "vga[d4]", "vga[d8]", "vga[dc]",
"vidOverlayDvdyOffset","vidDesktopStartAddr","vidDesktopOverlayStride","vidInAddr0",
"vidInAddr1", "vidInAddr2", "vidInStride", "vidCurrOverlayStartAddr"
};
/*************************************
*
* Voodoo Banshee AGP space registers
*
*************************************/
/* 0x000 */
#define agpReqSize (0x000/4) /* */
#define agpHostAddressLow (0x004/4) /* */
#define agpHostAddressHigh (0x008/4) /* */
#define agpGraphicsAddress (0x00c/4) /* */
#define agpGraphicsStride (0x010/4) /* */
#define agpMoveCMD (0x014/4) /* */
#define cmdBaseAddr0 (0x020/4) /* */
#define cmdBaseSize0 (0x024/4) /* */
#define cmdBump0 (0x028/4) /* */
#define cmdRdPtrL0 (0x02c/4) /* */
#define cmdRdPtrH0 (0x030/4) /* */
#define cmdAMin0 (0x034/4) /* */
#define cmdAMax0 (0x03c/4) /* */
/* 0x040 */
#define cmdFifoDepth0 (0x044/4) /* */
#define cmdHoleCnt0 (0x048/4) /* */
#define cmdBaseAddr1 (0x050/4) /* */
#define cmdBaseSize1 (0x054/4) /* */
#define cmdBump1 (0x058/4) /* */
#define cmdRdPtrL1 (0x05c/4) /* */
#define cmdRdPtrH1 (0x060/4) /* */
#define cmdAMin1 (0x064/4) /* */
#define cmdAMax1 (0x06c/4) /* */
#define cmdFifoDepth1 (0x074/4) /* */
#define cmdHoleCnt1 (0x078/4) /* */
/* 0x080 */
#define cmdFifoThresh (0x080/4) /* */
#define cmdHoleInt (0x084/4) /* */
/* 0x100 */
#define yuvBaseAddress (0x100/4) /* */
#define yuvStride (0x104/4) /* */
#define crc1 (0x120/4) /* */
#define crc2 (0x130/4) /* */
/*************************************
*
* Register string table for debug
*
*************************************/
static const char *const banshee_agp_reg_name[] =
{
/* 0x000 */
"agpReqSize", "agpHostAddressLow","agpHostAddressHigh","agpGraphicsAddress",
"agpGraphicsStride","agpMoveCMD","reserved18", "reserved1c",
"cmdBaseAddr0", "cmdBaseSize0", "cmdBump0", "cmdRdPtrL0",
"cmdRdPtrH0", "cmdAMin0", "reserved38", "cmdAMax0",
/* 0x040 */
"reserved40", "cmdFifoDepth0","cmdHoleCnt0", "reserved4c",
"cmdBaseAddr1", "cmdBaseSize1", "cmdBump1", "cmdRdPtrL1",
"cmdRdPtrH1", "cmdAMin1", "reserved68", "cmdAMax1",
"reserved70", "cmdFifoDepth1","cmdHoleCnt1", "reserved7c",
/* 0x080 */
"cmdFifoThresh","cmdHoleInt", "reserved88", "reserved8c",
"reserved90", "reserved94", "reserved98", "reserved9c",
"reserveda0", "reserveda4", "reserveda8", "reservedac",
"reservedb0", "reservedb4", "reservedb8", "reservedbc",
/* 0x0c0 */
"reservedc0", "reservedc4", "reservedc8", "reservedcc",
"reservedd0", "reservedd4", "reservedd8", "reserveddc",
"reservede0", "reservede4", "reservede8", "reservedec",
"reservedf0", "reservedf4", "reservedf8", "reservedfc",
/* 0x100 */
"yuvBaseAddress","yuvStride", "reserved108", "reserved10c",
"reserved110", "reserved114", "reserved118", "reserved11c",
"crc1", "reserved124", "reserved128", "reserved12c",
"crc2", "reserved134", "reserved138", "reserved13c"
};
/*************************************
*
* Dithering tables
*
*************************************/
static const Bit8u dither_matrix_4x4[16] =
{
0, 8, 2, 10,
12, 4, 14, 6,
3, 11, 1, 9,
15, 7, 13, 5
};
static const Bit8u dither_matrix_2x2[16] =
{
2, 10, 2, 10,
14, 6, 14, 6,
2, 10, 2, 10,
14, 6, 14, 6
};
/*************************************
*
* Macros for extracting pixels
*
*************************************/
#define EXTRACT_565_TO_888(val, a, b, c) \
(a) = (((val) >> 8) & 0xf8) | (((val) >> 13) & 0x07); \
(b) = (((val) >> 3) & 0xfc) | (((val) >> 9) & 0x03); \
(c) = (((val) << 3) & 0xf8) | (((val) >> 2) & 0x07); \
#define EXTRACT_x555_TO_888(val, a, b, c) \
(a) = (((val) >> 7) & 0xf8) | (((val) >> 12) & 0x07); \
(b) = (((val) >> 2) & 0xf8) | (((val) >> 7) & 0x07); \
(c) = (((val) << 3) & 0xf8) | (((val) >> 2) & 0x07); \
#define EXTRACT_555x_TO_888(val, a, b, c) \
(a) = (((val) >> 8) & 0xf8) | (((val) >> 13) & 0x07); \
(b) = (((val) >> 3) & 0xf8) | (((val) >> 8) & 0x07); \
(c) = (((val) << 2) & 0xf8) | (((val) >> 3) & 0x07); \
#define EXTRACT_1555_TO_8888(val, a, b, c, d) \
(a) = ((Bit16s)(val) >> 15) & 0xff; \
EXTRACT_x555_TO_888(val, b, c, d) \
#define EXTRACT_5551_TO_8888(val, a, b, c, d) \
EXTRACT_555x_TO_888(val, a, b, c) \
(d) = ((val) & 0x0001) ? 0xff : 0x00; \
#define EXTRACT_x888_TO_888(val, a, b, c) \
(a) = ((val) >> 16) & 0xff; \
(b) = ((val) >> 8) & 0xff; \
(c) = ((val) >> 0) & 0xff; \
#define EXTRACT_888x_TO_888(val, a, b, c) \
(a) = ((val) >> 24) & 0xff; \
(b) = ((val) >> 16) & 0xff; \
(c) = ((val) >> 8) & 0xff; \
#define EXTRACT_8888_TO_8888(val, a, b, c, d) \
(a) = ((val) >> 24) & 0xff; \
(b) = ((val) >> 16) & 0xff; \
(c) = ((val) >> 8) & 0xff; \
(d) = ((val) >> 0) & 0xff; \
#define EXTRACT_4444_TO_8888(val, a, b, c, d) \
(a) = (((val) >> 8) & 0xf0) | (((val) >> 12) & 0x0f); \
(b) = (((val) >> 4) & 0xf0) | (((val) >> 8) & 0x0f); \
(c) = (((val) >> 0) & 0xf0) | (((val) >> 4) & 0x0f); \
(d) = (((val) << 4) & 0xf0) | (((val) >> 0) & 0x0f); \
#define EXTRACT_332_TO_888(val, a, b, c) \
(a) = (((val) >> 0) & 0xe0) | (((val) >> 3) & 0x1c) | (((val) >> 6) & 0x03); \
(b) = (((val) << 3) & 0xe0) | (((val) >> 0) & 0x1c) | (((val) >> 3) & 0x03); \
(c) = (((val) << 6) & 0xc0) | (((val) << 4) & 0x30) | (((val) << 2) & 0xc0) | (((val) << 0) & 0x03); \
/*************************************
*
* Misc. macros
*
*************************************/
/* macro for clamping a value between minimum and maximum values */
#define CLAMP(val,min,max) do { if ((val) < (min)) { (val) = (min); } else if ((val) > (max)) { (val) = (max); } } while (0)
/* macro to compute the base 2 log for LOD calculations */
#define LOGB2(x) (log((double)(x)) / log(2.0))
/*************************************
*
* Macros for extracting bitfields
*
*************************************/
#define INITEN_ENABLE_HW_INIT(val) (((val) >> 0) & 1)
#define INITEN_ENABLE_PCI_FIFO(val) (((val) >> 1) & 1)
#define INITEN_REMAP_INIT_TO_DAC(val) (((val) >> 2) & 1)
#define INITEN_ENABLE_SNOOP0(val) (((val) >> 4) & 1)
#define INITEN_SNOOP0_MEMORY_MATCH(val) (((val) >> 5) & 1)
#define INITEN_SNOOP0_READWRITE_MATCH(val) (((val) >> 6) & 1)
#define INITEN_ENABLE_SNOOP1(val) (((val) >> 7) & 1)
#define INITEN_SNOOP1_MEMORY_MATCH(val) (((val) >> 8) & 1)
#define INITEN_SNOOP1_READWRITE_MATCH(val) (((val) >> 9) & 1)
#define INITEN_SLI_BUS_OWNER(val) (((val) >> 10) & 1)
#define INITEN_SLI_ODD_EVEN(val) (((val) >> 11) & 1)
#define INITEN_SECONDARY_REV_ID(val) (((val) >> 12) & 0xf) /* voodoo 2 only */
#define INITEN_MFCTR_FAB_ID(val) (((val) >> 16) & 0xf) /* voodoo 2 only */
#define INITEN_ENABLE_PCI_INTERRUPT(val) (((val) >> 20) & 1) /* voodoo 2 only */
#define INITEN_PCI_INTERRUPT_TIMEOUT(val) (((val) >> 21) & 1) /* voodoo 2 only */
#define INITEN_ENABLE_NAND_TREE_TEST(val) (((val) >> 22) & 1) /* voodoo 2 only */
#define INITEN_ENABLE_SLI_ADDRESS_SNOOP(val) (((val) >> 23) & 1) /* voodoo 2 only */
#define INITEN_SLI_SNOOP_ADDRESS(val) (((val) >> 24) & 0xff) /* voodoo 2 only */
#define FBZCP_CC_RGBSELECT(val) (((val) >> 0) & 3)
#define FBZCP_CC_ASELECT(val) (((val) >> 2) & 3)
#define FBZCP_CC_LOCALSELECT(val) (((val) >> 4) & 1)
#define FBZCP_CCA_LOCALSELECT(val) (((val) >> 5) & 3)
#define FBZCP_CC_LOCALSELECT_OVERRIDE(val) (((val) >> 7) & 1)
#define FBZCP_CC_ZERO_OTHER(val) (((val) >> 8) & 1)
#define FBZCP_CC_SUB_CLOCAL(val) (((val) >> 9) & 1)
#define FBZCP_CC_MSELECT(val) (((val) >> 10) & 7)
#define FBZCP_CC_REVERSE_BLEND(val) (((val) >> 13) & 1)
#define FBZCP_CC_ADD_ACLOCAL(val) (((val) >> 14) & 3)
#define FBZCP_CC_INVERT_OUTPUT(val) (((val) >> 16) & 1)
#define FBZCP_CCA_ZERO_OTHER(val) (((val) >> 17) & 1)
#define FBZCP_CCA_SUB_CLOCAL(val) (((val) >> 18) & 1)
#define FBZCP_CCA_MSELECT(val) (((val) >> 19) & 7)
#define FBZCP_CCA_REVERSE_BLEND(val) (((val) >> 22) & 1)
#define FBZCP_CCA_ADD_ACLOCAL(val) (((val) >> 23) & 3)
#define FBZCP_CCA_INVERT_OUTPUT(val) (((val) >> 25) & 1)
#define FBZCP_CCA_SUBPIXEL_ADJUST(val) (((val) >> 26) & 1)
#define FBZCP_TEXTURE_ENABLE(val) (((val) >> 27) & 1)
#define FBZCP_RGBZW_CLAMP(val) (((val) >> 28) & 1) /* voodoo 2 only */
#define FBZCP_ANTI_ALIAS(val) (((val) >> 29) & 1) /* voodoo 2 only */
#define ALPHAMODE_ALPHATEST(val) (((val) >> 0) & 1)
#define ALPHAMODE_ALPHAFUNCTION(val) (((val) >> 1) & 7)
#define ALPHAMODE_ALPHABLEND(val) (((val) >> 4) & 1)
#define ALPHAMODE_ANTIALIAS(val) (((val) >> 5) & 1)
#define ALPHAMODE_SRCRGBBLEND(val) (((val) >> 8) & 15)
#define ALPHAMODE_DSTRGBBLEND(val) (((val) >> 12) & 15)
#define ALPHAMODE_SRCALPHABLEND(val) (((val) >> 16) & 15)
#define ALPHAMODE_DSTALPHABLEND(val) (((val) >> 20) & 15)
#define ALPHAMODE_ALPHAREF(val) (((val) >> 24) & 0xff)
#define FOGMODE_ENABLE_FOG(val) (((val) >> 0) & 1)
#define FOGMODE_FOG_ADD(val) (((val) >> 1) & 1)
#define FOGMODE_FOG_MULT(val) (((val) >> 2) & 1)
#define FOGMODE_FOG_ZALPHA(val) (((val) >> 3) & 3)
#define FOGMODE_FOG_CONSTANT(val) (((val) >> 5) & 1)
#define FOGMODE_FOG_DITHER(val) (((val) >> 6) & 1) /* voodoo 2 only */
#define FOGMODE_FOG_ZONES(val) (((val) >> 7) & 1) /* voodoo 2 only */
#define FBZMODE_ENABLE_CLIPPING(val) (((val) >> 0) & 1)
#define FBZMODE_ENABLE_CHROMAKEY(val) (((val) >> 1) & 1)
#define FBZMODE_ENABLE_STIPPLE(val) (((val) >> 2) & 1)
#define FBZMODE_WBUFFER_SELECT(val) (((val) >> 3) & 1)
#define FBZMODE_ENABLE_DEPTHBUF(val) (((val) >> 4) & 1)
#define FBZMODE_DEPTH_FUNCTION(val) (((val) >> 5) & 7)
#define FBZMODE_ENABLE_DITHERING(val) (((val) >> 8) & 1)
#define FBZMODE_RGB_BUFFER_MASK(val) (((val) >> 9) & 1)
#define FBZMODE_AUX_BUFFER_MASK(val) (((val) >> 10) & 1)
#define FBZMODE_DITHER_TYPE(val) (((val) >> 11) & 1)
#define FBZMODE_STIPPLE_PATTERN(val) (((val) >> 12) & 1)
#define FBZMODE_ENABLE_ALPHA_MASK(val) (((val) >> 13) & 1)
#define FBZMODE_DRAW_BUFFER(val) (((val) >> 14) & 3)
#define FBZMODE_ENABLE_DEPTH_BIAS(val) (((val) >> 16) & 1)
#define FBZMODE_Y_ORIGIN(val) (((val) >> 17) & 1)
#define FBZMODE_ENABLE_ALPHA_PLANES(val) (((val) >> 18) & 1)
#define FBZMODE_ALPHA_DITHER_SUBTRACT(val) (((val) >> 19) & 1)
#define FBZMODE_DEPTH_SOURCE_COMPARE(val) (((val) >> 20) & 1)
#define FBZMODE_DEPTH_FLOAT_SELECT(val) (((val) >> 21) & 1) /* voodoo 2 only */
#define LFBMODE_WRITE_FORMAT(val) (((val) >> 0) & 0xf)
#define LFBMODE_WRITE_BUFFER_SELECT(val) (((val) >> 4) & 3)
#define LFBMODE_READ_BUFFER_SELECT(val) (((val) >> 6) & 3)
#define LFBMODE_ENABLE_PIXEL_PIPELINE(val) (((val) >> 8) & 1)
#define LFBMODE_RGBA_LANES(val) (((val) >> 9) & 3)
#define LFBMODE_WORD_SWAP_WRITES(val) (((val) >> 11) & 1)
#define LFBMODE_BYTE_SWIZZLE_WRITES(val) (((val) >> 12) & 1)
#define LFBMODE_Y_ORIGIN(val) (((val) >> 13) & 1)
#define LFBMODE_WRITE_W_SELECT(val) (((val) >> 14) & 1)
#define LFBMODE_WORD_SWAP_READS(val) (((val) >> 15) & 1)
#define LFBMODE_BYTE_SWIZZLE_READS(val) (((val) >> 16) & 1)
#define CHROMARANGE_BLUE_EXCLUSIVE(val) (((val) >> 24) & 1)
#define CHROMARANGE_GREEN_EXCLUSIVE(val) (((val) >> 25) & 1)
#define CHROMARANGE_RED_EXCLUSIVE(val) (((val) >> 26) & 1)
#define CHROMARANGE_UNION_MODE(val) (((val) >> 27) & 1)
#define CHROMARANGE_ENABLE(val) (((val) >> 28) & 1)
#define FBIINIT0_VGA_PASSTHRU(val) (((val) >> 0) & 1)
#define FBIINIT0_GRAPHICS_RESET(val) (((val) >> 1) & 1)
#define FBIINIT0_FIFO_RESET(val) (((val) >> 2) & 1)
#define FBIINIT0_SWIZZLE_REG_WRITES(val) (((val) >> 3) & 1)
#define FBIINIT0_STALL_PCIE_FOR_HWM(val) (((val) >> 4) & 1)
#define FBIINIT0_PCI_FIFO_LWM(val) (((val) >> 6) & 0x1f)
#define FBIINIT0_LFB_TO_MEMORY_FIFO(val) (((val) >> 11) & 1)
#define FBIINIT0_TEXMEM_TO_MEMORY_FIFO(val) (((val) >> 12) & 1)
#define FBIINIT0_ENABLE_MEMORY_FIFO(val) (((val) >> 13) & 1)
#define FBIINIT0_MEMORY_FIFO_HWM(val) (((val) >> 14) & 0x7ff)
#define FBIINIT0_MEMORY_FIFO_BURST(val) (((val) >> 25) & 0x3f)
#define FBIINIT1_PCI_DEV_FUNCTION(val) (((val) >> 0) & 1)
#define FBIINIT1_PCI_WRITE_WAIT_STATES(val) (((val) >> 1) & 1)
#define FBIINIT1_MULTI_SST1(val) (((val) >> 2) & 1) /* not on voodoo 2 */
#define FBIINIT1_ENABLE_LFB(val) (((val) >> 3) & 1)
#define FBIINIT1_X_VIDEO_TILES(val) (((val) >> 4) & 0xf)
#define FBIINIT1_VIDEO_TIMING_RESET(val) (((val) >> 8) & 1)
#define FBIINIT1_SOFTWARE_OVERRIDE(val) (((val) >> 9) & 1)
#define FBIINIT1_SOFTWARE_HSYNC(val) (((val) >> 10) & 1)
#define FBIINIT1_SOFTWARE_VSYNC(val) (((val) >> 11) & 1)
#define FBIINIT1_SOFTWARE_BLANK(val) (((val) >> 12) & 1)
#define FBIINIT1_DRIVE_VIDEO_TIMING(val) (((val) >> 13) & 1)
#define FBIINIT1_DRIVE_VIDEO_BLANK(val) (((val) >> 14) & 1)
#define FBIINIT1_DRIVE_VIDEO_SYNC(val) (((val) >> 15) & 1)
#define FBIINIT1_DRIVE_VIDEO_DCLK(val) (((val) >> 16) & 1)
#define FBIINIT1_VIDEO_TIMING_VCLK(val) (((val) >> 17) & 1)
#define FBIINIT1_VIDEO_CLK_2X_DELAY(val) (((val) >> 18) & 3)
#define FBIINIT1_VIDEO_TIMING_SOURCE(val) (((val) >> 20) & 3)
#define FBIINIT1_ENABLE_24BPP_OUTPUT(val) (((val) >> 22) & 1)
#define FBIINIT1_ENABLE_SLI(val) (((val) >> 23) & 1)
#define FBIINIT1_X_VIDEO_TILES_BIT5(val) (((val) >> 24) & 1) /* voodoo 2 only */
#define FBIINIT1_ENABLE_EDGE_FILTER(val) (((val) >> 25) & 1)
#define FBIINIT1_INVERT_VID_CLK_2X(val) (((val) >> 26) & 1)
#define FBIINIT1_VID_CLK_2X_SEL_DELAY(val) (((val) >> 27) & 3)
#define FBIINIT1_VID_CLK_DELAY(val) (((val) >> 29) & 3)
#define FBIINIT1_DISABLE_FAST_READAHEAD(val) (((val) >> 31) & 1)
#define FBIINIT2_DISABLE_DITHER_SUB(val) (((val) >> 0) & 1)
#define FBIINIT2_DRAM_BANKING(val) (((val) >> 1) & 1)
#define FBIINIT2_ENABLE_TRIPLE_BUF(val) (((val) >> 4) & 1)
#define FBIINIT2_ENABLE_FAST_RAS_READ(val) (((val) >> 5) & 1)
#define FBIINIT2_ENABLE_GEN_DRAM_OE(val) (((val) >> 6) & 1)
#define FBIINIT2_ENABLE_FAST_READWRITE(val) (((val) >> 7) & 1)
#define FBIINIT2_ENABLE_PASSTHRU_DITHER(val) (((val) >> 8) & 1)
#define FBIINIT2_SWAP_BUFFER_ALGORITHM(val) (((val) >> 9) & 3)
#define FBIINIT2_VIDEO_BUFFER_OFFSET(val) (((val) >> 11) & 0x1ff)
#define FBIINIT2_ENABLE_DRAM_BANKING(val) (((val) >> 20) & 1)
#define FBIINIT2_ENABLE_DRAM_READ_FIFO(val) (((val) >> 21) & 1)
#define FBIINIT2_ENABLE_DRAM_REFRESH(val) (((val) >> 22) & 1)
#define FBIINIT2_REFRESH_LOAD_VALUE(val) (((val) >> 23) & 0x1ff)
#define FBIINIT3_TRI_REGISTER_REMAP(val) (((val) >> 0) & 1)
#define FBIINIT3_VIDEO_FIFO_THRESH(val) (((val) >> 1) & 0x1f)
#define FBIINIT3_DISABLE_TMUS(val) (((val) >> 6) & 1)
#define FBIINIT3_FBI_MEMORY_TYPE(val) (((val) >> 8) & 7)
#define FBIINIT3_VGA_PASS_RESET_VAL(val) (((val) >> 11) & 1)
#define FBIINIT3_HARDCODE_PCI_BASE(val) (((val) >> 12) & 1)
#define FBIINIT3_FBI2TREX_DELAY(val) (((val) >> 13) & 0xf)
#define FBIINIT3_TREX2FBI_DELAY(val) (((val) >> 17) & 0x1f)
#define FBIINIT3_YORIGIN_SUBTRACT(val) (((val) >> 22) & 0x3ff)
#define FBIINIT4_PCI_READ_WAITS(val) (((val) >> 0) & 1)
#define FBIINIT4_ENABLE_LFB_READAHEAD(val) (((val) >> 1) & 1)
#define FBIINIT4_MEMORY_FIFO_LWM(val) (((val) >> 2) & 0x3f)
#define FBIINIT4_MEMORY_FIFO_START_ROW(val) (((val) >> 8) & 0x3ff)
#define FBIINIT4_MEMORY_FIFO_STOP_ROW(val) (((val) >> 18) & 0x3ff)
#define FBIINIT4_VIDEO_CLOCKING_DELAY(val) (((val) >> 29) & 7) /* voodoo 2 only */
#define FBIINIT5_DISABLE_PCI_STOP(val) (((val) >> 0) & 1) /* voodoo 2 only */
#define FBIINIT5_PCI_SLAVE_SPEED(val) (((val) >> 1) & 1) /* voodoo 2 only */
#define FBIINIT5_DAC_DATA_OUTPUT_WIDTH(val) (((val) >> 2) & 1) /* voodoo 2 only */
#define FBIINIT5_DAC_DATA_17_OUTPUT(val) (((val) >> 3) & 1) /* voodoo 2 only */
#define FBIINIT5_DAC_DATA_18_OUTPUT(val) (((val) >> 4) & 1) /* voodoo 2 only */
#define FBIINIT5_GENERIC_STRAPPING(val) (((val) >> 5) & 0xf) /* voodoo 2 only */
#define FBIINIT5_BUFFER_ALLOCATION(val) (((val) >> 9) & 3) /* voodoo 2 only */
#define FBIINIT5_DRIVE_VID_CLK_SLAVE(val) (((val) >> 11) & 1) /* voodoo 2 only */
#define FBIINIT5_DRIVE_DAC_DATA_16(val) (((val) >> 12) & 1) /* voodoo 2 only */
#define FBIINIT5_VCLK_INPUT_SELECT(val) (((val) >> 13) & 1) /* voodoo 2 only */
#define FBIINIT5_MULTI_CVG_DETECT(val) (((val) >> 14) & 1) /* voodoo 2 only */
#define FBIINIT5_SYNC_RETRACE_READS(val) (((val) >> 15) & 1) /* voodoo 2 only */
#define FBIINIT5_ENABLE_RHBORDER_COLOR(val) (((val) >> 16) & 1) /* voodoo 2 only */
#define FBIINIT5_ENABLE_LHBORDER_COLOR(val) (((val) >> 17) & 1) /* voodoo 2 only */
#define FBIINIT5_ENABLE_BVBORDER_COLOR(val) (((val) >> 18) & 1) /* voodoo 2 only */
#define FBIINIT5_ENABLE_TVBORDER_COLOR(val) (((val) >> 19) & 1) /* voodoo 2 only */
#define FBIINIT5_DOUBLE_HORIZ(val) (((val) >> 20) & 1) /* voodoo 2 only */
#define FBIINIT5_DOUBLE_VERT(val) (((val) >> 21) & 1) /* voodoo 2 only */
#define FBIINIT5_ENABLE_16BIT_GAMMA(val) (((val) >> 22) & 1) /* voodoo 2 only */
#define FBIINIT5_INVERT_DAC_HSYNC(val) (((val) >> 23) & 1) /* voodoo 2 only */
#define FBIINIT5_INVERT_DAC_VSYNC(val) (((val) >> 24) & 1) /* voodoo 2 only */
#define FBIINIT5_ENABLE_24BIT_DACDATA(val) (((val) >> 25) & 1) /* voodoo 2 only */
#define FBIINIT5_ENABLE_INTERLACING(val) (((val) >> 26) & 1) /* voodoo 2 only */
#define FBIINIT5_DAC_DATA_18_CONTROL(val) (((val) >> 27) & 1) /* voodoo 2 only */
#define FBIINIT5_RASTERIZER_UNIT_MODE(val) (((val) >> 30) & 3) /* voodoo 2 only */
#define FBIINIT6_WINDOW_ACTIVE_COUNTER(val) (((val) >> 0) & 7) /* voodoo 2 only */
#define FBIINIT6_WINDOW_DRAG_COUNTER(val) (((val) >> 3) & 0x1f) /* voodoo 2 only */
#define FBIINIT6_SLI_SYNC_MASTER(val) (((val) >> 8) & 1) /* voodoo 2 only */
#define FBIINIT6_DAC_DATA_22_OUTPUT(val) (((val) >> 9) & 3) /* voodoo 2 only */
#define FBIINIT6_DAC_DATA_23_OUTPUT(val) (((val) >> 11) & 3) /* voodoo 2 only */
#define FBIINIT6_SLI_SYNCIN_OUTPUT(val) (((val) >> 13) & 3) /* voodoo 2 only */
#define FBIINIT6_SLI_SYNCOUT_OUTPUT(val) (((val) >> 15) & 3) /* voodoo 2 only */
#define FBIINIT6_DAC_RD_OUTPUT(val) (((val) >> 17) & 3) /* voodoo 2 only */
#define FBIINIT6_DAC_WR_OUTPUT(val) (((val) >> 19) & 3) /* voodoo 2 only */
#define FBIINIT6_PCI_FIFO_LWM_RDY(val) (((val) >> 21) & 0x7f) /* voodoo 2 only */
#define FBIINIT6_VGA_PASS_N_OUTPUT(val) (((val) >> 28) & 3) /* voodoo 2 only */
#define FBIINIT6_X_VIDEO_TILES_BIT0(val) (((val) >> 30) & 1) /* voodoo 2 only */
#define FBIINIT7_GENERIC_STRAPPING(val) (((val) >> 0) & 0xff) /* voodoo 2 only */
#define FBIINIT7_CMDFIFO_ENABLE(val) (((val) >> 8) & 1) /* voodoo 2 only */
#define FBIINIT7_CMDFIFO_MEMORY_STORE(val) (((val) >> 9) & 1) /* voodoo 2 only */
#define FBIINIT7_DISABLE_CMDFIFO_HOLES(val) (((val) >> 10) & 1) /* voodoo 2 only */
#define FBIINIT7_CMDFIFO_READ_THRESH(val) (((val) >> 11) & 0x1f) /* voodoo 2 only */
#define FBIINIT7_SYNC_CMDFIFO_WRITES(val) (((val) >> 16) & 1) /* voodoo 2 only */
#define FBIINIT7_SYNC_CMDFIFO_READS(val) (((val) >> 17) & 1) /* voodoo 2 only */
#define FBIINIT7_RESET_PCI_PACKER(val) (((val) >> 18) & 1) /* voodoo 2 only */
#define FBIINIT7_ENABLE_CHROMA_STUFF(val) (((val) >> 19) & 1) /* voodoo 2 only */
#define FBIINIT7_CMDFIFO_PCI_TIMEOUT(val) (((val) >> 20) & 0x7f) /* voodoo 2 only */
#define FBIINIT7_ENABLE_TEXTURE_BURST(val) (((val) >> 27) & 1) /* voodoo 2 only */
#define TEXMODE_ENABLE_PERSPECTIVE(val) (((val) >> 0) & 1)
#define TEXMODE_MINIFICATION_FILTER(val) (((val) >> 1) & 1)
#define TEXMODE_MAGNIFICATION_FILTER(val) (((val) >> 2) & 1)
#define TEXMODE_CLAMP_NEG_W(val) (((val) >> 3) & 1)
#define TEXMODE_ENABLE_LOD_DITHER(val) (((val) >> 4) & 1)
#define TEXMODE_NCC_TABLE_SELECT(val) (((val) >> 5) & 1)
#define TEXMODE_CLAMP_S(val) (((val) >> 6) & 1)
#define TEXMODE_CLAMP_T(val) (((val) >> 7) & 1)
#define TEXMODE_FORMAT(val) (((val) >> 8) & 0xf)
#define TEXMODE_TC_ZERO_OTHER(val) (((val) >> 12) & 1)
#define TEXMODE_TC_SUB_CLOCAL(val) (((val) >> 13) & 1)
#define TEXMODE_TC_MSELECT(val) (((val) >> 14) & 7)
#define TEXMODE_TC_REVERSE_BLEND(val) (((val) >> 17) & 1)
#define TEXMODE_TC_ADD_ACLOCAL(val) (((val) >> 18) & 3)
#define TEXMODE_TC_INVERT_OUTPUT(val) (((val) >> 20) & 1)
#define TEXMODE_TCA_ZERO_OTHER(val) (((val) >> 21) & 1)
#define TEXMODE_TCA_SUB_CLOCAL(val) (((val) >> 22) & 1)
#define TEXMODE_TCA_MSELECT(val) (((val) >> 23) & 7)
#define TEXMODE_TCA_REVERSE_BLEND(val) (((val) >> 26) & 1)
#define TEXMODE_TCA_ADD_ACLOCAL(val) (((val) >> 27) & 3)
#define TEXMODE_TCA_INVERT_OUTPUT(val) (((val) >> 29) & 1)
#define TEXMODE_TRILINEAR(val) (((val) >> 30) & 1)
#define TEXMODE_SEQ_8_DOWNLD(val) (((val) >> 31) & 1)
#define TEXLOD_LODMIN(val) (((val) >> 0) & 0x3f)
#define TEXLOD_LODMAX(val) (((val) >> 6) & 0x3f)
#define TEXLOD_LODBIAS(val) (((val) >> 12) & 0x3f)
#define TEXLOD_LOD_ODD(val) (((val) >> 18) & 1)
#define TEXLOD_LOD_TSPLIT(val) (((val) >> 19) & 1)
#define TEXLOD_LOD_S_IS_WIDER(val) (((val) >> 20) & 1)
#define TEXLOD_LOD_ASPECT(val) (((val) >> 21) & 3)
#define TEXLOD_LOD_ZEROFRAC(val) (((val) >> 23) & 1)
#define TEXLOD_TMULTIBASEADDR(val) (((val) >> 24) & 1)
#define TEXLOD_TDATA_SWIZZLE(val) (((val) >> 25) & 1)
#define TEXLOD_TDATA_SWAP(val) (((val) >> 26) & 1)
#define TEXLOD_TDIRECT_WRITE(val) (((val) >> 27) & 1) /* Voodoo 2 only */
#define TEXDETAIL_DETAIL_MAX(val) (((val) >> 0) & 0xff)
#define TEXDETAIL_DETAIL_BIAS(val) (((val) >> 8) & 0x3f)
#define TEXDETAIL_DETAIL_SCALE(val) (((val) >> 14) & 7)
#define TEXDETAIL_RGB_MIN_FILTER(val) (((val) >> 17) & 1) /* Voodoo 2 only */
#define TEXDETAIL_RGB_MAG_FILTER(val) (((val) >> 18) & 1) /* Voodoo 2 only */
#define TEXDETAIL_ALPHA_MIN_FILTER(val) (((val) >> 19) & 1) /* Voodoo 2 only */
#define TEXDETAIL_ALPHA_MAG_FILTER(val) (((val) >> 20) & 1) /* Voodoo 2 only */
#define TEXDETAIL_SEPARATE_RGBA_FILTER(val) (((val) >> 21) & 1) /* Voodoo 2 only */
#define TREXINIT_SEND_TMU_CONFIG(val) (((val) >> 18) & 1)
/*************************************
*
* Core types
*
*************************************/
typedef struct _voodoo_state voodoo_state;
typedef struct _poly_extra_data poly_extra_data;
typedef Bit32u rgb_t;
typedef struct _rgba rgba;
#define LSB_FIRST
struct _rgba
{
#ifdef LSB_FIRST
Bit8u b, g, r, a;
#else
Bit8u a, r, g, b;
#endif
};
typedef union _voodoo_reg voodoo_reg;
union _voodoo_reg
{
Bit32s i;
Bit32u u;
float f;
rgba rgb;
};
typedef voodoo_reg rgb_union;
/* note that this structure is an even 64 bytes long */
typedef struct _stats_block stats_block;
struct _stats_block
{
Bit32s pixels_in; /* pixels in statistic */
Bit32s pixels_out; /* pixels out statistic */
Bit32s chroma_fail; /* chroma test fail statistic */
Bit32s zfunc_fail; /* z function test fail statistic */
Bit32s afunc_fail; /* alpha function test fail statistic */
Bit32s clip_fail; /* clipping fail statistic */
Bit32s stipple_count; /* stipple statistic */
Bit32s filler[64/4 - 7]; /* pad this structure to 64 bytes */
};
typedef struct _fifo_state fifo_state;
struct _fifo_state
{
Bit32u* base; /* base of the FIFO */
Bit32s size; /* size of the FIFO */
Bit32s in; /* input pointer */
Bit32s out; /* output pointer */
};
typedef struct _cmdfifo_info cmdfifo_info;
struct _cmdfifo_info
{
bx_bool enable; /* enabled? */
Bit8u count_holes; /* count holes? */
Bit32u base; /* base address in framebuffer RAM */
Bit32u end; /* end address in framebuffer RAM */
Bit32u rdptr; /* current read pointer */
Bit32u amin; /* minimum address */
Bit32u amax; /* maximum address */
Bit32u depth; /* current depth */
Bit32u depth_needed; /* depth needed for command */
Bit32u holes; /* number of holes */
#ifdef WIN32
HANDLE event;
#endif
};
typedef struct _pci_state pci_state;
struct _pci_state
{
fifo_state fifo; /* PCI FIFO */
Bit32u init_enable; /* initEnable value */
Bit8u stall_state; /* state of the system if we're stalled */
Bit8u op_pending; /* true if an operation is pending */
Bit32u fifo_mem[64*2]; /* memory backing the PCI FIFO */
};
typedef struct _ncc_table ncc_table;
struct _ncc_table
{
bx_bool dirty; /* is the texel lookup dirty? */
voodoo_reg* reg; /* pointer to our registers */
Bit32s ir[4], ig[4], ib[4]; /* I values for R,G,B */
Bit32s qr[4], qg[4], qb[4]; /* Q values for R,G,B */
Bit32s y[16]; /* Y values */
rgb_t * palette; /* pointer to associated RGB palette */
rgb_t * palettea; /* pointer to associated ARGB palette */
rgb_t texel[256]; /* texel lookup */
};
typedef struct _tmu_state tmu_state;
struct _tmu_state
{
Bit8u* ram; /* pointer to our RAM */
Bit32u mask; /* mask to apply to pointers */
voodoo_reg* reg; /* pointer to our register base */
bx_bool regdirty; /* true if the LOD/mode/base registers have changed */
Bit32u texaddr_mask; /* mask for texture address */
Bit8u texaddr_shift; /* shift for texture address */
Bit64s starts, startt; /* starting S,T (14.18) */
Bit64s startw; /* starting W (2.30) */
Bit64s dsdx, dtdx; /* delta S,T per X */
Bit64s dwdx; /* delta W per X */
Bit64s dsdy, dtdy; /* delta S,T per Y */
Bit64s dwdy; /* delta W per Y */
Bit32s lodmin, lodmax; /* min, max LOD values */
Bit32s lodbias; /* LOD bias */
Bit32u lodmask; /* mask of available LODs */
Bit32u lodoffset[9]; /* offset of texture base for each LOD */
Bit32s detailmax; /* detail clamp */
Bit32s detailbias; /* detail bias */
Bit8u detailscale; /* detail scale */
Bit32u wmask; /* mask for the current texture width */
Bit32u hmask; /* mask for the current texture height */
Bit32u bilinear_mask; /* mask for bilinear resolution (0xf0 for V1, 0xff for V2) */
ncc_table ncc[2]; /* two NCC tables */
rgb_t * lookup; /* currently selected lookup */
rgb_t * texel[16]; /* texel lookups for each format */
rgb_t palette[256]; /* palette lookup table */
rgb_t palettea[256]; /* palette+alpha lookup table */
};
typedef struct _tmu_shared_state tmu_shared_state;
struct _tmu_shared_state
{
rgb_t rgb332[256]; /* RGB 3-3-2 lookup table */
rgb_t alpha8[256]; /* alpha 8-bit lookup table */
rgb_t int8[256]; /* intensity 8-bit lookup table */
rgb_t ai44[256]; /* alpha, intensity 4-4 lookup table */
rgb_t rgb565[65536]; /* RGB 5-6-5 lookup table */
rgb_t argb1555[65536]; /* ARGB 1-5-5-5 lookup table */
rgb_t argb4444[65536]; /* ARGB 4-4-4-4 lookup table */
};
typedef struct _setup_vertex setup_vertex;
struct _setup_vertex
{
float x, y; /* X, Y coordinates */
float a, r, g, b; /* A, R, G, B values */
float z, wb; /* Z and broadcast W values */
float w0, s0, t0; /* W, S, T for TMU 0 */
float w1, s1, t1; /* W, S, T for TMU 1 */
};
typedef struct _fbi_state fbi_state;
struct _fbi_state
{
Bit8u * ram; /* pointer to frame buffer RAM */
Bit32u mask; /* mask to apply to pointers */
Bit32u rgboffs[3]; /* word offset to 3 RGB buffers */
Bit32u auxoffs; /* word offset to 1 aux buffer */
Bit8u frontbuf; /* front buffer index */
Bit8u backbuf; /* back buffer index */
Bit8u swaps_pending; /* number of pending swaps */
bx_bool video_changed; /* did the frontbuffer video change? */
Bit32u yorigin; /* Y origin subtract value */
Bit32u lfb_base; /* base of LFB in memory */
Bit8u lfb_stride; /* stride of LFB accesses in bits */
Bit32u width; /* width of current frame buffer */
Bit32u height; /* height of current frame buffer */
Bit32u xoffs; /* horizontal offset (back porch) */
Bit32u yoffs; /* vertical offset (back porch) */
Bit32u vsyncscan; /* vertical sync scanline */
Bit32u rowpixels; /* pixels per row */
Bit32u tile_width; /* width of video tiles */
Bit32u tile_height; /* height of video tiles */
Bit32u x_tiles; /* number of tiles in the X direction */
Bit8u vblank; /* VBLANK state */
Bit8u vblank_count; /* number of VBLANKs since last swap */
bx_bool vblank_swap_pending; /* a swap is pending, waiting for a vblank */
Bit8u vblank_swap; /* swap when we hit this count */
Bit8u vblank_dont_swap; /* don't actually swap when we hit this point */
/* triangle setup info */
bx_bool cheating_allowed; /* allow cheating? */
Bit32s sign; /* triangle sign */
Bit16s ax, ay; /* vertex A x,y (12.4) */
Bit16s bx, by; /* vertex B x,y (12.4) */
Bit16s cx, cy; /* vertex C x,y (12.4) */
Bit32s startr, startg, startb, starta; /* starting R,G,B,A (12.12) */
Bit32s startz; /* starting Z (20.12) */
Bit64s startw; /* starting W (16.32) */
Bit32s drdx, dgdx, dbdx, dadx; /* delta R,G,B,A per X */
Bit32s dzdx; /* delta Z per X */
Bit64s dwdx; /* delta W per X */
Bit32s drdy, dgdy, dbdy, dady; /* delta R,G,B,A per Y */
Bit32s dzdy; /* delta Z per Y */
Bit64s dwdy; /* delta W per Y */
stats_block lfb_stats; /* LFB-access statistics */
Bit8u sverts; /* number of vertices ready */
setup_vertex svert[3]; /* 3 setup vertices */
fifo_state fifo; /* framebuffer memory fifo */
cmdfifo_info cmdfifo[2]; /* command FIFOs */
Bit8u fogblend[64]; /* 64-entry fog table */
Bit8u fogdelta[64]; /* 64-entry fog table */
Bit8u fogdelta_mask; /* mask for for delta (0xff for V1, 0xfc for V2) */
rgb_t pen[65536]; /* mapping from pixels to pens */
rgb_t clut[512]; /* clut gamma data */
bx_bool clut_dirty; /* do we need to recompute? */
};
typedef struct _dac_state dac_state;
struct _dac_state
{
Bit8u reg[8]; /* 8 registers */
Bit8u read_result; /* pending read result */
Bit8u data_size;
Bit8u clk0_m;
Bit8u clk0_n;
Bit8u clk0_p;
Bit32u clk0_freq;
};
typedef struct _raster_info raster_info;
struct _raster_info
{
struct _raster_info *next; /* pointer to next entry with the same hash */
poly_draw_scanline_func callback; /* callback pointer */
Bit8u is_generic; /* true if this is one of the generic rasterizers */
Bit8u display; /* display index */
Bit32u hits; /* how many hits (pixels) we've used this for */
Bit32u polys; /* how many polys we've used this for */
Bit32u eff_color_path; /* effective fbzColorPath value */
Bit32u eff_alpha_mode; /* effective alphaMode value */
Bit32u eff_fog_mode; /* effective fogMode value */
Bit32u eff_fbz_mode; /* effective fbzMode value */
Bit32u eff_tex_mode_0; /* effective textureMode value for TMU #0 */
Bit32u eff_tex_mode_1; /* effective textureMode value for TMU #1 */
};
struct _poly_extra_data
{
voodoo_state* state; /* pointer back to the voodoo state */
raster_info* info; /* pointer to rasterizer information */
Bit16s ax, ay; /* vertex A x,y (12.4) */
Bit32s startr, startg, startb, starta; /* starting R,G,B,A (12.12) */
Bit32s startz; /* starting Z (20.12) */
Bit64s startw; /* starting W (16.32) */
Bit32s drdx, dgdx, dbdx, dadx; /* delta R,G,B,A per X */
Bit32s dzdx; /* delta Z per X */
Bit64s dwdx; /* delta W per X */
Bit32s drdy, dgdy, dbdy, dady; /* delta R,G,B,A per Y */
Bit32s dzdy; /* delta Z per Y */
Bit64s dwdy; /* delta W per Y */
Bit64s starts0, startt0; /* starting S,T (14.18) */
Bit64s startw0; /* starting W (2.30) */
Bit64s ds0dx, dt0dx; /* delta S,T per X */
Bit64s dw0dx; /* delta W per X */
Bit64s ds0dy, dt0dy; /* delta S,T per Y */
Bit64s dw0dy; /* delta W per Y */
Bit32s lodbase0; /* used during rasterization */
Bit64s starts1, startt1; /* starting S,T (14.18) */
Bit64s startw1; /* starting W (2.30) */
Bit64s ds1dx, dt1dx; /* delta S,T per X */
Bit64s dw1dx; /* delta W per X */
Bit64s ds1dy, dt1dy; /* delta S,T per Y */
Bit64s dw1dy; /* delta W per Y */
Bit32s lodbase1; /* used during rasterization */
Bit16u dither[16]; /* dither matrix, for fastfill */
};
typedef struct _banshee_info banshee_info;
struct _banshee_info
{
Bit32u io[0x40]; /* I/O registers */
Bit32u agp[0x80]; /* AGP registers */
Bit8u vga[0x20]; /* VGA registers */
Bit8u crtc[0x27]; /* VGA CRTC registers */
Bit8u seq[0x05]; /* VGA sequencer registers */
Bit8u gc[0x05]; /* VGA graphics controller registers */
Bit8u att[0x15]; /* VGA attribute registers */
Bit8u attff; /* VGA attribute flip-flop */
};
/* typedef struct _voodoo_state voodoo_state; -- declared above */
struct _voodoo_state
{
Bit8u index; /* index of board */
Bit8u type; /* type of system */
Bit8u chipmask; /* mask for which chips are available */
Bit32u freq; /* operating frequency */
Bit32u extra_cycles; /* extra cycles not yet accounted for */
int trigger; /* trigger used for stalling */
voodoo_reg reg[0x400]; /* raw registers */
const Bit8u *regaccess; /* register access array */
const char *const *regnames; /* register names array */
Bit8u alt_regmap; /* enable alternate register map? */
pci_state pci; /* PCI state */
dac_state dac; /* DAC state */
fbi_state fbi; /* FBI states */
tmu_state tmu[MAX_TMU]; /* TMU states */
tmu_shared_state tmushare; /* TMU shared state */
banshee_info banshee; /* Banshee state */
Bit32u send_config;
Bit32u tmu_config;
stats_block * thread_stats; /* per-thread statistics */
Bit32u last_status_pc; /* PC of last status description (for logging) */
Bit32u last_status_value; /* value of last status read (for logging) */
int next_rasterizer; /* next rasterizer index */
raster_info rasterizer[MAX_RASTERIZERS]; /* array of rasterizers */
raster_info * raster_hash[RASTER_HASH_SIZE]; /* hash table of rasterizers */
};
/*************************************
*
* Inline FIFO management
*
*************************************/
BX_CPP_INLINE void fifo_reset(fifo_state *f)
{
f->in = f->out = 0;
}
BX_CPP_INLINE void fifo_add(fifo_state *f, Bit32u data)
{
Bit32s next_in;
/* compute the value of 'in' after we add this item */
next_in = f->in + 1;
if (next_in >= f->size)
next_in = 0;
/* as long as it's not equal to the output pointer, we can do it */
if (next_in != f->out)
{
f->base[f->in] = data;
f->in = next_in;
}
}
BX_CPP_INLINE Bit32u fifo_remove(fifo_state *f)
{
Bit32u data = 0xffffffff;
/* as long as we have data, we can do it */
if (f->out != f->in)
{
Bit32s next_out;
/* fetch the data */
data = f->base[f->out];
/* advance the output pointer */
next_out = f->out + 1;
if (next_out >= f->size)
next_out = 0;
f->out = next_out;
}
return data;
}
BX_CPP_INLINE Bit32u fifo_peek(fifo_state *f)
{
return f->base[f->out];
}
BX_CPP_INLINE int fifo_empty(fifo_state *f)
{
return (f->in == f->out);
}
BX_CPP_INLINE int fifo_full(fifo_state *f)
{
return (f->in + 1 == f->out || (f->in == f->size - 1 && f->out == 0));
}
BX_CPP_INLINE Bit32s fifo_items(fifo_state *f)
{
Bit32s items = f->in - f->out;
if (items < 0)
items += f->size;
return items;
}
BX_CPP_INLINE Bit32s fifo_space(fifo_state *f)
{
Bit32s items = f->in - f->out;
if (items < 0)
items += f->size;
return f->size - 1 - items;
}
#ifndef PTR64
#define count_leading_zeros _count_leading_zeros
BX_CPP_INLINE Bit8u _count_leading_zeros(Bit32u value)
{
Bit32s result = 32;
while(value > 0) {
result--;
value >>= 1;
}
return result;
}
#endif
/*************************************
*
* Computes a fast 16.16 reciprocal
* of a 16.32 value; used for
* computing 1/w in the rasterizer.
*
* Since it is trivial to also
* compute log2(1/w) = -log2(w) at
* the same time, we do that as well
* to 16.8 precision for LOD
* calculations.
*
* On a Pentium M, this routine is
* 20% faster than a 64-bit integer
* divide and also produces the log
* for free.
*
*************************************/
BX_CPP_INLINE Bit32s fast_reciplog(Bit64s value, Bit32s *log2)
{
extern Bit32u voodoo_reciplog[];
Bit32u temp, recip, rlog;
Bit32u interp;
Bit32u *table;
int neg = false;
int lz, exp = 0;
/* always work with unsigned numbers */
if (value < 0)
{
value = -value;
neg = true;
}
/* if we've spilled out of 32 bits, push it down under 32 */
if (value & BX_CONST64(0xffff00000000))
{
temp = (Bit32u)(value >> 16);
exp -= 16;
}
else
temp = (Bit32u)value;
/* if the resulting value is 0, the reciprocal is infinite */
if ((temp == 0))
{
*log2 = 1000 << LOG_OUTPUT_PREC;
return neg ? 0x80000000 : 0x7fffffff;
}
/* determine how many leading zeros in the value and shift it up high */
lz = count_leading_zeros(temp);
temp <<= lz;
exp += lz;
/* compute a pointer to the table entries we want */
/* math is a bit funny here because we shift one less than we need to in order */
/* to account for the fact that there are two Bit32u's per table entry */
table = &voodoo_reciplog[(temp >> (31 - RECIPLOG_LOOKUP_BITS - 1)) & ((2 << RECIPLOG_LOOKUP_BITS) - 2)];
/* compute the interpolation value */
interp = (temp >> (31 - RECIPLOG_LOOKUP_BITS - 8)) & 0xff;
/* do a linear interpolatation between the two nearest table values */
/* for both the log and the reciprocal */
rlog = (table[1] * (0x100 - interp) + table[3] * interp) >> 8;
recip = (table[0] * (0x100 - interp) + table[2] * interp) >> 8;
/* the log result is the fractional part of the log; round it to the output precision */
rlog = (rlog + (1 << (RECIPLOG_LOOKUP_PREC - LOG_OUTPUT_PREC - 1))) >> (RECIPLOG_LOOKUP_PREC - LOG_OUTPUT_PREC);
/* the exponent is the non-fractional part of the log; normally, we would subtract it from rlog */
/* but since we want the log(1/value) = -log(value), we subtract rlog from the exponent */
*log2 = ((exp - (31 - RECIPLOG_INPUT_PREC)) << LOG_OUTPUT_PREC) - rlog;
/* adjust the exponent to account for all the reciprocal-related parameters to arrive at a final shift amount */
exp += (RECIP_OUTPUT_PREC - RECIPLOG_LOOKUP_PREC) - (31 - RECIPLOG_INPUT_PREC);
/* shift by the exponent */
if (exp < 0)
recip >>= -exp;
else
recip <<= exp;
/* on the way out, apply the original sign to the reciprocal */
return neg ? -((Bit32s)recip) : recip;
}
/*************************************
*
* Float-to-int conversions
*
*************************************/
BX_CPP_INLINE Bit32s float_to_Bit32s(Bit32u data, int fixedbits)
{
int exponent = ((data >> 23) & 0xff) - 127 - 23 + fixedbits;
Bit32s result = (data & 0x7fffff) | 0x800000;
if (exponent < 0)
{
if (exponent > -32)
result >>= -exponent;
else
result = 0;
}
else
{
if (exponent < 32)
result <<= exponent;
else
result = 0x7fffffff;
}
if (data & 0x80000000)
result = -result;
return result;
}
BX_CPP_INLINE Bit64s float_to_Bit64s(Bit32u data, int fixedbits)
{
int exponent = ((data >> 23) & 0xff) - 127 - 23 + fixedbits;
Bit64s result = (data & 0x7fffff) | 0x800000;
if (exponent < 0)
{
if (exponent > -64)
result >>= -exponent;
else
result = 0;
}
else
{
if (exponent < 64)
result <<= exponent;
else
result = BX_CONST64(0x7fffffffffffffff);
}
if (data & 0x80000000)
result = -result;
return result;
}
/*************************************
*
* Rasterizer inlines
*
*************************************/
BX_CPP_INLINE Bit32u normalize_color_path(Bit32u eff_color_path)
{
/* ignore the subpixel adjust and texture enable flags */
eff_color_path &= ~((1 << 26) | (1 << 27));
return eff_color_path;
}
BX_CPP_INLINE Bit32u normalize_alpha_mode(Bit32u eff_alpha_mode)
{
/* always ignore alpha ref value */
eff_alpha_mode &= ~(0xff << 24);
/* if not doing alpha testing, ignore the alpha function and ref value */
if (!ALPHAMODE_ALPHATEST(eff_alpha_mode))
eff_alpha_mode &= ~(7 << 1);
/* if not doing alpha blending, ignore the source and dest blending factors */
if (!ALPHAMODE_ALPHABLEND(eff_alpha_mode))
eff_alpha_mode &= ~((15 << 8) | (15 << 12) | (15 << 16) | (15 << 20));
return eff_alpha_mode;
}
BX_CPP_INLINE Bit32u normalize_fog_mode(Bit32u eff_fog_mode)
{
/* if not doing fogging, ignore all the other fog bits */
if (!FOGMODE_ENABLE_FOG(eff_fog_mode))
eff_fog_mode = 0;
return eff_fog_mode;
}
BX_CPP_INLINE Bit32u normalize_fbz_mode(Bit32u eff_fbz_mode)
{
/* ignore the draw buffer */
eff_fbz_mode &= ~(3 << 14);
return eff_fbz_mode;
}
BX_CPP_INLINE Bit32u normalize_tex_mode(Bit32u eff_tex_mode)
{
/* ignore the NCC table and seq_8_downld flags */
eff_tex_mode &= ~((1 << 5) | (1 << 31));
/* classify texture formats into 3 format categories */
if (TEXMODE_FORMAT(eff_tex_mode) < 8)
eff_tex_mode = (eff_tex_mode & ~(0xf << 8)) | (0 << 8);
else if (TEXMODE_FORMAT(eff_tex_mode) >= 10 && TEXMODE_FORMAT(eff_tex_mode) <= 12)
eff_tex_mode = (eff_tex_mode & ~(0xf << 8)) | (10 << 8);
else
eff_tex_mode = (eff_tex_mode & ~(0xf << 8)) | (8 << 8);
return eff_tex_mode;
}
BX_CPP_INLINE Bit32u compute_raster_hash(const raster_info *info)
{
Bit32u hash;
/* make a hash */
hash = info->eff_color_path;
hash = (hash << 1) | (hash >> 31);
hash ^= info->eff_fbz_mode;
hash = (hash << 1) | (hash >> 31);
hash ^= info->eff_alpha_mode;
hash = (hash << 1) | (hash >> 31);
hash ^= info->eff_fog_mode;
hash = (hash << 1) | (hash >> 31);
hash ^= info->eff_tex_mode_0;
hash = (hash << 1) | (hash >> 31);
hash ^= info->eff_tex_mode_1;
return hash % RASTER_HASH_SIZE;
}
/*************************************
*
* Dithering macros
*
*************************************/
/* note that these equations and the dither matrixes have
been confirmed to be exact matches to the real hardware */
#define DITHER_RB(val,dith) ((((val) << 1) - ((val) >> 4) + ((val) >> 7) + (dith)) >> 1)
#define DITHER_G(val,dith) ((((val) << 2) - ((val) >> 4) + ((val) >> 6) + (dith)) >> 2)
#define DECLARE_DITHER_POINTERS \
const Bit8u *dither_lookup = NULL; \
const Bit8u *dither4 = NULL; \
const Bit8u *dither = NULL \
#define COMPUTE_DITHER_POINTERS(FBZMODE, YY) \
do \
{ \
/* compute the dithering pointers */ \
if (FBZMODE_ENABLE_DITHERING(FBZMODE)) \
{ \
dither4 = &dither_matrix_4x4[((YY) & 3) * 4]; \
if (FBZMODE_DITHER_TYPE(FBZMODE) == 0) \
{ \
dither = dither4; \
dither_lookup = &dither4_lookup[(YY & 3) << 11]; \
} \
else \
{ \
dither = &dither_matrix_2x2[((YY) & 3) * 4]; \
dither_lookup = &dither2_lookup[(YY & 3) << 11]; \
} \
} \
} \
while (0)
#define APPLY_DITHER(FBZMODE, XX, DITHER_LOOKUP, RR, GG, BB) \
do \
{ \
/* apply dithering */ \
if (FBZMODE_ENABLE_DITHERING(FBZMODE)) \
{ \
/* look up the dither value from the appropriate matrix */ \
const Bit8u *dith = &DITHER_LOOKUP[((XX) & 3) << 1]; \
\
/* apply dithering to R,G,B */ \
(RR) = dith[((RR) << 3) + 0]; \
(GG) = dith[((GG) << 3) + 1]; \
(BB) = dith[((BB) << 3) + 0]; \
} \
else \
{ \
(RR) >>= 3; \
(GG) >>= 2; \
(BB) >>= 3; \
} \
} \
while (0)
/*************************************
*
* Clamping macros
*
*************************************/
#define CLAMPED_ARGB(ITERR, ITERG, ITERB, ITERA, FBZCP, RESULT) \
do \
{ \
Bit32s r = (Bit32s)(ITERR) >> 12; \
Bit32s g = (Bit32s)(ITERG) >> 12; \
Bit32s b = (Bit32s)(ITERB) >> 12; \
Bit32s a = (Bit32s)(ITERA) >> 12; \
\
if (FBZCP_RGBZW_CLAMP(FBZCP) == 0) \
{ \
r &= 0xfff; \
RESULT.rgb.r = r; \
if (r == 0xfff) \
RESULT.rgb.r = 0; \
else if (r == 0x100) \
RESULT.rgb.r = 0xff; \
\
g &= 0xfff; \
RESULT.rgb.g = g; \
if (g == 0xfff) \
RESULT.rgb.g = 0; \
else if (g == 0x100) \
RESULT.rgb.g = 0xff; \
\
b &= 0xfff; \
RESULT.rgb.b = b; \
if (b == 0xfff) \
RESULT.rgb.b = 0; \
else if (b == 0x100) \
RESULT.rgb.b = 0xff; \
\
a &= 0xfff; \
RESULT.rgb.a = a; \
if (a == 0xfff) \
RESULT.rgb.a = 0; \
else if (a == 0x100) \
RESULT.rgb.a = 0xff; \
} \
else \
{ \
RESULT.rgb.r = (r < 0) ? 0 : (r > 0xff) ? 0xff : r; \
RESULT.rgb.g = (g < 0) ? 0 : (g > 0xff) ? 0xff : g; \
RESULT.rgb.b = (b < 0) ? 0 : (b > 0xff) ? 0xff : b; \
RESULT.rgb.a = (a < 0) ? 0 : (a > 0xff) ? 0xff : a; \
} \
} \
while (0)
#define CLAMPED_Z(ITERZ, FBZCP, RESULT) \
do \
{ \
(RESULT) = (Bit32s)(ITERZ) >> 12; \
if (FBZCP_RGBZW_CLAMP(FBZCP) == 0) \
{ \
(RESULT) &= 0xfffff; \
if ((RESULT) == 0xfffff) \
(RESULT) = 0; \
else if ((RESULT) == 0x10000) \
(RESULT) = 0xffff; \
else \
(RESULT) &= 0xffff; \
} \
else \
{ \
CLAMP((RESULT), 0, 0xffff); \
} \
} \
while (0)
#define CLAMPED_W(ITERW, FBZCP, RESULT) \
do \
{ \
(RESULT) = (Bit16s)((ITERW) >> 32); \
if (FBZCP_RGBZW_CLAMP(FBZCP) == 0) \
{ \
(RESULT) &= 0xffff; \
if ((RESULT) == 0xffff) \
(RESULT) = 0; \
else if ((RESULT) == 0x100) \
(RESULT) = 0xff; \
(RESULT) &= 0xff; \
} \
else \
{ \
CLAMP((RESULT), 0, 0xff); \
} \
} \
while (0)
/*************************************
*
* Chroma keying macro
*
*************************************/
#define APPLY_CHROMAKEY(VV, STATS, FBZMODE, COLOR) \
do \
{ \
if (FBZMODE_ENABLE_CHROMAKEY(FBZMODE)) \
{ \
/* non-range version */ \
if (!CHROMARANGE_ENABLE((VV)->reg[chromaRange].u)) \
{ \
if (((COLOR.u ^ (VV)->reg[chromaKey].u) & 0xffffff) == 0) \
{ \
(STATS)->chroma_fail++; \
goto skipdrawdepth; \
} \
} \
\
/* tricky range version */ \
else \
{ \
Bit32s low, high, test; \
int results = 0; \
\
/* check blue */ \
low = (VV)->reg[chromaKey].rgb.b; \
high = (VV)->reg[chromaRange].rgb.b; \
test = COLOR.rgb.b; \
results = (test >= low && test <= high); \
results ^= CHROMARANGE_BLUE_EXCLUSIVE((VV)->reg[chromaRange].u); \
results <<= 1; \
\
/* check green */ \
low = (VV)->reg[chromaKey].rgb.g; \
high = (VV)->reg[chromaRange].rgb.g; \
test = COLOR.rgb.g; \
results |= (test >= low && test <= high); \
results ^= CHROMARANGE_GREEN_EXCLUSIVE((VV)->reg[chromaRange].u); \
results <<= 1; \
\
/* check red */ \
low = (VV)->reg[chromaKey].rgb.r; \
high = (VV)->reg[chromaRange].rgb.r; \
test = COLOR.rgb.r; \
results |= (test >= low && test <= high); \
results ^= CHROMARANGE_RED_EXCLUSIVE((VV)->reg[chromaRange].u); \
\
/* final result */ \
if (CHROMARANGE_UNION_MODE((VV)->reg[chromaRange].u)) \
{ \
if (results != 0) \
{ \
(STATS)->chroma_fail++; \
goto skipdrawdepth; \
} \
} \
else \
{ \
if (results == 7) \
{ \
(STATS)->chroma_fail++; \
goto skipdrawdepth; \
} \
} \
} \
} \
} \
while (0)
/*************************************
*
* Alpha masking macro
*
*************************************/
#define APPLY_ALPHAMASK(VV, STATS, FBZMODE, AA) \
do \
{ \
if (FBZMODE_ENABLE_ALPHA_MASK(FBZMODE)) \
{ \
if (((AA) & 1) == 0) \
{ \
(STATS)->afunc_fail++; \
goto skipdrawdepth; \
} \
} \
} \
while (0)
/*************************************
*
* Alpha testing macro
*
*************************************/
#define APPLY_ALPHATEST(VV, STATS, ALPHAMODE, AA) \
do \
{ \
if (ALPHAMODE_ALPHATEST(ALPHAMODE)) \
{ \
Bit8u alpharef = (VV)->reg[alphaMode].rgb.a; \
switch (ALPHAMODE_ALPHAFUNCTION(ALPHAMODE)) \
{ \
case 0: /* alphaOP = never */ \
(STATS)->afunc_fail++; \
goto skipdrawdepth; \
\
case 1: /* alphaOP = less than */ \
if ((AA) >= alpharef) \
{ \
(STATS)->afunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 2: /* alphaOP = equal */ \
if ((AA) != alpharef) \
{ \
(STATS)->afunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 3: /* alphaOP = less than or equal */ \
if ((AA) > alpharef) \
{ \
(STATS)->afunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 4: /* alphaOP = greater than */ \
if ((AA) <= alpharef) \
{ \
(STATS)->afunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 5: /* alphaOP = not equal */ \
if ((AA) == alpharef) \
{ \
(STATS)->afunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 6: /* alphaOP = greater than or equal */ \
if ((AA) < alpharef) \
{ \
(STATS)->afunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 7: /* alphaOP = always */ \
break; \
} \
} \
} \
while (0)
/*************************************
*
* Alpha blending macro
*
*************************************/
#define APPLY_ALPHA_BLEND(FBZMODE, ALPHAMODE, XX, DITHER, RR, GG, BB, AA) \
do \
{ \
if (ALPHAMODE_ALPHABLEND(ALPHAMODE)) \
{ \
int dpix = dest[XX]; \
int dr = (dpix >> 8) & 0xf8; \
int dg = (dpix >> 3) & 0xfc; \
int db = (dpix << 3) & 0xf8; \
int da = FBZMODE_ENABLE_ALPHA_PLANES(FBZMODE) ? depth[XX] : 0xff; \
int sr = (RR); \
int sg = (GG); \
int sb = (BB); \
int sa = (AA); \
int ta; \
\
/* apply dither subtraction */ \
if (FBZMODE_ALPHA_DITHER_SUBTRACT(FBZMODE)) \
{ \
/* look up the dither value from the appropriate matrix */ \
int dith = DITHER[(XX) & 3]; \
\
/* subtract the dither value */ \
dr = ((dr << 1) + 15 - dith) >> 1; \
dg = ((dg << 2) + 15 - dith) >> 2; \
db = ((db << 1) + 15 - dith) >> 1; \
} \
\
/* compute source portion */ \
switch (ALPHAMODE_SRCRGBBLEND(ALPHAMODE)) \
{ \
default: /* reserved */ \
case 0: /* AZERO */ \
(RR) = (GG) = (BB) = 0; \
break; \
\
case 1: /* ASRC_ALPHA */ \
(RR) = (sr * (sa + 1)) >> 8; \
(GG) = (sg * (sa + 1)) >> 8; \
(BB) = (sb * (sa + 1)) >> 8; \
break; \
\
case 2: /* A_COLOR */ \
(RR) = (sr * (dr + 1)) >> 8; \
(GG) = (sg * (dg + 1)) >> 8; \
(BB) = (sb * (db + 1)) >> 8; \
break; \
\
case 3: /* ADST_ALPHA */ \
(RR) = (sr * (da + 1)) >> 8; \
(GG) = (sg * (da + 1)) >> 8; \
(BB) = (sb * (da + 1)) >> 8; \
break; \
\
case 4: /* AONE */ \
break; \
\
case 5: /* AOMSRC_ALPHA */ \
(RR) = (sr * (0x100 - sa)) >> 8; \
(GG) = (sg * (0x100 - sa)) >> 8; \
(BB) = (sb * (0x100 - sa)) >> 8; \
break; \
\
case 6: /* AOM_COLOR */ \
(RR) = (sr * (0x100 - dr)) >> 8; \
(GG) = (sg * (0x100 - dg)) >> 8; \
(BB) = (sb * (0x100 - db)) >> 8; \
break; \
\
case 7: /* AOMDST_ALPHA */ \
(RR) = (sr * (0x100 - da)) >> 8; \
(GG) = (sg * (0x100 - da)) >> 8; \
(BB) = (sb * (0x100 - da)) >> 8; \
break; \
\
case 15: /* ASATURATE */ \
ta = (sa < (0x100 - da)) ? sa : (0x100 - da); \
(RR) = (sr * (ta + 1)) >> 8; \
(GG) = (sg * (ta + 1)) >> 8; \
(BB) = (sb * (ta + 1)) >> 8; \
break; \
} \
\
/* add in dest portion */ \
switch (ALPHAMODE_DSTRGBBLEND(ALPHAMODE)) \
{ \
default: /* reserved */ \
case 0: /* AZERO */ \
break; \
\
case 1: /* ASRC_ALPHA */ \
(RR) += (dr * (sa + 1)) >> 8; \
(GG) += (dg * (sa + 1)) >> 8; \
(BB) += (db * (sa + 1)) >> 8; \
break; \
\
case 2: /* A_COLOR */ \
(RR) += (dr * (sr + 1)) >> 8; \
(GG) += (dg * (sg + 1)) >> 8; \
(BB) += (db * (sb + 1)) >> 8; \
break; \
\
case 3: /* ADST_ALPHA */ \
(RR) += (dr * (da + 1)) >> 8; \
(GG) += (dg * (da + 1)) >> 8; \
(BB) += (db * (da + 1)) >> 8; \
break; \
\
case 4: /* AONE */ \
(RR) += dr; \
(GG) += dg; \
(BB) += db; \
break; \
\
case 5: /* AOMSRC_ALPHA */ \
(RR) += (dr * (0x100 - sa)) >> 8; \
(GG) += (dg * (0x100 - sa)) >> 8; \
(BB) += (db * (0x100 - sa)) >> 8; \
break; \
\
case 6: /* AOM_COLOR */ \
(RR) += (dr * (0x100 - sr)) >> 8; \
(GG) += (dg * (0x100 - sg)) >> 8; \
(BB) += (db * (0x100 - sb)) >> 8; \
break; \
\
case 7: /* AOMDST_ALPHA */ \
(RR) += (dr * (0x100 - da)) >> 8; \
(GG) += (dg * (0x100 - da)) >> 8; \
(BB) += (db * (0x100 - da)) >> 8; \
break; \
\
case 15: /* A_COLORBEFOREFOG */ \
(RR) += (dr * (prefogr + 1)) >> 8; \
(GG) += (dg * (prefogg + 1)) >> 8; \
(BB) += (db * (prefogb + 1)) >> 8; \
break; \
} \
\
/* blend the source alpha */ \
(AA) = 0; \
if (ALPHAMODE_SRCALPHABLEND(ALPHAMODE) == 4) \
(AA) = sa; \
\
/* blend the dest alpha */ \
if (ALPHAMODE_DSTALPHABLEND(ALPHAMODE) == 4) \
(AA) += da; \
\
/* clamp */ \
CLAMP((RR), 0x00, 0xff); \
CLAMP((GG), 0x00, 0xff); \
CLAMP((BB), 0x00, 0xff); \
CLAMP((AA), 0x00, 0xff); \
} \
} \
while (0)
/*************************************
*
* Fogging macro
*
*************************************/
#define APPLY_FOGGING(VV, FOGMODE, FBZCP, XX, DITHER4, RR, GG, BB, ITERZ, ITERW, ITERAXXX) \
do \
{ \
if (FOGMODE_ENABLE_FOG(FOGMODE)) \
{ \
rgb_union fogcolor = (VV)->reg[fogColor]; \
Bit32s fr, fg, fb; \
\
/* constant fog bypasses everything else */ \
if (FOGMODE_FOG_CONSTANT(FOGMODE)) \
{ \
fr = fogcolor.rgb.r; \
fg = fogcolor.rgb.g; \
fb = fogcolor.rgb.b; \
} \
/* non-constant fog comes from several sources */ \
else \
{ \
Bit32s fogblend = 0; \
\
/* if fog_add is zero, we start with the fog color */ \
if (FOGMODE_FOG_ADD(FOGMODE) == 0) \
{ \
fr = fogcolor.rgb.r; \
fg = fogcolor.rgb.g; \
fb = fogcolor.rgb.b; \
} \
else \
fr = fg = fb = 0; \
\
/* if fog_mult is zero, we subtract the incoming color */ \
if (FOGMODE_FOG_MULT(FOGMODE) == 0) \
{ \
fr -= (RR); \
fg -= (GG); \
fb -= (BB); \
} \
\
/* fog blending mode */ \
switch (FOGMODE_FOG_ZALPHA(FOGMODE)) \
{ \
case 0: /* fog table */ \
{ \
Bit32s delta = (VV)->fbi.fogdelta[wfloat >> 10]; \
Bit32s deltaval; \
\
/* perform the multiply against lower 8 bits of wfloat */ \
deltaval = (delta & (VV)->fbi.fogdelta_mask) * \
((wfloat >> 2) & 0xff); \
\
/* fog zones allow for negating this value */ \
if (FOGMODE_FOG_ZONES(FOGMODE) && (delta & 2)) \
deltaval = -deltaval; \
deltaval >>= 6; \
\
/* apply dither */ \
if (FOGMODE_FOG_DITHER(FOGMODE)) \
deltaval += DITHER4[(XX) & 3]; \
deltaval >>= 4; \
\
/* add to the blending factor */ \
fogblend = (VV)->fbi.fogblend[wfloat >> 10] + deltaval; \
break; \
} \
\
case 1: /* iterated A */ \
fogblend = ITERAXXX.rgb.a; \
break; \
\
case 2: /* iterated Z */ \
CLAMPED_Z((ITERZ), FBZCP, fogblend); \
fogblend >>= 8; \
break; \
\
case 3: /* iterated W - Voodoo 2 only */ \
CLAMPED_W((ITERW), FBZCP, fogblend); \
break; \
} \
\
/* perform the blend */ \
fogblend++; \
fr = (fr * fogblend) >> 8; \
fg = (fg * fogblend) >> 8; \
fb = (fb * fogblend) >> 8; \
} \
\
/* if fog_mult is 0, we add this to the original color */ \
if (FOGMODE_FOG_MULT(FOGMODE) == 0) \
{ \
(RR) += fr; \
(GG) += fg; \
(BB) += fb; \
} \
/* otherwise this just becomes the new color */ \
else \
{ \
(RR) = fr; \
(GG) = fg; \
(BB) = fb; \
} \
\
/* clamp */ \
CLAMP((RR), 0x00, 0xff); \
CLAMP((GG), 0x00, 0xff); \
CLAMP((BB), 0x00, 0xff); \
} \
} \
while (0)
/*************************************
*
* Texture pipeline macro
*
*************************************/
#define TEXTURE_PIPELINE(TT, XX, DITHER4, TEXMODE, COTHER, LOOKUP, LODBASE, ITERS, ITERT, ITERW, RESULT) \
do \
{ \
Bit32s blendr, blendg, blendb, blenda; \
Bit32s tr, tg, tb, ta; \
Bit32s oow, s, t, lod, ilod; \
Bit32s smax, tmax; \
Bit32u texbase; \
rgb_union c_local; \
\
/* determine the S/T/LOD values for this texture */ \
if (TEXMODE_ENABLE_PERSPECTIVE(TEXMODE)) \
{ \
oow = fast_reciplog((ITERW), &lod); \
s = (Bit32s)((Bit64s)oow * (ITERS) >> 29); \
t = (Bit32s)((Bit64s)oow * (ITERT) >> 29); \
lod += (LODBASE); \
} \
else \
{ \
s = (Bit32s)((ITERS) >> 14); \
t = (Bit32s)((ITERT) >> 14); \
lod = (LODBASE); \
} \
\
/* clamp W */ \
if (TEXMODE_CLAMP_NEG_W(TEXMODE) && (ITERW) < 0) \
s = t = 0; \
\
/* clamp the LOD */ \
lod += (TT)->lodbias; \
if (TEXMODE_ENABLE_LOD_DITHER(TEXMODE)) \
lod += DITHER4[(XX) & 3] << 4; \
if (lod < (TT)->lodmin) \
lod = (TT)->lodmin; \
if (lod > (TT)->lodmax) \
lod = (TT)->lodmax; \
\
/* now the LOD is in range; if we don't own this LOD, take the next one */ \
ilod = lod >> 8; \
if (!(((TT)->lodmask >> ilod) & 1)) \
ilod++; \
\
/* fetch the texture base */ \
texbase = (TT)->lodoffset[ilod]; \
\
/* compute the maximum s and t values at this LOD */ \
smax = (TT)->wmask >> ilod; \
tmax = (TT)->hmask >> ilod; \
\
/* determine whether we are point-sampled or bilinear */ \
if ((lod == (TT)->lodmin && !TEXMODE_MAGNIFICATION_FILTER(TEXMODE)) || \
(lod != (TT)->lodmin && !TEXMODE_MINIFICATION_FILTER(TEXMODE))) \
{ \
/* point sampled */ \
\
Bit32u texel0; \
\
/* adjust S/T for the LOD and strip off the fractions */ \
s >>= ilod + 18; \
t >>= ilod + 18; \
\
/* clamp/wrap S/T if necessary */ \
if (TEXMODE_CLAMP_S(TEXMODE)) \
CLAMP(s, 0, smax); \
if (TEXMODE_CLAMP_T(TEXMODE)) \
CLAMP(t, 0, tmax); \
s &= smax; \
t &= tmax; \
t *= smax + 1; \
\
/* fetch texel data */ \
if (TEXMODE_FORMAT(TEXMODE) < 8) \
{ \
texel0 = *(Bit8u *)&(TT)->ram[(texbase + t + s) & (TT)->mask]; \
c_local.u = (LOOKUP)[texel0]; \
} \
else \
{ \
texel0 = *(Bit16u *)&(TT)->ram[(texbase + 2*(t + s)) & (TT)->mask]; \
if (TEXMODE_FORMAT(TEXMODE) >= 10 && TEXMODE_FORMAT(TEXMODE) <= 12) \
c_local.u = (LOOKUP)[texel0]; \
else \
c_local.u = ((LOOKUP)[texel0 & 0xff] & 0xffffff) | \
((texel0 & 0xff00) << 16); \
} \
} \
else \
{ \
/* bilinear filtered */ \
\
Bit32u texel0, texel1, texel2, texel3; \
Bit32u sfrac, tfrac; \
Bit32s s1, t1; \
\
/* adjust S/T for the LOD and strip off all but the low 8 bits of */ \
/* the fraction */ \
s >>= ilod + 10; \
t >>= ilod + 10; \
\
/* also subtract 1/2 texel so that (0.5,0.5) = a full (0,0) texel */ \
s -= 0x80; \
t -= 0x80; \
\
/* extract the fractions */ \
sfrac = s & (TT)->bilinear_mask; \
tfrac = t & (TT)->bilinear_mask; \
\
/* now toss the rest */ \
s >>= 8; \
t >>= 8; \
s1 = s + 1; \
t1 = t + 1; \
\
/* clamp/wrap S/T if necessary */ \
if (TEXMODE_CLAMP_S(TEXMODE)) \
{ \
CLAMP(s, 0, smax); \
CLAMP(s1, 0, smax); \
} \
if (TEXMODE_CLAMP_T(TEXMODE)) \
{ \
CLAMP(t, 0, tmax); \
CLAMP(t1, 0, tmax); \
} \
s &= smax; \
s1 &= smax; \
t &= tmax; \
t1 &= tmax; \
t *= smax + 1; \
t1 *= smax + 1; \
\
/* fetch texel data */ \
if (TEXMODE_FORMAT(TEXMODE) < 8) \
{ \
texel0 = *(Bit8u *)&(TT)->ram[(texbase + t + s) & (TT)->mask]; \
texel1 = *(Bit8u *)&(TT)->ram[(texbase + t + s1) & (TT)->mask]; \
texel2 = *(Bit8u *)&(TT)->ram[(texbase + t1 + s) & (TT)->mask]; \
texel3 = *(Bit8u *)&(TT)->ram[(texbase + t1 + s1) & (TT)->mask]; \
texel0 = (LOOKUP)[texel0]; \
texel1 = (LOOKUP)[texel1]; \
texel2 = (LOOKUP)[texel2]; \
texel3 = (LOOKUP)[texel3]; \
} \
else \
{ \
texel0 = *(Bit16u *)&(TT)->ram[(texbase + 2*(t + s)) & (TT)->mask]; \
texel1 = *(Bit16u *)&(TT)->ram[(texbase + 2*(t + s1)) & (TT)->mask]; \
texel2 = *(Bit16u *)&(TT)->ram[(texbase + 2*(t1 + s)) & (TT)->mask]; \
texel3 = *(Bit16u *)&(TT)->ram[(texbase + 2*(t1 + s1)) & (TT)->mask]; \
if (TEXMODE_FORMAT(TEXMODE) >= 10 && TEXMODE_FORMAT(TEXMODE) <= 12) \
{ \
texel0 = (LOOKUP)[texel0]; \
texel1 = (LOOKUP)[texel1]; \
texel2 = (LOOKUP)[texel2]; \
texel3 = (LOOKUP)[texel3]; \
} \
else \
{ \
texel0 = ((LOOKUP)[texel0 & 0xff] & 0xffffff) | \
((texel0 & 0xff00) << 16); \
texel1 = ((LOOKUP)[texel1 & 0xff] & 0xffffff) | \
((texel1 & 0xff00) << 16); \
texel2 = ((LOOKUP)[texel2 & 0xff] & 0xffffff) | \
((texel2 & 0xff00) << 16); \
texel3 = ((LOOKUP)[texel3 & 0xff] & 0xffffff) | \
((texel3 & 0xff00) << 16); \
} \
} \
\
/* weigh in each texel */ \
c_local.u = rgba_bilinear_filter(texel0, texel1, texel2, texel3, sfrac, tfrac); \
} \
\
/* select zero/other for RGB */ \
if (!TEXMODE_TC_ZERO_OTHER(TEXMODE)) \
{ \
tr = COTHER.rgb.r; \
tg = COTHER.rgb.g; \
tb = COTHER.rgb.b; \
} \
else \
tr = tg = tb = 0; \
\
/* select zero/other for alpha */ \
if (!TEXMODE_TCA_ZERO_OTHER(TEXMODE)) \
ta = COTHER.rgb.a; \
else \
ta = 0; \
\
/* potentially subtract c_local */ \
if (TEXMODE_TC_SUB_CLOCAL(TEXMODE)) \
{ \
tr -= c_local.rgb.r; \
tg -= c_local.rgb.g; \
tb -= c_local.rgb.b; \
} \
if (TEXMODE_TCA_SUB_CLOCAL(TEXMODE)) \
ta -= c_local.rgb.a; \
\
/* blend RGB */ \
switch (TEXMODE_TC_MSELECT(TEXMODE)) \
{ \
default: /* reserved */ \
case 0: /* zero */ \
blendr = blendg = blendb = 0; \
break; \
\
case 1: /* c_local */ \
blendr = c_local.rgb.r; \
blendg = c_local.rgb.g; \
blendb = c_local.rgb.b; \
break; \
\
case 2: /* a_other */ \
blendr = blendg = blendb = COTHER.rgb.a; \
break; \
\
case 3: /* a_local */ \
blendr = blendg = blendb = c_local.rgb.a; \
break; \
\
case 4: /* LOD (detail factor) */ \
if ((TT)->detailbias <= lod) \
blendr = blendg = blendb = 0; \
else \
{ \
blendr = ((((TT)->detailbias - lod) << (TT)->detailscale) >> 8); \
if (blendr > (TT)->detailmax) \
blendr = (TT)->detailmax; \
blendg = blendb = blendr; \
} \
break; \
\
case 5: /* LOD fraction */ \
blendr = blendg = blendb = lod & 0xff; \
break; \
} \
\
/* blend alpha */ \
switch (TEXMODE_TCA_MSELECT(TEXMODE)) \
{ \
default: /* reserved */ \
case 0: /* zero */ \
blenda = 0; \
break; \
\
case 1: /* c_local */ \
blenda = c_local.rgb.a; \
break; \
\
case 2: /* a_other */ \
blenda = COTHER.rgb.a; \
break; \
\
case 3: /* a_local */ \
blenda = c_local.rgb.a; \
break; \
\
case 4: /* LOD (detail factor) */ \
if ((TT)->detailbias <= lod) \
blenda = 0; \
else \
{ \
blenda = ((((TT)->detailbias - lod) << (TT)->detailscale) >> 8); \
if (blenda > (TT)->detailmax) \
blenda = (TT)->detailmax; \
} \
break; \
\
case 5: /* LOD fraction */ \
blenda = lod & 0xff; \
break; \
} \
\
/* reverse the RGB blend */ \
if (!TEXMODE_TC_REVERSE_BLEND(TEXMODE)) \
{ \
blendr ^= 0xff; \
blendg ^= 0xff; \
blendb ^= 0xff; \
} \
\
/* reverse the alpha blend */ \
if (!TEXMODE_TCA_REVERSE_BLEND(TEXMODE)) \
blenda ^= 0xff; \
\
/* do the blend */ \
tr = (tr * (blendr + 1)) >> 8; \
tg = (tg * (blendg + 1)) >> 8; \
tb = (tb * (blendb + 1)) >> 8; \
ta = (ta * (blenda + 1)) >> 8; \
\
/* add clocal or alocal to RGB */ \
switch (TEXMODE_TC_ADD_ACLOCAL(TEXMODE)) \
{ \
case 3: /* reserved */ \
case 0: /* nothing */ \
break; \
\
case 1: /* add c_local */ \
tr += c_local.rgb.r; \
tg += c_local.rgb.g; \
tb += c_local.rgb.b; \
break; \
\
case 2: /* add_alocal */ \
tr += c_local.rgb.a; \
tg += c_local.rgb.a; \
tb += c_local.rgb.a; \
break; \
} \
\
/* add clocal or alocal to alpha */ \
if (TEXMODE_TCA_ADD_ACLOCAL(TEXMODE)) \
ta += c_local.rgb.a; \
\
/* clamp */ \
RESULT.rgb.r = (tr < 0) ? 0 : (tr > 0xff) ? 0xff : tr; \
RESULT.rgb.g = (tg < 0) ? 0 : (tg > 0xff) ? 0xff : tg; \
RESULT.rgb.b = (tb < 0) ? 0 : (tb > 0xff) ? 0xff : tb; \
RESULT.rgb.a = (ta < 0) ? 0 : (ta > 0xff) ? 0xff : ta; \
\
/* invert */ \
if (TEXMODE_TC_INVERT_OUTPUT(TEXMODE)) \
RESULT.u ^= 0x00ffffff; \
if (TEXMODE_TCA_INVERT_OUTPUT(TEXMODE)) \
RESULT.rgb.a ^= 0xff; \
} \
while (0)
/*************************************
*
* Pixel pipeline macros
*
*************************************/
#define PIXEL_PIPELINE_BEGIN(VV, STATS, XX, YY, FBZCOLORPATH, FBZMODE, ITERZ, ITERW) \
do \
{ \
Bit32s depthval, wfloat; \
Bit32s prefogr, prefogg, prefogb; \
Bit32s r, g, b, a; \
\
(STATS)->pixels_in++; \
\
/* apply clipping */ \
/* note that for perf reasons, we assume the caller has done clipping */ \
\
/* handle stippling */ \
if (FBZMODE_ENABLE_STIPPLE(FBZMODE)) \
{ \
/* rotate mode */ \
if (FBZMODE_STIPPLE_PATTERN(FBZMODE) == 0) \
{ \
(VV)->reg[stipple].u = ((VV)->reg[stipple].u << 1) | ((VV)->reg[stipple].u >> 31); \
if (((VV)->reg[stipple].u & 0x80000000) == 0) \
{ \
goto skipdrawdepth; \
} \
} \
\
/* pattern mode */ \
else \
{ \
int stipple_index = (((YY) & 3) << 3) | (~(XX) & 7); \
if ((((VV)->reg[stipple].u >> stipple_index) & 1) == 0) \
{ \
goto skipdrawdepth; \
} \
} \
} \
\
/* compute "floating point" W value (used for depth and fog) */ \
if ((ITERW) & BX_CONST64(0xffff00000000)) \
wfloat = 0x0000; \
else \
{ \
Bit32u temp = (Bit32u)(ITERW); \
if ((temp & 0xffff0000) == 0) \
wfloat = 0xffff; \
else \
{ \
int exp = count_leading_zeros(temp); \
wfloat = ((exp << 12) | ((~temp >> (19 - exp)) & 0xfff)) + 1; \
} \
} \
\
/* compute depth value (W or Z) for this pixel */ \
if (FBZMODE_WBUFFER_SELECT(FBZMODE) == 0) \
CLAMPED_Z(ITERZ, FBZCOLORPATH, depthval); \
else if (FBZMODE_DEPTH_FLOAT_SELECT(FBZMODE) == 0) \
depthval = wfloat; \
else \
{ \
if ((ITERZ) & 0xf0000000) \
depthval = 0x0000; \
else \
{ \
Bit32u temp = (ITERZ) << 4; \
if ((temp & 0xffff0000) == 0) \
depthval = 0xffff; \
else \
{ \
int exp = count_leading_zeros(temp); \
depthval = ((exp << 12) | ((~temp >> (19 - exp)) & 0xfff)) + 1; \
} \
} \
} \
\
/* add the bias */ \
if (FBZMODE_ENABLE_DEPTH_BIAS(FBZMODE)) \
{ \
depthval += (Bit16s)(VV)->reg[zaColor].u; \
CLAMP(depthval, 0, 0xffff); \
} \
\
/* handle depth buffer testing */ \
if (FBZMODE_ENABLE_DEPTHBUF(FBZMODE)) \
{ \
Bit32s depthsource; \
\
/* the source depth is either the iterated W/Z+bias or a */ \
/* constant value */ \
if (FBZMODE_DEPTH_SOURCE_COMPARE(FBZMODE) == 0) \
depthsource = depthval; \
else \
depthsource = (Bit16u)(VV)->reg[zaColor].u; \
\
/* test against the depth buffer */ \
switch (FBZMODE_DEPTH_FUNCTION(FBZMODE)) \
{ \
case 0: /* depthOP = never */ \
(STATS)->zfunc_fail++; \
goto skipdrawdepth; \
\
case 1: /* depthOP = less than */ \
if (depthsource >= depth[XX]) \
{ \
(STATS)->zfunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 2: /* depthOP = equal */ \
if (depthsource != depth[XX]) \
{ \
(STATS)->zfunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 3: /* depthOP = less than or equal */ \
if (depthsource > depth[XX]) \
{ \
(STATS)->zfunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 4: /* depthOP = greater than */ \
if (depthsource <= depth[XX]) \
{ \
(STATS)->zfunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 5: /* depthOP = not equal */ \
if (depthsource == depth[XX]) \
{ \
(STATS)->zfunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 6: /* depthOP = greater than or equal */ \
if (depthsource < depth[XX]) \
{ \
(STATS)->zfunc_fail++; \
goto skipdrawdepth; \
} \
break; \
\
case 7: /* depthOP = always */ \
break; \
} \
}
#define PIXEL_PIPELINE_END(VV, STATS, DITHER, DITHER4, DITHER_LOOKUP, XX, dest, depth, FBZMODE, FBZCOLORPATH, ALPHAMODE, FOGMODE, ITERZ, ITERW, ITERAXXX) \
\
/* perform fogging */ \
prefogr = r; \
prefogg = g; \
prefogb = b; \
APPLY_FOGGING(VV, FOGMODE, FBZCOLORPATH, XX, DITHER4, r, g, b, \
ITERZ, ITERW, ITERAXXX); \
\
/* perform alpha blending */ \
APPLY_ALPHA_BLEND(FBZMODE, ALPHAMODE, XX, DITHER, r, g, b, a); \
\
/* modify the pixel for debugging purposes */ \
MODIFY_PIXEL(VV); \
\
/* write to framebuffer */ \
if (FBZMODE_RGB_BUFFER_MASK(FBZMODE)) \
{ \
/* apply dithering */ \
APPLY_DITHER(FBZMODE, XX, DITHER_LOOKUP, r, g, b); \
dest[XX] = (r << 11) | (g << 5) | b; \
} \
\
/* write to aux buffer */ \
if (depth && FBZMODE_AUX_BUFFER_MASK(FBZMODE)) \
{ \
if (FBZMODE_ENABLE_ALPHA_PLANES(FBZMODE) == 0) \
depth[XX] = depthval; \
else \
depth[XX] = a; \
} \
\
/* track pixel writes to the frame buffer regardless of mask */ \
(STATS)->pixels_out++; \
\
skipdrawdepth: \
; \
} \
while (0)
/*************************************
*
* Colorpath pipeline macro
*
*************************************/
/*
c_other_is_used:
if (FBZMODE_ENABLE_CHROMAKEY(FBZMODE) ||
FBZCP_CC_ZERO_OTHER(FBZCOLORPATH) == 0)
c_local_is_used:
if (FBZCP_CC_SUB_CLOCAL(FBZCOLORPATH) ||
FBZCP_CC_MSELECT(FBZCOLORPATH) == 1 ||
FBZCP_CC_ADD_ACLOCAL(FBZCOLORPATH) == 1)
NEEDS_ITER_RGB:
if ((c_other_is_used && FBZCP_CC_RGBSELECT(FBZCOLORPATH) == 0) ||
(c_local_is_used && (FBZCP_CC_LOCALSELECT_OVERRIDE(FBZCOLORPATH) != 0 || FBZCP_CC_LOCALSELECT(FBZCOLORPATH) == 0))
NEEDS_ITER_A:
if ((a_other_is_used && FBZCP_CC_ASELECT(FBZCOLORPATH) == 0) ||
(a_local_is_used && FBZCP_CCA_LOCALSELECT(FBZCOLORPATH) == 0))
NEEDS_ITER_Z:
if (FBZMODE_WBUFFER_SELECT(FBZMODE) == 0 ||
FBZMODE_DEPTH_FLOAT_SELECT(FBZMODE) != 0 ||
FBZCP_CCA_LOCALSELECT(FBZCOLORPATH) == 2)
*/
/*
Expects the following declarations to be outside of this scope:
Bit32s r, g, b, a;
*/
#define COLORPATH_PIPELINE(VV, STATS, FBZCOLORPATH, FBZMODE, ALPHAMODE, TEXELARGB, ITERZ, ITERW, ITERARGB) \
do \
{ \
Bit32s blendr, blendg, blendb, blenda; \
rgb_union c_other; \
rgb_union c_local; \
\
/* compute c_other */ \
switch (FBZCP_CC_RGBSELECT(FBZCOLORPATH)) \
{ \
case 0: /* iterated RGB */ \
c_other.u = ITERARGB.u; \
break; \
\
case 1: /* texture RGB */ \
c_other.u = TEXELARGB.u; \
break; \
\
case 2: /* color1 RGB */ \
c_other.u = (VV)->reg[color1].u; \
break; \
\
default: /* reserved */ \
c_other.u = 0; \
break; \
} \
\
/* handle chroma key */ \
APPLY_CHROMAKEY(VV, STATS, FBZMODE, c_other); \
\
/* compute a_other */ \
switch (FBZCP_CC_ASELECT(FBZCOLORPATH)) \
{ \
case 0: /* iterated alpha */ \
c_other.rgb.a = ITERARGB.rgb.a; \
break; \
\
case 1: /* texture alpha */ \
c_other.rgb.a = TEXELARGB.rgb.a; \
break; \
\
case 2: /* color1 alpha */ \
c_other.rgb.a = (VV)->reg[color1].rgb.a; \
break; \
\
default: /* reserved */ \
c_other.rgb.a = 0; \
break; \
} \
\
/* handle alpha mask */ \
APPLY_ALPHAMASK(VV, STATS, FBZMODE, c_other.rgb.a); \
\
/* handle alpha test */ \
APPLY_ALPHATEST(VV, STATS, ALPHAMODE, c_other.rgb.a); \
\
/* compute c_local */ \
if (FBZCP_CC_LOCALSELECT_OVERRIDE(FBZCOLORPATH) == 0) \
{ \
if (FBZCP_CC_LOCALSELECT(FBZCOLORPATH) == 0) /* iterated RGB */ \
c_local.u = ITERARGB.u; \
else /* color0 RGB */ \
c_local.u = (VV)->reg[color0].u; \
} \
else \
{ \
if (!(TEXELARGB.rgb.a & 0x80)) /* iterated RGB */ \
c_local.u = ITERARGB.u; \
else /* color0 RGB */ \
c_local.u = (VV)->reg[color0].u; \
} \
\
/* compute a_local */ \
switch (FBZCP_CCA_LOCALSELECT(FBZCOLORPATH)) \
{ \
default: \
case 0: /* iterated alpha */ \
c_local.rgb.a = ITERARGB.rgb.a; \
break; \
\
case 1: /* color0 alpha */ \
c_local.rgb.a = (VV)->reg[color0].rgb.a; \
break; \
\
case 2: /* clamped iterated Z[27:20] */ \
{ \
int temp; \
CLAMPED_Z(ITERZ, FBZCOLORPATH, temp); \
c_local.rgb.a = (Bit8u)temp; \
break; \
} \
\
case 3: /* clamped iterated W[39:32] */ \
{ \
int temp; \
CLAMPED_W(ITERW, FBZCOLORPATH, temp); /* Voodoo 2 only */ \
c_local.rgb.a = (Bit8u)temp; \
break; \
} \
} \
\
/* select zero or c_other */ \
if (FBZCP_CC_ZERO_OTHER(FBZCOLORPATH) == 0) \
{ \
r = c_other.rgb.r; \
g = c_other.rgb.g; \
b = c_other.rgb.b; \
} \
else \
r = g = b = 0; \
\
/* select zero or a_other */ \
if (FBZCP_CCA_ZERO_OTHER(FBZCOLORPATH) == 0) \
a = c_other.rgb.a; \
else \
a = 0; \
\
/* subtract c_local */ \
if (FBZCP_CC_SUB_CLOCAL(FBZCOLORPATH)) \
{ \
r -= c_local.rgb.r; \
g -= c_local.rgb.g; \
b -= c_local.rgb.b; \
} \
\
/* subtract a_local */ \
if (FBZCP_CCA_SUB_CLOCAL(FBZCOLORPATH)) \
a -= c_local.rgb.a; \
\
/* blend RGB */ \
switch (FBZCP_CC_MSELECT(FBZCOLORPATH)) \
{ \
default: /* reserved */ \
case 0: /* 0 */ \
blendr = blendg = blendb = 0; \
break; \
\
case 1: /* c_local */ \
blendr = c_local.rgb.r; \
blendg = c_local.rgb.g; \
blendb = c_local.rgb.b; \
break; \
\
case 2: /* a_other */ \
blendr = blendg = blendb = c_other.rgb.a; \
break; \
\
case 3: /* a_local */ \
blendr = blendg = blendb = c_local.rgb.a; \
break; \
\
case 4: /* texture alpha */ \
blendr = blendg = blendb = TEXELARGB.rgb.a; \
break; \
\
case 5: /* texture RGB (Voodoo 2 only) */ \
blendr = TEXELARGB.rgb.r; \
blendg = TEXELARGB.rgb.g; \
blendb = TEXELARGB.rgb.b; \
break; \
} \
\
/* blend alpha */ \
switch (FBZCP_CCA_MSELECT(FBZCOLORPATH)) \
{ \
default: /* reserved */ \
case 0: /* 0 */ \
blenda = 0; \
break; \
\
case 1: /* a_local */ \
blenda = c_local.rgb.a; \
break; \
\
case 2: /* a_other */ \
blenda = c_other.rgb.a; \
break; \
\
case 3: /* a_local */ \
blenda = c_local.rgb.a; \
break; \
\
case 4: /* texture alpha */ \
blenda = TEXELARGB.rgb.a; \
break; \
} \
\
/* reverse the RGB blend */ \
if (!FBZCP_CC_REVERSE_BLEND(FBZCOLORPATH)) \
{ \
blendr ^= 0xff; \
blendg ^= 0xff; \
blendb ^= 0xff; \
} \
\
/* reverse the alpha blend */ \
if (!FBZCP_CCA_REVERSE_BLEND(FBZCOLORPATH)) \
blenda ^= 0xff; \
\
/* do the blend */ \
r = (r * (blendr + 1)) >> 8; \
g = (g * (blendg + 1)) >> 8; \
b = (b * (blendb + 1)) >> 8; \
a = (a * (blenda + 1)) >> 8; \
\
/* add clocal or alocal to RGB */ \
switch (FBZCP_CC_ADD_ACLOCAL(FBZCOLORPATH)) \
{ \
case 3: /* reserved */ \
case 0: /* nothing */ \
break; \
\
case 1: /* add c_local */ \
r += c_local.rgb.r; \
g += c_local.rgb.g; \
b += c_local.rgb.b; \
break; \
\
case 2: /* add_alocal */ \
r += c_local.rgb.a; \
g += c_local.rgb.a; \
b += c_local.rgb.a; \
break; \
} \
\
/* add clocal or alocal to alpha */ \
if (FBZCP_CCA_ADD_ACLOCAL(FBZCOLORPATH)) \
a += c_local.rgb.a; \
\
/* clamp */ \
CLAMP(r, 0x00, 0xff); \
CLAMP(g, 0x00, 0xff); \
CLAMP(b, 0x00, 0xff); \
CLAMP(a, 0x00, 0xff); \
\
/* invert */ \
if (FBZCP_CC_INVERT_OUTPUT(FBZCOLORPATH)) \
{ \
r ^= 0xff; \
g ^= 0xff; \
b ^= 0xff; \
} \
if (FBZCP_CCA_INVERT_OUTPUT(FBZCOLORPATH)) \
a ^= 0xff; \
} \
while (0)
/*************************************
*
* Rasterizer generator macro
*
*************************************/
#define RASTERIZER(name, TMUS, FBZCOLORPATH, FBZMODE, ALPHAMODE, FOGMODE, TEXMODE0, TEXMODE1) \
\
void raster_##name(void *destbase, Bit32s y, const poly_extent *extent, const void *extradata, int threadid) \
{ \
const poly_extra_data *extra = (const poly_extra_data *)extradata; \
voodoo_state *v = extra->state; \
stats_block *stats = &v->thread_stats[threadid]; \
DECLARE_DITHER_POINTERS; \
Bit32s startx = extent->startx; \
Bit32s stopx = extent->stopx; \
Bit32s iterr, iterg, iterb, itera; \
Bit32s iterz; \
Bit64s iterw, iterw0 = 0, iterw1 = 0; \
Bit64s iters0 = 0, iters1 = 0; \
Bit64s itert0 = 0, itert1 = 0; \
Bit16u *depth; \
Bit16u *dest; \
Bit32s dx, dy; \
Bit32s scry; \
Bit32s x; \
\
/* determine the screen Y */ \
scry = y; \
if (FBZMODE_Y_ORIGIN(FBZMODE)) \
scry = (v->fbi.yorigin - y) & 0x3ff; \
\
/* compute dithering */ \
COMPUTE_DITHER_POINTERS(FBZMODE, y); \
\
/* apply clipping */ \
if (FBZMODE_ENABLE_CLIPPING(FBZMODE)) \
{ \
Bit32s tempclip; \
\
/* Y clipping buys us the whole scanline */ \
if (scry < (Bit32s)((v->reg[clipLowYHighY].u >> 16) & 0x3ff) || \
scry >= (Bit32s)(v->reg[clipLowYHighY].u & 0x3ff)) \
{ \
stats->pixels_in += stopx - startx; \
stats->clip_fail += stopx - startx; \
return; \
} \
\
/* X clipping */ \
tempclip = (v->reg[clipLeftRight].u >> 16) & 0x3ff; \
if (startx < tempclip) \
{ \
stats->pixels_in += tempclip - startx; \
startx = tempclip; \
} \
tempclip = v->reg[clipLeftRight].u & 0x3ff; \
if (stopx >= tempclip) \
{ \
stats->pixels_in += stopx - tempclip; \
stopx = tempclip - 1; \
} \
} \
\
/* get pointers to the target buffer and depth buffer */ \
dest = (Bit16u *)destbase + scry * v->fbi.rowpixels; \
depth = (v->fbi.auxoffs != (Bit32u)~0) ? ((Bit16u *)(v->fbi.ram + v->fbi.auxoffs) + scry * v->fbi.rowpixels) : NULL; \
\
/* compute the starting parameters */ \
dx = startx - (extra->ax >> 4); \
dy = y - (extra->ay >> 4); \
iterr = extra->startr + dy * extra->drdy + dx * extra->drdx; \
iterg = extra->startg + dy * extra->dgdy + dx * extra->dgdx; \
iterb = extra->startb + dy * extra->dbdy + dx * extra->dbdx; \
itera = extra->starta + dy * extra->dady + dx * extra->dadx; \
iterz = extra->startz + dy * extra->dzdy + dx * extra->dzdx; \
iterw = extra->startw + dy * extra->dwdy + dx * extra->dwdx; \
if (TMUS >= 1) \
{ \
iterw0 = extra->startw0 + dy * extra->dw0dy + dx * extra->dw0dx; \
iters0 = extra->starts0 + dy * extra->ds0dy + dx * extra->ds0dx; \
itert0 = extra->startt0 + dy * extra->dt0dy + dx * extra->dt0dx; \
} \
if (TMUS >= 2) \
{ \
iterw1 = extra->startw1 + dy * extra->dw1dy + dx * extra->dw1dx; \
iters1 = extra->starts1 + dy * extra->ds1dy + dx * extra->ds1dx; \
itert1 = extra->startt1 + dy * extra->dt1dy + dx * extra->dt1dx; \
} \
\
/* loop in X */ \
for (x = startx; x < stopx; x++) \
{ \
rgb_union iterargb = { 0 }; \
rgb_union texel = { 0 }; \
\
/* pixel pipeline part 1 handles depth testing and stippling */ \
PIXEL_PIPELINE_BEGIN(v, stats, x, y, FBZCOLORPATH, FBZMODE, \
iterz, iterw); \
\
/* run the texture pipeline on TMU1 to produce a value in texel */ \
/* note that they set LOD min to 8 to "disable" a TMU */ \
if (TMUS >= 2 && v->tmu[1].lodmin < (8 << 8)) \
TEXTURE_PIPELINE(&v->tmu[1], x, dither4, TEXMODE1, texel, \
v->tmu[1].lookup, extra->lodbase1, \
iters1, itert1, iterw1, texel); \
\
/* run the texture pipeline on TMU0 to produce a final */ \
/* result in texel */ \
/* note that they set LOD min to 8 to "disable" a TMU */ \
if (TMUS >= 1 && v->tmu[0].lodmin < (8 << 8)) { \
if (v->send_config==0) \
TEXTURE_PIPELINE(&v->tmu[0], x, dither4, TEXMODE0, texel, \
v->tmu[0].lookup, extra->lodbase0, \
iters0, itert0, iterw0, texel); \
/* send config data to the frame buffer */ \
else texel.u=v->tmu_config; \
} \
/* colorpath pipeline selects source colors and does blending */ \
CLAMPED_ARGB(iterr, iterg, iterb, itera, FBZCOLORPATH, iterargb); \
COLORPATH_PIPELINE(v, stats, FBZCOLORPATH, FBZMODE, ALPHAMODE, texel, \
iterz, iterw, iterargb); \
\
/* pixel pipeline part 2 handles fog, alpha, and final output */ \
PIXEL_PIPELINE_END(v, stats, dither, dither4, dither_lookup, x, dest, depth, \
FBZMODE, FBZCOLORPATH, ALPHAMODE, FOGMODE, \
iterz, iterw, iterargb); \
\
/* update the iterated parameters */ \
iterr += extra->drdx; \
iterg += extra->dgdx; \
iterb += extra->dbdx; \
itera += extra->dadx; \
iterz += extra->dzdx; \
iterw += extra->dwdx; \
if (TMUS >= 1) \
{ \
iterw0 += extra->dw0dx; \
iters0 += extra->ds0dx; \
itert0 += extra->dt0dx; \
} \
if (TMUS >= 2) \
{ \
iterw1 += extra->dw1dx; \
iters1 += extra->ds1dx; \
itert1 += extra->dt1dx; \
} \
} \
}