summaryrefslogtreecommitdiff
path: root/driver/xf86-video-mga/src/mga_exa.c
diff options
context:
space:
mode:
Diffstat (limited to 'driver/xf86-video-mga/src/mga_exa.c')
-rw-r--r--driver/xf86-video-mga/src/mga_exa.c810
1 files changed, 810 insertions, 0 deletions
diff --git a/driver/xf86-video-mga/src/mga_exa.c b/driver/xf86-video-mga/src/mga_exa.c
new file mode 100644
index 000000000..3242ea884
--- /dev/null
+++ b/driver/xf86-video-mga/src/mga_exa.c
@@ -0,0 +1,810 @@
+/*
+ * Copyright 2006 Red Hat, Inc.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software")
+ * to deal in the software without restriction, including without limitation
+ * on the rights to use, copy, modify, merge, publish, distribute, sub
+ * license, and/or sell copies of the Software, and to permit persons to whom
+ * them Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice (including the next
+ * paragraph) shall be included in all copies or substantial portions of the
+ * Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTIBILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES, OR OTHER LIABILITY, WHETHER
+ * IN AN ACTION OF CONTRACT, TORT, OR OTHERWISE, ARISING FROM, OUT OF OR IN
+ * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+ *
+ * Authors:
+ * Adam Jackson <ajax@nwnk.net>
+ * Tilman Sauerbeck <tilman@code-monkey.de>
+ */
+
+/*
+ * Sources:
+ * - mga kdrive accel by Anders Carlsson
+ * - mga g400 Render accel by Damien Ciabrini
+ */
+
+#ifdef HAVE_CONFIG_H
+#include "config.h"
+#endif
+
+#include "xf86.h"
+
+#include "mga.h"
+#include "mga_reg.h"
+#include "mga_macros.h"
+
+#include "exa.h"
+#ifdef XF86DRI
+#include "mga_dri.h"
+#endif
+
+#include "xf86PciInfo.h"
+
+#if 0
+#define DEBUG_MSG(x) ErrorF x
+#else
+#define DEBUG_MSG(x)
+#endif
+
+#define PMGA(x) \
+ MGAPtr pMga = xf86Screens[x->drawable.pScreen->myNum]->driverPrivate;
+
+#define QUIESCE_DMA(x) \
+ CHECK_DMA_QUIESCENT(pMga, xf86Screens[x->drawable.pScreen->myNum]);
+
+/* stuff stolen from mga_storm.c */
+#define BLIT_LEFT 1
+#define BLIT_UP 4
+
+/* FIXME
+ * We could use MGADWG_BLK for GXcopy if HaveSDRAM is FALSE.
+ * That will only work in some situations though (see mga_storm.c
+ * for details).
+ */
+static const CARD32 mgaRop[16] = {
+ /* GXclear */ MGADWG_RPL | 0x00000000, /* 0 */
+ /* GXand */ MGADWG_RSTR | 0x00080000, /* src AND dst */
+ /* GXandReverse */ MGADWG_RSTR | 0x00040000, /* src AND NOT dst */
+ /* GXcopy */ MGADWG_RSTR | 0x000c0000, /* src */
+ /* GXandInverted */ MGADWG_RSTR | 0x00020000, /* NOT src AND dst */
+ /* GXnoop */ MGADWG_RSTR | 0x000a0000, /* dst */
+ /* GXxor */ MGADWG_RSTR | 0x00060000, /* src XOR dst */
+ /* GXor */ MGADWG_RSTR | 0x000e0000, /* src OR dst */
+ /* GXnor */ MGADWG_RSTR | 0x00010000, /* NOT src AND NOT dst */
+ /* GXequiv */ MGADWG_RSTR | 0x00090000, /* NOT src XOR dst */
+ /* GXinvert */ MGADWG_RSTR | 0x00050000, /* NOT dst */
+ /* GXorReverse */ MGADWG_RSTR | 0x000d0000, /* src OR NOT dst */
+ /* GXcopyInverted */ MGADWG_RPL | 0x00030000, /* NOT src */
+ /* GXorInverted */ MGADWG_RSTR | 0x000b0000, /* NOT src OR dst */
+ /* GXnand */ MGADWG_RSTR | 0x00070000, /* NOT src OR NOT dst */
+ /* GXset */ MGADWG_RPL | 0x000f0000 /* 1 */
+};
+
+static const struct {
+ Bool dst_alpha;
+ Bool src_alpha;
+ CARD32 blend_cntl;
+} mgaBlendOp[] = {
+ /* Clear */
+ {0, 0, MGA_SRC_ZERO | MGA_DST_ZERO},
+ /* Src */
+ {0, 0, MGA_SRC_ONE | MGA_DST_ZERO},
+ /* Dst */
+ {0, 0, MGA_SRC_ZERO | MGA_DST_ONE},
+ /* Over */
+ {0, 1, MGA_SRC_ONE | MGA_DST_ONE_MINUS_SRC_ALPHA},
+ /* OverReverse */
+ {1, 0, MGA_SRC_ONE_MINUS_DST_ALPHA | MGA_DST_ONE},
+ /* In */
+ {1, 0, MGA_SRC_DST_ALPHA | MGA_DST_ZERO},
+ /* InReverse */
+ {0, 1, MGA_SRC_ZERO | MGA_DST_SRC_ALPHA},
+ /* Out */
+ {1, 0, MGA_SRC_ONE_MINUS_DST_ALPHA | MGA_DST_ZERO},
+ /* OutReverse */
+ {0, 1, MGA_SRC_ZERO | MGA_DST_ONE_MINUS_SRC_ALPHA},
+ /* Atop */
+ {1, 1, MGA_SRC_DST_ALPHA | MGA_DST_ONE_MINUS_SRC_ALPHA},
+ /* AtopReverse */
+ {1, 1, MGA_SRC_ONE_MINUS_DST_ALPHA | MGA_DST_SRC_ALPHA},
+ /* Xor */
+ {1, 1, MGA_SRC_ONE_MINUS_DST_ALPHA | MGA_DST_ONE_MINUS_SRC_ALPHA},
+ /* Add */
+ {0, 0, MGA_SRC_ONE | MGA_DST_ONE},
+};
+
+static CARD32
+mgaGetPixmapPitch(PixmapPtr pPix)
+{
+ return exaGetPixmapPitch(pPix) / (pPix->drawable.bitsPerPixel >> 3);
+}
+
+static CARD32
+mgaGetMACCESS(PixmapPtr pixmap, PicturePtr pict)
+{
+ switch (pixmap->drawable.bitsPerPixel) {
+ case 8:
+ return MGAMAC_PW8 | MGAMAC_BYPASS332 | MGAMAC_NODITHER;
+ case 16:
+ if (pict &&
+ (pict->format == PICT_x1r5g5b5 || pict->format == PICT_a1r5g5b5))
+ return MGAMAC_PW16 | MGAMAC_DIT555;
+ else
+ return MGAMAC_PW16;
+ case 24:
+ return MGAMAC_PW24;
+ default:
+ return MGAMAC_PW32;
+ }
+}
+
+static Bool
+mgaSetup(MGAPtr pMga, PixmapPtr pixmap, PicturePtr pict, int wait)
+{
+ WAITFIFO(wait + 4);
+
+ /* Set the format of the destination pixmap */
+ OUTREG(MGAREG_MACCESS, mgaGetMACCESS(pixmap, pict));
+
+ OUTREG(MGAREG_CXBNDRY, 0xffff0000);
+ OUTREG(MGAREG_YTOP, 0x00000000);
+ OUTREG(MGAREG_YBOT, 0x007fffff);
+
+ return TRUE;
+}
+
+static void
+mgaNoopDone(PixmapPtr pPixmap)
+{
+}
+
+static Bool
+mgaPrepareSolid(PixmapPtr pPixmap, int alu, Pixel planemask, Pixel fg)
+{
+ PMGA(pPixmap);
+ int dwgctl;
+
+ /* FIXME
+ * Is this needed here? We don't use DMA stuff here...
+ */
+ QUIESCE_DMA(pPixmap);
+
+ /* We must pad planemask and fg depending on the format of the
+ * destination pixmap
+ */
+ switch (pPixmap->drawable.bitsPerPixel) {
+ case 8:
+ fg |= fg << 8;
+ planemask |= planemask << 8;
+ /* fall through */
+ case 16:
+ fg |= fg << 16;
+ planemask |= planemask << 16;
+ break;
+ }
+
+ dwgctl = MGADWG_TRAP | MGADWG_SOLID | MGADWG_ARZERO |
+ MGADWG_SGNZERO | MGADWG_SHIFTZERO | mgaRop[alu];
+
+ mgaSetup(pMga, pPixmap, NULL, 5);
+
+ OUTREG(MGAREG_PITCH, mgaGetPixmapPitch(pPixmap));
+ OUTREG(MGAREG_DSTORG, exaGetPixmapOffset(pPixmap));
+ OUTREG(MGAREG_FCOL, fg);
+ OUTREG(MGAREG_PLNWT, planemask);
+ OUTREG(MGAREG_DWGCTL, dwgctl);
+
+ return TRUE;
+}
+
+static void
+mgaSolid(PixmapPtr pPixmap, int x1, int y1, int x2, int y2)
+{
+ PMGA(pPixmap);
+
+ WAITFIFO(2);
+ OUTREG(MGAREG_FXBNDRY, (x2 << 16) | (x1 & 0xffff));
+ OUTREG(MGAREG_YDSTLEN | MGAREG_EXEC, (y1 << 16) | (y2 - y1));
+}
+
+static Bool
+mgaPrepareCopy(PixmapPtr pSrc, PixmapPtr pDst, int xdir, int ydir, int alu,
+ Pixel planemask)
+{
+ PMGA(pSrc);
+ int blit_direction = 0;
+ int dwgctl = 0;
+
+ /* FIXME
+ * Is this needed here? We don't use DMA stuff here...
+ */
+ QUIESCE_DMA(pSrc);
+
+ DEBUG_MSG(("s: %x@%x d: %x@%x xdir %d ydir %d alu %d pm %d\n",
+ exaGetPixmapOffset(pSrc), exaGetPixmapPitch(pSrc),
+ exaGetPixmapOffset(pDst), exaGetPixmapPitch(pDst),
+ xdir, ydir, alu, planemask));
+
+ if (xdir < 0)
+ blit_direction |= BLIT_LEFT;
+
+ if (ydir < 0)
+ blit_direction |= BLIT_UP;
+
+ pMga->BltScanDirection = blit_direction;
+
+ dwgctl = mgaRop[alu] | MGADWG_SHIFTZERO | MGADWG_BITBLT | MGADWG_BFCOL;
+ pMga->src_pitch = mgaGetPixmapPitch(pSrc);
+
+ mgaSetup(pMga, pDst, NULL, 7);
+ OUTREG(MGAREG_PITCH, mgaGetPixmapPitch(pDst));
+ OUTREG(MGAREG_SRCORG, exaGetPixmapOffset(pSrc));
+ OUTREG(MGAREG_DSTORG, exaGetPixmapOffset(pDst));
+ OUTREG(MGAREG_DWGCTL, dwgctl);
+ OUTREG(MGAREG_SGN, blit_direction);
+ OUTREG(MGAREG_PLNWT, planemask);
+ OUTREG(MGAREG_AR5, (ydir < 0 ? -1 : 1) * pMga->src_pitch);
+
+ return TRUE;
+}
+
+static void
+mgaCopy(PixmapPtr pDst, int srcx, int srcy, int dstx, int dsty, int w, int h)
+{
+ PMGA(pDst);
+ int start, end;
+
+ DEBUG_MSG((" %d,%d -> %d,%d %dx%d\n", srcx, srcy, dstx,dsty, w, h));
+
+ w--;
+
+ if (pMga->BltScanDirection & BLIT_UP) {
+ srcy += h - 1;
+ dsty += h - 1;
+ }
+
+ start = end = srcy * pMga->src_pitch + srcx;
+
+ if (pMga->BltScanDirection & BLIT_LEFT)
+ start += w;
+ else
+ end += w;
+
+ DEBUG_MSG((" end %d start %d dstx %d dsty %d w %d h %d\n",
+ end, start, dstx, dsty, w, h));
+
+ WAITFIFO(4);
+ OUTREG(MGAREG_AR0, end);
+ OUTREG(MGAREG_AR3, start);
+ OUTREG(MGAREG_FXBNDRY, ((dstx + w) << 16) | (dstx & 0xffff));
+ OUTREG(MGAREG_YDSTLEN | MGAREG_EXEC, (dsty << 16) | h);
+}
+
+static int
+MGA_LOG2(int val)
+{
+ int ret = 0;
+
+ if (val == 1)
+ return 0;
+
+ while (val >> ret)
+ ret++;
+
+ return ((1 << (ret - 1)) == val) ? (ret - 1) : ret;
+}
+
+static CARD32
+mgaGetTexFormat(PicturePtr pPict)
+{
+ static const struct {
+ int fmt;
+ CARD32 card_fmt;
+ } *ptr, texformats[] = {
+ { PICT_a8r8g8b8, MGA_TW32 },
+ { PICT_x8r8g8b8, MGA_TW32 },
+ { PICT_r5g6b5, MGA_TW16 },
+ { PICT_a1r5g5b5, MGA_TW15 },
+ { PICT_x1r5g5b5, MGA_TW15 },
+ { PICT_a4r4g4b4, MGA_TW12 },
+ { PICT_x4r4g4b4, MGA_TW12 },
+ { PICT_a8, MGA_TW8A },
+ { 0, 0}
+ };
+
+ for (ptr = texformats; ptr->fmt; ptr++)
+ if (ptr->fmt == pPict->format)
+ return ptr->card_fmt;
+
+ return 0;
+}
+
+static Bool
+mgaCheckSourceTexture(int tmu, PicturePtr pPict)
+{
+ int w = pPict->pDrawable->width;
+ int h = pPict->pDrawable->height;
+
+ if ((w > 2047) || (h > 2047)){
+ DEBUG_MSG(("Picture w/h too large (%dx%d)\n", w, h));
+ return FALSE;
+ }
+
+ if (!mgaGetTexFormat(pPict)) {
+ DEBUG_MSG(("Unsupported picture format 0x%x\n", pPict->format));
+ return FALSE;
+ }
+
+ if (pPict->repeat && ((w & (w - 1)) != 0 || (h & (h - 1)) != 0)) {
+ DEBUG_MSG(("NPOT repeat unsupported (%dx%d)\n", w, h));
+ return FALSE;
+ }
+
+ if (pPict->filter != PictFilterNearest &&
+ pPict->filter != PictFilterBilinear) {
+ DEBUG_MSG(("Unsupported filter 0x%x\n", pPict->filter));
+ return FALSE;
+ }
+
+ return TRUE;
+}
+
+static Bool
+mgaCheckComposite(int op, PicturePtr pSrcPict, PicturePtr pMaskPict,
+ PicturePtr pDstPict)
+{
+ if (op >= sizeof(mgaBlendOp) / sizeof(mgaBlendOp[0])) {
+ DEBUG_MSG(("unsupported op %x\n", op));
+ return FALSE;
+ }
+
+ if (!mgaCheckSourceTexture(0, pSrcPict))
+ return FALSE;
+
+ if (pMaskPict) {
+ if (!mgaCheckSourceTexture(1, pMaskPict))
+ return FALSE;
+
+ if (pMaskPict->componentAlpha) {
+ DEBUG_MSG(("Component alpha unsupported\n"));
+ return FALSE;
+ }
+ }
+
+ if (PICT_FORMAT_TYPE(pDstPict->format) == PICT_TYPE_ABGR) {
+ DEBUG_MSG(("render to (A)BGR unsupported\n"));
+ return FALSE;
+ }
+
+ /* FIXME
+ * Doing this operation in hardware is broken atm :/
+ */
+ if (op == PictOpAdd && pSrcPict->format == PICT_a8 &&
+ pDstPict->format == PICT_a8)
+ return FALSE;
+
+ return TRUE;
+}
+
+static void
+PrepareSourceTexture(int tmu, PicturePtr pSrcPicture, PixmapPtr pSrc)
+{
+ PMGA(pSrc);
+ int pitch = mgaGetPixmapPitch(pSrc);
+ int w = pSrc->drawable.width;
+ int h = pSrc->drawable.height;
+ int w_log2 = MGA_LOG2(w);
+ int h_log2 = MGA_LOG2(h);
+
+ int texctl = MGA_PITCHLIN | ((pitch & (2048 - 1)) << 9) |
+ MGA_NOPERSPECTIVE | MGA_TAKEY;
+ int texctl2 = MGA_G400_TC2_MAGIC | MGA_TC2_CKSTRANSDIS;
+ int texfilter = MGA_FILTERALPHA | (0x10 << 21);
+
+ texctl |= mgaGetTexFormat(pSrcPicture);
+
+ if (pSrcPicture->filter == PictFilterBilinear)
+ texfilter |= MGA_MAG_BILIN | MGA_MIN_BILIN;
+ else
+ texfilter |= MGA_MAG_NRST | MGA_MIN_NRST;
+
+ if (!pSrcPicture->repeat)
+ texctl |= MGA_CLAMPUV;
+
+ if (tmu == 1)
+ texctl2 |= MGA_TC2_DUALTEX | MGA_TC2_SELECT_TMU1;
+
+ WAITFIFO(6);
+ OUTREG(MGAREG_TEXCTL2, texctl2);
+ OUTREG(MGAREG_TEXCTL, texctl);
+
+ /* Source (texture) address + pitch */
+ OUTREG(MGAREG_TEXORG, exaGetPixmapOffset(pSrc));
+ OUTREG(MGAREG_TEXWIDTH, (w - 1) << 18 | ((8 - w_log2) & 63) << 9 | w_log2);
+ OUTREG(MGAREG_TEXHEIGHT, (h - 1) << 18 | ((8 - h_log2) & 63) << 9 | h_log2);
+
+ /* Set blit filtering flags */
+ OUTREG(MGAREG_TEXFILTER, texfilter);
+
+ if (tmu == 1) {
+ WAITFIFO(1);
+ OUTREG(MGAREG_TEXCTL2, texctl2 & ~MGA_TC2_SELECT_TMU1);
+ }
+}
+
+/*
+ * The formals params are the elements of the following matrix:
+ *
+ * Dest Transform Src
+ * coords coords
+ * / Xdst \ / X_incx X_incy X_init \ / Xsrc \
+ * | Ydst | = | Y_incx Y_incy Y_init | x | Ysrc |
+ * \ 1 / \ H_incx H_incy H_init / \ 1 /
+ *
+ * matrix elements are 32bits fixed points (16.16)
+ * mga_fx_* is the size of the fixed point for the TMU
+ */
+static void
+setTMIncrementsRegs(PixmapPtr pPix, int X_incx, int X_incy, int X_init,
+ int Y_incx, int Y_incy, int Y_init,
+ int H_incx, int H_incy, int H_init,
+ int mga_fx_width_size, int mga_fx_height_size)
+{
+ PMGA(pPix);
+
+ int decalw = mga_fx_width_size - 16;
+ int decalh = mga_fx_height_size - 16;
+
+ /* Convert 16 bits fixpoint -> MGA variable size fixpoint */
+ if (decalw >= 0) {
+ X_incx <<= decalw;
+ X_incy <<= decalw;
+ X_init <<= decalw;
+ } else {
+ decalw = -decalw;
+ X_incx >>= decalw;
+ X_incy >>= decalw;
+ X_init >>= decalw;
+ }
+
+ /* Convert 16 bits fixpoint -> MGA variable size fixpoint */
+ if (decalh >= 0) {
+ Y_incx <<= decalh;
+ Y_incy <<= decalh;
+ Y_init <<= decalh;
+ } else {
+ decalh = -decalh;
+ Y_incx >>= decalh;
+ Y_incy >>= decalh;
+ Y_init >>= decalh;
+ }
+
+ /* Set TM registers */
+ WAITFIFO(9);
+ OUTREG(MGAREG_TMR0, X_incx);
+ OUTREG(MGAREG_TMR1, Y_incx);
+ OUTREG(MGAREG_TMR2, X_incy);
+ OUTREG(MGAREG_TMR3, Y_incy);
+ OUTREG(MGAREG_TMR4, H_incx);
+ OUTREG(MGAREG_TMR5, H_incy);
+ OUTREG(MGAREG_TMR6, X_init);
+ OUTREG(MGAREG_TMR7, Y_init);
+ OUTREG(MGAREG_TMR8, H_init);
+}
+
+/* XXX these look like magic */
+#define C_ARG1_CUR 0x0
+#define C_ARG1_ALPHA MGA_TDS_COLOR_ARG1_REPLICATEALPHA
+#define C_ARG2_DIFFUSE MGA_TDS_COLOR_ARG2_DIFFUSE
+#define C_ARG2_FCOL MGA_TDS_COLOR_ARG2_FCOL
+#define C_ARG2_PREV MGA_TDS_COLOR_ARG2_PREVSTAGE
+#define C_ARG1_INV MGA_TDS_COLOR_ARG1_INV
+#define C_ARG2_INV MGA_TDS_COLOR_ARG2_INV
+#define COLOR_MUL MGA_TDS_COLOR_SEL_MUL
+#define COLOR_ARG1 MGA_TDS_COLOR_SEL_ARG1
+#define COLOR_ARG2 MGA_TDS_COLOR_SEL_ARG2
+#define A_ARG1_CUR 0x0
+#define A_ARG2_IGN A_ARG2_DIFFUSE
+#define A_ARG2_FCOL MGA_TDS_ALPHA_ARG2_FCOL
+#define A_ARG2_DIFFUSE MGA_TDS_ALPHA_ARG2_DIFFUSE
+#define A_ARG2_PREV MGA_TDS_ALPHA_ARG2_PREVSTAGE
+#define ALPHA_MUL MGA_TDS_ALPHA_SEL_MUL
+#define ALPHA_ARG1 MGA_TDS_ALPHA_SEL_ARG1
+#define ALPHA_ARG2 MGA_TDS_ALPHA_SEL_ARG2
+
+static Bool
+mgaPrepareComposite(int op, PicturePtr pSrcPict, PicturePtr pMaskPict,
+ PicturePtr pDstPict, PixmapPtr pSrc, PixmapPtr pMask,
+ PixmapPtr pDst)
+{
+ PMGA(pDst);
+ CARD32 fcol = 0xff000000, ds0 = 0, ds1 = 0, cmd, blendcntl;
+
+ mgaSetup(pMga, pDst, pDstPict, 2);
+ OUTREG(MGAREG_DSTORG, exaGetPixmapOffset(pDst));
+ OUTREG(MGAREG_PITCH, mgaGetPixmapPitch(pDst));
+
+ PrepareSourceTexture(0, pSrcPict, pSrc);
+
+ if (pMask)
+ PrepareSourceTexture(1, pMaskPict, pMask);
+ else
+ PrepareSourceTexture(1, pSrcPict, pSrc);
+
+ /* For A8 writes, the desired alpha value needs to be replicated
+ * to the color channels - if the source texture doesn't have an
+ * alpha channel, set it to 0xff instead.
+ * Otherwise, use the color channels if available, or set them
+ * to black.
+ */
+ if (pDstPict->format == PICT_a8 && !PICT_FORMAT_A(pSrcPict->format)) {
+ fcol = 0xffffffff;
+ ds0 |= C_ARG2_FCOL | COLOR_ARG2; /* C = 0xff */
+ } else if (pDstPict->format == PICT_a8)
+ ds0 |= C_ARG1_ALPHA | COLOR_ARG1; /* C = As */
+ else if (pSrcPict->format == PICT_a8)
+ ds0 |= C_ARG2_FCOL | COLOR_ARG2; /* C = 0 */
+ else
+ ds0 |= C_ARG1_CUR | COLOR_ARG1; /* C = Cs */
+
+ /* If the source texture has an alpha channel, use it.
+ * Otherwise, set the alpha channel to 0xff (see FCOL setting above).
+ */
+ if (PICT_FORMAT_A(pSrcPict->format))
+ ds0 |= A_ARG1_CUR | ALPHA_ARG1; /* A = As */
+ else
+ ds0 |= A_ARG2_FCOL | ALPHA_ARG2; /* A = 0xff */
+
+ if (!pMask)
+ ds1 = ds0;
+ else {
+ /* As or Am might be NULL. in this case we don't multiply because,
+ * the alpha component holds garbage.
+ */
+ if (!PICT_FORMAT_A(pMaskPict->format))
+ ds1 |= C_ARG2_PREV | COLOR_ARG2; /* C = Cs */
+ else
+ ds1 |= C_ARG1_ALPHA | C_ARG2_PREV | COLOR_MUL; /* C = Am * Cs */
+
+ if (!PICT_FORMAT_A(pMaskPict->format))
+ ds1 |= A_ARG2_PREV | ALPHA_ARG2; /* A = As */
+ else if (!PICT_FORMAT_A(pSrcPict->format))
+ ds1 |= A_ARG1_CUR | ALPHA_ARG1; /* A = Am */
+ else
+ ds1 |= A_ARG1_CUR | A_ARG2_PREV | ALPHA_MUL; /* A = Am * As */
+ }
+
+ cmd = MGADWG_TEXTURE_TRAP | MGADWG_I | 0x000c0000 |
+ MGADWG_SHIFTZERO | MGADWG_SGNZERO | MGADWG_ARZERO;
+ blendcntl = mgaBlendOp[op].blend_cntl;
+
+ if (!PICT_FORMAT_A(pDstPict->format) && mgaBlendOp[op].dst_alpha) {
+ int sblend = blendcntl & MGA_SRC_BLEND_MASK;
+
+ if (sblend == MGA_SRC_DST_ALPHA)
+ blendcntl = (blendcntl & ~MGA_SRC_BLEND_MASK) | MGA_SRC_ONE;
+ else if (sblend == MGA_SRC_ONE_MINUS_DST_ALPHA)
+ blendcntl = (blendcntl & ~MGA_SRC_BLEND_MASK) | MGA_SRC_ZERO;
+ }
+
+ if (!PICT_FORMAT_A(pSrcPict->format) && mgaBlendOp[op].src_alpha) {
+ int dblend = blendcntl & MGA_DST_BLEND_MASK;
+
+ if (dblend == MGA_DST_SRC_ALPHA)
+ blendcntl = (blendcntl & ~MGA_DST_BLEND_MASK) | MGA_DST_ONE;
+ else if (dblend == MGA_DST_ONE_MINUS_SRC_ALPHA)
+ blendcntl = (blendcntl & ~MGA_DST_BLEND_MASK) | MGA_DST_ZERO;
+ }
+
+ WAITFIFO(5);
+ OUTREG(MGAREG_FCOL, fcol);
+ OUTREG(MGAREG_TDUALSTAGE0, ds0);
+ OUTREG(MGAREG_TDUALSTAGE1, ds1);
+ OUTREG(MGAREG_DWGCTL, cmd);
+ OUTREG(MGAREG_ALPHACTRL, MGA_ALPHACHANNEL | blendcntl);
+
+ pMga->currentSrcPicture = pSrcPict;
+ pMga->currentMaskPicture = pMaskPict;
+ pMga->currentSrc = pSrc;
+ pMga->currentMask = pMask;
+
+ pMga->src_w2 = MGA_LOG2 (pSrc->drawable.width);
+ pMga->src_h2 = MGA_LOG2 (pSrc->drawable.height);
+
+ if (pMask) {
+ pMga->mask_w2 = MGA_LOG2 (pMask->drawable.width);
+ pMga->mask_h2 = MGA_LOG2 (pMask->drawable.height);
+ }
+
+ return TRUE;
+}
+
+static void
+mgaComposite(PixmapPtr pDst, int srcx, int srcy, int maskx, int masky,
+ int dstx, int dsty, int w, int h)
+{
+ PMGA(pDst);
+ PictTransformPtr t;
+ int texctl2;
+
+ srcx %= pMga->currentSrc->drawable.width;
+ srcy %= pMga->currentSrc->drawable.height;
+
+ if (pMga->currentMask) {
+ maskx %= pMga->currentMask->drawable.width;
+ masky %= pMga->currentMask->drawable.height;
+ }
+
+ t = pMga->currentSrcPicture->transform;
+
+ if (t)
+ setTMIncrementsRegs(pMga->currentSrc,
+ t->matrix[0][0],
+ t->matrix[0][1],
+ t->matrix[0][2] + (srcx << 16),
+ t->matrix[1][0],
+ t->matrix[1][1],
+ t->matrix[1][2] + (srcy << 16),
+ t->matrix[2][0],
+ t->matrix[2][1],
+ t->matrix[2][2],
+ 20 - pMga->src_w2,
+ 20 - pMga->src_h2);
+ else
+ setTMIncrementsRegs(pMga->currentSrc,
+ 1 << 16, 0, srcx << 16,
+ 0, 1 << 16, srcy << 16,
+ 0, 0, 1 << 16,
+ 20 - pMga->src_w2,
+ 20 - pMga->src_h2);
+
+ if (pMga->currentMask) {
+ texctl2 = MGA_G400_TC2_MAGIC | MGA_TC2_CKSTRANSDIS | MGA_TC2_DUALTEX;
+
+ WAITFIFO(1);
+ OUTREG(MGAREG_TEXCTL2, texctl2 | MGA_TC2_SELECT_TMU1);
+
+ t = pMga->currentMaskPicture->transform;
+
+ if (t)
+ setTMIncrementsRegs(pMga->currentMask,
+ t->matrix[0][0],
+ t->matrix[0][1],
+ t->matrix[0][2] + (maskx << 16),
+ t->matrix[1][0],
+ t->matrix[1][1],
+ t->matrix[1][2] + (masky << 16),
+ t->matrix[2][0],
+ t->matrix[2][1],
+ t->matrix[2][2],
+ 20 - pMga->mask_w2,
+ 20 - pMga->mask_h2);
+ else
+ setTMIncrementsRegs(pMga->currentMask,
+ 1 << 16, 0, maskx << 16,
+ 0, 1 << 16, masky << 16,
+ 0, 0, 1 << 16,
+ 20 - pMga->mask_w2,
+ 20 - pMga->mask_h2);
+
+ WAITFIFO(1);
+ OUTREG(MGAREG_TEXCTL2, texctl2 & ~MGA_TC2_SELECT_TMU1);
+ }
+
+ WAITFIFO(2);
+ OUTREG(MGAREG_FXBNDRY, ((dstx + w) << 16) | (dstx & 0xffff));
+ OUTREG(MGAREG_YDSTLEN | MGAREG_EXEC, (dsty << 16) | (h & 0xffff));
+}
+
+static Bool
+mgaUploadToScreen(PixmapPtr pDst, int x, int y, int w, int h,
+ char *src, int src_pitch)
+{
+ PMGA(pDst);
+ int bytes_padded = ((pDst->drawable.bitsPerPixel * w + 31) / 32) * 4;
+
+ QUIESCE_DMA(pDst);
+
+ mgaSetup(pMga, pDst, NULL, 10);
+
+ OUTREG(MGAREG_OPMODE, MGAOPM_DMA_BLIT);
+ OUTREG(MGAREG_DSTORG, exaGetPixmapOffset(pDst));
+ OUTREG(MGAREG_PITCH, mgaGetPixmapPitch(pDst));
+ OUTREG(MGAREG_PLNWT, 0xffffffff);
+ OUTREG(MGAREG_DWGCTL, MGADWG_ILOAD | MGADWG_BFCOL |
+ MGADWG_SGNZERO | MGADWG_SHIFTZERO |
+ MGADWG_RSTR | 0x000c0000);
+ OUTREG(MGAREG_AR0, w - 1);
+ OUTREG(MGAREG_AR3, 0);
+ OUTREG(MGAREG_AR5, 0);
+ OUTREG(MGAREG_FXBNDRY, ((x + w - 1) << 16) | (x & 0xffff));
+ OUTREG(MGAREG_YDSTLEN | MGAREG_EXEC, (y << 16) | (h & 0xffff));
+
+ while (h--) {
+ memcpy (pMga->ILOADBase, src, bytes_padded);
+ src += src_pitch;
+ }
+
+ return TRUE;
+}
+
+static void
+mgaWaitMarker(ScreenPtr pScreen, int marker)
+{
+ ScrnInfoPtr pScrn = xf86Screens[pScreen->myNum];
+ MGAPtr pMga = pScrn->driverPrivate;
+
+ WAITFIFO(1);
+
+ OUTREG(MGAREG_CACHEFLUSH, 0);
+
+ /* wait until the "drawing engine busy" bit is unset */
+ while (INREG (MGAREG_Status) & 0x10000);
+}
+
+Bool
+mgaExaInit(ScreenPtr pScreen)
+{
+ ExaDriverPtr pExa;
+ ScrnInfoPtr pScrn = xf86Screens[pScreen->myNum];
+ MGAPtr pMga = pScrn->driverPrivate;
+
+ pExa = exaDriverAlloc();
+ if (!pExa) {
+ pMga->NoAccel = TRUE;
+ return FALSE;
+ }
+
+ pMga->ExaDriver = pExa;
+
+ pExa->exa_major = EXA_VERSION_MAJOR;
+ pExa->exa_minor = EXA_VERSION_MINOR;
+
+ pExa->flags = EXA_OFFSCREEN_PIXMAPS | EXA_OFFSCREEN_ALIGN_POT;
+ pExa->memoryBase = pMga->FbStart;
+ pExa->memorySize = pMga->FbUsableSize - 4096;
+ pExa->offScreenBase = (pScrn->virtualX * pScrn->virtualY *
+ pScrn->bitsPerPixel / 8) + 4096;
+
+ xf86DrvMsg(pScrn->scrnIndex, X_INFO, "X %d Y %d bpp %d\n",
+ pScrn->virtualX, pScrn->virtualY, pScrn->bitsPerPixel);
+ xf86DrvMsg(pScrn->scrnIndex, X_INFO, "Start at %p, size %x, osb %x\n",
+ pExa->memoryBase, pExa->memorySize, pExa->offScreenBase);
+
+ /* In PW24 mode, we need to align to "3 64-bytes" */
+ pExa->pixmapOffsetAlign = 192;
+
+ /* Pitch alignment is in sets of 32 pixels, and we need to cover
+ * 32bpp, so it's 128 bytes.
+ */
+ pExa->pixmapPitchAlign = 128;
+
+ pExa->maxX = 2048;
+ pExa->maxY = 2048;
+
+ pExa->WaitMarker = mgaWaitMarker;
+ pExa->PrepareSolid = mgaPrepareSolid;
+ pExa->Solid = mgaSolid;
+ pExa->DoneSolid = mgaNoopDone;
+ pExa->PrepareCopy = mgaPrepareCopy;
+ pExa->Copy = mgaCopy;
+ pExa->DoneCopy = mgaNoopDone;
+
+ if (pMga->Chipset == PCI_CHIP_MGAG400) {
+ pExa->CheckComposite = mgaCheckComposite;
+ pExa->PrepareComposite = mgaPrepareComposite;
+ pExa->Composite = mgaComposite;
+ pExa->DoneComposite = mgaNoopDone;
+ }
+
+ pExa->UploadToScreen = mgaUploadToScreen;
+
+ return exaDriverInit(pScreen, pExa);
+}