diff options
author | Chris Wilson <chris@chris-wilson.co.uk> | 2010-05-21 09:55:55 +0100 |
---|---|---|
committer | Chris Wilson <chris@chris-wilson.co.uk> | 2010-05-24 18:31:16 +0100 |
commit | 80a9e64f50aeda6004e3aba1fbfdda50bb1f1c82 (patch) | |
tree | a9e39dec68ff4fd3b4d61a5c26cd7fc18b88a3b0 /src/i830_uxa.c | |
parent | 91f560034fc2695680d1208a78fc56d814b0da79 (diff) |
uxa: Use temporary dest when target is too large for compositor
If the destination cannot fit into the 3D pipeline when we need to
composite, we fallback to doing the operation on the CPU. This is very
slow, and quite easy to trigger on i915 by plugging in an external
display.
An alternative is to extract the extents of the operation from the
destination using the blitter which can usually handle much larger
operations. This gives us a temporary target that can fit into the 3D
pipeline and thus be accelerated, before copying back into the larger
real destination.
For x11perf this boosts glyph rendering on PineView, from 38kglyphs/s to
480kglyphs/s. Just a little shy of the native performance of 601kglyphs/s
Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
Diffstat (limited to 'src/i830_uxa.c')
-rw-r--r-- | src/i830_uxa.c | 22 |
1 files changed, 12 insertions, 10 deletions
diff --git a/src/i830_uxa.c b/src/i830_uxa.c index a79dde17..0a6b6f80 100644 --- a/src/i830_uxa.c +++ b/src/i830_uxa.c @@ -323,10 +323,10 @@ static void i830_uxa_done_solid(PixmapPtr pixmap) * - support planemask using FULL_BLT_CMD? */ static Bool -i830_uxa_check_copy(DrawablePtr source, DrawablePtr dest, +i830_uxa_check_copy(PixmapPtr source, PixmapPtr dest, int alu, Pixel planemask) { - ScrnInfoPtr scrn = xf86Screens[dest->pScreen->myNum]; + ScrnInfoPtr scrn = xf86Screens[dest->drawable.pScreen->myNum]; intel_screen_private *intel = intel_get_screen_private(scrn); if (IS_GEN6(intel)) { @@ -335,16 +335,16 @@ i830_uxa_check_copy(DrawablePtr source, DrawablePtr dest, return FALSE; } - if (!UXA_PM_IS_SOLID(source, planemask)) { + if (!UXA_PM_IS_SOLID(&source->drawable, planemask)) { intel_debug_fallback(scrn, "planemask is not solid"); return FALSE; } - if (source->bitsPerPixel != dest->bitsPerPixel) { + if (source->drawable.bitsPerPixel != dest->drawable.bitsPerPixel) { intel_debug_fallback(scrn, "mixed bpp copies unsupported\n"); return FALSE; } - switch (source->bitsPerPixel) { + switch (source->drawable.bitsPerPixel) { case 8: case 16: case 32: @@ -353,6 +353,11 @@ i830_uxa_check_copy(DrawablePtr source, DrawablePtr dest, return FALSE; } + if (!intel_check_pitch_2d(source)) + return FALSE; + if (!intel_check_pitch_2d(dest)) + return FALSE; + return TRUE; } @@ -368,11 +373,6 @@ i830_uxa_prepare_copy(PixmapPtr source, PixmapPtr dest, int xdir, i830_get_pixmap_bo(dest), }; - if (!intel_check_pitch_2d(source)) - return FALSE; - if (!intel_check_pitch_2d(dest)) - return FALSE; - if (!i830_get_aperture_space(scrn, bo_table, ARRAY_SIZE(bo_table))) return FALSE; @@ -1076,6 +1076,7 @@ Bool i830_uxa_init(ScreenPtr screen) /* Composite */ if (!IS_I9XX(intel)) { intel->uxa_driver->check_composite = i830_check_composite; + intel->uxa_driver->check_composite_target = i830_check_composite_target; intel->uxa_driver->check_composite_texture = i830_check_composite_texture; intel->uxa_driver->prepare_composite = i830_prepare_composite; intel->uxa_driver->composite = i830_composite; @@ -1083,6 +1084,7 @@ Bool i830_uxa_init(ScreenPtr screen) } else if (IS_I915G(intel) || IS_I915GM(intel) || IS_I945G(intel) || IS_I945GM(intel) || IS_G33CLASS(intel)) { intel->uxa_driver->check_composite = i915_check_composite; + intel->uxa_driver->check_composite_target = i915_check_composite_target; intel->uxa_driver->check_composite_texture = i915_check_composite_texture; intel->uxa_driver->prepare_composite = i915_prepare_composite; intel->uxa_driver->composite = i915_composite; |