summaryrefslogtreecommitdiff
path: root/sys
diff options
context:
space:
mode:
authorMark Kettenis <kettenis@openbsd.org>2013-02-25 22:02:54 +0100
committerMark Kettenis <kettenis@openbsd.org>2013-02-25 22:02:54 +0100
commitd405facafba886d45e9b62d6cd52215743811bb7 (patch)
treeef579954c3770c858a1f667585eb6dc6c30d6955 /sys
parent00320b104ba962ed9541697895aa343e5b282d42 (diff)
Bring domain handling code close to Linux 3.4.33.
Diffstat (limited to 'sys')
-rw-r--r--sys/dev/pci/drm/i915_drv.c32
-rw-r--r--sys/dev/pci/drm/i915_drv.h5
-rw-r--r--sys/dev/pci/drm/i915_gem.c204
-rw-r--r--sys/dev/pci/drm/i915_gem_evict.c2
-rw-r--r--sys/dev/pci/drm/i915_gem_execbuffer.c2
5 files changed, 129 insertions, 116 deletions
diff --git a/sys/dev/pci/drm/i915_drv.c b/sys/dev/pci/drm/i915_drv.c
index 8ec81de2b9e..2a0df603749 100644
--- a/sys/dev/pci/drm/i915_drv.c
+++ b/sys/dev/pci/drm/i915_drv.c
@@ -1492,38 +1492,6 @@ i915_gem_retire_work_handler(void *arg1, void *unused)
timeout_add_sec(&dev_priv->mm.retire_timer, 1);
}
-/*
- * flush and invalidate the provided domains
- * if we have successfully queued a gpu flush, then we return a seqno from
- * the request. else (failed or just cpu flushed) we return 0.
- */
-u_int32_t
-i915_gem_flush(struct intel_ring_buffer *ring, uint32_t invalidate_domains,
- uint32_t flush_domains)
-{
- drm_i915_private_t *dev_priv = ring->dev->dev_private;
- int err = 0;
- u32 seqno;
-
- if (flush_domains & I915_GEM_DOMAIN_CPU)
- inteldrm_chipset_flush(dev_priv);
- if (((invalidate_domains | flush_domains) & I915_GEM_GPU_DOMAINS) == 0)
- return (0);
-
- ring->flush(ring, invalidate_domains, flush_domains);
-
- /* if this is a gpu flush, process the results */
- if (flush_domains & I915_GEM_GPU_DOMAINS) {
- i915_gem_process_flushing_list(ring, flush_domains);
- err = i915_add_request(ring, NULL, &seqno);
- }
-
- if (err)
- return (0);
- else
- return (seqno);
-}
-
struct drm_obj *
i915_gem_find_inactive_object(struct inteldrm_softc *dev_priv,
size_t min_size)
diff --git a/sys/dev/pci/drm/i915_drv.h b/sys/dev/pci/drm/i915_drv.h
index 19d84c153fd..56396ebba0d 100644
--- a/sys/dev/pci/drm/i915_drv.h
+++ b/sys/dev/pci/drm/i915_drv.h
@@ -1060,7 +1060,7 @@ int i915_gem_object_pin_and_relocate(struct drm_obj *,
struct drm_i915_gem_relocation_entry *);
int i915_gem_object_bind_to_gtt(struct drm_i915_gem_object *,
bus_size_t);
-u_int32_t i915_gem_flush(struct intel_ring_buffer *, uint32_t, uint32_t);
+int i915_gem_flush_ring(struct intel_ring_buffer *, uint32_t, uint32_t);
struct drm_obj *i915_gem_find_inactive_object(struct inteldrm_softc *,
size_t);
@@ -1073,8 +1073,7 @@ int i915_gem_object_pin_to_display_plane(struct drm_i915_gem_object *,
u32, struct intel_ring_buffer *);
int i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *,
int);
-int i915_gem_object_flush_gpu_write_domain(struct drm_i915_gem_object *,
- int, int);
+int i915_gem_object_flush_gpu_write_domain(struct drm_i915_gem_object *);
int i915_gem_object_wait_rendering(struct drm_i915_gem_object *, bool);
bus_size_t i915_gem_get_gtt_alignment(struct drm_obj *);
diff --git a/sys/dev/pci/drm/i915_gem.c b/sys/dev/pci/drm/i915_gem.c
index 5fbea7f36d2..d355ffc8483 100644
--- a/sys/dev/pci/drm/i915_gem.c
+++ b/sys/dev/pci/drm/i915_gem.c
@@ -1278,6 +1278,28 @@ i915_gem_object_unbind(struct drm_i915_gem_object *obj)
}
int
+i915_gem_flush_ring(struct intel_ring_buffer *ring,
+ uint32_t invalidate_domains,
+ uint32_t flush_domains)
+{
+ int ret;
+
+ if (((invalidate_domains | flush_domains) & I915_GEM_GPU_DOMAINS) == 0)
+ return 0;
+
+// trace_i915_gem_ring_flush(ring, invalidate_domains, flush_domains);
+
+ ret = ring->flush(ring, invalidate_domains, flush_domains);
+ if (ret)
+ return ret;
+
+ if (flush_domains & I915_GEM_GPU_DOMAINS)
+ i915_gem_process_flushing_list(ring, flush_domains);
+
+ return 0;
+}
+
+int
i915_gpu_idle(struct drm_device *dev)
{
drm_i915_private_t *dev_priv = dev->dev_private;
@@ -1696,39 +1718,16 @@ error:
// i915_gem_clflush_object
// i915_gem_object_flush_gtt_write_domain
-/*
- * Flush the GPU write domain for the object if dirty, then wait for the
- * rendering to complete. When this returns it is safe to unbind from the
- * GTT or access from the CPU.
- */
+
+/** Flushes any GPU write domain for the object if it's dirty. */
int
-i915_gem_object_flush_gpu_write_domain(struct drm_i915_gem_object *obj,
- int pipelined, int write)
+i915_gem_object_flush_gpu_write_domain(struct drm_i915_gem_object *obj)
{
- u_int32_t seqno;
- int ret = 0;
-
- DRM_ASSERT_HELD(&obj->base);
- if ((obj->base.write_domain & I915_GEM_GPU_DOMAINS) != 0) {
- /*
- * Queue the GPU write cache flushing we need.
- * This call will move stuff form the flushing list to the
- * active list so all we need to is wait for it.
- */
- (void)i915_gem_flush(obj->ring, 0, obj->base.write_domain);
- KASSERT(obj->base.write_domain == 0);
- }
+ if ((obj->base.write_domain & I915_GEM_GPU_DOMAINS) == 0)
+ return 0;
- /* wait for queued rendering so we know it's flushed and bo is idle */
- if (pipelined == 0 && obj->active) {
- if (write) {
- seqno = obj->last_read_seqno;
- } else {
- seqno = obj->last_write_seqno;
- }
- ret = i915_wait_seqno(obj->ring, seqno);
- }
- return (ret);
+ /* Queue the GPU write cache flushing we need. */
+ return i915_gem_flush_ring(obj->ring, 0, obj->base.write_domain);
}
void
@@ -1747,17 +1746,27 @@ int
i915_gem_object_set_to_gtt_domain(struct drm_i915_gem_object *obj, int write)
{
drm_i915_private_t *dev_priv = obj->base.dev->dev_private;
+// uint32_t old_write_domain, old_read_domains;
int ret;
DRM_ASSERT_HELD(&obj->base);
+
/* Not valid to be called on unbound objects. */
if (obj->dmamap == NULL)
return (EINVAL);
- /* Wait on any GPU rendering and flushing to occur. */
- if ((ret = i915_gem_object_flush_gpu_write_domain(obj, 0,
- write)) != 0)
- return (ret);
+ if (obj->base.write_domain == I915_GEM_DOMAIN_GTT)
+ return 0;
+
+ ret = i915_gem_object_flush_gpu_write_domain(obj);
+ if (ret)
+ return ret;
+
+ if (obj->pending_gpu_write || write) {
+ ret = i915_gem_object_wait_rendering(obj, false);
+ if (ret)
+ return ret;
+ }
if (obj->base.write_domain == I915_GEM_DOMAIN_CPU) {
/* clflush the pages, and flush chipset cache */
@@ -1778,21 +1787,25 @@ i915_gem_object_set_to_gtt_domain(struct drm_i915_gem_object *obj, int write)
if (obj->tiling_mode != I915_TILING_NONE)
ret = i915_gem_object_get_fence(obj);
- /*
- * If we're writing through the GTT domain then the CPU and GPU caches
- * will need to be invalidated at next use.
- * It should now be out of any other write domains and we can update
- * to the correct ones
+// old_write_domain = obj->base.write_domain;
+// old_read_domains = obj->base.read_domains;
+
+ /* It should now be out of any other write domains, and we can update
+ * the domain values for our changes.
*/
- KASSERT((obj->base.write_domain & ~I915_GEM_DOMAIN_GTT) == 0);
+ BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
+ obj->base.read_domains |= I915_GEM_DOMAIN_GTT;
if (write) {
- obj->base.read_domains = obj->base.write_domain = I915_GEM_DOMAIN_GTT;
+ obj->base.read_domains = I915_GEM_DOMAIN_GTT;
+ obj->base.write_domain = I915_GEM_DOMAIN_GTT;
obj->dirty = 1;
- } else {
- obj->base.read_domains |= I915_GEM_DOMAIN_GTT;
}
- return (ret);
+// trace_i915_gem_object_change_domain(obj,
+// old_read_domains,
+// old_write_domain);
+
+ return 0;
}
int
@@ -1808,15 +1821,15 @@ i915_gem_object_set_cache_level(struct drm_i915_gem_object *obj,
int
i915_gem_object_pin_to_display_plane(struct drm_i915_gem_object *obj,
- u32 alignment, struct intel_ring_buffer *pipelined)
+ u32 alignment,
+ struct intel_ring_buffer *pipelined)
{
// u32 old_read_domains, old_write_domain;
int ret;
- ret = i915_gem_object_flush_gpu_write_domain(obj, pipelined != NULL,
- 0);
- if (ret != 0)
- return (ret);
+ ret = i915_gem_object_flush_gpu_write_domain(obj);
+ if (ret)
+ return ret;
if (pipelined != obj->ring) {
ret = i915_gem_object_wait_rendering(obj, false);
@@ -1824,31 +1837,47 @@ i915_gem_object_pin_to_display_plane(struct drm_i915_gem_object *obj,
return (ret);
}
+ /* The display engine is not coherent with the LLC cache on gen6. As
+ * a result, we make sure that the pinning that is about to occur is
+ * done with uncached PTEs. This is lowest common denominator for all
+ * chipsets.
+ *
+ * However for gen6+, we could do better by using the GFDT bit instead
+ * of uncaching, which would allow us to flush all the LLC-cached data
+ * with that bit in the PTE to main memory with just one PIPE_CONTROL.
+ */
ret = i915_gem_object_set_cache_level(obj, I915_CACHE_NONE);
- if (ret != 0)
- return (ret);
+ if (ret)
+ return ret;
+ /* As the user may map the buffer once pinned in the display plane
+ * (e.g. libkms for the bootup splash), we have to ensure that we
+ * always use map_and_fenceable for all scanout buffers.
+ */
ret = i915_gem_object_pin(obj, alignment, true);
- if (ret != 0)
- return (ret);
+ if (ret)
+ return ret;
#ifdef notyet
i915_gem_object_flush_cpu_write_domain(obj);
- old_write_domain = obj->write_domain;
- old_read_domains = obj->read_domains;
+// old_write_domain = obj->write_domain;
+// old_read_domains = obj->read_domains;
- KASSERT((obj->write_domain & ~I915_GEM_DOMAIN_GTT) == 0);
- obj->read_domains |= I915_GEM_DOMAIN_GTT;
+ /* It should now be out of any other write domains, and we can update
+ * the domain values for our changes.
+ */
+ BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
+ obj->base.read_domains |= I915_GEM_DOMAIN_GTT;
#else
printf("%s skipping write domain flush\n", __func__);
#endif
-#ifdef notyet
- CTR3(KTR_DRM, "object_change_domain pin_to_display_plan %p %x %x",
- obj, old_read_domains, obj->write_domain);
-#endif
- return (0);
+// trace_i915_gem_object_change_domain(obj,
+// old_read_domains,
+// old_write_domain);
+
+ return 0;
}
int
@@ -1879,13 +1908,21 @@ i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *obj, int write)
{
struct drm_device *dev = obj->base.dev;
struct inteldrm_softc *dev_priv = dev->dev_private;
- int ret;
+// uint32_t old_write_domain, old_read_domains;
+ int ret;
DRM_ASSERT_HELD(obj);
- /* Wait on any GPU rendering and flushing to occur. */
- if ((ret = i915_gem_object_flush_gpu_write_domain(obj, 0,
- write)) != 0)
- return (ret);
+
+ if (obj->base.write_domain == I915_GEM_DOMAIN_CPU)
+ return 0;
+
+ ret = i915_gem_object_flush_gpu_write_domain(obj);
+ if (ret)
+ return ret;
+
+ ret = i915_gem_object_wait_rendering(obj, false);
+ if (ret)
+ return ret;
if (obj->base.write_domain == I915_GEM_DOMAIN_GTT ||
(write && obj->base.read_domains & I915_GEM_DOMAIN_GTT)) {
@@ -1904,6 +1941,9 @@ i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *obj, int write)
if ((ret = i915_gem_object_put_fence(obj)) != 0)
return (ret);
+// old_write_domain = obj->base.write_domain;
+// old_read_domains = obj->base.read_domains;
+
/* Flush the CPU cache if it's still invalid. */
if ((obj->base.read_domains & I915_GEM_DOMAIN_CPU) == 0) {
bus_dmamap_sync(dev_priv->agpdmat, obj->dmamap, 0,
@@ -1912,20 +1952,24 @@ i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *obj, int write)
obj->base.read_domains |= I915_GEM_DOMAIN_CPU;
}
- /*
- * It should now be out of any other write domain, and we can update
- * the domain value for our changes.
+ /* It should now be out of any other write domains, and we can update
+ * the domain values for our changes.
*/
- KASSERT((obj->base.write_domain & ~I915_GEM_DOMAIN_CPU) == 0);
+ BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_CPU) != 0);
- /*
- * If we're writing through the CPU, then the GPU read domains will
+ /* If we're writing through the CPU, then the GPU read domains will
* need to be invalidated at next use.
*/
- if (write)
- obj->base.read_domains = obj->base.write_domain = I915_GEM_DOMAIN_CPU;
+ if (write) {
+ obj->base.read_domains = I915_GEM_DOMAIN_CPU;
+ obj->base.write_domain = I915_GEM_DOMAIN_CPU;
+ }
- return (0);
+// trace_i915_gem_object_change_domain(obj,
+// old_read_domains,
+// old_write_domain);
+
+ return 0;
}
/* Throttle our rendering by waiting until the ring has completed our requests
@@ -2136,9 +2180,11 @@ i915_gem_busy_ioctl(struct drm_device *dev, void *data,
* it wants to use this buffer sooner rather than later, so
* flushing now shoul reduce latency.
*/
- if (obj->base.write_domain)
- (void)i915_gem_flush(obj->ring, obj->base.write_domain,
- obj->base.write_domain);
+ if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
+ ret = i915_gem_flush_ring(obj->ring,
+ 0, obj->base.write_domain);
+ }
+
/*
* Update the active list after the flush otherwise this is
* only updated on a delayed timer. Updating now reduces
diff --git a/sys/dev/pci/drm/i915_gem_evict.c b/sys/dev/pci/drm/i915_gem_evict.c
index 592c7dda3a2..9ac0c28efdd 100644
--- a/sys/dev/pci/drm/i915_gem_evict.c
+++ b/sys/dev/pci/drm/i915_gem_evict.c
@@ -127,7 +127,7 @@ i915_gem_evict_something(struct inteldrm_softc *dev_priv, size_t min_size)
}
if (write_domain) {
- if (i915_gem_flush(obj_priv->ring, write_domain,
+ if (i915_gem_flush_ring(obj_priv->ring, write_domain,
write_domain) == 0)
return (ENOMEM);
continue;
diff --git a/sys/dev/pci/drm/i915_gem_execbuffer.c b/sys/dev/pci/drm/i915_gem_execbuffer.c
index ad42c36c5e3..a72354a049e 100644
--- a/sys/dev/pci/drm/i915_gem_execbuffer.c
+++ b/sys/dev/pci/drm/i915_gem_execbuffer.c
@@ -472,7 +472,7 @@ i915_gem_execbuffer2(struct drm_device *dev, void *data,
inteldrm_verify_inactive(dev_priv, __FILE__, __LINE__);
/* flush and invalidate any domains that need them. */
- (void)i915_gem_flush(ring, dev->invalidate_domains,
+ (void)i915_gem_flush_ring(ring, dev->invalidate_domains,
dev->flush_domains);
/*