src - OpenBSD base system

diff options


context:
space:
mode:

author	Jonathan Gray <jsg@cvs.openbsd.org>	2023-08-13 10:22:21 +0000
committer	Jonathan Gray <jsg@cvs.openbsd.org>	2023-08-13 10:22:21 +0000
commit	02dc4ce0066e76ea4ece72b01b9296566661f2e5 (patch)
tree	abe1469229f1ee8e824ccfdf02a1276aace9a046
parent	ddcc438439fe756ba7855187ca7ff8746a7b4025 (diff)

drm/i915: Fix premature release of request's reusable memory

From Janusz Krzysztofik 4db8b39418a685179263b7ad895a3182d72be358 in linux-6.1.y/6.1.45 a337b64f0d5717248a0c894e2618e658e6a9de9f in mainline linux

Diffstat

-rw-r--r--

sys/dev/pci/drm/i915/i915_active.c

-rw-r--r--

sys/dev/pci/drm/i915/i915_request.c

2 files changed, 81 insertions, 29 deletions

diff --git a/sys/dev/pci/drm/i915/i915_active.c b/sys/dev/pci/drm/i915/i915_active.c
index de21524f9d1..96e3e84d376 100644
--- a/sys/dev/pci/drm/i915/i915_active.c
+++ b/sys/dev/pci/drm/i915/i915_active.c

@@ -461,8 +461,11 @@ int i915_active_add_request(struct i915_active *ref, struct i915_request *rq)

}

} while (unlikely(is_barrier(active)));

- if (!__i915_active_fence_set(active, fence))

+ fence = __i915_active_fence_set(active, fence);

+ if (!fence)

__i915_active_acquire(ref);

+ else

+ dma_fence_put(fence);

out:

i915_active_release(ref);

@@ -481,13 +484,9 @@ __i915_active_set_fence(struct i915_active *ref,

return NULL;

}

- rcu_read_lock();

prev = __i915_active_fence_set(active, fence);

- if (prev)

- prev = dma_fence_get_rcu(prev);

- else

+ if (!prev)

__i915_active_acquire(ref);

- rcu_read_unlock();

return prev;

}

@@ -1043,10 +1042,11 @@ void i915_request_add_active_barriers(struct i915_request *rq)

* Records the new @fence as the last active fence along its timeline in

* this active tracker, moving the tracking callbacks from the previous

- * fence onto this one. Returns the previous fence (if not already completed),

- * which the caller must ensure is executed before the new fence. To ensure

- * that the order of fences within the timeline of the i915_active_fence is

- * understood, it should be locked by the caller.

+ * fence onto this one. Gets and returns a reference to the previous fence

+ * (if not already completed), which the caller must put after making sure

+ * that it is executed before the new fence. To ensure that the order of

+ * fences within the timeline of the i915_active_fence is understood, it

+ * should be locked by the caller.

struct dma_fence *

__i915_active_fence_set(struct i915_active_fence *active,

@@ -1055,7 +1055,23 @@ __i915_active_fence_set(struct i915_active_fence *active,

struct dma_fence *prev;

unsigned long flags;

- if (fence == rcu_access_pointer(active->fence))

+ /*

+ * In case of fences embedded in i915_requests, their memory is

+ * SLAB_FAILSAFE_BY_RCU, then it can be reused right after release

+ * by new requests. Then, there is a risk of passing back a pointer

+ * to a new, completely unrelated fence that reuses the same memory

+ * while tracked under a different active tracker. Combined with i915

+ * perf open/close operations that build await dependencies between

+ * engine kernel context requests and user requests from different

+ * timelines, this can lead to dependency loops and infinite waits.

+ *

+ * As a countermeasure, we try to get a reference to the active->fence

+ * first, so if we succeed and pass it back to our user then it is not

+ * released and potentially reused by an unrelated request before the

+ * user has a chance to set up an await dependency on it.

+ */

+ prev = i915_active_fence_get(active);

+ if (fence == prev)

return fence;

GEM_BUG_ON(test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &fence->flags));

@@ -1064,27 +1080,56 @@ __i915_active_fence_set(struct i915_active_fence *active,

* Consider that we have two threads arriving (A and B), with

* C already resident as the active->fence.

- * A does the xchg first, and so it sees C or NULL depending

- * on the timing of the interrupt handler. If it is NULL, the

- * previous fence must have been signaled and we know that

- * we are first on the timeline. If it is still present,

- * we acquire the lock on that fence and serialise with the interrupt

- * handler, in the process removing it from any future interrupt

- * callback. A will then wait on C before executing (if present).

- *

- * As B is second, it sees A as the previous fence and so waits for

- * it to complete its transition and takes over the occupancy for

- * itself -- remembering that it needs to wait on A before executing.

+ * Both A and B have got a reference to C or NULL, depending on the

+ * timing of the interrupt handler. Let's assume that if A has got C

+ * then it has locked C first (before B).

* Note the strong ordering of the timeline also provides consistent

* nesting rules for the fence->lock; the inner lock is always the

* older lock.

spin_lock_irqsave(fence->lock, flags);

- prev = xchg(__active_fence_slot(active), fence);

- if (prev) {

- GEM_BUG_ON(prev == fence);

+ if (prev)

spin_lock_nested(prev->lock, SINGLE_DEPTH_NESTING);

+ /*

+ * A does the cmpxchg first, and so it sees C or NULL, as before, or

+ * something else, depending on the timing of other threads and/or

+ * interrupt handler. If not the same as before then A unlocks C if

+ * applicable and retries, starting from an attempt to get a new

+ * active->fence. Meanwhile, B follows the same path as A.

+ * Once A succeeds with cmpxch, B fails again, retires, gets A from

+ * active->fence, locks it as soon as A completes, and possibly

+ * succeeds with cmpxchg.

+ */

+ while (cmpxchg(__active_fence_slot(active), prev, fence) != prev) {

+ if (prev) {

+ spin_unlock(prev->lock);

+ dma_fence_put(prev);

+ }

+ spin_unlock_irqrestore(fence->lock, flags);

+ prev = i915_active_fence_get(active);

+ GEM_BUG_ON(prev == fence);

+ spin_lock_irqsave(fence->lock, flags);

+ if (prev)

+ spin_lock_nested(prev->lock, SINGLE_DEPTH_NESTING);

+ }

+ /*

+ * If prev is NULL then the previous fence must have been signaled

+ * and we know that we are first on the timeline. If it is still

+ * present then, having the lock on that fence already acquired, we

+ * serialise with the interrupt handler, in the process of removing it

+ * from any future interrupt callback. A will then wait on C before

+ * executing (if present).

+ *

+ * As B is second, it sees A as the previous fence and so waits for

+ * it to complete its transition and takes over the occupancy for

+ * itself -- remembering that it needs to wait on A before executing.

+ */

+ if (prev) {

__list_del_entry(&active->cb.node);

spin_unlock(prev->lock); /* serialise with prev->cb_list */

}

@@ -1101,11 +1146,7 @@ int i915_active_fence_set(struct i915_active_fence *active,

int err = 0;

/* Must maintain timeline ordering wrt previous active requests */

- rcu_read_lock();

fence = __i915_active_fence_set(active, &rq->fence);

- if (fence) /* but the previous fence may not belong to that timeline! */

- fence = dma_fence_get_rcu(fence);

- rcu_read_unlock();

if (fence) {

err = i915_request_await_dma_fence(rq, fence);

dma_fence_put(fence);

diff --git a/sys/dev/pci/drm/i915/i915_request.c b/sys/dev/pci/drm/i915/i915_request.c
index d0728df7261..1e37187e84e 100644
--- a/sys/dev/pci/drm/i915/i915_request.c
+++ b/sys/dev/pci/drm/i915/i915_request.c

@@ -1728,6 +1728,11 @@ __i915_request_ensure_parallel_ordering(struct i915_request *rq,

request_to_parent(rq)->parallel.last_rq = i915_request_get(rq);

+ /*

+ * Users have to put a reference potentially got by

+ * __i915_active_fence_set() to the returned request

+ * when no longer needed

+ */

return to_request(__i915_active_fence_set(&timeline->last_request,

&rq->fence));

}

@@ -1774,6 +1779,10 @@ __i915_request_ensure_ordering(struct i915_request *rq,

0);

}

+ /*

+ * Users have to put the reference to prev potentially got

+ * by __i915_active_fence_set() when no longer needed

+ */

return prev;

}

@@ -1817,6 +1826,8 @@ __i915_request_add_to_timeline(struct i915_request *rq)

prev = __i915_request_ensure_ordering(rq, timeline);

else

prev = __i915_request_ensure_parallel_ordering(rq, timeline);

+ if (prev)

+ i915_request_put(prev);

* Make sure that no request gazumped us - if it was allocated after