mirror of
https://github.com/edk2-porting/linux-next.git
synced 2024-12-21 19:53:59 +08:00
drm/i915: Seal races between async GPU cancellation, retirement and signaling
Currently there is an underlying assumption that i915_request_unsubmit() is synchronous wrt the GPU -- that is the request is no longer in flight as we remove it. In the near future that may change, and this may upset our signaling as we can process an interrupt for that request while it is no longer in flight. CPU0 CPU1 intel_engine_breadcrumbs_irq (queue request completion) i915_request_cancel_signaling ... ... i915_request_enable_signaling dma_fence_signal Hence in the time it took us to drop the lock to signal the request, a preemption event may have occurred and re-queued the request. In the process, that request would have seen I915_FENCE_FLAG_SIGNAL clear and so reused the rq->signal_link that was in use on CPU0, leading to bad pointer chasing in intel_engine_breadcrumbs_irq. A related issue was that if someone started listening for a signal on a completed but no longer in-flight request, we missed the opportunity to immediately signal that request. Furthermore, as intel_contexts may be immediately released during request retirement, in order to be entirely sure that intel_engine_breadcrumbs_irq may no longer dereference the intel_context (ce->signals and ce->signal_link), we must wait for irq spinlock. In order to prevent the race, we use a bit in the fence.flags to signal the transfer onto the signal list inside intel_engine_breadcrumbs_irq. For simplicity, we use the DMA_FENCE_FLAG_SIGNALED_BIT as it then quickly signals to any outside observer that the fence is indeed signaled. v2: Sketch out potential dma-fence API for manual signaling v3: And the test_and_set_bit() Fixes:52c0fdb25c
("drm/i915: Replace global breadcrumbs with per-context interrupt tracking") Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk> Cc: Tvrtko Ursulin <tvrtko.ursulin@intel.com> Reviewed-by: Tvrtko Ursulin <tvrtko.ursulin@intel.com> Link: https://patchwork.freedesktop.org/patch/msgid/20190508112452.18942-1-chris@chris-wilson.co.uk (cherry picked from commit0152b3b3f4
) Signed-off-by: Joonas Lahtinen <joonas.lahtinen@linux.intel.com>
This commit is contained in:
parent
da47125070
commit
c36beba6b2
drivers
@ -29,6 +29,7 @@
|
|||||||
|
|
||||||
EXPORT_TRACEPOINT_SYMBOL(dma_fence_emit);
|
EXPORT_TRACEPOINT_SYMBOL(dma_fence_emit);
|
||||||
EXPORT_TRACEPOINT_SYMBOL(dma_fence_enable_signal);
|
EXPORT_TRACEPOINT_SYMBOL(dma_fence_enable_signal);
|
||||||
|
EXPORT_TRACEPOINT_SYMBOL(dma_fence_signaled);
|
||||||
|
|
||||||
static DEFINE_SPINLOCK(dma_fence_stub_lock);
|
static DEFINE_SPINLOCK(dma_fence_stub_lock);
|
||||||
static struct dma_fence dma_fence_stub;
|
static struct dma_fence dma_fence_stub;
|
||||||
|
@ -452,6 +452,7 @@ void __i915_request_submit(struct i915_request *request)
|
|||||||
set_bit(I915_FENCE_FLAG_ACTIVE, &request->fence.flags);
|
set_bit(I915_FENCE_FLAG_ACTIVE, &request->fence.flags);
|
||||||
|
|
||||||
if (test_bit(DMA_FENCE_FLAG_ENABLE_SIGNAL_BIT, &request->fence.flags) &&
|
if (test_bit(DMA_FENCE_FLAG_ENABLE_SIGNAL_BIT, &request->fence.flags) &&
|
||||||
|
!test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &request->fence.flags) &&
|
||||||
!i915_request_enable_breadcrumb(request))
|
!i915_request_enable_breadcrumb(request))
|
||||||
intel_engine_queue_breadcrumbs(engine);
|
intel_engine_queue_breadcrumbs(engine);
|
||||||
|
|
||||||
|
@ -23,6 +23,7 @@
|
|||||||
*/
|
*/
|
||||||
|
|
||||||
#include <linux/kthread.h>
|
#include <linux/kthread.h>
|
||||||
|
#include <trace/events/dma_fence.h>
|
||||||
#include <uapi/linux/sched/types.h>
|
#include <uapi/linux/sched/types.h>
|
||||||
|
|
||||||
#include "i915_drv.h"
|
#include "i915_drv.h"
|
||||||
@ -80,9 +81,39 @@ static inline bool __request_completed(const struct i915_request *rq)
|
|||||||
return i915_seqno_passed(__hwsp_seqno(rq), rq->fence.seqno);
|
return i915_seqno_passed(__hwsp_seqno(rq), rq->fence.seqno);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static bool
|
||||||
|
__dma_fence_signal(struct dma_fence *fence)
|
||||||
|
{
|
||||||
|
return !test_and_set_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &fence->flags);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void
|
||||||
|
__dma_fence_signal__timestamp(struct dma_fence *fence, ktime_t timestamp)
|
||||||
|
{
|
||||||
|
fence->timestamp = timestamp;
|
||||||
|
set_bit(DMA_FENCE_FLAG_TIMESTAMP_BIT, &fence->flags);
|
||||||
|
trace_dma_fence_signaled(fence);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void
|
||||||
|
__dma_fence_signal__notify(struct dma_fence *fence)
|
||||||
|
{
|
||||||
|
struct dma_fence_cb *cur, *tmp;
|
||||||
|
|
||||||
|
lockdep_assert_held(fence->lock);
|
||||||
|
lockdep_assert_irqs_disabled();
|
||||||
|
|
||||||
|
list_for_each_entry_safe(cur, tmp, &fence->cb_list, node) {
|
||||||
|
INIT_LIST_HEAD(&cur->node);
|
||||||
|
cur->func(fence, cur);
|
||||||
|
}
|
||||||
|
INIT_LIST_HEAD(&fence->cb_list);
|
||||||
|
}
|
||||||
|
|
||||||
void intel_engine_breadcrumbs_irq(struct intel_engine_cs *engine)
|
void intel_engine_breadcrumbs_irq(struct intel_engine_cs *engine)
|
||||||
{
|
{
|
||||||
struct intel_breadcrumbs *b = &engine->breadcrumbs;
|
struct intel_breadcrumbs *b = &engine->breadcrumbs;
|
||||||
|
const ktime_t timestamp = ktime_get();
|
||||||
struct intel_context *ce, *cn;
|
struct intel_context *ce, *cn;
|
||||||
struct list_head *pos, *next;
|
struct list_head *pos, *next;
|
||||||
LIST_HEAD(signal);
|
LIST_HEAD(signal);
|
||||||
@ -104,6 +135,10 @@ void intel_engine_breadcrumbs_irq(struct intel_engine_cs *engine)
|
|||||||
|
|
||||||
GEM_BUG_ON(!test_bit(I915_FENCE_FLAG_SIGNAL,
|
GEM_BUG_ON(!test_bit(I915_FENCE_FLAG_SIGNAL,
|
||||||
&rq->fence.flags));
|
&rq->fence.flags));
|
||||||
|
clear_bit(I915_FENCE_FLAG_SIGNAL, &rq->fence.flags);
|
||||||
|
|
||||||
|
if (!__dma_fence_signal(&rq->fence))
|
||||||
|
continue;
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Queue for execution after dropping the signaling
|
* Queue for execution after dropping the signaling
|
||||||
@ -111,14 +146,6 @@ void intel_engine_breadcrumbs_irq(struct intel_engine_cs *engine)
|
|||||||
* more signalers to the same context or engine.
|
* more signalers to the same context or engine.
|
||||||
*/
|
*/
|
||||||
i915_request_get(rq);
|
i915_request_get(rq);
|
||||||
|
|
||||||
/*
|
|
||||||
* We may race with direct invocation of
|
|
||||||
* dma_fence_signal(), e.g. i915_request_retire(),
|
|
||||||
* so we need to acquire our reference to the request
|
|
||||||
* before we cancel the breadcrumb.
|
|
||||||
*/
|
|
||||||
clear_bit(I915_FENCE_FLAG_SIGNAL, &rq->fence.flags);
|
|
||||||
list_add_tail(&rq->signal_link, &signal);
|
list_add_tail(&rq->signal_link, &signal);
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -141,7 +168,12 @@ void intel_engine_breadcrumbs_irq(struct intel_engine_cs *engine)
|
|||||||
struct i915_request *rq =
|
struct i915_request *rq =
|
||||||
list_entry(pos, typeof(*rq), signal_link);
|
list_entry(pos, typeof(*rq), signal_link);
|
||||||
|
|
||||||
dma_fence_signal(&rq->fence);
|
__dma_fence_signal__timestamp(&rq->fence, timestamp);
|
||||||
|
|
||||||
|
spin_lock(&rq->lock);
|
||||||
|
__dma_fence_signal__notify(&rq->fence);
|
||||||
|
spin_unlock(&rq->lock);
|
||||||
|
|
||||||
i915_request_put(rq);
|
i915_request_put(rq);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -243,19 +275,17 @@ void intel_engine_fini_breadcrumbs(struct intel_engine_cs *engine)
|
|||||||
|
|
||||||
bool i915_request_enable_breadcrumb(struct i915_request *rq)
|
bool i915_request_enable_breadcrumb(struct i915_request *rq)
|
||||||
{
|
{
|
||||||
struct intel_breadcrumbs *b = &rq->engine->breadcrumbs;
|
lockdep_assert_held(&rq->lock);
|
||||||
|
lockdep_assert_irqs_disabled();
|
||||||
|
|
||||||
GEM_BUG_ON(test_bit(I915_FENCE_FLAG_SIGNAL, &rq->fence.flags));
|
if (test_bit(I915_FENCE_FLAG_ACTIVE, &rq->fence.flags)) {
|
||||||
|
struct intel_breadcrumbs *b = &rq->engine->breadcrumbs;
|
||||||
if (!test_bit(I915_FENCE_FLAG_ACTIVE, &rq->fence.flags))
|
|
||||||
return true;
|
|
||||||
|
|
||||||
spin_lock(&b->irq_lock);
|
|
||||||
if (test_bit(I915_FENCE_FLAG_ACTIVE, &rq->fence.flags) &&
|
|
||||||
!__request_completed(rq)) {
|
|
||||||
struct intel_context *ce = rq->hw_context;
|
struct intel_context *ce = rq->hw_context;
|
||||||
struct list_head *pos;
|
struct list_head *pos;
|
||||||
|
|
||||||
|
spin_lock(&b->irq_lock);
|
||||||
|
GEM_BUG_ON(test_bit(I915_FENCE_FLAG_SIGNAL, &rq->fence.flags));
|
||||||
|
|
||||||
__intel_breadcrumbs_arm_irq(b);
|
__intel_breadcrumbs_arm_irq(b);
|
||||||
|
|
||||||
/*
|
/*
|
||||||
@ -284,8 +314,8 @@ bool i915_request_enable_breadcrumb(struct i915_request *rq)
|
|||||||
list_move_tail(&ce->signal_link, &b->signalers);
|
list_move_tail(&ce->signal_link, &b->signalers);
|
||||||
|
|
||||||
set_bit(I915_FENCE_FLAG_SIGNAL, &rq->fence.flags);
|
set_bit(I915_FENCE_FLAG_SIGNAL, &rq->fence.flags);
|
||||||
|
spin_unlock(&b->irq_lock);
|
||||||
}
|
}
|
||||||
spin_unlock(&b->irq_lock);
|
|
||||||
|
|
||||||
return !__request_completed(rq);
|
return !__request_completed(rq);
|
||||||
}
|
}
|
||||||
@ -294,9 +324,15 @@ void i915_request_cancel_breadcrumb(struct i915_request *rq)
|
|||||||
{
|
{
|
||||||
struct intel_breadcrumbs *b = &rq->engine->breadcrumbs;
|
struct intel_breadcrumbs *b = &rq->engine->breadcrumbs;
|
||||||
|
|
||||||
if (!test_bit(I915_FENCE_FLAG_SIGNAL, &rq->fence.flags))
|
lockdep_assert_held(&rq->lock);
|
||||||
return;
|
lockdep_assert_irqs_disabled();
|
||||||
|
|
||||||
|
/*
|
||||||
|
* We must wait for b->irq_lock so that we know the interrupt handler
|
||||||
|
* has released its reference to the intel_context and has completed
|
||||||
|
* the DMA_FENCE_FLAG_SIGNALED_BIT/I915_FENCE_FLAG_SIGNAL dance (if
|
||||||
|
* required).
|
||||||
|
*/
|
||||||
spin_lock(&b->irq_lock);
|
spin_lock(&b->irq_lock);
|
||||||
if (test_bit(I915_FENCE_FLAG_SIGNAL, &rq->fence.flags)) {
|
if (test_bit(I915_FENCE_FLAG_SIGNAL, &rq->fence.flags)) {
|
||||||
struct intel_context *ce = rq->hw_context;
|
struct intel_context *ce = rq->hw_context;
|
||||||
|
@ -23,7 +23,6 @@
|
|||||||
*/
|
*/
|
||||||
|
|
||||||
#include <linux/circ_buf.h>
|
#include <linux/circ_buf.h>
|
||||||
#include <trace/events/dma_fence.h>
|
|
||||||
|
|
||||||
#include "intel_guc_submission.h"
|
#include "intel_guc_submission.h"
|
||||||
#include "intel_lrc_reg.h"
|
#include "intel_lrc_reg.h"
|
||||||
|
Loading…
Reference in New Issue
Block a user