drm/i915/ringbuffer: Fix use of stale HEAD position whilst polling for space
During suspend, Linus found that his machine would hang for 3 seconds, and identified that intel_ring_buffer_wait() was the culprit: "Because from looking at the code, I get the notion that "intel_read_status_page()" may not be exact. But what happens if that inexact value matches our cached ring->actual_head, so we never even try to read the exact case? Does it _stay_ inexact for arbitrarily long times? If so, we might wait for the ring to empty forever (well, until the timeout - the behavior I see), even though the ring really _is_ empty." As the reported HEAD position is only updated every time it crosses a 64k boundary, whilst draining the ring it is indeed likely to remain one value. If that value matches the last known HEAD position, we never read the true value from the register and so trigger a timeout. Reported-by: Linus Torvalds <torvalds@linux-foundation.org> Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
This commit is contained in:
parent
475553de2f
commit
c7dca47bd6
|
@ -34,6 +34,14 @@
|
||||||
#include "i915_trace.h"
|
#include "i915_trace.h"
|
||||||
#include "intel_drv.h"
|
#include "intel_drv.h"
|
||||||
|
|
||||||
|
static inline int ring_space(struct intel_ring_buffer *ring)
|
||||||
|
{
|
||||||
|
int space = (ring->head & HEAD_ADDR) - (ring->tail + 8);
|
||||||
|
if (space < 0)
|
||||||
|
space += ring->size;
|
||||||
|
return space;
|
||||||
|
}
|
||||||
|
|
||||||
static u32 i915_gem_get_seqno(struct drm_device *dev)
|
static u32 i915_gem_get_seqno(struct drm_device *dev)
|
||||||
{
|
{
|
||||||
drm_i915_private_t *dev_priv = dev->dev_private;
|
drm_i915_private_t *dev_priv = dev->dev_private;
|
||||||
|
@ -204,11 +212,9 @@ static int init_ring_common(struct intel_ring_buffer *ring)
|
||||||
if (!drm_core_check_feature(ring->dev, DRIVER_MODESET))
|
if (!drm_core_check_feature(ring->dev, DRIVER_MODESET))
|
||||||
i915_kernel_lost_context(ring->dev);
|
i915_kernel_lost_context(ring->dev);
|
||||||
else {
|
else {
|
||||||
ring->head = I915_READ_HEAD(ring) & HEAD_ADDR;
|
ring->head = I915_READ_HEAD(ring);
|
||||||
ring->tail = I915_READ_TAIL(ring) & TAIL_ADDR;
|
ring->tail = I915_READ_TAIL(ring) & TAIL_ADDR;
|
||||||
ring->space = ring->head - (ring->tail + 8);
|
ring->space = ring_space(ring);
|
||||||
if (ring->space < 0)
|
|
||||||
ring->space += ring->size;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
return 0;
|
return 0;
|
||||||
|
@ -921,7 +927,7 @@ static int intel_wrap_ring_buffer(struct intel_ring_buffer *ring)
|
||||||
}
|
}
|
||||||
|
|
||||||
ring->tail = 0;
|
ring->tail = 0;
|
||||||
ring->space = ring->head - 8;
|
ring->space = ring_space(ring);
|
||||||
|
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
@ -933,20 +939,22 @@ int intel_wait_ring_buffer(struct intel_ring_buffer *ring, int n)
|
||||||
unsigned long end;
|
unsigned long end;
|
||||||
u32 head;
|
u32 head;
|
||||||
|
|
||||||
|
/* If the reported head position has wrapped or hasn't advanced,
|
||||||
|
* fallback to the slow and accurate path.
|
||||||
|
*/
|
||||||
|
head = intel_read_status_page(ring, 4);
|
||||||
|
if (head > ring->head) {
|
||||||
|
ring->head = head;
|
||||||
|
ring->space = ring_space(ring);
|
||||||
|
if (ring->space >= n)
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
trace_i915_ring_wait_begin (dev);
|
trace_i915_ring_wait_begin (dev);
|
||||||
end = jiffies + 3 * HZ;
|
end = jiffies + 3 * HZ;
|
||||||
do {
|
do {
|
||||||
/* If the reported head position has wrapped or hasn't advanced,
|
ring->head = I915_READ_HEAD(ring);
|
||||||
* fallback to the slow and accurate path.
|
ring->space = ring_space(ring);
|
||||||
*/
|
|
||||||
head = intel_read_status_page(ring, 4);
|
|
||||||
if (head < ring->actual_head)
|
|
||||||
head = I915_READ_HEAD(ring);
|
|
||||||
ring->actual_head = head;
|
|
||||||
ring->head = head & HEAD_ADDR;
|
|
||||||
ring->space = ring->head - (ring->tail + 8);
|
|
||||||
if (ring->space < 0)
|
|
||||||
ring->space += ring->size;
|
|
||||||
if (ring->space >= n) {
|
if (ring->space >= n) {
|
||||||
trace_i915_ring_wait_end(dev);
|
trace_i915_ring_wait_end(dev);
|
||||||
return 0;
|
return 0;
|
||||||
|
|
|
@ -47,7 +47,6 @@ struct intel_ring_buffer {
|
||||||
struct drm_device *dev;
|
struct drm_device *dev;
|
||||||
struct drm_i915_gem_object *obj;
|
struct drm_i915_gem_object *obj;
|
||||||
|
|
||||||
u32 actual_head;
|
|
||||||
u32 head;
|
u32 head;
|
||||||
u32 tail;
|
u32 tail;
|
||||||
int space;
|
int space;
|
||||||
|
|
Loading…
Reference in New Issue