2013-07-12 21:50:57 +08:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2008 Intel Corporation
|
|
|
|
*
|
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
|
|
* to deal in the Software without restriction, including without limitation
|
|
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice (including the next
|
|
|
|
* paragraph) shall be included in all copies or substantial portions of the
|
|
|
|
* Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
|
|
|
|
* IN THE SOFTWARE.
|
|
|
|
*
|
|
|
|
* Authors:
|
|
|
|
* Eric Anholt <eric@anholt.net>
|
|
|
|
* Keith Packard <keithp@keithp.com>
|
|
|
|
* Mika Kuoppala <mika.kuoppala@intel.com>
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
#include <linux/ascii85.h>
|
|
|
|
#include <linux/nmi.h>
|
2019-07-23 06:28:47 +08:00
|
|
|
#include <linux/pagevec.h>
|
2018-11-23 21:23:25 +08:00
|
|
|
#include <linux/scatterlist.h>
|
|
|
|
#include <linux/utsname.h>
|
2016-10-12 17:05:22 +08:00
|
|
|
#include <linux/zlib.h>
|
2018-11-23 21:23:25 +08:00
|
|
|
|
2017-10-27 01:36:55 +08:00
|
|
|
#include <drm/drm_print.h>
|
|
|
|
|
2021-05-19 05:34:44 +08:00
|
|
|
#include "display/intel_dmc.h"
|
2019-06-13 16:44:16 +08:00
|
|
|
#include "display/intel_overlay.h"
|
|
|
|
|
2019-05-28 17:29:49 +08:00
|
|
|
#include "gem/i915_gem_context.h"
|
2019-10-29 17:58:53 +08:00
|
|
|
#include "gem/i915_gem_lmem.h"
|
2020-07-08 08:39:47 +08:00
|
|
|
#include "gt/intel_gt.h"
|
2020-01-10 20:30:56 +08:00
|
|
|
#include "gt/intel_gt_pm.h"
|
2019-05-28 17:29:49 +08:00
|
|
|
|
2013-07-12 21:50:57 +08:00
|
|
|
#include "i915_drv.h"
|
2019-04-29 20:29:31 +08:00
|
|
|
#include "i915_gpu_error.h"
|
2019-08-08 21:42:47 +08:00
|
|
|
#include "i915_memcpy.h"
|
2019-05-28 17:29:50 +08:00
|
|
|
#include "i915_scatterlist.h"
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2019-07-23 06:28:47 +08:00
|
|
|
#define ALLOW_FAIL (GFP_KERNEL | __GFP_RETRY_MAYFAIL | __GFP_NOWARN)
|
|
|
|
#define ATOMIC_MAYFAIL (GFP_ATOMIC | __GFP_NOWARN)
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
static void __sg_set_buf(struct scatterlist *sg,
|
|
|
|
void *addr, unsigned int len, loff_t it)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2018-11-23 21:23:25 +08:00
|
|
|
sg->page_link = (unsigned long)virt_to_page(addr);
|
|
|
|
sg->offset = offset_in_page(addr);
|
|
|
|
sg->length = len;
|
|
|
|
sg->dma_address = it;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
static bool __i915_error_grow(struct drm_i915_error_state_buf *e, size_t len)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2018-11-23 21:23:25 +08:00
|
|
|
if (!len)
|
2013-07-12 21:50:57 +08:00
|
|
|
return false;
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
if (e->bytes + len + 1 <= e->size)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
if (e->bytes) {
|
|
|
|
__sg_set_buf(e->cur++, e->buf, e->bytes, e->iter);
|
|
|
|
e->iter += e->bytes;
|
|
|
|
e->buf = NULL;
|
|
|
|
e->bytes = 0;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
if (e->cur == e->end) {
|
|
|
|
struct scatterlist *sgl;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2019-07-23 06:28:47 +08:00
|
|
|
sgl = (typeof(sgl))__get_free_page(ALLOW_FAIL);
|
2018-11-23 21:23:25 +08:00
|
|
|
if (!sgl) {
|
|
|
|
e->err = -ENOMEM;
|
|
|
|
return false;
|
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
if (e->cur) {
|
|
|
|
e->cur->offset = 0;
|
|
|
|
e->cur->length = 0;
|
|
|
|
e->cur->page_link =
|
|
|
|
(unsigned long)sgl | SG_CHAIN;
|
|
|
|
} else {
|
|
|
|
e->sgl = sgl;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
e->cur = sgl;
|
|
|
|
e->end = sgl + SG_MAX_SINGLE_ALLOC - 1;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
e->size = ALIGN(len + 1, SZ_64K);
|
2019-07-23 06:28:47 +08:00
|
|
|
e->buf = kmalloc(e->size, ALLOW_FAIL);
|
2018-11-23 21:23:25 +08:00
|
|
|
if (!e->buf) {
|
|
|
|
e->size = PAGE_ALIGN(len + 1);
|
|
|
|
e->buf = kmalloc(e->size, GFP_KERNEL);
|
|
|
|
}
|
|
|
|
if (!e->buf) {
|
|
|
|
e->err = -ENOMEM;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2017-01-14 18:51:12 +08:00
|
|
|
__printf(2, 0)
|
2013-07-12 21:50:57 +08:00
|
|
|
static void i915_error_vprintf(struct drm_i915_error_state_buf *e,
|
2018-11-23 21:23:25 +08:00
|
|
|
const char *fmt, va_list args)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2018-11-23 21:23:25 +08:00
|
|
|
va_list ap;
|
|
|
|
int len;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
if (e->err)
|
2013-07-12 21:50:57 +08:00
|
|
|
return;
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
va_copy(ap, args);
|
|
|
|
len = vsnprintf(NULL, 0, fmt, ap);
|
|
|
|
va_end(ap);
|
|
|
|
if (len <= 0) {
|
|
|
|
e->err = len;
|
|
|
|
return;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
if (!__i915_error_grow(e, len))
|
|
|
|
return;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
GEM_BUG_ON(e->bytes >= e->size);
|
|
|
|
len = vscnprintf(e->buf + e->bytes, e->size - e->bytes, fmt, args);
|
|
|
|
if (len < 0) {
|
|
|
|
e->err = len;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
e->bytes += len;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
static void i915_error_puts(struct drm_i915_error_state_buf *e, const char *str)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
|
|
|
unsigned len;
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
if (e->err || !str)
|
2013-07-12 21:50:57 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
len = strlen(str);
|
2018-11-23 21:23:25 +08:00
|
|
|
if (!__i915_error_grow(e, len))
|
|
|
|
return;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
GEM_BUG_ON(e->bytes + len > e->size);
|
2013-07-12 21:50:57 +08:00
|
|
|
memcpy(e->buf + e->bytes, str, len);
|
2018-11-23 21:23:25 +08:00
|
|
|
e->bytes += len;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
#define err_printf(e, ...) i915_error_printf(e, __VA_ARGS__)
|
|
|
|
#define err_puts(e, s) i915_error_puts(e, s)
|
|
|
|
|
2017-10-27 01:36:55 +08:00
|
|
|
static void __i915_printfn_error(struct drm_printer *p, struct va_format *vaf)
|
|
|
|
{
|
|
|
|
i915_error_vprintf(p->arg, vaf->fmt, *vaf->va);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline struct drm_printer
|
|
|
|
i915_error_printer(struct drm_i915_error_state_buf *e)
|
|
|
|
{
|
|
|
|
struct drm_printer p = {
|
|
|
|
.printfn = __i915_printfn_error,
|
|
|
|
.arg = e,
|
|
|
|
};
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
|
2019-07-23 06:28:47 +08:00
|
|
|
/* single threaded page allocator with a reserved stash for emergencies */
|
|
|
|
static void pool_fini(struct pagevec *pv)
|
|
|
|
{
|
|
|
|
pagevec_release(pv);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int pool_refill(struct pagevec *pv, gfp_t gfp)
|
|
|
|
{
|
|
|
|
while (pagevec_space(pv)) {
|
|
|
|
struct page *p;
|
|
|
|
|
|
|
|
p = alloc_page(gfp);
|
|
|
|
if (!p)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
pagevec_add(pv, p);
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int pool_init(struct pagevec *pv, gfp_t gfp)
|
|
|
|
{
|
|
|
|
int err;
|
|
|
|
|
|
|
|
pagevec_init(pv);
|
|
|
|
|
|
|
|
err = pool_refill(pv, gfp);
|
|
|
|
if (err)
|
|
|
|
pool_fini(pv);
|
|
|
|
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void *pool_alloc(struct pagevec *pv, gfp_t gfp)
|
|
|
|
{
|
|
|
|
struct page *p;
|
|
|
|
|
|
|
|
p = alloc_page(gfp);
|
|
|
|
if (!p && pagevec_count(pv))
|
|
|
|
p = pv->pages[--pv->nr];
|
|
|
|
|
|
|
|
return p ? page_address(p) : NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void pool_free(struct pagevec *pv, void *addr)
|
|
|
|
{
|
|
|
|
struct page *p = virt_to_page(addr);
|
|
|
|
|
|
|
|
if (pagevec_space(pv))
|
|
|
|
pagevec_add(pv, p);
|
|
|
|
else
|
|
|
|
__free_page(p);
|
|
|
|
}
|
|
|
|
|
2016-10-12 17:05:22 +08:00
|
|
|
#ifdef CONFIG_DRM_I915_COMPRESS_ERROR
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_vma_compress {
|
2019-07-23 06:28:47 +08:00
|
|
|
struct pagevec pool;
|
2016-12-06 20:40:51 +08:00
|
|
|
struct z_stream_s zstream;
|
|
|
|
void *tmp;
|
|
|
|
};
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static bool compress_init(struct i915_vma_compress *c)
|
2016-10-12 17:05:22 +08:00
|
|
|
{
|
2019-07-23 06:28:47 +08:00
|
|
|
struct z_stream_s *zstream = &c->zstream;
|
2016-10-12 17:05:22 +08:00
|
|
|
|
2019-07-23 06:28:47 +08:00
|
|
|
if (pool_init(&c->pool, ALLOW_FAIL))
|
2016-10-12 17:05:22 +08:00
|
|
|
return false;
|
|
|
|
|
2019-07-23 06:28:47 +08:00
|
|
|
zstream->workspace =
|
|
|
|
kmalloc(zlib_deflate_workspacesize(MAX_WBITS, MAX_MEM_LEVEL),
|
|
|
|
ALLOW_FAIL);
|
|
|
|
if (!zstream->workspace) {
|
|
|
|
pool_fini(&c->pool);
|
2016-10-12 17:05:22 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-12-06 20:40:51 +08:00
|
|
|
c->tmp = NULL;
|
2017-01-06 23:20:09 +08:00
|
|
|
if (i915_has_memcpy_from_wc())
|
2019-07-23 06:28:47 +08:00
|
|
|
c->tmp = pool_alloc(&c->pool, ALLOW_FAIL);
|
2016-12-06 20:40:51 +08:00
|
|
|
|
2016-10-12 17:05:22 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static bool compress_start(struct i915_vma_compress *c)
|
2018-10-03 16:24:22 +08:00
|
|
|
{
|
2019-07-23 06:28:47 +08:00
|
|
|
struct z_stream_s *zstream = &c->zstream;
|
|
|
|
void *workspace = zstream->workspace;
|
|
|
|
|
|
|
|
memset(zstream, 0, sizeof(*zstream));
|
|
|
|
zstream->workspace = workspace;
|
|
|
|
|
|
|
|
return zlib_deflateInit(zstream, Z_DEFAULT_COMPRESSION) == Z_OK;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void *compress_next_page(struct i915_vma_compress *c,
|
|
|
|
struct i915_vma_coredump *dst)
|
2019-07-23 06:28:47 +08:00
|
|
|
{
|
|
|
|
void *page;
|
2018-10-03 16:24:22 +08:00
|
|
|
|
|
|
|
if (dst->page_count >= dst->num_pages)
|
|
|
|
return ERR_PTR(-ENOSPC);
|
|
|
|
|
2019-07-26 06:38:43 +08:00
|
|
|
page = pool_alloc(&c->pool, ALLOW_FAIL);
|
2018-10-03 16:24:22 +08:00
|
|
|
if (!page)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
|
2019-07-23 06:28:47 +08:00
|
|
|
return dst->pages[dst->page_count++] = page;
|
2018-10-03 16:24:22 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static int compress_page(struct i915_vma_compress *c,
|
2016-10-12 17:05:22 +08:00
|
|
|
void *src,
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_vma_coredump *dst,
|
|
|
|
bool wc)
|
2016-10-12 17:05:22 +08:00
|
|
|
{
|
2016-12-06 20:40:51 +08:00
|
|
|
struct z_stream_s *zstream = &c->zstream;
|
|
|
|
|
2016-10-12 17:05:22 +08:00
|
|
|
zstream->next_in = src;
|
2020-01-10 20:30:56 +08:00
|
|
|
if (wc && c->tmp && i915_memcpy_from_wc(c->tmp, src, PAGE_SIZE))
|
2016-12-06 20:40:51 +08:00
|
|
|
zstream->next_in = c->tmp;
|
2016-10-12 17:05:22 +08:00
|
|
|
zstream->avail_in = PAGE_SIZE;
|
|
|
|
|
|
|
|
do {
|
|
|
|
if (zstream->avail_out == 0) {
|
2019-07-23 06:28:47 +08:00
|
|
|
zstream->next_out = compress_next_page(c, dst);
|
2018-10-03 16:24:22 +08:00
|
|
|
if (IS_ERR(zstream->next_out))
|
|
|
|
return PTR_ERR(zstream->next_out);
|
2016-10-12 17:05:22 +08:00
|
|
|
|
|
|
|
zstream->avail_out = PAGE_SIZE;
|
|
|
|
}
|
|
|
|
|
2018-10-03 16:24:22 +08:00
|
|
|
if (zlib_deflate(zstream, Z_NO_FLUSH) != Z_OK)
|
2016-10-12 17:05:22 +08:00
|
|
|
return -EIO;
|
2020-09-16 17:00:58 +08:00
|
|
|
|
|
|
|
cond_resched();
|
2016-10-12 17:05:22 +08:00
|
|
|
} while (zstream->avail_in);
|
|
|
|
|
|
|
|
/* Fallback to uncompressed if we increase size? */
|
|
|
|
if (0 && zstream->total_out > zstream->total_in)
|
|
|
|
return -E2BIG;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static int compress_flush(struct i915_vma_compress *c,
|
|
|
|
struct i915_vma_coredump *dst)
|
2016-10-12 17:05:22 +08:00
|
|
|
{
|
2016-12-06 20:40:51 +08:00
|
|
|
struct z_stream_s *zstream = &c->zstream;
|
|
|
|
|
2018-10-03 16:24:22 +08:00
|
|
|
do {
|
|
|
|
switch (zlib_deflate(zstream, Z_FINISH)) {
|
|
|
|
case Z_OK: /* more space requested */
|
2019-07-23 06:28:47 +08:00
|
|
|
zstream->next_out = compress_next_page(c, dst);
|
2018-10-03 16:24:22 +08:00
|
|
|
if (IS_ERR(zstream->next_out))
|
|
|
|
return PTR_ERR(zstream->next_out);
|
|
|
|
|
|
|
|
zstream->avail_out = PAGE_SIZE;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case Z_STREAM_END:
|
|
|
|
goto end;
|
|
|
|
|
|
|
|
default: /* any error */
|
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
} while (1);
|
|
|
|
|
|
|
|
end:
|
|
|
|
memset(zstream->next_out, 0, zstream->avail_out);
|
|
|
|
dst->unused = zstream->avail_out;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void compress_finish(struct i915_vma_compress *c)
|
2018-10-03 16:24:22 +08:00
|
|
|
{
|
2019-07-23 06:28:47 +08:00
|
|
|
zlib_deflateEnd(&c->zstream);
|
|
|
|
}
|
2016-10-12 17:05:22 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void compress_fini(struct i915_vma_compress *c)
|
2019-07-23 06:28:47 +08:00
|
|
|
{
|
|
|
|
kfree(c->zstream.workspace);
|
2016-12-06 20:40:51 +08:00
|
|
|
if (c->tmp)
|
2019-07-23 06:28:47 +08:00
|
|
|
pool_free(&c->pool, c->tmp);
|
|
|
|
pool_fini(&c->pool);
|
2016-10-12 17:05:22 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void err_compression_marker(struct drm_i915_error_state_buf *m)
|
|
|
|
{
|
|
|
|
err_puts(m, ":");
|
|
|
|
}
|
|
|
|
|
|
|
|
#else
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_vma_compress {
|
2019-07-23 06:28:47 +08:00
|
|
|
struct pagevec pool;
|
2016-12-06 20:40:51 +08:00
|
|
|
};
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static bool compress_init(struct i915_vma_compress *c)
|
2019-07-23 06:28:47 +08:00
|
|
|
{
|
|
|
|
return pool_init(&c->pool, ALLOW_FAIL) == 0;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static bool compress_start(struct i915_vma_compress *c)
|
2016-10-12 17:05:22 +08:00
|
|
|
{
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static int compress_page(struct i915_vma_compress *c,
|
2016-10-12 17:05:22 +08:00
|
|
|
void *src,
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_vma_coredump *dst,
|
|
|
|
bool wc)
|
2016-10-12 17:05:22 +08:00
|
|
|
{
|
2016-12-06 20:40:51 +08:00
|
|
|
void *ptr;
|
2016-10-12 17:05:22 +08:00
|
|
|
|
2019-07-26 06:38:43 +08:00
|
|
|
ptr = pool_alloc(&c->pool, ALLOW_FAIL);
|
2019-07-23 06:28:47 +08:00
|
|
|
if (!ptr)
|
2016-10-12 17:05:22 +08:00
|
|
|
return -ENOMEM;
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
if (!(wc && i915_memcpy_from_wc(ptr, src, PAGE_SIZE)))
|
2016-12-06 20:40:51 +08:00
|
|
|
memcpy(ptr, src, PAGE_SIZE);
|
|
|
|
dst->pages[dst->page_count++] = ptr;
|
2020-09-16 17:00:58 +08:00
|
|
|
cond_resched();
|
2016-10-12 17:05:22 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static int compress_flush(struct i915_vma_compress *c,
|
|
|
|
struct i915_vma_coredump *dst)
|
2018-10-03 16:24:22 +08:00
|
|
|
{
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void compress_finish(struct i915_vma_compress *c)
|
2016-10-12 17:05:22 +08:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void compress_fini(struct i915_vma_compress *c)
|
2019-07-23 06:28:47 +08:00
|
|
|
{
|
|
|
|
pool_fini(&c->pool);
|
|
|
|
}
|
|
|
|
|
2016-10-12 17:05:22 +08:00
|
|
|
static void err_compression_marker(struct drm_i915_error_state_buf *m)
|
|
|
|
{
|
|
|
|
err_puts(m, "~");
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
2016-09-20 21:54:32 +08:00
|
|
|
static void error_print_instdone(struct drm_i915_error_state_buf *m,
|
2020-01-10 20:30:56 +08:00
|
|
|
const struct intel_engine_coredump *ee)
|
2016-09-20 21:54:32 +08:00
|
|
|
{
|
2020-07-08 08:39:50 +08:00
|
|
|
const struct sseu_dev_info *sseu = &ee->engine->gt->info.sseu;
|
2016-09-20 21:54:33 +08:00
|
|
|
int slice;
|
|
|
|
int subslice;
|
|
|
|
|
2016-09-20 21:54:32 +08:00
|
|
|
err_printf(m, " INSTDONE: 0x%08x\n",
|
|
|
|
ee->instdone.instdone);
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (ee->engine->class != RENDER_CLASS || GRAPHICS_VER(m->i915) <= 3)
|
2016-09-20 21:54:32 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
err_printf(m, " SC_INSTDONE: 0x%08x\n",
|
|
|
|
ee->instdone.slice_common);
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(m->i915) <= 6)
|
2016-09-20 21:54:32 +08:00
|
|
|
return;
|
|
|
|
|
2019-08-24 00:03:05 +08:00
|
|
|
for_each_instdone_slice_subslice(m->i915, sseu, slice, subslice)
|
2016-09-20 21:54:33 +08:00
|
|
|
err_printf(m, " SAMPLER_INSTDONE[%d][%d]: 0x%08x\n",
|
|
|
|
slice, subslice,
|
|
|
|
ee->instdone.sampler[slice][subslice]);
|
|
|
|
|
2019-08-24 00:03:05 +08:00
|
|
|
for_each_instdone_slice_subslice(m->i915, sseu, slice, subslice)
|
2016-09-20 21:54:33 +08:00
|
|
|
err_printf(m, " ROW_INSTDONE[%d][%d]: 0x%08x\n",
|
|
|
|
slice, subslice,
|
|
|
|
ee->instdone.row[slice][subslice]);
|
2020-01-30 02:16:38 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(m->i915) < 12)
|
2020-01-30 02:16:38 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
err_printf(m, " SC_INSTDONE_EXTRA: 0x%08x\n",
|
|
|
|
ee->instdone.slice_common_extra[0]);
|
|
|
|
err_printf(m, " SC_INSTDONE_EXTRA2: 0x%08x\n",
|
|
|
|
ee->instdone.slice_common_extra[1]);
|
2016-09-20 21:54:32 +08:00
|
|
|
}
|
|
|
|
|
2016-10-13 18:18:14 +08:00
|
|
|
static void error_print_request(struct drm_i915_error_state_buf *m,
|
|
|
|
const char *prefix,
|
2020-01-10 20:30:56 +08:00
|
|
|
const struct i915_request_coredump *erq)
|
2016-10-13 18:18:14 +08:00
|
|
|
{
|
|
|
|
if (!erq->seqno)
|
|
|
|
return;
|
|
|
|
|
2020-04-25 03:14:10 +08:00
|
|
|
err_printf(m, "%s pid %d, seqno %8x:%08x%s%s, prio %d, head %08x, tail %08x\n",
|
drm/i915: Use time based guilty context banning
Currently, we accumulate each time a context hangs the GPU, offset
against the number of requests it submits, and if that score exceeds a
certain threshold, we ban that context from submitting any more requests
(cancelling any work in flight). In contrast, we use a simple timer on
the file, that if we see more than a 9 hangs faster than 60s apart in
total across all of its contexts, we will ban the client from creating
any more contexts. This leads to a confusing situation where the file
may be banned before the context, so lets use a simple timer scheme for
each.
If the context submits 3 hanging requests within a 120s period, declare
it forbidden to ever send more requests.
This has the advantage of not being easy to repair by simply sending
empty requests, but has the disadvantage that if the context is idle
then it is forgiven. However, if the context is idle, it is not
disrupting the system, but a hog can evade the request counting and
cause much more severe disruption to the system.
Updating ban_score from request retirement is dubious as the retirement
is purposely not in sync with request submission (i.e. we try and batch
retirement to reduce overhead and avoid latency on submission), which
leads to surprising situations where we can forgive a hang immediately
due to a backlog of requests from before the hang being retired
afterwards.
Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
Cc: Mika Kuoppala <mika.kuoppala@intel.com>
Reviewed-by: Mika Kuoppala <mika.kuoppala@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20190219122215.8941-2-chris@chris-wilson.co.uk
2019-02-19 20:21:52 +08:00
|
|
|
prefix, erq->pid, erq->context, erq->seqno,
|
drm/i915: Replace global breadcrumbs with per-context interrupt tracking
A few years ago, see commit 688e6c725816 ("drm/i915: Slaughter the
thundering i915_wait_request herd"), the issue of handling multiple
clients waiting in parallel was brought to our attention. The
requirement was that every client should be woken immediately upon its
request being signaled, without incurring any cpu overhead.
To handle certain fragility of our hw meant that we could not do a
simple check inside the irq handler (some generations required almost
unbounded delays before we could be sure of seqno coherency) and so
request completion checking required delegation.
Before commit 688e6c725816, the solution was simple. Every client
waiting on a request would be woken on every interrupt and each would do
a heavyweight check to see if their request was complete. Commit
688e6c725816 introduced an rbtree so that only the earliest waiter on
the global timeline would woken, and would wake the next and so on.
(Along with various complications to handle requests being reordered
along the global timeline, and also a requirement for kthread to provide
a delegate for fence signaling that had no process context.)
The global rbtree depends on knowing the execution timeline (and global
seqno). Without knowing that order, we must instead check all contexts
queued to the HW to see which may have advanced. We trim that list by
only checking queued contexts that are being waited on, but still we
keep a list of all active contexts and their active signalers that we
inspect from inside the irq handler. By moving the waiters onto the fence
signal list, we can combine the client wakeup with the dma_fence
signaling (a dramatic reduction in complexity, but does require the HW
being coherent, the seqno must be visible from the cpu before the
interrupt is raised - we keep a timer backup just in case).
Having previously fixed all the issues with irq-seqno serialisation (by
inserting delays onto the GPU after each request instead of random delays
on the CPU after each interrupt), we can rely on the seqno state to
perfom direct wakeups from the interrupt handler. This allows us to
preserve our single context switch behaviour of the current routine,
with the only downside that we lose the RT priority sorting of wakeups.
In general, direct wakeup latency of multiple clients is about the same
(about 10% better in most cases) with a reduction in total CPU time spent
in the waiter (about 20-50% depending on gen). Average herd behaviour is
improved, but at the cost of not delegating wakeups on task_prio.
v2: Capture fence signaling state for error state and add comments to
warm even the most cold of hearts.
v3: Check if the request is still active before busywaiting
v4: Reduce the amount of pointer misdirection with list_for_each_safe
and using a local i915_request variable inside the loops
v5: Add a missing pluralisation to a purely informative selftest message.
References: 688e6c725816 ("drm/i915: Slaughter the thundering i915_wait_request herd")
Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
Cc: Tvrtko Ursulin <tvrtko.ursulin@intel.com>
Reviewed-by: Tvrtko Ursulin <tvrtko.ursulin@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20190129205230.19056-2-chris@chris-wilson.co.uk
2019-01-30 04:52:29 +08:00
|
|
|
test_bit(DMA_FENCE_FLAG_SIGNALED_BIT,
|
|
|
|
&erq->flags) ? "!" : "",
|
|
|
|
test_bit(DMA_FENCE_FLAG_ENABLE_SIGNAL_BIT,
|
|
|
|
&erq->flags) ? "+" : "",
|
|
|
|
erq->sched_attr.priority,
|
2020-04-25 03:14:10 +08:00
|
|
|
erq->head, erq->tail);
|
2016-10-13 18:18:14 +08:00
|
|
|
}
|
|
|
|
|
2017-01-29 17:24:33 +08:00
|
|
|
static void error_print_context(struct drm_i915_error_state_buf *m,
|
|
|
|
const char *header,
|
2020-01-10 20:30:56 +08:00
|
|
|
const struct i915_gem_context_coredump *ctx)
|
2017-01-29 17:24:33 +08:00
|
|
|
{
|
2020-12-23 20:23:59 +08:00
|
|
|
const u32 period = m->i915->gt.clock_period_ns;
|
2020-02-16 21:36:20 +08:00
|
|
|
|
|
|
|
err_printf(m, "%s%s[%d] prio %d, guilty %d active %d, runtime total %lluns, avg %lluns\n",
|
2019-10-04 21:40:08 +08:00
|
|
|
header, ctx->comm, ctx->pid, ctx->sched_attr.priority,
|
2020-02-16 21:36:20 +08:00
|
|
|
ctx->guilty, ctx->active,
|
|
|
|
ctx->total_runtime * period,
|
|
|
|
mul_u32_u32(ctx->avg_runtime, period));
|
2017-01-29 17:24:33 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static struct i915_vma_coredump *
|
|
|
|
__find_vma(struct i915_vma_coredump *vma, const char *name)
|
|
|
|
{
|
|
|
|
while (vma) {
|
|
|
|
if (strcmp(vma->name, name) == 0)
|
|
|
|
return vma;
|
|
|
|
vma = vma->next;
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct i915_vma_coredump *
|
|
|
|
find_batch(const struct intel_engine_coredump *ee)
|
|
|
|
{
|
|
|
|
return __find_vma(ee->vma, "batch");
|
|
|
|
}
|
|
|
|
|
2016-07-27 16:07:28 +08:00
|
|
|
static void error_print_engine(struct drm_i915_error_state_buf *m,
|
2020-01-10 20:30:56 +08:00
|
|
|
const struct intel_engine_coredump *ee)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_vma_coredump *batch;
|
2017-09-22 20:43:07 +08:00
|
|
|
int n;
|
|
|
|
|
2019-08-08 22:45:11 +08:00
|
|
|
err_printf(m, "%s command stream:\n", ee->engine->name);
|
2020-01-10 20:30:56 +08:00
|
|
|
err_printf(m, " CCID: 0x%08x\n", ee->ccid);
|
2016-07-27 16:07:28 +08:00
|
|
|
err_printf(m, " START: 0x%08x\n", ee->start);
|
2016-10-13 18:18:15 +08:00
|
|
|
err_printf(m, " HEAD: 0x%08x [0x%08x]\n", ee->head, ee->rq_head);
|
2016-10-05 04:11:30 +08:00
|
|
|
err_printf(m, " TAIL: 0x%08x [0x%08x, 0x%08x]\n",
|
|
|
|
ee->tail, ee->rq_post, ee->rq_tail);
|
2016-07-27 16:07:28 +08:00
|
|
|
err_printf(m, " CTL: 0x%08x\n", ee->ctl);
|
2016-08-15 17:49:11 +08:00
|
|
|
err_printf(m, " MODE: 0x%08x\n", ee->mode);
|
2016-07-27 16:07:28 +08:00
|
|
|
err_printf(m, " HWS: 0x%08x\n", ee->hws);
|
|
|
|
err_printf(m, " ACTHD: 0x%08x %08x\n",
|
|
|
|
(u32)(ee->acthd>>32), (u32)ee->acthd);
|
|
|
|
err_printf(m, " IPEIR: 0x%08x\n", ee->ipeir);
|
|
|
|
err_printf(m, " IPEHR: 0x%08x\n", ee->ipehr);
|
2020-01-29 04:43:15 +08:00
|
|
|
err_printf(m, " ESR: 0x%08x\n", ee->esr);
|
2016-09-20 21:54:32 +08:00
|
|
|
|
|
|
|
error_print_instdone(m, ee);
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
batch = find_batch(ee);
|
|
|
|
if (batch) {
|
|
|
|
u64 start = batch->gtt_offset;
|
|
|
|
u64 end = start + batch->gtt_size;
|
2016-08-15 17:49:09 +08:00
|
|
|
|
|
|
|
err_printf(m, " batch: [0x%08x_%08x, 0x%08x_%08x]\n",
|
|
|
|
upper_32_bits(start), lower_32_bits(start),
|
|
|
|
upper_32_bits(end), lower_32_bits(end));
|
|
|
|
}
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(m->i915) >= 4) {
|
2016-08-15 17:49:09 +08:00
|
|
|
err_printf(m, " BBADDR: 0x%08x_%08x\n",
|
2016-07-27 16:07:28 +08:00
|
|
|
(u32)(ee->bbaddr>>32), (u32)ee->bbaddr);
|
|
|
|
err_printf(m, " BB_STATE: 0x%08x\n", ee->bbstate);
|
|
|
|
err_printf(m, " INSTPS: 0x%08x\n", ee->instps);
|
2013-12-11 03:44:43 +08:00
|
|
|
}
|
2016-07-27 16:07:28 +08:00
|
|
|
err_printf(m, " INSTPM: 0x%08x\n", ee->instpm);
|
|
|
|
err_printf(m, " FADDR: 0x%08x %08x\n", upper_32_bits(ee->faddr),
|
|
|
|
lower_32_bits(ee->faddr));
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(m->i915) >= 6) {
|
2016-07-27 16:07:28 +08:00
|
|
|
err_printf(m, " RC PSMI: 0x%08x\n", ee->rc_psmi);
|
|
|
|
err_printf(m, " FAULT_REG: 0x%08x\n", ee->fault_reg);
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
2018-09-27 04:12:22 +08:00
|
|
|
if (HAS_PPGTT(m->i915)) {
|
2016-07-27 16:07:28 +08:00
|
|
|
err_printf(m, " GFX_MODE: 0x%08x\n", ee->vm_info.gfx_mode);
|
2014-01-30 16:19:40 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(m->i915) >= 8) {
|
2014-01-30 16:19:40 +08:00
|
|
|
int i;
|
|
|
|
for (i = 0; i < 4; i++)
|
|
|
|
err_printf(m, " PDP%d: 0x%016llx\n",
|
2016-07-27 16:07:28 +08:00
|
|
|
i, ee->vm_info.pdp[i]);
|
2014-01-30 16:19:40 +08:00
|
|
|
} else {
|
|
|
|
err_printf(m, " PP_DIR_BASE: 0x%08x\n",
|
2016-07-27 16:07:28 +08:00
|
|
|
ee->vm_info.pp_dir_base);
|
2014-01-30 16:19:40 +08:00
|
|
|
}
|
|
|
|
}
|
2020-11-04 21:47:42 +08:00
|
|
|
err_printf(m, " hung: %u\n", ee->hung);
|
2017-06-20 17:57:48 +08:00
|
|
|
err_printf(m, " engine reset count: %u\n", ee->reset_count);
|
2016-11-18 21:09:04 +08:00
|
|
|
|
2017-09-22 20:43:07 +08:00
|
|
|
for (n = 0; n < ee->num_ports; n++) {
|
|
|
|
err_printf(m, " ELSP[%d]:", n);
|
2020-01-10 20:30:56 +08:00
|
|
|
error_print_request(m, " ", &ee->execlist[n]);
|
2017-09-22 20:43:07 +08:00
|
|
|
}
|
|
|
|
|
2017-01-29 17:24:33 +08:00
|
|
|
error_print_context(m, " Active context: ", &ee->context);
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void i915_error_printf(struct drm_i915_error_state_buf *e, const char *f, ...)
|
|
|
|
{
|
|
|
|
va_list args;
|
|
|
|
|
|
|
|
va_start(args, f);
|
|
|
|
i915_error_vprintf(e, f, args);
|
|
|
|
va_end(args);
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void print_error_vma(struct drm_i915_error_state_buf *m,
|
2019-08-08 22:45:11 +08:00
|
|
|
const struct intel_engine_cs *engine,
|
2020-01-10 20:30:56 +08:00
|
|
|
const struct i915_vma_coredump *vma)
|
2014-02-25 23:11:24 +08:00
|
|
|
{
|
2018-07-25 00:33:19 +08:00
|
|
|
char out[ASCII85_BUFSZ];
|
2016-10-12 17:05:22 +08:00
|
|
|
int page;
|
2014-02-25 23:11:24 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
if (!vma)
|
2016-10-12 17:05:21 +08:00
|
|
|
return;
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
err_printf(m, "%s --- %s = 0x%08x %08x\n",
|
|
|
|
engine ? engine->name : "global", vma->name,
|
|
|
|
upper_32_bits(vma->gtt_offset),
|
|
|
|
lower_32_bits(vma->gtt_offset));
|
2016-10-12 17:05:21 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
if (vma->gtt_page_sizes > I915_GTT_PAGE_SIZE_4K)
|
|
|
|
err_printf(m, "gtt_page_sizes = 0x%08x\n", vma->gtt_page_sizes);
|
2019-09-10 01:16:46 +08:00
|
|
|
|
2016-10-12 17:05:22 +08:00
|
|
|
err_compression_marker(m);
|
2020-01-10 20:30:56 +08:00
|
|
|
for (page = 0; page < vma->page_count; page++) {
|
2016-10-12 17:05:22 +08:00
|
|
|
int i, len;
|
|
|
|
|
|
|
|
len = PAGE_SIZE;
|
2020-01-10 20:30:56 +08:00
|
|
|
if (page == vma->page_count - 1)
|
|
|
|
len -= vma->unused;
|
2016-10-12 17:05:22 +08:00
|
|
|
len = ascii85_encode_len(len);
|
|
|
|
|
2018-07-25 00:33:19 +08:00
|
|
|
for (i = 0; i < len; i++)
|
2020-01-10 20:30:56 +08:00
|
|
|
err_puts(m, ascii85_encode(vma->pages[page][i], out));
|
2014-02-25 23:11:24 +08:00
|
|
|
}
|
2016-10-12 17:05:22 +08:00
|
|
|
err_puts(m, "\n");
|
2014-02-25 23:11:24 +08:00
|
|
|
}
|
|
|
|
|
2016-08-15 17:48:45 +08:00
|
|
|
static void err_print_capabilities(struct drm_i915_error_state_buf *m,
|
2020-07-08 08:39:47 +08:00
|
|
|
struct i915_gpu_coredump *error)
|
2016-08-15 17:48:45 +08:00
|
|
|
{
|
2017-12-19 19:43:44 +08:00
|
|
|
struct drm_printer p = i915_error_printer(m);
|
|
|
|
|
2020-07-08 08:39:47 +08:00
|
|
|
intel_device_info_print_static(&error->device_info, &p);
|
|
|
|
intel_device_info_print_runtime(&error->runtime_info, &p);
|
|
|
|
intel_driver_caps_print(&error->driver_caps, &p);
|
2016-08-15 17:48:45 +08:00
|
|
|
}
|
|
|
|
|
2017-02-07 05:36:07 +08:00
|
|
|
static void err_print_params(struct drm_i915_error_state_buf *m,
|
2017-12-19 19:43:46 +08:00
|
|
|
const struct i915_params *params)
|
2017-02-07 05:36:07 +08:00
|
|
|
{
|
2017-12-19 19:43:46 +08:00
|
|
|
struct drm_printer p = i915_error_printer(m);
|
|
|
|
|
|
|
|
i915_params_dump(params, &p);
|
2017-02-07 05:36:07 +08:00
|
|
|
}
|
|
|
|
|
2017-02-15 00:46:11 +08:00
|
|
|
static void err_print_pciid(struct drm_i915_error_state_buf *m,
|
|
|
|
struct drm_i915_private *i915)
|
|
|
|
{
|
2021-01-28 21:31:23 +08:00
|
|
|
struct pci_dev *pdev = to_pci_dev(i915->drm.dev);
|
2017-02-15 00:46:11 +08:00
|
|
|
|
|
|
|
err_printf(m, "PCI ID: 0x%04x\n", pdev->device);
|
|
|
|
err_printf(m, "PCI Revision: 0x%02x\n", pdev->revision);
|
|
|
|
err_printf(m, "PCI Subsystem: %04x:%04x\n",
|
|
|
|
pdev->subsystem_vendor,
|
|
|
|
pdev->subsystem_device);
|
|
|
|
}
|
|
|
|
|
2017-10-27 01:36:55 +08:00
|
|
|
static void err_print_uc(struct drm_i915_error_state_buf *m,
|
2020-01-10 20:30:56 +08:00
|
|
|
const struct intel_uc_coredump *error_uc)
|
2017-10-27 01:36:55 +08:00
|
|
|
{
|
|
|
|
struct drm_printer p = i915_error_printer(m);
|
|
|
|
|
|
|
|
intel_uc_fw_dump(&error_uc->guc_fw, &p);
|
|
|
|
intel_uc_fw_dump(&error_uc->huc_fw, &p);
|
2020-01-10 20:30:56 +08:00
|
|
|
print_error_vma(m, NULL, error_uc->guc_log);
|
2017-10-27 01:36:55 +08:00
|
|
|
}
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
static void err_free_sgl(struct scatterlist *sgl)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2018-11-23 21:23:25 +08:00
|
|
|
while (sgl) {
|
|
|
|
struct scatterlist *sg;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
for (sg = sgl; !sg_is_chain(sg); sg++) {
|
|
|
|
kfree(sg_virt(sg));
|
|
|
|
if (sg_is_last(sg))
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
sg = sg_is_last(sg) ? NULL : sg_chain_ptr(sg);
|
|
|
|
free_page((unsigned long)sgl);
|
|
|
|
sgl = sg;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
2018-11-23 21:23:25 +08:00
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2020-07-11 03:32:39 +08:00
|
|
|
static void err_print_gt_info(struct drm_i915_error_state_buf *m,
|
|
|
|
struct intel_gt_coredump *gt)
|
|
|
|
{
|
|
|
|
struct drm_printer p = i915_error_printer(m);
|
|
|
|
|
|
|
|
intel_gt_info_print(>->info, &p);
|
|
|
|
intel_sseu_print_topology(>->info.sseu, &p);
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void err_print_gt(struct drm_i915_error_state_buf *m,
|
|
|
|
struct intel_gt_coredump *gt)
|
|
|
|
{
|
|
|
|
const struct intel_engine_coredump *ee;
|
2020-01-10 20:30:59 +08:00
|
|
|
int i;
|
2020-01-10 20:30:56 +08:00
|
|
|
|
|
|
|
err_printf(m, "GT awake: %s\n", yesno(gt->awake));
|
|
|
|
err_printf(m, "EIR: 0x%08x\n", gt->eir);
|
|
|
|
err_printf(m, "IER: 0x%08x\n", gt->ier);
|
|
|
|
for (i = 0; i < gt->ngtier; i++)
|
|
|
|
err_printf(m, "GTIER[%d]: 0x%08x\n", i, gt->gtier[i]);
|
|
|
|
err_printf(m, "PGTBL_ER: 0x%08x\n", gt->pgtbl_er);
|
|
|
|
err_printf(m, "FORCEWAKE: 0x%08x\n", gt->forcewake);
|
|
|
|
err_printf(m, "DERRMR: 0x%08x\n", gt->derrmr);
|
|
|
|
|
|
|
|
for (i = 0; i < gt->nfence; i++)
|
|
|
|
err_printf(m, " fence[%d] = %08llx\n", i, gt->fence[i]);
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (IS_GRAPHICS_VER(m->i915, 6, 11)) {
|
2020-01-10 20:30:56 +08:00
|
|
|
err_printf(m, "ERROR: 0x%08x\n", gt->error);
|
|
|
|
err_printf(m, "DONE_REG: 0x%08x\n", gt->done_reg);
|
|
|
|
}
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(m->i915) >= 8)
|
2020-01-10 20:30:56 +08:00
|
|
|
err_printf(m, "FAULT_TLB_DATA: 0x%08x 0x%08x\n",
|
|
|
|
gt->fault_data1, gt->fault_data0);
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(m->i915) == 7)
|
2020-01-10 20:30:56 +08:00
|
|
|
err_printf(m, "ERR_INT: 0x%08x\n", gt->err_int);
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (IS_GRAPHICS_VER(m->i915, 8, 11))
|
2020-01-10 20:30:56 +08:00
|
|
|
err_printf(m, "GTT_CACHE_EN: 0x%08x\n", gt->gtt_cache);
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(m->i915) == 12)
|
2020-01-10 20:30:56 +08:00
|
|
|
err_printf(m, "AUX_ERR_DBG: 0x%08x\n", gt->aux_err);
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(m->i915) >= 12) {
|
2020-01-10 20:30:56 +08:00
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < GEN12_SFC_DONE_MAX; i++)
|
|
|
|
err_printf(m, " SFC_DONE[%d]: 0x%08x\n", i,
|
|
|
|
gt->sfc_done[i]);
|
|
|
|
|
|
|
|
err_printf(m, " GAM_DONE: 0x%08x\n", gt->gam_done);
|
|
|
|
}
|
|
|
|
|
|
|
|
for (ee = gt->engine; ee; ee = ee->next) {
|
|
|
|
const struct i915_vma_coredump *vma;
|
|
|
|
|
|
|
|
error_print_engine(m, ee);
|
|
|
|
for (vma = ee->vma; vma; vma = vma->next)
|
|
|
|
print_error_vma(m, ee->engine, vma);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (gt->uc)
|
|
|
|
err_print_uc(m, gt->uc);
|
2020-07-11 03:32:39 +08:00
|
|
|
|
|
|
|
err_print_gt_info(m, gt);
|
2020-01-10 20:30:56 +08:00
|
|
|
}
|
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
static void __err_print_to_sgl(struct drm_i915_error_state_buf *m,
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_gpu_coredump *error)
|
2018-11-23 21:23:25 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
const struct intel_engine_coredump *ee;
|
2018-11-23 21:23:25 +08:00
|
|
|
struct timespec64 ts;
|
2018-11-03 00:12:12 +08:00
|
|
|
|
2017-02-15 00:46:11 +08:00
|
|
|
if (*error->error_msg)
|
|
|
|
err_printf(m, "%s\n", error->error_msg);
|
2019-01-03 18:12:45 +08:00
|
|
|
err_printf(m, "Kernel: %s %s\n",
|
|
|
|
init_utsname()->release,
|
|
|
|
init_utsname()->machine);
|
2019-08-07 19:38:27 +08:00
|
|
|
err_printf(m, "Driver: %s\n", DRIVER_DATE);
|
2018-01-17 23:48:53 +08:00
|
|
|
ts = ktime_to_timespec64(error->time);
|
|
|
|
err_printf(m, "Time: %lld s %ld us\n",
|
|
|
|
(s64)ts.tv_sec, ts.tv_nsec / NSEC_PER_USEC);
|
|
|
|
ts = ktime_to_timespec64(error->boottime);
|
|
|
|
err_printf(m, "Boottime: %lld s %ld us\n",
|
|
|
|
(s64)ts.tv_sec, ts.tv_nsec / NSEC_PER_USEC);
|
|
|
|
ts = ktime_to_timespec64(error->uptime);
|
|
|
|
err_printf(m, "Uptime: %lld s %ld us\n",
|
|
|
|
(s64)ts.tv_sec, ts.tv_nsec / NSEC_PER_USEC);
|
2019-10-23 21:31:08 +08:00
|
|
|
err_printf(m, "Capture: %lu jiffies; %d ms ago\n",
|
|
|
|
error->capture, jiffies_to_msecs(jiffies - error->capture));
|
2016-11-18 21:09:04 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
for (ee = error->gt ? error->gt->engine : NULL; ee; ee = ee->next)
|
drm/i915: Use time based guilty context banning
Currently, we accumulate each time a context hangs the GPU, offset
against the number of requests it submits, and if that score exceeds a
certain threshold, we ban that context from submitting any more requests
(cancelling any work in flight). In contrast, we use a simple timer on
the file, that if we see more than a 9 hangs faster than 60s apart in
total across all of its contexts, we will ban the client from creating
any more contexts. This leads to a confusing situation where the file
may be banned before the context, so lets use a simple timer scheme for
each.
If the context submits 3 hanging requests within a 120s period, declare
it forbidden to ever send more requests.
This has the advantage of not being easy to repair by simply sending
empty requests, but has the disadvantage that if the context is idle
then it is forgiven. However, if the context is idle, it is not
disrupting the system, but a hog can evade the request counting and
cause much more severe disruption to the system.
Updating ban_score from request retirement is dubious as the retirement
is purposely not in sync with request submission (i.e. we try and batch
retirement to reduce overhead and avoid latency on submission), which
leads to surprising situations where we can forgive a hang immediately
due to a backlog of requests from before the hang being retired
afterwards.
Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
Cc: Mika Kuoppala <mika.kuoppala@intel.com>
Reviewed-by: Mika Kuoppala <mika.kuoppala@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20190219122215.8941-2-chris@chris-wilson.co.uk
2019-02-19 20:21:52 +08:00
|
|
|
err_printf(m, "Active process (on ring %s): %s [%d]\n",
|
2019-08-08 22:45:11 +08:00
|
|
|
ee->engine->name,
|
|
|
|
ee->context.comm,
|
|
|
|
ee->context.pid);
|
|
|
|
|
2014-02-25 23:11:27 +08:00
|
|
|
err_printf(m, "Reset count: %u\n", error->reset_count);
|
2014-02-25 23:11:28 +08:00
|
|
|
err_printf(m, "Suspend count: %u\n", error->suspend_count);
|
2016-12-01 20:49:55 +08:00
|
|
|
err_printf(m, "Platform: %s\n", intel_platform_name(error->device_info.platform));
|
2019-03-27 22:23:28 +08:00
|
|
|
err_printf(m, "Subplatform: 0x%x\n",
|
|
|
|
intel_subplatform(&error->runtime_info,
|
|
|
|
error->device_info.platform));
|
2018-11-23 21:23:25 +08:00
|
|
|
err_print_pciid(m, m->i915);
|
2017-02-07 05:36:07 +08:00
|
|
|
|
2015-08-08 03:24:15 +08:00
|
|
|
err_printf(m, "IOMMU enabled?: %d\n", error->iommu);
|
2015-10-29 21:21:19 +08:00
|
|
|
|
2021-05-19 05:34:41 +08:00
|
|
|
if (HAS_DMC(m->i915)) {
|
2021-05-19 05:34:40 +08:00
|
|
|
struct intel_dmc *dmc = &m->i915->dmc;
|
2015-10-29 21:21:19 +08:00
|
|
|
|
|
|
|
err_printf(m, "DMC loaded: %s\n",
|
2021-05-27 06:02:55 +08:00
|
|
|
yesno(intel_dmc_has_payload(m->i915) != 0));
|
2015-10-29 21:21:19 +08:00
|
|
|
err_printf(m, "DMC fw version: %d.%d\n",
|
2021-05-19 05:34:42 +08:00
|
|
|
DMC_VERSION_MAJOR(dmc->version),
|
|
|
|
DMC_VERSION_MINOR(dmc->version));
|
2015-10-29 21:21:19 +08:00
|
|
|
}
|
|
|
|
|
2017-03-02 23:15:44 +08:00
|
|
|
err_printf(m, "RPM wakelock: %s\n", yesno(error->wakelock));
|
|
|
|
err_printf(m, "PM suspended: %s\n", yesno(error->suspended));
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
if (error->gt)
|
|
|
|
err_print_gt(m, error->gt);
|
2013-07-12 21:50:57 +08:00
|
|
|
|
|
|
|
if (error->overlay)
|
|
|
|
intel_overlay_print_error_state(m, error->overlay);
|
|
|
|
|
2020-07-08 08:39:47 +08:00
|
|
|
err_print_capabilities(m, error);
|
2017-02-07 05:36:07 +08:00
|
|
|
err_print_params(m, &error->params);
|
2018-11-23 21:23:25 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static int err_print_to_sgl(struct i915_gpu_coredump *error)
|
2018-11-23 21:23:25 +08:00
|
|
|
{
|
|
|
|
struct drm_i915_error_state_buf m;
|
|
|
|
|
|
|
|
if (IS_ERR(error))
|
|
|
|
return PTR_ERR(error);
|
|
|
|
|
|
|
|
if (READ_ONCE(error->sgl))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
memset(&m, 0, sizeof(m));
|
|
|
|
m.i915 = error->i915;
|
|
|
|
|
|
|
|
__err_print_to_sgl(&m, error);
|
|
|
|
|
|
|
|
if (m.buf) {
|
|
|
|
__sg_set_buf(m.cur++, m.buf, m.bytes, m.iter);
|
|
|
|
m.bytes = 0;
|
|
|
|
m.buf = NULL;
|
|
|
|
}
|
|
|
|
if (m.cur) {
|
|
|
|
GEM_BUG_ON(m.end < m.cur);
|
|
|
|
sg_mark_end(m.cur - 1);
|
|
|
|
}
|
|
|
|
GEM_BUG_ON(m.sgl && !m.cur);
|
|
|
|
|
|
|
|
if (m.err) {
|
|
|
|
err_free_sgl(m.sgl);
|
|
|
|
return m.err;
|
|
|
|
}
|
2017-02-07 05:36:07 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
if (cmpxchg(&error->sgl, NULL, m.sgl))
|
|
|
|
err_free_sgl(m.sgl);
|
2013-07-12 21:50:57 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
ssize_t i915_gpu_coredump_copy_to_buffer(struct i915_gpu_coredump *error,
|
|
|
|
char *buf, loff_t off, size_t rem)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2018-11-23 21:23:25 +08:00
|
|
|
struct scatterlist *sg;
|
|
|
|
size_t count;
|
|
|
|
loff_t pos;
|
|
|
|
int err;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
if (!error || !rem)
|
|
|
|
return 0;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
err = err_print_to_sgl(error);
|
|
|
|
if (err)
|
|
|
|
return err;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
sg = READ_ONCE(error->fit);
|
|
|
|
if (!sg || off < sg->dma_address)
|
|
|
|
sg = error->sgl;
|
|
|
|
if (!sg)
|
|
|
|
return 0;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
pos = sg->dma_address;
|
|
|
|
count = 0;
|
|
|
|
do {
|
|
|
|
size_t len, start;
|
|
|
|
|
|
|
|
if (sg_is_chain(sg)) {
|
|
|
|
sg = sg_chain_ptr(sg);
|
|
|
|
GEM_BUG_ON(sg_is_chain(sg));
|
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
len = sg->length;
|
|
|
|
if (pos + len <= off) {
|
|
|
|
pos += len;
|
|
|
|
continue;
|
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
start = sg->offset;
|
|
|
|
if (pos < off) {
|
|
|
|
GEM_BUG_ON(off - pos > len);
|
|
|
|
len -= off - pos;
|
|
|
|
start += off - pos;
|
|
|
|
pos = off;
|
|
|
|
}
|
|
|
|
|
|
|
|
len = min(len, rem);
|
|
|
|
GEM_BUG_ON(!len || len > sg->length);
|
|
|
|
|
|
|
|
memcpy(buf, page_address(sg_page(sg)) + start, len);
|
|
|
|
|
|
|
|
count += len;
|
|
|
|
pos += len;
|
|
|
|
|
|
|
|
buf += len;
|
|
|
|
rem -= len;
|
|
|
|
if (!rem) {
|
|
|
|
WRITE_ONCE(error->fit, sg);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} while (!sg_is_last(sg++));
|
|
|
|
|
|
|
|
return count;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void i915_vma_coredump_free(struct i915_vma_coredump *vma)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
while (vma) {
|
|
|
|
struct i915_vma_coredump *next = vma->next;
|
|
|
|
int page;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
for (page = 0; page < vma->page_count; page++)
|
|
|
|
free_page((unsigned long)vma->pages[page]);
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
kfree(vma);
|
|
|
|
vma = next;
|
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void cleanup_params(struct i915_gpu_coredump *error)
|
2017-10-27 01:36:57 +08:00
|
|
|
{
|
2018-12-27 22:33:38 +08:00
|
|
|
i915_params_free(&error->params);
|
2017-10-27 01:36:57 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void cleanup_uc(struct intel_uc_coredump *uc)
|
2017-10-27 01:36:55 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
kfree(uc->guc_fw.path);
|
|
|
|
kfree(uc->huc_fw.path);
|
|
|
|
i915_vma_coredump_free(uc->guc_log);
|
2017-10-27 01:36:55 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
kfree(uc);
|
2017-10-27 01:36:55 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void cleanup_gt(struct intel_gt_coredump *gt)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
while (gt->engine) {
|
|
|
|
struct intel_engine_coredump *ee = gt->engine;
|
|
|
|
|
|
|
|
gt->engine = ee->next;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
i915_vma_coredump_free(ee->vma);
|
|
|
|
kfree(ee);
|
|
|
|
}
|
2016-07-27 16:07:28 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
if (gt->uc)
|
|
|
|
cleanup_uc(gt->uc);
|
2019-08-08 22:45:11 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
kfree(gt);
|
|
|
|
}
|
2017-04-15 17:39:02 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
void __i915_gpu_coredump_free(struct kref *error_ref)
|
|
|
|
{
|
|
|
|
struct i915_gpu_coredump *error =
|
|
|
|
container_of(error_ref, typeof(*error), ref);
|
2016-07-27 16:07:28 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
while (error->gt) {
|
|
|
|
struct intel_gt_coredump *gt = error->gt;
|
|
|
|
|
|
|
|
error->gt = gt->next;
|
|
|
|
cleanup_gt(gt);
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
kfree(error->overlay);
|
2017-02-22 00:26:19 +08:00
|
|
|
|
2017-10-27 01:36:57 +08:00
|
|
|
cleanup_params(error);
|
2017-10-27 01:36:55 +08:00
|
|
|
|
2018-11-23 21:23:25 +08:00
|
|
|
err_free_sgl(error->sgl);
|
2013-07-12 21:50:57 +08:00
|
|
|
kfree(error);
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static struct i915_vma_coredump *
|
|
|
|
i915_vma_coredump_create(const struct intel_gt *gt,
|
|
|
|
const struct i915_vma *vma,
|
|
|
|
const char *name,
|
|
|
|
struct i915_vma_compress *compress)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_ggtt *ggtt = gt->ggtt;
|
2016-10-12 17:05:20 +08:00
|
|
|
const u64 slot = ggtt->error_capture.start;
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_vma_coredump *dst;
|
2016-10-12 17:05:20 +08:00
|
|
|
unsigned long num_pages;
|
|
|
|
struct sgt_iter iter;
|
2018-10-03 16:24:22 +08:00
|
|
|
int ret;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2019-07-26 06:38:43 +08:00
|
|
|
might_sleep();
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
if (!vma || !vma->pages || !compress)
|
2016-08-15 17:49:06 +08:00
|
|
|
return NULL;
|
|
|
|
|
2016-10-12 17:05:20 +08:00
|
|
|
num_pages = min_t(u64, vma->size, vma->obj->base.size) >> PAGE_SHIFT;
|
2016-10-12 17:05:22 +08:00
|
|
|
num_pages = DIV_ROUND_UP(10 * num_pages, 8); /* worstcase zlib growth */
|
2019-07-26 06:38:43 +08:00
|
|
|
dst = kmalloc(sizeof(*dst) + num_pages * sizeof(u32 *), ALLOW_FAIL);
|
2016-08-15 17:49:06 +08:00
|
|
|
if (!dst)
|
2013-07-12 21:50:57 +08:00
|
|
|
return NULL;
|
|
|
|
|
2019-07-23 06:28:47 +08:00
|
|
|
if (!compress_start(compress)) {
|
|
|
|
kfree(dst);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
strcpy(dst->name, name);
|
|
|
|
dst->next = NULL;
|
|
|
|
|
2016-08-15 17:49:09 +08:00
|
|
|
dst->gtt_offset = vma->node.start;
|
|
|
|
dst->gtt_size = vma->node.size;
|
2019-09-10 01:16:46 +08:00
|
|
|
dst->gtt_page_sizes = vma->page_sizes.gtt;
|
2018-10-03 16:24:22 +08:00
|
|
|
dst->num_pages = num_pages;
|
2016-10-12 17:05:20 +08:00
|
|
|
dst->page_count = 0;
|
2016-10-12 17:05:22 +08:00
|
|
|
dst->unused = 0;
|
|
|
|
|
2018-10-03 16:24:22 +08:00
|
|
|
ret = -EINVAL;
|
2019-10-29 17:58:53 +08:00
|
|
|
if (drm_mm_node_allocated(&ggtt->error_capture)) {
|
2016-10-12 17:05:20 +08:00
|
|
|
void __iomem *s;
|
2019-10-29 17:58:53 +08:00
|
|
|
dma_addr_t dma;
|
2014-08-13 03:05:48 +08:00
|
|
|
|
2019-10-29 17:58:53 +08:00
|
|
|
for_each_sgt_daddr(dma, iter, vma->pages) {
|
2020-09-16 17:00:59 +08:00
|
|
|
mutex_lock(&ggtt->error_mutex);
|
2019-10-29 17:58:53 +08:00
|
|
|
ggtt->vm.insert_page(&ggtt->vm, dma, slot,
|
|
|
|
I915_CACHE_NONE, 0);
|
2020-01-10 20:30:56 +08:00
|
|
|
mb();
|
2014-08-13 03:05:48 +08:00
|
|
|
|
2019-10-29 17:58:53 +08:00
|
|
|
s = io_mapping_map_wc(&ggtt->iomap, slot, PAGE_SIZE);
|
2020-01-10 20:30:56 +08:00
|
|
|
ret = compress_page(compress,
|
|
|
|
(void __force *)s, dst,
|
|
|
|
true);
|
2019-10-29 17:58:53 +08:00
|
|
|
io_mapping_unmap(s);
|
2020-09-16 17:00:59 +08:00
|
|
|
|
|
|
|
mb();
|
|
|
|
ggtt->vm.clear_range(&ggtt->vm, slot, PAGE_SIZE);
|
|
|
|
mutex_unlock(&ggtt->error_mutex);
|
2019-10-29 17:58:53 +08:00
|
|
|
if (ret)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} else if (i915_gem_object_is_lmem(vma->obj)) {
|
|
|
|
struct intel_memory_region *mem = vma->obj->mm.region;
|
|
|
|
dma_addr_t dma;
|
|
|
|
|
|
|
|
for_each_sgt_daddr(dma, iter, vma->pages) {
|
|
|
|
void __iomem *s;
|
|
|
|
|
2021-01-19 21:31:04 +08:00
|
|
|
s = io_mapping_map_wc(&mem->iomap,
|
|
|
|
dma - mem->region.start,
|
|
|
|
PAGE_SIZE);
|
2020-01-10 20:30:56 +08:00
|
|
|
ret = compress_page(compress,
|
|
|
|
(void __force *)s, dst,
|
|
|
|
true);
|
2019-11-14 07:11:04 +08:00
|
|
|
io_mapping_unmap(s);
|
2019-10-29 17:58:53 +08:00
|
|
|
if (ret)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
struct page *page;
|
|
|
|
|
|
|
|
for_each_sgt_page(page, iter, vma->pages) {
|
|
|
|
void *s;
|
|
|
|
|
|
|
|
drm_clflush_pages(&page, 1);
|
|
|
|
|
2019-11-14 07:11:04 +08:00
|
|
|
s = kmap(page);
|
2020-01-10 20:30:56 +08:00
|
|
|
ret = compress_page(compress, s, dst, false);
|
2019-11-25 17:14:09 +08:00
|
|
|
kunmap(page);
|
2019-10-29 17:58:53 +08:00
|
|
|
|
|
|
|
drm_clflush_pages(&page, 1);
|
|
|
|
|
|
|
|
if (ret)
|
|
|
|
break;
|
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2019-07-23 06:28:47 +08:00
|
|
|
if (ret || compress_flush(compress, dst)) {
|
2018-10-03 16:24:22 +08:00
|
|
|
while (dst->page_count--)
|
2019-07-23 06:28:47 +08:00
|
|
|
pool_free(&compress->pool, dst->pages[dst->page_count]);
|
2018-10-03 16:24:22 +08:00
|
|
|
kfree(dst);
|
|
|
|
dst = NULL;
|
|
|
|
}
|
2019-07-23 06:28:47 +08:00
|
|
|
compress_finish(compress);
|
2016-10-12 17:05:20 +08:00
|
|
|
|
|
|
|
return dst;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void gt_record_fences(struct intel_gt_coredump *gt)
|
2014-02-04 20:18:55 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_ggtt *ggtt = gt->_gt->ggtt;
|
|
|
|
struct intel_uncore *uncore = gt->_gt->uncore;
|
2013-07-12 21:50:57 +08:00
|
|
|
int i;
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(uncore->i915) >= 6) {
|
2020-01-10 20:30:56 +08:00
|
|
|
for (i = 0; i < ggtt->num_fences; i++)
|
|
|
|
gt->fence[i] =
|
2019-06-10 20:06:06 +08:00
|
|
|
intel_uncore_read64(uncore,
|
|
|
|
FENCE_REG_GEN6_LO(i));
|
2021-06-06 12:50:49 +08:00
|
|
|
} else if (GRAPHICS_VER(uncore->i915) >= 4) {
|
2020-01-10 20:30:56 +08:00
|
|
|
for (i = 0; i < ggtt->num_fences; i++)
|
|
|
|
gt->fence[i] =
|
2019-06-10 20:06:06 +08:00
|
|
|
intel_uncore_read64(uncore,
|
|
|
|
FENCE_REG_965_LO(i));
|
2017-02-15 00:46:11 +08:00
|
|
|
} else {
|
2020-01-10 20:30:56 +08:00
|
|
|
for (i = 0; i < ggtt->num_fences; i++)
|
|
|
|
gt->fence[i] =
|
2019-06-10 20:06:06 +08:00
|
|
|
intel_uncore_read(uncore, FENCE_REG(i));
|
2015-09-21 23:05:14 +08:00
|
|
|
}
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->nfence = i;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void engine_record_registers(struct intel_engine_coredump *ee)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
const struct intel_engine_cs *engine = ee->engine;
|
|
|
|
struct drm_i915_private *i915 = engine->i915;
|
2016-07-27 16:07:28 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) >= 6) {
|
2019-03-26 05:49:40 +08:00
|
|
|
ee->rc_psmi = ENGINE_READ(engine, RING_PSMI_CTL);
|
2019-07-31 02:04:03 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) >= 12)
|
2020-01-10 20:30:56 +08:00
|
|
|
ee->fault_reg = intel_uncore_read(engine->uncore,
|
|
|
|
GEN12_RING_FAULT_REG);
|
2021-06-06 12:50:49 +08:00
|
|
|
else if (GRAPHICS_VER(i915) >= 8)
|
2020-01-10 20:30:56 +08:00
|
|
|
ee->fault_reg = intel_uncore_read(engine->uncore,
|
|
|
|
GEN8_RING_FAULT_REG);
|
2019-03-05 23:09:14 +08:00
|
|
|
else
|
2019-06-07 18:15:35 +08:00
|
|
|
ee->fault_reg = GEN6_RING_FAULT_REG_READ(engine);
|
2013-08-13 07:53:04 +08:00
|
|
|
}
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) >= 4) {
|
2020-01-29 04:43:15 +08:00
|
|
|
ee->esr = ENGINE_READ(engine, RING_ESR);
|
2019-03-26 05:49:40 +08:00
|
|
|
ee->faddr = ENGINE_READ(engine, RING_DMA_FADD);
|
|
|
|
ee->ipeir = ENGINE_READ(engine, RING_IPEIR);
|
|
|
|
ee->ipehr = ENGINE_READ(engine, RING_IPEHR);
|
|
|
|
ee->instps = ENGINE_READ(engine, RING_INSTPS);
|
|
|
|
ee->bbaddr = ENGINE_READ(engine, RING_BBADDR);
|
2020-01-10 20:30:56 +08:00
|
|
|
ee->ccid = ENGINE_READ(engine, CCID);
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) >= 8) {
|
2019-03-26 05:49:40 +08:00
|
|
|
ee->faddr |= (u64)ENGINE_READ(engine, RING_DMA_FADD_UDW) << 32;
|
|
|
|
ee->bbaddr |= (u64)ENGINE_READ(engine, RING_BBADDR_UDW) << 32;
|
2014-04-02 07:31:07 +08:00
|
|
|
}
|
2019-03-26 05:49:40 +08:00
|
|
|
ee->bbstate = ENGINE_READ(engine, RING_BBSTATE);
|
2013-07-12 21:50:57 +08:00
|
|
|
} else {
|
2019-03-26 05:49:40 +08:00
|
|
|
ee->faddr = ENGINE_READ(engine, DMA_FADD_I8XX);
|
|
|
|
ee->ipeir = ENGINE_READ(engine, IPEIR);
|
|
|
|
ee->ipehr = ENGINE_READ(engine, IPEHR);
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2016-10-12 17:05:17 +08:00
|
|
|
intel_engine_get_instdone(engine, &ee->instdone);
|
2016-09-20 21:54:32 +08:00
|
|
|
|
2019-03-26 05:49:40 +08:00
|
|
|
ee->instpm = ENGINE_READ(engine, RING_INSTPM);
|
2016-08-03 05:50:21 +08:00
|
|
|
ee->acthd = intel_engine_get_active_head(engine);
|
2019-03-26 05:49:40 +08:00
|
|
|
ee->start = ENGINE_READ(engine, RING_START);
|
|
|
|
ee->head = ENGINE_READ(engine, RING_HEAD);
|
|
|
|
ee->tail = ENGINE_READ(engine, RING_TAIL);
|
|
|
|
ee->ctl = ENGINE_READ(engine, RING_CTL);
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) > 2)
|
2019-03-26 05:49:40 +08:00
|
|
|
ee->mode = ENGINE_READ(engine, RING_MI_MODE);
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
if (!HWS_NEEDS_PHYSICAL(i915)) {
|
drm/i915: Type safe register read/write
Make I915_READ and I915_WRITE more type safe by wrapping the register
offset in a struct. This should eliminate most of the fumbles we've had
with misplaced parens.
This only takes care of normal mmio registers. We could extend the idea
to other register types and define each with its own struct. That way
you wouldn't be able to accidentally pass the wrong thing to a specific
register access function.
The gpio_reg setup is probably the ugliest thing left. But I figure I'd
just leave it for now, and wait for some divine inspiration to strike
before making it nice.
As for the generated code, it's actually a bit better sometimes. Eg.
looking at i915_irq_handler(), we can see the following change:
lea 0x70024(%rdx,%rax,1),%r9d
mov $0x1,%edx
- movslq %r9d,%r9
- mov %r9,%rsi
- mov %r9,-0x58(%rbp)
- callq *0xd8(%rbx)
+ mov %r9d,%esi
+ mov %r9d,-0x48(%rbp)
callq *0xd8(%rbx)
So previously gcc thought the register offset might be signed and
decided to sign extend it, just in case. The rest appears to be
mostly just minor shuffling of instructions.
v2: i915_mmio_reg_{offset,equal,valid}() helpers added
s/_REG/_MMIO/ in the register defines
mo more switch statements left to worry about
ring_emit stuff got sorted in a prep patch
cmd parser, lrc context and w/a batch buildup also in prep patch
vgpu stuff cleaned up and moved to a prep patch
all other unrelated changes split out
v3: Rebased due to BXT DSI/BLC, MOCS, etc.
v4: Rebased due to churn, s/i915_mmio_reg_t/i915_reg_t/
Signed-off-by: Ville Syrjälä <ville.syrjala@linux.intel.com>
Reviewed-by: Chris Wilson <chris@chris-wilson.co.uk>
Link: http://patchwork.freedesktop.org/patch/msgid/1447853606-2751-1-git-send-email-ville.syrjala@linux.intel.com
2015-11-18 21:33:26 +08:00
|
|
|
i915_reg_t mmio;
|
2014-01-24 06:40:36 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) == 7) {
|
2016-03-16 19:00:37 +08:00
|
|
|
switch (engine->id) {
|
2014-01-24 06:40:36 +08:00
|
|
|
default:
|
2019-03-06 02:03:30 +08:00
|
|
|
MISSING_CASE(engine->id);
|
2020-08-24 06:36:59 +08:00
|
|
|
fallthrough;
|
2019-03-06 02:03:30 +08:00
|
|
|
case RCS0:
|
2014-01-24 06:40:36 +08:00
|
|
|
mmio = RENDER_HWS_PGA_GEN7;
|
|
|
|
break;
|
2019-03-06 02:03:30 +08:00
|
|
|
case BCS0:
|
2014-01-24 06:40:36 +08:00
|
|
|
mmio = BLT_HWS_PGA_GEN7;
|
|
|
|
break;
|
2019-03-06 02:03:30 +08:00
|
|
|
case VCS0:
|
2014-01-24 06:40:36 +08:00
|
|
|
mmio = BSD_HWS_PGA_GEN7;
|
|
|
|
break;
|
2019-03-06 02:03:30 +08:00
|
|
|
case VECS0:
|
2014-01-24 06:40:36 +08:00
|
|
|
mmio = VEBOX_HWS_PGA_GEN7;
|
|
|
|
break;
|
|
|
|
}
|
2021-06-06 12:50:49 +08:00
|
|
|
} else if (GRAPHICS_VER(engine->i915) == 6) {
|
2016-03-16 19:00:37 +08:00
|
|
|
mmio = RING_HWS_PGA_GEN6(engine->mmio_base);
|
2014-01-24 06:40:36 +08:00
|
|
|
} else {
|
|
|
|
/* XXX: gen8 returns to sanity */
|
2016-03-16 19:00:37 +08:00
|
|
|
mmio = RING_HWS_PGA(engine->mmio_base);
|
2014-01-24 06:40:36 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
ee->hws = intel_uncore_read(engine->uncore, mmio);
|
2014-01-24 06:40:36 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
ee->reset_count = i915_reset_engine_count(&i915->gpu_error, engine);
|
2014-01-30 16:19:40 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
if (HAS_PPGTT(i915)) {
|
2014-01-30 16:19:40 +08:00
|
|
|
int i;
|
|
|
|
|
2019-06-07 16:45:20 +08:00
|
|
|
ee->vm_info.gfx_mode = ENGINE_READ(engine, RING_MODE_GEN7);
|
2014-01-30 16:19:40 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) == 6) {
|
2016-07-27 16:07:28 +08:00
|
|
|
ee->vm_info.pp_dir_base =
|
2019-03-26 05:49:40 +08:00
|
|
|
ENGINE_READ(engine, RING_PP_DIR_BASE_READ);
|
2021-06-06 12:50:49 +08:00
|
|
|
} else if (GRAPHICS_VER(i915) == 7) {
|
2016-07-27 16:07:28 +08:00
|
|
|
ee->vm_info.pp_dir_base =
|
2019-04-05 20:38:31 +08:00
|
|
|
ENGINE_READ(engine, RING_PP_DIR_BASE);
|
2021-06-06 12:50:49 +08:00
|
|
|
} else if (GRAPHICS_VER(i915) >= 8) {
|
2019-04-05 20:38:31 +08:00
|
|
|
u32 base = engine->mmio_base;
|
|
|
|
|
2014-01-30 16:19:40 +08:00
|
|
|
for (i = 0; i < 4; i++) {
|
2016-07-27 16:07:28 +08:00
|
|
|
ee->vm_info.pdp[i] =
|
2020-01-10 20:30:56 +08:00
|
|
|
intel_uncore_read(engine->uncore,
|
|
|
|
GEN8_RING_PDP_UDW(base, i));
|
2016-07-27 16:07:28 +08:00
|
|
|
ee->vm_info.pdp[i] <<= 32;
|
|
|
|
ee->vm_info.pdp[i] |=
|
2020-01-10 20:30:56 +08:00
|
|
|
intel_uncore_read(engine->uncore,
|
|
|
|
GEN8_RING_PDP_LDW(base, i));
|
2014-01-30 16:19:40 +08:00
|
|
|
}
|
2019-04-05 20:38:31 +08:00
|
|
|
}
|
2014-01-30 16:19:40 +08:00
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
drm/i915/execlists: Preempt-to-busy
When using a global seqno, we required a precise stop-the-workd event to
handle preemption and unwind the global seqno counter. To accomplish
this, we would preempt to a special out-of-band context and wait for the
machine to report that it was idle. Given an idle machine, we could very
precisely see which requests had completed and which we needed to feed
back into the run queue.
However, now that we have scrapped the global seqno, we no longer need
to precisely unwind the global counter and only track requests by their
per-context seqno. This allows us to loosely unwind inflight requests
while scheduling a preemption, with the enormous caveat that the
requests we put back on the run queue are still _inflight_ (until the
preemption request is complete). This makes request tracking much more
messy, as at any point then we can see a completed request that we
believe is not currently scheduled for execution. We also have to be
careful not to rewind RING_TAIL past RING_HEAD on preempting to the
running context, and for this we use a semaphore to prevent completion
of the request before continuing.
To accomplish this feat, we change how we track requests scheduled to
the HW. Instead of appending our requests onto a single list as we
submit, we track each submission to ELSP as its own block. Then upon
receiving the CS preemption event, we promote the pending block to the
inflight block (discarding what was previously being tracked). As normal
CS completion events arrive, we then remove stale entries from the
inflight tracker.
v2: Be a tinge paranoid and ensure we flush the write into the HWS page
for the GPU semaphore to pick in a timely fashion.
Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
Reviewed-by: Mika Kuoppala <mika.kuoppala@linux.intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20190620142052.19311-1-chris@chris-wilson.co.uk
2019-06-20 22:20:51 +08:00
|
|
|
static void record_request(const struct i915_request *request,
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_request_coredump *erq)
|
2016-10-13 18:18:14 +08:00
|
|
|
{
|
drm/i915: Replace global breadcrumbs with per-context interrupt tracking
A few years ago, see commit 688e6c725816 ("drm/i915: Slaughter the
thundering i915_wait_request herd"), the issue of handling multiple
clients waiting in parallel was brought to our attention. The
requirement was that every client should be woken immediately upon its
request being signaled, without incurring any cpu overhead.
To handle certain fragility of our hw meant that we could not do a
simple check inside the irq handler (some generations required almost
unbounded delays before we could be sure of seqno coherency) and so
request completion checking required delegation.
Before commit 688e6c725816, the solution was simple. Every client
waiting on a request would be woken on every interrupt and each would do
a heavyweight check to see if their request was complete. Commit
688e6c725816 introduced an rbtree so that only the earliest waiter on
the global timeline would woken, and would wake the next and so on.
(Along with various complications to handle requests being reordered
along the global timeline, and also a requirement for kthread to provide
a delegate for fence signaling that had no process context.)
The global rbtree depends on knowing the execution timeline (and global
seqno). Without knowing that order, we must instead check all contexts
queued to the HW to see which may have advanced. We trim that list by
only checking queued contexts that are being waited on, but still we
keep a list of all active contexts and their active signalers that we
inspect from inside the irq handler. By moving the waiters onto the fence
signal list, we can combine the client wakeup with the dma_fence
signaling (a dramatic reduction in complexity, but does require the HW
being coherent, the seqno must be visible from the cpu before the
interrupt is raised - we keep a timer backup just in case).
Having previously fixed all the issues with irq-seqno serialisation (by
inserting delays onto the GPU after each request instead of random delays
on the CPU after each interrupt), we can rely on the seqno state to
perfom direct wakeups from the interrupt handler. This allows us to
preserve our single context switch behaviour of the current routine,
with the only downside that we lose the RT priority sorting of wakeups.
In general, direct wakeup latency of multiple clients is about the same
(about 10% better in most cases) with a reduction in total CPU time spent
in the waiter (about 20-50% depending on gen). Average herd behaviour is
improved, but at the cost of not delegating wakeups on task_prio.
v2: Capture fence signaling state for error state and add comments to
warm even the most cold of hearts.
v3: Check if the request is still active before busywaiting
v4: Reduce the amount of pointer misdirection with list_for_each_safe
and using a local i915_request variable inside the loops
v5: Add a missing pluralisation to a purely informative selftest message.
References: 688e6c725816 ("drm/i915: Slaughter the thundering i915_wait_request herd")
Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
Cc: Tvrtko Ursulin <tvrtko.ursulin@intel.com>
Reviewed-by: Tvrtko Ursulin <tvrtko.ursulin@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20190129205230.19056-2-chris@chris-wilson.co.uk
2019-01-30 04:52:29 +08:00
|
|
|
erq->flags = request->fence.flags;
|
2019-02-26 17:49:21 +08:00
|
|
|
erq->context = request->fence.context;
|
|
|
|
erq->seqno = request->fence.seqno;
|
2018-04-19 02:40:52 +08:00
|
|
|
erq->sched_attr = request->sched.attr;
|
2016-10-13 18:18:14 +08:00
|
|
|
erq->head = request->head;
|
|
|
|
erq->tail = request->tail;
|
2019-12-23 07:35:58 +08:00
|
|
|
|
|
|
|
erq->pid = 0;
|
|
|
|
rcu_read_lock();
|
2020-04-28 17:02:55 +08:00
|
|
|
if (!intel_context_is_closed(request->context)) {
|
|
|
|
const struct i915_gem_context *ctx;
|
|
|
|
|
|
|
|
ctx = rcu_dereference(request->context->gem_context);
|
|
|
|
if (ctx)
|
|
|
|
erq->pid = pid_nr(ctx->pid);
|
|
|
|
}
|
2019-12-23 07:35:58 +08:00
|
|
|
rcu_read_unlock();
|
2016-10-13 18:18:14 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void engine_record_execlists(struct intel_engine_coredump *ee)
|
2016-10-13 18:18:14 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
const struct intel_engine_execlists * const el = &ee->engine->execlists;
|
|
|
|
struct i915_request * const *port = el->active;
|
drm/i915/execlists: Preempt-to-busy
When using a global seqno, we required a precise stop-the-workd event to
handle preemption and unwind the global seqno counter. To accomplish
this, we would preempt to a special out-of-band context and wait for the
machine to report that it was idle. Given an idle machine, we could very
precisely see which requests had completed and which we needed to feed
back into the run queue.
However, now that we have scrapped the global seqno, we no longer need
to precisely unwind the global counter and only track requests by their
per-context seqno. This allows us to loosely unwind inflight requests
while scheduling a preemption, with the enormous caveat that the
requests we put back on the run queue are still _inflight_ (until the
preemption request is complete). This makes request tracking much more
messy, as at any point then we can see a completed request that we
believe is not currently scheduled for execution. We also have to be
careful not to rewind RING_TAIL past RING_HEAD on preempting to the
running context, and for this we use a semaphore to prevent completion
of the request before continuing.
To accomplish this feat, we change how we track requests scheduled to
the HW. Instead of appending our requests onto a single list as we
submit, we track each submission to ELSP as its own block. Then upon
receiving the CS preemption event, we promote the pending block to the
inflight block (discarding what was previously being tracked). As normal
CS completion events arrive, we then remove stale entries from the
inflight tracker.
v2: Be a tinge paranoid and ensure we flush the write into the HWS page
for the GPU semaphore to pick in a timely fashion.
Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
Reviewed-by: Mika Kuoppala <mika.kuoppala@linux.intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20190620142052.19311-1-chris@chris-wilson.co.uk
2019-06-20 22:20:51 +08:00
|
|
|
unsigned int n = 0;
|
2016-10-13 18:18:14 +08:00
|
|
|
|
drm/i915/execlists: Preempt-to-busy
When using a global seqno, we required a precise stop-the-workd event to
handle preemption and unwind the global seqno counter. To accomplish
this, we would preempt to a special out-of-band context and wait for the
machine to report that it was idle. Given an idle machine, we could very
precisely see which requests had completed and which we needed to feed
back into the run queue.
However, now that we have scrapped the global seqno, we no longer need
to precisely unwind the global counter and only track requests by their
per-context seqno. This allows us to loosely unwind inflight requests
while scheduling a preemption, with the enormous caveat that the
requests we put back on the run queue are still _inflight_ (until the
preemption request is complete). This makes request tracking much more
messy, as at any point then we can see a completed request that we
believe is not currently scheduled for execution. We also have to be
careful not to rewind RING_TAIL past RING_HEAD on preempting to the
running context, and for this we use a semaphore to prevent completion
of the request before continuing.
To accomplish this feat, we change how we track requests scheduled to
the HW. Instead of appending our requests onto a single list as we
submit, we track each submission to ELSP as its own block. Then upon
receiving the CS preemption event, we promote the pending block to the
inflight block (discarding what was previously being tracked). As normal
CS completion events arrive, we then remove stale entries from the
inflight tracker.
v2: Be a tinge paranoid and ensure we flush the write into the HWS page
for the GPU semaphore to pick in a timely fashion.
Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
Reviewed-by: Mika Kuoppala <mika.kuoppala@linux.intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20190620142052.19311-1-chris@chris-wilson.co.uk
2019-06-20 22:20:51 +08:00
|
|
|
while (*port)
|
|
|
|
record_request(*port++, &ee->execlist[n++]);
|
2017-09-22 20:43:07 +08:00
|
|
|
|
|
|
|
ee->num_ports = n;
|
2016-10-13 18:18:14 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static bool record_context(struct i915_gem_context_coredump *e,
|
2019-08-08 22:45:11 +08:00
|
|
|
const struct i915_request *rq)
|
2017-01-29 17:24:33 +08:00
|
|
|
{
|
2019-12-23 07:35:58 +08:00
|
|
|
struct i915_gem_context *ctx;
|
|
|
|
struct task_struct *task;
|
2020-01-28 19:34:26 +08:00
|
|
|
bool simulated;
|
2019-12-23 07:35:58 +08:00
|
|
|
|
|
|
|
rcu_read_lock();
|
|
|
|
ctx = rcu_dereference(rq->context->gem_context);
|
|
|
|
if (ctx && !kref_get_unless_zero(&ctx->ref))
|
|
|
|
ctx = NULL;
|
|
|
|
rcu_read_unlock();
|
2019-12-20 18:12:29 +08:00
|
|
|
if (!ctx)
|
2020-01-28 19:34:26 +08:00
|
|
|
return true;
|
2019-08-08 22:45:11 +08:00
|
|
|
|
2019-12-23 07:35:58 +08:00
|
|
|
rcu_read_lock();
|
|
|
|
task = pid_task(ctx->pid, PIDTYPE_PID);
|
|
|
|
if (task) {
|
|
|
|
strcpy(e->comm, task->comm);
|
|
|
|
e->pid = task->pid;
|
2017-01-29 17:24:33 +08:00
|
|
|
}
|
2019-12-23 07:35:58 +08:00
|
|
|
rcu_read_unlock();
|
2017-01-29 17:24:33 +08:00
|
|
|
|
2018-04-19 02:40:52 +08:00
|
|
|
e->sched_attr = ctx->sched;
|
2017-07-21 20:32:30 +08:00
|
|
|
e->guilty = atomic_read(&ctx->guilty_count);
|
|
|
|
e->active = atomic_read(&ctx->active_count);
|
2019-08-08 22:45:11 +08:00
|
|
|
|
2020-02-16 21:36:20 +08:00
|
|
|
e->total_runtime = rq->context->runtime.total;
|
|
|
|
e->avg_runtime = ewma_runtime_read(&rq->context->runtime.avg);
|
|
|
|
|
2020-01-28 19:34:26 +08:00
|
|
|
simulated = i915_gem_context_no_error_capture(ctx);
|
2019-12-23 07:35:58 +08:00
|
|
|
|
|
|
|
i915_gem_context_put(ctx);
|
2020-01-28 19:34:26 +08:00
|
|
|
return simulated;
|
2017-01-29 17:24:33 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
struct intel_engine_capture_vma {
|
|
|
|
struct intel_engine_capture_vma *next;
|
|
|
|
struct i915_vma *vma;
|
|
|
|
char name[16];
|
2019-07-26 06:38:43 +08:00
|
|
|
};
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static struct intel_engine_capture_vma *
|
|
|
|
capture_vma(struct intel_engine_capture_vma *next,
|
2019-07-26 06:38:43 +08:00
|
|
|
struct i915_vma *vma,
|
2020-01-10 20:30:56 +08:00
|
|
|
const char *name,
|
|
|
|
gfp_t gfp)
|
2019-07-26 06:38:43 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct intel_engine_capture_vma *c;
|
2019-07-26 06:38:43 +08:00
|
|
|
|
|
|
|
if (!vma)
|
|
|
|
return next;
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
c = kmalloc(sizeof(*c), gfp);
|
2019-07-26 06:38:43 +08:00
|
|
|
if (!c)
|
|
|
|
return next;
|
|
|
|
|
2019-10-04 21:40:00 +08:00
|
|
|
if (!i915_active_acquire_if_busy(&vma->active)) {
|
2019-07-26 06:38:43 +08:00
|
|
|
kfree(c);
|
|
|
|
return next;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
strcpy(c->name, name);
|
2020-10-16 17:25:27 +08:00
|
|
|
c->vma = vma; /* reference held while active */
|
2019-07-26 06:38:43 +08:00
|
|
|
|
|
|
|
c->next = next;
|
|
|
|
return c;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static struct intel_engine_capture_vma *
|
|
|
|
capture_user(struct intel_engine_capture_vma *capture,
|
|
|
|
const struct i915_request *rq,
|
|
|
|
gfp_t gfp)
|
2017-04-15 17:39:02 +08:00
|
|
|
{
|
2018-02-21 17:56:36 +08:00
|
|
|
struct i915_capture_list *c;
|
2017-04-15 17:39:02 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
for (c = rq->capture_list; c; c = c->next)
|
|
|
|
capture = capture_vma(capture, c->vma, "user", gfp);
|
2019-07-26 06:38:43 +08:00
|
|
|
|
|
|
|
return capture;
|
2017-04-15 17:39:02 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void add_vma(struct intel_engine_coredump *ee,
|
|
|
|
struct i915_vma_coredump *vma)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
if (vma) {
|
|
|
|
vma->next = ee->vma;
|
|
|
|
ee->vma = vma;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
struct intel_engine_coredump *
|
|
|
|
intel_engine_coredump_alloc(struct intel_engine_cs *engine, gfp_t gfp)
|
|
|
|
{
|
|
|
|
struct intel_engine_coredump *ee;
|
2019-08-08 22:45:11 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
ee = kzalloc(sizeof(*ee), gfp);
|
2019-08-08 22:45:11 +08:00
|
|
|
if (!ee)
|
2020-01-10 20:30:56 +08:00
|
|
|
return NULL;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
ee->engine = engine;
|
2014-01-27 21:52:34 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
engine_record_registers(ee);
|
|
|
|
engine_record_execlists(ee);
|
2019-07-23 06:28:47 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
return ee;
|
|
|
|
}
|
2014-02-25 23:11:24 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
struct intel_engine_capture_vma *
|
|
|
|
intel_engine_coredump_add_request(struct intel_engine_coredump *ee,
|
|
|
|
struct i915_request *rq,
|
|
|
|
gfp_t gfp)
|
|
|
|
{
|
|
|
|
struct intel_engine_capture_vma *vma = NULL;
|
2019-07-26 06:38:43 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
ee->simulated |= record_context(&ee->context, rq);
|
|
|
|
if (ee->simulated)
|
|
|
|
return NULL;
|
2014-02-25 23:11:24 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
/*
|
|
|
|
* We need to copy these to an anonymous buffer
|
|
|
|
* as the simplest method to avoid being overwritten
|
|
|
|
* by userspace.
|
|
|
|
*/
|
|
|
|
vma = capture_vma(vma, rq->batch, "batch", gfp);
|
|
|
|
vma = capture_user(vma, rq, gfp);
|
|
|
|
vma = capture_vma(vma, rq->ring->vma, "ring", gfp);
|
|
|
|
vma = capture_vma(vma, rq->context->state, "HW context", gfp);
|
2019-07-26 06:38:43 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
ee->rq_head = rq->head;
|
|
|
|
ee->rq_post = rq->postfix;
|
|
|
|
ee->rq_tail = rq->tail;
|
2016-07-04 15:08:39 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
return vma;
|
|
|
|
}
|
2016-10-05 04:11:30 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
void
|
|
|
|
intel_engine_coredump_add_vma(struct intel_engine_coredump *ee,
|
|
|
|
struct intel_engine_capture_vma *capture,
|
|
|
|
struct i915_vma_compress *compress)
|
|
|
|
{
|
|
|
|
const struct intel_engine_cs *engine = ee->engine;
|
2016-08-15 17:49:10 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
while (capture) {
|
|
|
|
struct intel_engine_capture_vma *this = capture;
|
|
|
|
struct i915_vma *vma = this->vma;
|
2019-08-08 22:45:11 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
add_vma(ee,
|
|
|
|
i915_vma_coredump_create(engine->gt,
|
|
|
|
vma, this->name,
|
|
|
|
compress));
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
i915_active_release(&vma->active);
|
2019-08-08 22:45:11 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
capture = this->next;
|
|
|
|
kfree(this);
|
|
|
|
}
|
2019-07-26 06:38:43 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
add_vma(ee,
|
|
|
|
i915_vma_coredump_create(engine->gt,
|
|
|
|
engine->status_page.vma,
|
|
|
|
"HW Status",
|
|
|
|
compress));
|
2019-07-26 06:38:43 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
add_vma(ee,
|
|
|
|
i915_vma_coredump_create(engine->gt,
|
|
|
|
engine->wa_ctx.vma,
|
|
|
|
"WA context",
|
|
|
|
compress));
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct intel_engine_coredump *
|
|
|
|
capture_engine(struct intel_engine_cs *engine,
|
|
|
|
struct i915_vma_compress *compress)
|
|
|
|
{
|
2020-01-10 20:30:59 +08:00
|
|
|
struct intel_engine_capture_vma *capture = NULL;
|
2020-01-10 20:30:56 +08:00
|
|
|
struct intel_engine_coredump *ee;
|
|
|
|
struct i915_request *rq;
|
|
|
|
unsigned long flags;
|
2019-07-26 06:38:43 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
ee = intel_engine_coredump_alloc(engine, GFP_KERNEL);
|
|
|
|
if (!ee)
|
|
|
|
return NULL;
|
2016-08-15 17:48:41 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
spin_lock_irqsave(&engine->active.lock, flags);
|
|
|
|
rq = intel_engine_find_active_request(engine);
|
2020-01-10 20:30:59 +08:00
|
|
|
if (rq)
|
|
|
|
capture = intel_engine_coredump_add_request(ee, rq,
|
|
|
|
ATOMIC_MAYFAIL);
|
|
|
|
spin_unlock_irqrestore(&engine->active.lock, flags);
|
|
|
|
if (!capture) {
|
2020-01-10 20:30:56 +08:00
|
|
|
kfree(ee);
|
|
|
|
return NULL;
|
|
|
|
}
|
2019-08-08 22:45:11 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
intel_engine_coredump_add_vma(ee, capture, compress);
|
2019-08-08 22:45:11 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
return ee;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2019-07-23 06:28:47 +08:00
|
|
|
static void
|
2020-01-10 20:30:56 +08:00
|
|
|
gt_record_engines(struct intel_gt_coredump *gt,
|
2020-11-04 21:47:42 +08:00
|
|
|
intel_engine_mask_t engine_mask,
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_vma_compress *compress)
|
2017-10-27 01:36:55 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct intel_engine_cs *engine;
|
|
|
|
enum intel_engine_id id;
|
2017-10-27 01:36:55 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
for_each_engine(engine, gt->_gt, id) {
|
|
|
|
struct intel_engine_coredump *ee;
|
|
|
|
|
|
|
|
/* Refill our page pool before entering atomic section */
|
|
|
|
pool_refill(&compress->pool, ALLOW_FAIL);
|
|
|
|
|
|
|
|
ee = capture_engine(engine, compress);
|
|
|
|
if (!ee)
|
|
|
|
continue;
|
|
|
|
|
2020-11-04 21:47:42 +08:00
|
|
|
ee->hung = engine->mask & engine_mask;
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->simulated |= ee->simulated;
|
|
|
|
if (ee->simulated) {
|
|
|
|
kfree(ee);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
ee->next = gt->engine;
|
|
|
|
gt->engine = ee;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct intel_uc_coredump *
|
|
|
|
gt_record_uc(struct intel_gt_coredump *gt,
|
|
|
|
struct i915_vma_compress *compress)
|
|
|
|
{
|
|
|
|
const struct intel_uc *uc = >->_gt->uc;
|
|
|
|
struct intel_uc_coredump *error_uc;
|
|
|
|
|
|
|
|
error_uc = kzalloc(sizeof(*error_uc), ALLOW_FAIL);
|
|
|
|
if (!error_uc)
|
|
|
|
return NULL;
|
2017-10-27 01:36:55 +08:00
|
|
|
|
2019-08-13 16:15:59 +08:00
|
|
|
memcpy(&error_uc->guc_fw, &uc->guc.fw, sizeof(uc->guc.fw));
|
|
|
|
memcpy(&error_uc->huc_fw, &uc->huc.fw, sizeof(uc->huc.fw));
|
2017-10-27 01:36:55 +08:00
|
|
|
|
|
|
|
/* Non-default firmware paths will be specified by the modparam.
|
|
|
|
* As modparams are generally accesible from the userspace make
|
|
|
|
* explicit copies of the firmware paths.
|
|
|
|
*/
|
2019-07-23 06:28:47 +08:00
|
|
|
error_uc->guc_fw.path = kstrdup(uc->guc.fw.path, ALLOW_FAIL);
|
|
|
|
error_uc->huc_fw.path = kstrdup(uc->huc.fw.path, ALLOW_FAIL);
|
2020-01-10 20:30:56 +08:00
|
|
|
error_uc->guc_log =
|
|
|
|
i915_vma_coredump_create(gt->_gt,
|
|
|
|
uc->guc.log.vma, "GuC log buffer",
|
|
|
|
compress);
|
|
|
|
|
|
|
|
return error_uc;
|
|
|
|
}
|
|
|
|
|
2014-01-30 16:19:35 +08:00
|
|
|
/* Capture all registers which don't fit into another category. */
|
2020-01-10 20:30:56 +08:00
|
|
|
static void gt_record_regs(struct intel_gt_coredump *gt)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct intel_uncore *uncore = gt->_gt->uncore;
|
|
|
|
struct drm_i915_private *i915 = uncore->i915;
|
2014-08-06 01:07:13 +08:00
|
|
|
int i;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
/*
|
|
|
|
* General organization
|
2014-01-30 16:19:36 +08:00
|
|
|
* 1. Registers specific to a single generation
|
|
|
|
* 2. Registers which belong to multiple generations
|
|
|
|
* 3. Feature specific registers.
|
|
|
|
* 4. Everything else
|
|
|
|
* Please try to follow the order.
|
|
|
|
*/
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2014-01-30 16:19:36 +08:00
|
|
|
/* 1: Registers specific to a single generation */
|
2019-06-11 18:45:48 +08:00
|
|
|
if (IS_VALLEYVIEW(i915)) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->gtier[0] = intel_uncore_read(uncore, GTIER);
|
|
|
|
gt->ier = intel_uncore_read(uncore, VLV_IER);
|
|
|
|
gt->forcewake = intel_uncore_read_fw(uncore, FORCEWAKE_VLV);
|
2014-01-30 16:19:36 +08:00
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) == 7)
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->err_int = intel_uncore_read(uncore, GEN7_ERR_INT);
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) >= 12) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->fault_data0 = intel_uncore_read(uncore,
|
|
|
|
GEN12_FAULT_TLB_DATA0);
|
|
|
|
gt->fault_data1 = intel_uncore_read(uncore,
|
|
|
|
GEN12_FAULT_TLB_DATA1);
|
2021-06-06 12:50:49 +08:00
|
|
|
} else if (GRAPHICS_VER(i915) >= 8) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->fault_data0 = intel_uncore_read(uncore,
|
|
|
|
GEN8_FAULT_TLB_DATA0);
|
|
|
|
gt->fault_data1 = intel_uncore_read(uncore,
|
|
|
|
GEN8_FAULT_TLB_DATA1);
|
2015-03-24 20:54:19 +08:00
|
|
|
}
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) == 6) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->forcewake = intel_uncore_read_fw(uncore, FORCEWAKE);
|
|
|
|
gt->gab_ctl = intel_uncore_read(uncore, GAB_CTL);
|
|
|
|
gt->gfx_mode = intel_uncore_read(uncore, GFX_MODE);
|
2014-01-30 16:19:39 +08:00
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2014-01-30 16:19:36 +08:00
|
|
|
/* 2: Registers which belong to multiple generations */
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) >= 7)
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->forcewake = intel_uncore_read_fw(uncore, FORCEWAKE_MT);
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) >= 6) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->derrmr = intel_uncore_read(uncore, DERRMR);
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) < 12) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->error = intel_uncore_read(uncore, ERROR_GEN6);
|
|
|
|
gt->done_reg = intel_uncore_read(uncore, DONE_REG);
|
2019-07-31 02:04:04 +08:00
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2014-01-30 16:19:36 +08:00
|
|
|
/* 3: Feature specific registers */
|
2021-06-06 12:50:49 +08:00
|
|
|
if (IS_GRAPHICS_VER(i915, 6, 7)) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->gam_ecochk = intel_uncore_read(uncore, GAM_ECOCHK);
|
|
|
|
gt->gac_eco = intel_uncore_read(uncore, GAC_ECO_BITS);
|
2014-01-30 16:19:39 +08:00
|
|
|
}
|
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (IS_GRAPHICS_VER(i915, 8, 11))
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->gtt_cache = intel_uncore_read(uncore, HSW_GTT_CACHE_EN);
|
2019-09-10 01:16:46 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) == 12)
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->aux_err = intel_uncore_read(uncore, GEN12_AUX_ERR_DBG);
|
2019-10-25 20:17:18 +08:00
|
|
|
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) >= 12) {
|
2019-10-30 00:38:40 +08:00
|
|
|
for (i = 0; i < GEN12_SFC_DONE_MAX; i++) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->sfc_done[i] =
|
2019-10-30 00:38:40 +08:00
|
|
|
intel_uncore_read(uncore, GEN12_SFC_DONE(i));
|
|
|
|
}
|
2019-10-30 00:38:41 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->gam_done = intel_uncore_read(uncore, GEN12_GAM_DONE);
|
2019-10-30 00:38:40 +08:00
|
|
|
}
|
|
|
|
|
2014-01-30 16:19:39 +08:00
|
|
|
/* 4: Everything else */
|
2021-06-06 12:50:49 +08:00
|
|
|
if (GRAPHICS_VER(i915) >= 11) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->ier = intel_uncore_read(uncore, GEN8_DE_MISC_IER);
|
|
|
|
gt->gtier[0] =
|
2019-06-11 18:45:48 +08:00
|
|
|
intel_uncore_read(uncore,
|
|
|
|
GEN11_RENDER_COPY_INTR_ENABLE);
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->gtier[1] =
|
2019-06-11 18:45:48 +08:00
|
|
|
intel_uncore_read(uncore, GEN11_VCS_VECS_INTR_ENABLE);
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->gtier[2] =
|
2019-06-11 18:45:48 +08:00
|
|
|
intel_uncore_read(uncore, GEN11_GUC_SG_INTR_ENABLE);
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->gtier[3] =
|
2019-06-11 18:45:48 +08:00
|
|
|
intel_uncore_read(uncore,
|
|
|
|
GEN11_GPM_WGBOXPERF_INTR_ENABLE);
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->gtier[4] =
|
2019-06-11 18:45:48 +08:00
|
|
|
intel_uncore_read(uncore,
|
|
|
|
GEN11_CRYPTO_RSVD_INTR_ENABLE);
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->gtier[5] =
|
2019-06-11 18:45:48 +08:00
|
|
|
intel_uncore_read(uncore,
|
|
|
|
GEN11_GUNIT_CSME_INTR_ENABLE);
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->ngtier = 6;
|
2021-06-06 12:50:49 +08:00
|
|
|
} else if (GRAPHICS_VER(i915) >= 8) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->ier = intel_uncore_read(uncore, GEN8_DE_MISC_IER);
|
2014-08-06 01:07:13 +08:00
|
|
|
for (i = 0; i < 4; i++)
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->gtier[i] =
|
|
|
|
intel_uncore_read(uncore, GEN8_GT_IER(i));
|
|
|
|
gt->ngtier = 4;
|
2019-06-11 18:45:48 +08:00
|
|
|
} else if (HAS_PCH_SPLIT(i915)) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->ier = intel_uncore_read(uncore, DEIER);
|
|
|
|
gt->gtier[0] = intel_uncore_read(uncore, GTIER);
|
|
|
|
gt->ngtier = 1;
|
2021-06-06 12:50:49 +08:00
|
|
|
} else if (GRAPHICS_VER(i915) == 2) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->ier = intel_uncore_read16(uncore, GEN2_IER);
|
2019-06-11 18:45:48 +08:00
|
|
|
} else if (!IS_VALLEYVIEW(i915)) {
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->ier = intel_uncore_read(uncore, GEN2_IER);
|
2014-01-30 16:19:36 +08:00
|
|
|
}
|
2020-01-10 20:30:56 +08:00
|
|
|
gt->eir = intel_uncore_read(uncore, EIR);
|
|
|
|
gt->pgtbl_er = intel_uncore_read(uncore, PGTBL_ER);
|
|
|
|
}
|
|
|
|
|
2020-07-08 08:39:47 +08:00
|
|
|
static void gt_record_info(struct intel_gt_coredump *gt)
|
|
|
|
{
|
|
|
|
memcpy(>->info, >->_gt->info, sizeof(struct intel_gt_info));
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
/*
|
|
|
|
* Generate a semi-unique error code. The code is not meant to have meaning, The
|
|
|
|
* code's only purpose is to try to prevent false duplicated bug reports by
|
|
|
|
* grossly estimating a GPU error state.
|
|
|
|
*
|
|
|
|
* TODO Ideally, hashing the batchbuffer would be a very nice way to determine
|
|
|
|
* the hang if we could strip the GTT offset information from it.
|
|
|
|
*
|
|
|
|
* It's only a small step better than a random number in its current form.
|
|
|
|
*/
|
|
|
|
static u32 generate_ecode(const struct intel_engine_coredump *ee)
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* IPEHR would be an ideal way to detect errors, as it's the gross
|
|
|
|
* measure of "the command that hung." However, has some very common
|
|
|
|
* synchronization commands which almost always appear in the case
|
|
|
|
* strictly a client bug. Use instdone to differentiate those some.
|
|
|
|
*/
|
|
|
|
return ee ? ee->ipehr ^ ee->instdone.instdone : 0;
|
2014-01-30 16:19:35 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static const char *error_msg(struct i915_gpu_coredump *error)
|
2014-02-25 23:11:25 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct intel_engine_coredump *first = NULL;
|
2020-11-05 19:38:42 +08:00
|
|
|
unsigned int hung_classes = 0;
|
2020-01-10 20:30:56 +08:00
|
|
|
struct intel_gt_coredump *gt;
|
2019-01-25 21:22:28 +08:00
|
|
|
int len;
|
2014-02-25 23:11:25 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
for (gt = error->gt; gt; gt = gt->next) {
|
|
|
|
struct intel_engine_coredump *cs;
|
|
|
|
|
2020-11-04 21:47:42 +08:00
|
|
|
for (cs = gt->engine; cs; cs = cs->next) {
|
|
|
|
if (cs->hung) {
|
2020-11-05 19:38:42 +08:00
|
|
|
hung_classes |= BIT(cs->engine->uabi_class);
|
2020-11-04 21:47:42 +08:00
|
|
|
if (!first)
|
|
|
|
first = cs;
|
|
|
|
}
|
|
|
|
}
|
2020-01-10 20:30:56 +08:00
|
|
|
}
|
|
|
|
|
2014-02-25 23:11:26 +08:00
|
|
|
len = scnprintf(error->error_msg, sizeof(error->error_msg),
|
2020-01-10 20:30:56 +08:00
|
|
|
"GPU HANG: ecode %d:%x:%08x",
|
2021-06-06 12:50:49 +08:00
|
|
|
GRAPHICS_VER(error->i915), hung_classes,
|
2020-01-10 20:30:56 +08:00
|
|
|
generate_ecode(first));
|
2020-01-21 21:21:07 +08:00
|
|
|
if (first && first->context.pid) {
|
2019-01-25 21:22:28 +08:00
|
|
|
/* Just show the first executing process, more is confusing */
|
2014-02-25 23:11:26 +08:00
|
|
|
len += scnprintf(error->error_msg + len,
|
|
|
|
sizeof(error->error_msg) - len,
|
|
|
|
", in %s [%d]",
|
2020-01-10 20:30:56 +08:00
|
|
|
first->context.comm, first->context.pid);
|
2019-01-25 21:22:28 +08:00
|
|
|
}
|
2014-02-25 23:11:26 +08:00
|
|
|
|
2019-01-25 21:22:28 +08:00
|
|
|
return error->error_msg;
|
2014-02-25 23:11:25 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
static void capture_gen(struct i915_gpu_coredump *error)
|
2014-02-25 23:11:27 +08:00
|
|
|
{
|
2018-03-06 06:21:21 +08:00
|
|
|
struct drm_i915_private *i915 = error->i915;
|
|
|
|
|
|
|
|
error->wakelock = atomic_read(&i915->runtime_pm.wakeref_count);
|
|
|
|
error->suspended = i915->runtime_pm.suspended;
|
2017-03-02 23:03:56 +08:00
|
|
|
|
2015-08-08 03:24:15 +08:00
|
|
|
error->iommu = -1;
|
|
|
|
#ifdef CONFIG_INTEL_IOMMU
|
|
|
|
error->iommu = intel_iommu_gfx_mapped;
|
|
|
|
#endif
|
2018-03-06 06:21:21 +08:00
|
|
|
error->reset_count = i915_reset_count(&i915->gpu_error);
|
|
|
|
error->suspend_count = i915->suspend_count;
|
2016-08-15 17:48:45 +08:00
|
|
|
|
2020-06-18 23:04:02 +08:00
|
|
|
i915_params_copy(&error->params, &i915->params);
|
2016-08-15 17:48:45 +08:00
|
|
|
memcpy(&error->device_info,
|
2018-03-06 06:21:21 +08:00
|
|
|
INTEL_INFO(i915),
|
2016-08-15 17:48:45 +08:00
|
|
|
sizeof(error->device_info));
|
2018-12-31 22:56:41 +08:00
|
|
|
memcpy(&error->runtime_info,
|
|
|
|
RUNTIME_INFO(i915),
|
|
|
|
sizeof(error->runtime_info));
|
2018-03-06 06:21:21 +08:00
|
|
|
error->driver_caps = i915->caps;
|
2014-02-25 23:11:27 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_gpu_coredump *
|
|
|
|
i915_gpu_coredump_alloc(struct drm_i915_private *i915, gfp_t gfp)
|
2017-10-27 01:36:57 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_gpu_coredump *error;
|
|
|
|
|
2020-06-18 23:04:02 +08:00
|
|
|
if (!i915->params.error_capture)
|
2020-01-10 20:30:56 +08:00
|
|
|
return NULL;
|
|
|
|
|
|
|
|
error = kzalloc(sizeof(*error), gfp);
|
|
|
|
if (!error)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
kref_init(&error->ref);
|
|
|
|
error->i915 = i915;
|
|
|
|
|
|
|
|
error->time = ktime_get_real();
|
|
|
|
error->boottime = ktime_get_boottime();
|
|
|
|
error->uptime = ktime_sub(ktime_get(), i915->gt.last_init_time);
|
|
|
|
error->capture = jiffies;
|
|
|
|
|
|
|
|
capture_gen(error);
|
|
|
|
|
|
|
|
return error;
|
2017-10-27 01:36:57 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
#define DAY_AS_SECONDS(x) (24 * 60 * 60 * (x))
|
|
|
|
|
|
|
|
struct intel_gt_coredump *
|
|
|
|
intel_gt_coredump_alloc(struct intel_gt *gt, gfp_t gfp)
|
2018-10-02 03:44:46 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct intel_gt_coredump *gc;
|
2018-10-02 03:44:46 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
gc = kzalloc(sizeof(*gc), gfp);
|
|
|
|
if (!gc)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
gc->_gt = gt;
|
|
|
|
gc->awake = intel_gt_pm_is_awake(gt);
|
|
|
|
|
|
|
|
gt_record_regs(gc);
|
|
|
|
gt_record_fences(gc);
|
|
|
|
|
|
|
|
return gc;
|
|
|
|
}
|
2019-10-29 17:58:53 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_vma_compress *
|
|
|
|
i915_vma_capture_prepare(struct intel_gt_coredump *gt)
|
|
|
|
{
|
|
|
|
struct i915_vma_compress *compress;
|
|
|
|
|
|
|
|
compress = kmalloc(sizeof(*compress), ALLOW_FAIL);
|
|
|
|
if (!compress)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
if (!compress_init(compress)) {
|
|
|
|
kfree(compress);
|
|
|
|
return NULL;
|
2019-10-29 17:58:53 +08:00
|
|
|
}
|
2020-01-10 20:30:56 +08:00
|
|
|
|
|
|
|
return compress;
|
2018-10-02 03:44:46 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
void i915_vma_capture_finish(struct intel_gt_coredump *gt,
|
|
|
|
struct i915_vma_compress *compress)
|
|
|
|
{
|
|
|
|
if (!compress)
|
|
|
|
return;
|
2016-10-14 21:44:28 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
compress_fini(compress);
|
|
|
|
kfree(compress);
|
|
|
|
}
|
|
|
|
|
2020-11-04 21:47:42 +08:00
|
|
|
struct i915_gpu_coredump *
|
|
|
|
i915_gpu_coredump(struct intel_gt *gt, intel_engine_mask_t engine_mask)
|
2017-02-15 00:46:11 +08:00
|
|
|
{
|
2020-11-04 21:47:42 +08:00
|
|
|
struct drm_i915_private *i915 = gt->i915;
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_gpu_coredump *error;
|
2017-02-15 00:46:11 +08:00
|
|
|
|
2018-12-07 19:05:54 +08:00
|
|
|
/* Check if GPU capture has been disabled */
|
|
|
|
error = READ_ONCE(i915->gpu_error.first_error);
|
|
|
|
if (IS_ERR(error))
|
|
|
|
return error;
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
error = i915_gpu_coredump_alloc(i915, ALLOW_FAIL);
|
|
|
|
if (!error)
|
2018-12-07 19:05:54 +08:00
|
|
|
return ERR_PTR(-ENOMEM);
|
2017-02-15 00:46:11 +08:00
|
|
|
|
2020-11-04 21:47:42 +08:00
|
|
|
error->gt = intel_gt_coredump_alloc(gt, ALLOW_FAIL);
|
2020-01-10 20:30:56 +08:00
|
|
|
if (error->gt) {
|
|
|
|
struct i915_vma_compress *compress;
|
2019-07-23 06:28:47 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
compress = i915_vma_capture_prepare(error->gt);
|
|
|
|
if (!compress) {
|
|
|
|
kfree(error->gt);
|
|
|
|
kfree(error);
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
}
|
2017-02-15 00:46:11 +08:00
|
|
|
|
2020-07-08 08:39:47 +08:00
|
|
|
gt_record_info(error->gt);
|
2020-11-04 21:47:42 +08:00
|
|
|
gt_record_engines(error->gt, engine_mask, compress);
|
2020-01-10 20:30:56 +08:00
|
|
|
|
|
|
|
if (INTEL_INFO(i915)->has_gt_uc)
|
|
|
|
error->gt->uc = gt_record_uc(error->gt, compress);
|
2019-07-23 06:28:47 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
i915_vma_capture_finish(error->gt, compress);
|
|
|
|
|
|
|
|
error->simulated |= error->gt->simulated;
|
|
|
|
}
|
2019-07-23 06:28:47 +08:00
|
|
|
|
|
|
|
error->overlay = intel_overlay_capture_error_state(i915);
|
|
|
|
|
2017-02-15 00:46:11 +08:00
|
|
|
return error;
|
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
void i915_error_state_store(struct i915_gpu_coredump *error)
|
2014-01-30 16:19:35 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct drm_i915_private *i915;
|
2014-01-30 22:38:15 +08:00
|
|
|
static bool warned;
|
2014-01-30 16:19:35 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
if (IS_ERR_OR_NULL(error))
|
2016-10-12 17:05:18 +08:00
|
|
|
return;
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
i915 = error->i915;
|
2020-04-02 19:48:13 +08:00
|
|
|
drm_info(&i915->drm, "%s\n", error_msg(error));
|
2016-07-04 15:48:33 +08:00
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
if (error->simulated ||
|
|
|
|
cmpxchg(&i915->gpu_error.first_error, NULL, error))
|
2014-01-30 16:19:35 +08:00
|
|
|
return;
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
i915_gpu_coredump_get(error);
|
2014-02-25 23:11:25 +08:00
|
|
|
|
2019-08-19 15:58:21 +08:00
|
|
|
if (!xchg(&warned, true) &&
|
2016-10-14 21:44:28 +08:00
|
|
|
ktime_get_real_seconds() - DRIVER_TIMESTAMP < DAY_AS_SECONDS(180)) {
|
2019-08-15 17:36:04 +08:00
|
|
|
pr_info("GPU hangs can indicate a bug anywhere in the entire gfx stack, including userspace.\n");
|
2020-02-13 00:04:34 +08:00
|
|
|
pr_info("Please file a _new_ bug report at https://gitlab.freedesktop.org/drm/intel/issues/new.\n");
|
|
|
|
pr_info("Please see https://gitlab.freedesktop.org/drm/intel/-/wikis/How-to-file-i915-bugs for details.\n");
|
2019-08-15 17:36:04 +08:00
|
|
|
pr_info("drm/i915 developers can then reassign to the right component if it's not a kernel issue.\n");
|
|
|
|
pr_info("The GPU crash dump is required to analyze GPU hangs, so please always attach it.\n");
|
|
|
|
pr_info("GPU crash dump saved to /sys/class/drm/card%d/error\n",
|
|
|
|
i915->drm.primary->index);
|
2014-02-25 23:11:25 +08:00
|
|
|
}
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2020-01-10 20:30:56 +08:00
|
|
|
/**
|
|
|
|
* i915_capture_error_state - capture an error record for later analysis
|
2020-11-04 21:47:42 +08:00
|
|
|
* @gt: intel_gt which originated the hang
|
|
|
|
* @engine_mask: hung engines
|
|
|
|
*
|
2020-01-10 20:30:56 +08:00
|
|
|
*
|
|
|
|
* Should be called when an error is detected (either a hang or an error
|
|
|
|
* interrupt) to capture error state from the time of the error. Fills
|
|
|
|
* out a structure which becomes available in debugfs for user level tools
|
|
|
|
* to pick up.
|
|
|
|
*/
|
2020-11-04 21:47:42 +08:00
|
|
|
void i915_capture_error_state(struct intel_gt *gt,
|
|
|
|
intel_engine_mask_t engine_mask)
|
2020-01-10 20:30:56 +08:00
|
|
|
{
|
|
|
|
struct i915_gpu_coredump *error;
|
|
|
|
|
2020-11-04 21:47:42 +08:00
|
|
|
error = i915_gpu_coredump(gt, engine_mask);
|
2020-01-10 20:30:56 +08:00
|
|
|
if (IS_ERR(error)) {
|
2020-11-04 21:47:42 +08:00
|
|
|
cmpxchg(>->i915->gpu_error.first_error, NULL, error);
|
2020-01-10 20:30:56 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
i915_error_state_store(error);
|
|
|
|
i915_gpu_coredump_put(error);
|
|
|
|
}
|
|
|
|
|
|
|
|
struct i915_gpu_coredump *
|
2017-02-15 00:46:11 +08:00
|
|
|
i915_first_error_state(struct drm_i915_private *i915)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_gpu_coredump *error;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2017-02-15 00:46:11 +08:00
|
|
|
spin_lock_irq(&i915->gpu_error.lock);
|
|
|
|
error = i915->gpu_error.first_error;
|
2018-12-07 19:05:54 +08:00
|
|
|
if (!IS_ERR_OR_NULL(error))
|
2020-01-10 20:30:56 +08:00
|
|
|
i915_gpu_coredump_get(error);
|
2017-02-15 00:46:11 +08:00
|
|
|
spin_unlock_irq(&i915->gpu_error.lock);
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2017-02-15 00:46:11 +08:00
|
|
|
return error;
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|
|
|
|
|
2017-02-15 00:46:11 +08:00
|
|
|
void i915_reset_error_state(struct drm_i915_private *i915)
|
2013-07-12 21:50:57 +08:00
|
|
|
{
|
2020-01-10 20:30:56 +08:00
|
|
|
struct i915_gpu_coredump *error;
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2017-02-15 00:46:11 +08:00
|
|
|
spin_lock_irq(&i915->gpu_error.lock);
|
|
|
|
error = i915->gpu_error.first_error;
|
2018-12-07 19:05:54 +08:00
|
|
|
if (error != ERR_PTR(-ENODEV)) /* if disabled, always disabled */
|
|
|
|
i915->gpu_error.first_error = NULL;
|
2017-02-15 00:46:11 +08:00
|
|
|
spin_unlock_irq(&i915->gpu_error.lock);
|
2013-07-12 21:50:57 +08:00
|
|
|
|
2018-12-07 19:05:54 +08:00
|
|
|
if (!IS_ERR_OR_NULL(error))
|
2020-01-10 20:30:56 +08:00
|
|
|
i915_gpu_coredump_put(error);
|
2018-11-03 00:12:12 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void i915_disable_error_state(struct drm_i915_private *i915, int err)
|
|
|
|
{
|
|
|
|
spin_lock_irq(&i915->gpu_error.lock);
|
|
|
|
if (!i915->gpu_error.first_error)
|
|
|
|
i915->gpu_error.first_error = ERR_PTR(err);
|
|
|
|
spin_unlock_irq(&i915->gpu_error.lock);
|
2013-07-12 21:50:57 +08:00
|
|
|
}
|