mirror of
git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
synced 2025-08-05 16:54:27 +00:00

Many selftests call igt_flush_test() on cleanup. With default preemption timeout of compute engines raised to 7.5 seconds, hardcoded flush timeout of 3 seconds is too short. That results in GPU forcibly wedged and kernel taineted, then IGT abort triggered. CI BAT runs loose a part of their expected coverage. Calculate the flush timeout based on the longest preemption timeout currently configured for any engine. That way, selftest can still report detected issues as non-critical, and the GPU gets a chance to recover from preemptible hangs and prepare for fluent execution of next test cases. Link: https://gitlab.freedesktop.org/drm/i915/kernel/-/issues/12061 Signed-off-by: Janusz Krzysztofik <janusz.krzysztofik@linux.intel.com> Reviewed-by: Andi Shyti <andi.shyti@linux.intel.com> Signed-off-by: Andi Shyti <andi.shyti@kernel.org> Link: https://patchwork.freedesktop.org/patch/msgid/20241213190122.513709-2-janusz.krzysztofik@linux.intel.com
51 lines
1 KiB
C
51 lines
1 KiB
C
/*
|
|
* SPDX-License-Identifier: MIT
|
|
*
|
|
* Copyright © 2018 Intel Corporation
|
|
*/
|
|
|
|
#include "gt/intel_gt.h"
|
|
#include "gt/intel_gt_requests.h"
|
|
|
|
#include "i915_drv.h"
|
|
#include "i915_selftest.h"
|
|
|
|
#include "igt_flush_test.h"
|
|
|
|
int igt_flush_test(struct drm_i915_private *i915)
|
|
{
|
|
struct intel_gt *gt;
|
|
unsigned int i;
|
|
int ret = 0;
|
|
|
|
for_each_gt(gt, i915, i) {
|
|
struct intel_engine_cs *engine;
|
|
unsigned long timeout_ms = 0;
|
|
unsigned int id;
|
|
|
|
if (intel_gt_is_wedged(gt))
|
|
ret = -EIO;
|
|
|
|
for_each_engine(engine, gt, id) {
|
|
if (engine->props.preempt_timeout_ms > timeout_ms)
|
|
timeout_ms = engine->props.preempt_timeout_ms;
|
|
}
|
|
|
|
cond_resched();
|
|
|
|
/* 2x longest preempt timeout, experimentally determined */
|
|
if (intel_gt_wait_for_idle(gt, HZ * timeout_ms / 500) == -ETIME) {
|
|
pr_err("%pS timed out, cancelling all further testing.\n",
|
|
__builtin_return_address(0));
|
|
|
|
GEM_TRACE("%pS timed out.\n",
|
|
__builtin_return_address(0));
|
|
GEM_TRACE_DUMP();
|
|
|
|
intel_gt_set_wedged(gt);
|
|
ret = -EIO;
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|