From patchwork Tue Feb 12 20:57:39 2019 Content-Type: text/plain; charset="utf-8" MIME-Version: 1.0 Content-Transfer-Encoding: 7bit X-Patchwork-Submitter: Chris Wilson X-Patchwork-Id: 10808671 Return-Path: Received: from mail.wl.linuxfoundation.org (pdx-wl-mail.web.codeaurora.org [172.30.200.125]) by pdx-korg-patchwork-2.web.codeaurora.org (Postfix) with ESMTP id 0766713A4 for ; Tue, 12 Feb 2019 20:57:58 +0000 (UTC) Received: from mail.wl.linuxfoundation.org (localhost [127.0.0.1]) by mail.wl.linuxfoundation.org (Postfix) with ESMTP id EB60E2981D for ; Tue, 12 Feb 2019 20:57:57 +0000 (UTC) Received: by mail.wl.linuxfoundation.org (Postfix, from userid 486) id DF4222ABF6; Tue, 12 Feb 2019 20:57:57 +0000 (UTC) X-Spam-Checker-Version: SpamAssassin 3.3.1 (2010-03-16) on pdx-wl-mail.web.codeaurora.org X-Spam-Level: X-Spam-Status: No, score=-5.2 required=2.0 tests=BAYES_00,MAILING_LIST_MULTI, RCVD_IN_DNSWL_MED autolearn=ham version=3.3.1 Received: from gabe.freedesktop.org (gabe.freedesktop.org [131.252.210.177]) (using TLSv1.2 with cipher DHE-RSA-AES256-GCM-SHA384 (256/256 bits)) (No client certificate requested) by mail.wl.linuxfoundation.org (Postfix) with ESMTPS id 7A1A92981D for ; Tue, 12 Feb 2019 20:57:57 +0000 (UTC) Received: from gabe.freedesktop.org (localhost [127.0.0.1]) by gabe.freedesktop.org (Postfix) with ESMTP id A95756E702; Tue, 12 Feb 2019 20:57:54 +0000 (UTC) X-Original-To: intel-gfx@lists.freedesktop.org Delivered-To: intel-gfx@lists.freedesktop.org Received: from fireflyinternet.com (mail.fireflyinternet.com [109.228.58.192]) by gabe.freedesktop.org (Postfix) with ESMTPS id 9ACF66E6F6; Tue, 12 Feb 2019 20:57:52 +0000 (UTC) X-Default-Received-SPF: pass (skip=forwardok (res=PASS)) x-ip-name=78.156.65.138; Received: from haswell.alporthouse.com (unverified [78.156.65.138]) by fireflyinternet.com (Firefly Internet (M1)) with ESMTP id 15556275-1500050 for multiple; Tue, 12 Feb 2019 20:57:47 +0000 From: Chris Wilson To: intel-gfx@lists.freedesktop.org Date: Tue, 12 Feb 2019 20:57:39 +0000 Message-Id: <20190212205740.20368-1-chris@chris-wilson.co.uk> X-Mailer: git-send-email 2.20.1 MIME-Version: 1.0 Subject: [Intel-gfx] [PATCH i-g-t 1/2] i915/gem_eio: Check average reset times X-BeenThere: intel-gfx@lists.freedesktop.org X-Mailman-Version: 2.1.23 Precedence: list List-Id: Intel graphics driver community testing & development List-Unsubscribe: , List-Archive: List-Post: List-Help: List-Subscribe: , Cc: igt-dev@lists.freedesktop.org Errors-To: intel-gfx-bounces@lists.freedesktop.org Sender: "Intel-gfx" X-Virus-Scanned: ClamAV using ClamSMTP As we have moved to rcu/srcu to serialise the resets, individual resets are subject to small variations in system grace periods. Allow for this by only expecting the median reset time to be within our target, thereby excluding noisy outliers from perturbing our results (but keep the maximum capped to prevent horrid failures!) Signed-off-by: Chris Wilson Reviewed-by: Mika Kuoppala --- tests/i915/gem_eio.c | 53 ++++++++++++++++++++++++++++++++++---------- 1 file changed, 41 insertions(+), 12 deletions(-) diff --git a/tests/i915/gem_eio.c b/tests/i915/gem_eio.c index 61054a07e..bd5266104 100644 --- a/tests/i915/gem_eio.c +++ b/tests/i915/gem_eio.c @@ -42,6 +42,7 @@ #include "igt.h" #include "igt_device.h" +#include "igt_stats.h" #include "igt_sysfs.h" #include "sw_sync.h" #include "i915/gem_ring.h" @@ -239,10 +240,9 @@ static void hang_after(int fd, unsigned int us, struct timespec *ts) igt_assert_eq(timer_settime(ctx->timer, 0, &its, NULL), 0); } -static void check_wait(int fd, uint32_t bo, unsigned int wait) +static void check_wait(int fd, uint32_t bo, unsigned int wait, igt_stats_t *st) { struct timespec ts = {}; - uint64_t elapsed; if (wait) { hang_after(fd, wait, &ts); @@ -253,10 +253,34 @@ static void check_wait(int fd, uint32_t bo, unsigned int wait) gem_sync(fd, bo); - elapsed = igt_nsec_elapsed(&ts); - igt_assert_f(elapsed < 250e6, - "Wake up following reset+wedge took %.3fms\n", - elapsed*1e-6); + if (st) + igt_stats_push(st, igt_nsec_elapsed(&ts)); +} + +static void check_wait_elapsed(int fd, igt_stats_t *st) +{ + double med, max; + + igt_info("Completed %d resets, wakeups took %.3f+-%.3fms (min:%.3fms, median:%.3fms, max:%.3fms)\n", + st->n_values, + igt_stats_get_mean(st)*1e-6, + igt_stats_get_std_deviation(st)*1e-6, + igt_stats_get_min(st)*1e-6, + igt_stats_get_median(st)*1e-6, + igt_stats_get_max(st)*1e-6); + + if (st->n_values < 9) + return; /* too few for stable median */ + + med = igt_stats_get_median(st); + max = igt_stats_get_max(st); + igt_assert_f(med < 250e6 && max < 1250e6, + "Wake up following reset+wedge took %.3f+-%.3fms (min:%.3fms, median:%.3fms, max:%.3fms)\n", + igt_stats_get_mean(st)*1e-6, + igt_stats_get_std_deviation(st)*1e-6, + igt_stats_get_min(st)*1e-6, + igt_stats_get_median(st)*1e-6, + igt_stats_get_max(st)*1e-6); } static void __test_banned(int fd) @@ -326,7 +350,7 @@ static void test_wait(int fd, unsigned int flags, unsigned int wait) hang = spin_sync(fd, 0, I915_EXEC_DEFAULT); - check_wait(fd, hang->handle, wait); + check_wait(fd, hang->handle, wait, NULL); igt_spin_batch_free(fd, hang); @@ -401,7 +425,7 @@ static void test_inflight(int fd, unsigned int wait) igt_assert(fence[n] != -1); } - check_wait(fd, obj[1].handle, wait); + check_wait(fd, obj[1].handle, wait, NULL); for (unsigned int n = 0; n < max; n++) { igt_assert_eq(sync_fence_status(fence[n]), -EIO); @@ -457,7 +481,7 @@ static void test_inflight_suspend(int fd) igt_set_autoresume_delay(30); igt_system_suspend_autoresume(SUSPEND_STATE_MEM, SUSPEND_TEST_NONE); - check_wait(fd, obj[1].handle, 10); + check_wait(fd, obj[1].handle, 10, NULL); for (unsigned int n = 0; n < max; n++) { igt_assert_eq(sync_fence_status(fence[n]), -EIO); @@ -535,7 +559,7 @@ static void test_inflight_contexts(int fd, unsigned int wait) igt_assert(fence[n] != -1); } - check_wait(fd, obj[1].handle, wait); + check_wait(fd, obj[1].handle, wait, NULL); for (unsigned int n = 0; n < ARRAY_SIZE(fence); n++) { igt_assert_eq(sync_fence_status(fence[n]), -EIO); @@ -644,7 +668,7 @@ static void test_inflight_internal(int fd, unsigned int wait) nfence++; } - check_wait(fd, obj[1].handle, wait); + check_wait(fd, obj[1].handle, wait, NULL); while (nfence--) { igt_assert_eq(sync_fence_status(fences[nfence]), -EIO); @@ -670,8 +694,11 @@ static void reset_stress(int fd, .buffer_count = 1, .flags = engine, }; + igt_stats_t stats; + gem_write(fd, obj.handle, 0, &bbe, sizeof(bbe)); + igt_stats_init(&stats); igt_until_timeout(5) { uint32_t ctx = context_create_safe(fd); igt_spin_t *hang; @@ -697,7 +724,7 @@ static void reset_stress(int fd, gem_execbuf(fd, &execbuf); /* Wedge after a small delay. */ - check_wait(fd, obj.handle, 100e3); + check_wait(fd, obj.handle, 100e3, &stats); /* Unwedge by forcing a reset. */ igt_assert(i915_reset_control(true)); @@ -721,6 +748,8 @@ static void reset_stress(int fd, igt_spin_batch_free(fd, hang); gem_context_destroy(fd, ctx); } + check_wait_elapsed(fd, &stats); + igt_stats_fini(&stats); gem_close(fd, obj.handle); }