From: Tvrtko Ursulin <tvrtko.ursulin@xxxxxxxxx> A bunch of tests for the new i915 PMU feature. Parts of the code were initialy sketched by Dmitry Rogozhkin. v2: (Most suggestions by Chris Wilson) * Add new class/instance based engine list. * Add gem_has_engine/gem_require_engine to work with class/instance. * Use the above two throughout the test. * Shorten tests to 100ms busy batches, seems enough. * Add queued counter sanity checks. * Use igt_nsec_elapsed. * Skip on perf -ENODEV in some tests instead of embedding knowledge locally. * Fix multi ordering for busy accounting. * Use new guranteed_usleep when sleep time is asserted on. * Check for no queued when idle/busy. * Add queued counter init test. * Add queued tests. * Consolidate and increase multiple busy engines tests to most-busy and all-busy tests. * Guarantte interrupts by using fences. * Test RC6 via forcewake. Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin@xxxxxxxxx> Cc: Chris Wilson <chris@xxxxxxxxxxxxxxxxxx> Cc: Dmitry Rogozhkin <dmitry.v.rogozhkin@xxxxxxxxx> --- lib/igt_gt.c | 50 +++ lib/igt_gt.h | 38 +++ lib/igt_perf.h | 9 +- tests/Makefile.sources | 1 + tests/perf_pmu.c | 840 +++++++++++++++++++++++++++++++++++++++++++++++++ 5 files changed, 930 insertions(+), 8 deletions(-) create mode 100644 tests/perf_pmu.c diff --git a/lib/igt_gt.c b/lib/igt_gt.c index b3f3b3809eee..4c75811fb1b3 100644 --- a/lib/igt_gt.c +++ b/lib/igt_gt.c @@ -568,3 +568,53 @@ bool gem_can_store_dword(int fd, unsigned int engine) return true; } + +const struct intel_execution_engine2 intel_execution_engines2[] = { + { "rcs0", I915_ENGINE_CLASS_RENDER, 0 }, + { "bcs0", I915_ENGINE_CLASS_COPY, 0 }, + { "vcs0", I915_ENGINE_CLASS_VIDEO, 0 }, + { "vcs1", I915_ENGINE_CLASS_VIDEO, 1 }, + { "vecs0", I915_ENGINE_CLASS_VIDEO_ENHANCE, 0 }, +}; + +unsigned int +gem_class_instance_to_eb_flags(int gem_fd, + enum drm_i915_gem_engine_class class, + unsigned int instance) +{ + if (class != I915_ENGINE_CLASS_VIDEO) + igt_assert(instance == 0); + else + igt_assert(instance >= 0 && instance <= 1); + + switch (class) { + case I915_ENGINE_CLASS_RENDER: + return I915_EXEC_RENDER; + case I915_ENGINE_CLASS_COPY: + return I915_EXEC_BLT; + case I915_ENGINE_CLASS_VIDEO: + if (instance == 0) { + if (gem_has_bsd2(gem_fd)) + return I915_EXEC_BSD | I915_EXEC_BSD_RING1; + else + return I915_EXEC_BSD; + + } else { + return I915_EXEC_BSD | I915_EXEC_BSD_RING2; + } + case I915_ENGINE_CLASS_VIDEO_ENHANCE: + return I915_EXEC_VEBOX; + case I915_ENGINE_CLASS_OTHER: + default: + igt_assert(0); + }; +} + +bool gem_has_engine(int gem_fd, + enum drm_i915_gem_engine_class class, + unsigned int instance) +{ + return gem_has_ring(gem_fd, + gem_class_instance_to_eb_flags(gem_fd, class, + instance)); +} diff --git a/lib/igt_gt.h b/lib/igt_gt.h index 2579cbd37be7..fb67ae1a7d1f 100644 --- a/lib/igt_gt.h +++ b/lib/igt_gt.h @@ -25,6 +25,7 @@ #define IGT_GT_H #include "igt_debugfs.h" +#include "igt_core.h" void igt_require_hang_ring(int fd, int ring); @@ -80,4 +81,41 @@ extern const struct intel_execution_engine { bool gem_can_store_dword(int fd, unsigned int engine); +extern const struct intel_execution_engine2 { + const char *name; + int class; + int instance; +} intel_execution_engines2[]; + +#define for_each_engine_class_instance(fd__, e__) \ + for ((e__) = intel_execution_engines2;\ + (e__)->name; \ + (e__)++) + +enum drm_i915_gem_engine_class { + I915_ENGINE_CLASS_OTHER = 0, + I915_ENGINE_CLASS_RENDER = 1, + I915_ENGINE_CLASS_COPY = 2, + I915_ENGINE_CLASS_VIDEO = 3, + I915_ENGINE_CLASS_VIDEO_ENHANCE = 4, + I915_ENGINE_CLASS_MAX /* non-ABI */ +}; + +unsigned int +gem_class_instance_to_eb_flags(int gem_fd, + enum drm_i915_gem_engine_class class, + unsigned int instance); + +bool gem_has_engine(int gem_fd, + enum drm_i915_gem_engine_class class, + unsigned int instance); + +static inline +void gem_require_engine(int gem_fd, + enum drm_i915_gem_engine_class class, + unsigned int instance) +{ + igt_require(gem_has_engine(gem_fd, class, instance)); +} + #endif /* IGT_GT_H */ diff --git a/lib/igt_perf.h b/lib/igt_perf.h index e29216f0500a..d64e0bd7a06a 100644 --- a/lib/igt_perf.h +++ b/lib/igt_perf.h @@ -29,14 +29,7 @@ #include <linux/perf_event.h> -enum drm_i915_gem_engine_class { - I915_ENGINE_CLASS_OTHER = 0, - I915_ENGINE_CLASS_RENDER = 1, - I915_ENGINE_CLASS_COPY = 2, - I915_ENGINE_CLASS_VIDEO = 3, - I915_ENGINE_CLASS_VIDEO_ENHANCE = 4, - I915_ENGINE_CLASS_MAX /* non-ABI */ -}; +#include "igt_gt.h" enum drm_i915_pmu_engine_sample { I915_SAMPLE_QUEUED = 0, diff --git a/tests/Makefile.sources b/tests/Makefile.sources index cf542df181a8..4bab6247151c 100644 --- a/tests/Makefile.sources +++ b/tests/Makefile.sources @@ -217,6 +217,7 @@ TESTS_progs = \ kms_vblank \ meta_test \ perf \ + perf_pmu \ pm_backlight \ pm_lpsp \ pm_rc6_residency \ diff --git a/tests/perf_pmu.c b/tests/perf_pmu.c new file mode 100644 index 000000000000..42d92b36a384 --- /dev/null +++ b/tests/perf_pmu.c @@ -0,0 +1,840 @@ +/* + * Copyright © 2017 Intel Corporation + * + * Permission is hereby granted, free of charge, to any person obtaining a + * copy of this software and associated documentation files (the "Software"), + * to deal in the Software without restriction, including without limitation + * the rights to use, copy, modify, merge, publish, distribute, sublicense, + * and/or sell copies of the Software, and to permit persons to whom the + * Software is furnished to do so, subject to the following conditions: + * + * The above copyright notice and this permission notice (including the next + * paragraph) shall be included in all copies or substantial portions of the + * Software. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING + * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS + * IN THE SOFTWARE. + * + */ + +#include <stdlib.h> +#include <stdio.h> +#include <string.h> +#include <fcntl.h> +#include <inttypes.h> +#include <errno.h> +#include <sys/stat.h> +#include <sys/time.h> +#include <sys/times.h> +#include <sys/types.h> +#include <dirent.h> +#include <time.h> +#include <poll.h> + +#include "igt.h" +#include "igt_core.h" +#include "igt_perf.h" + +IGT_TEST_DESCRIPTION("Test the i915 pmu perf interface"); + +const double tolerance = 0.02f; +const unsigned long batch_duration_ns = 100 * 1000 * 1000; + +static int open_pmu(uint64_t config) +{ + int fd; + + fd = perf_i915_open(config); + igt_require(fd >= 0 || (fd < 0 && errno != ENODEV)); + igt_assert(fd >= 0); + + return fd; +} + +static int open_group(uint64_t config, int group) +{ + int fd; + + fd = perf_i915_open_group(config, group); + igt_require(fd >= 0 || (fd < 0 && errno != ENODEV)); + igt_assert(fd >= 0); + + return fd; +} + +static void +init(int gem_fd, const struct intel_execution_engine2 *e, uint8_t sample) +{ + int fd; + + fd = open_pmu(__I915_PMU_ENGINE(e->class, e->instance, sample)); + + close(fd); +} + +static uint64_t pmu_read_single(int fd) +{ + uint64_t data[2]; + ssize_t len; + + len = read(fd, data, sizeof(data)); + igt_assert_eq(len, sizeof(data)); + + return data[0]; +} + +static void pmu_read_multi(int fd, unsigned int num, uint64_t *val) +{ + uint64_t buf[2 + num]; + unsigned int i; + ssize_t len; + + len = read(fd, buf, sizeof(buf)); + igt_assert_eq(len, sizeof(buf)); + for (i = 0; i < num; i++) + val[i] = buf[2 + i]; +} + +#define assert_within_epsilon(x, ref, tolerance) \ + igt_assert_f((double)(x) <= (1.0 + tolerance) * (double)ref && \ + (double)(x) >= (1.0 - tolerance) * (double)ref, \ + "'%s' != '%s' (%f not within %f%% tolerance of %f)\n",\ + #x, #ref, (double)x, tolerance * 100.0, (double)ref) + +static void guaranteed_usleep(unsigned int usec) +{ + uint64_t slept = 0, to_sleep = usec; + + while (usec > 0) { + struct timespec start = { }; + uint64_t this_sleep; + + igt_nsec_elapsed(&start); + usleep(usec); + this_sleep = igt_nsec_elapsed(&start) / 1000; + slept += this_sleep; + if (this_sleep > usec) + break; + usec -= this_sleep; + } + + assert_within_epsilon(slept, to_sleep, tolerance); +} + +static unsigned int e2ring(int gem_fd, const struct intel_execution_engine2 *e) +{ + return gem_class_instance_to_eb_flags(gem_fd, e->class, e->instance); +} + +static void +single(int gem_fd, const struct intel_execution_engine2 *e, uint8_t sample, + bool busy) +{ + double ref = busy && sample == I915_SAMPLE_BUSY ? + batch_duration_ns : 0.0f; + igt_spin_t *spin; + uint64_t val; + int fd; + + fd = open_pmu(__I915_PMU_ENGINE(e->class, e->instance, sample)); + + if (busy) { + spin = igt_spin_batch_new(gem_fd, 0, e2ring(gem_fd, e), 0); + igt_spin_batch_set_timeout(spin, batch_duration_ns); + } else { + guaranteed_usleep(batch_duration_ns / 1000); + } + + if (busy) + gem_sync(gem_fd, spin->handle); + + val = pmu_read_single(fd); + + assert_within_epsilon(val, ref, tolerance); + + if (busy) + igt_spin_batch_free(gem_fd, spin); + close(fd); +} + +static void +queued(int gem_fd, const struct intel_execution_engine2 *e) +{ + igt_spin_t *spin[2]; + uint64_t val; + int fd; + + fd = open_pmu(I915_PMU_ENGINE_QUEUED(e->class, e->instance)); + + spin[0] = igt_spin_batch_new(gem_fd, 0, e2ring(gem_fd, e), 0); + igt_spin_batch_set_timeout(spin[0], batch_duration_ns); + + spin[1] = igt_spin_batch_new(gem_fd, 0, e2ring(gem_fd, e), 0); + igt_spin_batch_set_timeout(spin[1], batch_duration_ns); + + gem_sync(gem_fd, spin[0]->handle); + + val = pmu_read_single(fd); + assert_within_epsilon(val, batch_duration_ns, tolerance); + + gem_sync(gem_fd, spin[1]->handle); + + igt_spin_batch_free(gem_fd, spin[0]); + igt_spin_batch_free(gem_fd, spin[1]); + close(fd); +} + +static void +busy_check_all(int gem_fd, const struct intel_execution_engine2 *e, + const unsigned int num_engines) +{ + const struct intel_execution_engine2 *e_; + uint64_t val[num_engines]; + int fd[num_engines]; + igt_spin_t *spin; + unsigned int busy_idx, i; + + i = 0; + fd[0] = -1; + for_each_engine_class_instance(fd, e_) { + if (!gem_has_engine(gem_fd, e_->class, e_->instance)) + continue; + else if (e == e_) + busy_idx = i; + + fd[i++] = open_group(I915_PMU_ENGINE_BUSY(e_->class, + e_->instance), + fd[0]); + } + + spin = igt_spin_batch_new(gem_fd, 0, e2ring(gem_fd, e), 0); + igt_spin_batch_set_timeout(spin, batch_duration_ns); + + gem_sync(gem_fd, spin->handle); + + pmu_read_multi(fd[0], num_engines, val); + + assert_within_epsilon(val[busy_idx], batch_duration_ns, tolerance); + for (i = 0; i < num_engines; i++) { + if (i == busy_idx) + continue; + assert_within_epsilon(val[i], 0.0f, tolerance); + } + + igt_spin_batch_free(gem_fd, spin); + close(fd[0]); +} + +static void +most_busy_check_all(int gem_fd, const struct intel_execution_engine2 *e, + const unsigned int num_engines) +{ + const struct intel_execution_engine2 *e_; + uint64_t val[num_engines]; + int fd[num_engines]; + igt_spin_t *spin[num_engines]; + unsigned int idle_idx, i; + + gem_require_engine(gem_fd, e->class, e->instance); + + i = 0; + fd[0] = -1; + for_each_engine_class_instance(fd, e_) { + if (!gem_has_engine(gem_fd, e_->class, e_->instance)) + continue; + + fd[i] = open_group(I915_PMU_ENGINE_BUSY(e_->class, + e_->instance), + fd[0]); + + if (e == e_) { + idle_idx = i; + } else { + spin[i] = igt_spin_batch_new(gem_fd, 0, + e2ring(gem_fd, e_), 0); + igt_spin_batch_set_timeout(spin[i], batch_duration_ns); + } + + i++; + } + + for (i = 0; i < num_engines; i++) { + if (i != idle_idx) + gem_sync(gem_fd, spin[i]->handle); + } + + pmu_read_multi(fd[0], num_engines, val); + + for (i = 0; i < num_engines; i++) { + if (i == idle_idx) + assert_within_epsilon(val[i], 0.0f, tolerance); + else + assert_within_epsilon(val[i], batch_duration_ns, + tolerance); + } + + for (i = 0; i < num_engines; i++) { + if (i != idle_idx) + igt_spin_batch_free(gem_fd, spin[i]); + } + close(fd[0]); +} + +static void +all_busy_check_all(int gem_fd, const unsigned int num_engines) +{ + const struct intel_execution_engine2 *e; + uint64_t val[num_engines]; + int fd[num_engines]; + igt_spin_t *spin[num_engines]; + unsigned int i; + + i = 0; + fd[0] = -1; + for_each_engine_class_instance(fd, e) { + if (!gem_has_engine(gem_fd, e->class, e->instance)) + continue; + + fd[i] = open_group(I915_PMU_ENGINE_BUSY(e->class, e->instance), + fd[0]); + + spin[i] = igt_spin_batch_new(gem_fd, 0, e2ring(gem_fd, e), 0); + igt_spin_batch_set_timeout(spin[i], batch_duration_ns); + + i++; + } + + for (i = 0; i < num_engines; i++) + gem_sync(gem_fd, spin[i]->handle); + + pmu_read_multi(fd[0], num_engines, val); + + for (i = 0; i < num_engines; i++) + assert_within_epsilon(val[i], batch_duration_ns, tolerance); + + for (i = 0; i < num_engines; i++) + igt_spin_batch_free(gem_fd, spin[i]); + close(fd[0]); +} + +static void +no_sema(int gem_fd, const struct intel_execution_engine2 *e, bool busy) +{ + igt_spin_t *spin; + uint64_t val[2]; + int fd; + + fd = open_group(I915_PMU_ENGINE_SEMA(e->class, e->instance), -1); + open_group(I915_PMU_ENGINE_WAIT(e->class, e->instance), fd); + + if (busy) { + spin = igt_spin_batch_new(gem_fd, 0, e2ring(gem_fd, e), 0); + igt_spin_batch_set_timeout(spin, batch_duration_ns); + } else { + usleep(batch_duration_ns / 1000); + } + + pmu_read_multi(fd, 2, val); + + assert_within_epsilon(val[0], 0.0f, tolerance); + assert_within_epsilon(val[1], 0.0f, tolerance); + + if (busy) + igt_spin_batch_free(gem_fd, spin); + close(fd); +} + +static void +multi_client(int gem_fd, const struct intel_execution_engine2 *e) +{ + uint64_t config = I915_PMU_ENGINE_BUSY(e->class, e->instance); + igt_spin_t *spin; + uint64_t val[2]; + int fd[2]; + + fd[0] = open_pmu(config); + + spin = igt_spin_batch_new(gem_fd, 0, e2ring(gem_fd, e), 0); + igt_spin_batch_set_timeout(spin, batch_duration_ns); + + guaranteed_usleep(batch_duration_ns / 2000); + + fd[1] = perf_i915_open(config); + igt_assert(fd[1] >= 0); + + gem_sync(gem_fd, spin->handle); + + val[0] = pmu_read_single(fd[0]); + val[1] = pmu_read_single(fd[1]); + close(fd[1]); + + assert_within_epsilon(val[0], batch_duration_ns, tolerance); + assert_within_epsilon(val[1], batch_duration_ns / 2, tolerance); + + igt_spin_batch_free(gem_fd, spin); + close(fd[0]); +} + +/** + * Tests that i915 PMU corectly errors out in invalid initialization. + * i915 PMU is uncore PMU, thus: + * - sampling period is not supported + * - pid > 0 is not supported since we can't count per-process (we count + * per whole system) + * - cpu != 0 is not supported since i915 PMU exposes cpumask for CPU0 + */ +static void invalid_init(void) +{ + struct perf_event_attr attr; + int pid, cpu; + +#define ATTR_INIT() \ +do { \ + memset(&attr, 0, sizeof (attr)); \ + attr.config = I915_PMU_ENGINE_BUSY(I915_ENGINE_CLASS_RENDER, 0); \ + attr.type = i915_type_id(); \ + igt_assert(attr.type != 0); \ +} while(0) + + ATTR_INIT(); + attr.sample_period = 100; + pid = -1; + cpu = 0; + igt_assert_eq(perf_event_open(&attr, pid, cpu, -1, 0), -1); + igt_assert_eq(errno, EINVAL); + + ATTR_INIT(); + pid = 0; + cpu = 0; + igt_assert_eq(perf_event_open(&attr, pid, cpu, -1, 0), -1); + igt_assert_eq(errno, EINVAL); + + ATTR_INIT(); + pid = -1; + cpu = 1; + igt_assert_eq(perf_event_open(&attr, pid, cpu, -1, 0), -1); + igt_assert_eq(errno, ENODEV); +} + +static void init_other(unsigned int i, bool valid) +{ + int fd; + + fd = perf_i915_open(__I915_PMU_OTHER(i)); + igt_require(!(fd < 0 && errno == ENODEV)); + if (valid) { + igt_assert(fd >= 0); + } else { + igt_assert(fd < 0); + return; + } + + close(fd); +} + +static void read_other(unsigned int i, bool valid) +{ + int fd; + + fd = perf_i915_open(__I915_PMU_OTHER(i)); + igt_require(!(fd < 0 && errno == ENODEV)); + if (valid) { + igt_assert(fd >= 0); + } else { + igt_assert(fd < 0); + return; + } + + (void)pmu_read_single(fd); + + close(fd); +} + +static bool cpu0_hotplug_support(void) +{ + int fd = open("/sys/devices/system/cpu/cpu0/online", O_WRONLY); + + close(fd); + + return fd > 0; +} + +static void cpu_hotplug(int gem_fd) +{ + struct timespec start = { }; + igt_spin_t *spin; + uint64_t val, ref; + int fd; + + igt_require(cpu0_hotplug_support()); + + spin = igt_spin_batch_new(gem_fd, 0, I915_EXEC_RENDER, 0); + fd = perf_i915_open(I915_PMU_ENGINE_BUSY(I915_ENGINE_CLASS_RENDER, 0)); + igt_assert(fd >= 0); + + igt_nsec_elapsed(&start); + + igt_fork(child, 1) { + int cpu = 0; + + for (;;) { + char name[128]; + int cpufd; + + sprintf(name, "/sys/devices/system/cpu/cpu%d/online", + cpu); + cpufd = open(name, O_WRONLY); + if (cpufd == -1) { + igt_assert(cpu > 0); + break; + } + igt_assert_eq(write(cpufd, "0", 2), 2); + + usleep(1000 * 1000); + + igt_assert_eq(write(cpufd, "1", 2), 2); + + close(cpufd); + cpu++; + } + } + + igt_waitchildren(); + + igt_spin_batch_end(spin); + gem_sync(gem_fd, spin->handle); + + ref = igt_nsec_elapsed(&start); + val = pmu_read_single(fd); + + assert_within_epsilon(val, ref, tolerance); + + igt_spin_batch_free(gem_fd, spin); + close(fd); +} + +static int chain_nop(int gem_fd, int in_fence, bool sync) +{ + struct drm_i915_gem_exec_object2 obj = {}; + struct drm_i915_gem_execbuffer2 eb = + { .buffer_count = 1, .buffers_ptr = (uintptr_t)&obj}; + const uint32_t bbe = 0xa << 23; + + obj.handle = gem_create(gem_fd, sizeof(bbe)); + gem_write(gem_fd, obj.handle, 0, &bbe, sizeof(bbe)); + + eb.flags = I915_EXEC_RENDER | I915_EXEC_FENCE_OUT; + + if (in_fence >= 0) { + eb.flags |= I915_EXEC_FENCE_IN; + eb.rsvd2 = in_fence; + } + + gem_execbuf_wr(gem_fd, &eb); + + if (sync) + gem_sync(gem_fd, obj.handle); + + gem_close(gem_fd, obj.handle); + if (in_fence >= 0) + close(in_fence); + + return eb.rsvd2 >> 32; +} + +static void +test_interrupts(int gem_fd) +{ + uint64_t idle, busy, prev; + int fd, fence = -1; + const unsigned int count = 1000; + unsigned int i; + + fd = open_pmu(I915_PMU_INTERRUPTS); + + gem_quiescent_gpu(gem_fd); + + /* Wait for idle state. */ + prev = pmu_read_single(fd); + idle = prev + 1; + while (idle != prev) { + usleep(batch_duration_ns / 1000); + prev = idle; + idle = pmu_read_single(fd); + } + + igt_assert_eq(idle - prev, 0); + + /* Send some no-op batches with chained fences to ensure interrupts. */ + for (i = 1; i <= count; i++) + fence = chain_nop(gem_fd, fence, i < count ? false : true); + close(fence); + + /* Check at least as many interrupts has been generated. */ + busy = pmu_read_single(fd); + igt_assert(busy > count - 1); + + close(fd); +} + +static void +test_frequency(int gem_fd) +{ + igt_spin_t *spin; + uint64_t idle[2], busy[2]; + int fd; + + fd = open_group(I915_PMU_REQUESTED_FREQUENCY, -1); + open_group(I915_PMU_ACTUAL_FREQUENCY, fd); + + gem_quiescent_gpu(gem_fd); + usleep(batch_duration_ns / 1000); + + pmu_read_multi(fd, 2, idle); + + spin = igt_spin_batch_new(gem_fd, 0, I915_EXEC_RENDER, 0); + igt_spin_batch_set_timeout(spin, batch_duration_ns); + gem_sync(gem_fd, spin->handle); + + pmu_read_multi(fd, 2, busy); + + igt_assert(busy[0] > idle[0]); + igt_assert(busy[1] > idle[1]); + + igt_spin_batch_free(gem_fd, spin); + close(fd); +} + +static void +test_rc6(int gem_fd) +{ + int64_t duration_ns = 2 * 1000 * 1000 * 1000; + uint64_t idle, busy, prev; + int fd, fw; + + fd = open_pmu(I915_PMU_RC6_RESIDENCY); + + gem_quiescent_gpu(gem_fd); + + /* Go idle and check full RC6. */ + prev = pmu_read_single(fd); + guaranteed_usleep(duration_ns / 1000); + idle = pmu_read_single(fd); + + assert_within_epsilon(idle - prev, duration_ns, tolerance); + + /* Wake up device and check no RC6. */ + fw = igt_open_forcewake_handle(gem_fd); + igt_assert(fw >= 0); + + prev = pmu_read_single(fd); + guaranteed_usleep(duration_ns / 1000); + busy = pmu_read_single(fd); + + assert_within_epsilon(busy - prev, 0.0, tolerance); + + close(fw); + close(fd); +} + +static void +test_rc6p(int gem_fd) +{ + int64_t duration_ns = 2 * 1000 * 1000 * 1000; + unsigned int num_pmu = 1; + uint64_t idle[3], busy[3], prev[3]; + unsigned int i; + int fd, ret, fw; + + fd = open_group(I915_PMU_RC6_RESIDENCY, -1); + ret = perf_i915_open_group(I915_PMU_RC6p_RESIDENCY, fd); + if (ret > 0) { + num_pmu++; + ret = perf_i915_open_group(I915_PMU_RC6pp_RESIDENCY, fd); + if (ret > 0) + num_pmu++; + } + + igt_require(num_pmu == 3); + + gem_quiescent_gpu(gem_fd); + + /* Go idle and check full RC6. */ + pmu_read_multi(fd, num_pmu, prev); + guaranteed_usleep(duration_ns / 1000); + pmu_read_multi(fd, num_pmu, idle); + + for (i = 0; i < num_pmu; i++) + assert_within_epsilon(idle[i] - prev[i], duration_ns, + tolerance); + + /* Wake up device and check no RC6. */ + fw = igt_open_forcewake_handle(gem_fd); + igt_assert(fw >= 0); + + pmu_read_multi(fd, num_pmu, prev); + guaranteed_usleep(duration_ns / 1000); + pmu_read_multi(fd, num_pmu, busy); + + for (i = 0; i < num_pmu; i++) + assert_within_epsilon(busy[i] - prev[i], 0.0, tolerance); + + close(fw); + close(fd); +} + +igt_main +{ + const unsigned int num_other_metrics = + I915_PMU_LAST - __I915_PMU_OTHER(0) + 1; + unsigned int num_engines = 0; + int fd = -1; + const struct intel_execution_engine2 *e; + unsigned int i; + + igt_fixture { + fd = drm_open_driver_master(DRIVER_INTEL); + + igt_require_gem(fd); + igt_require(i915_type_id() > 0); + + for_each_engine_class_instance(fd, e) { + if (gem_has_engine(fd, e->class, e->instance)) + num_engines++; + } + } + + /** + * Test invalid access via perf API is rejected. + */ + igt_subtest("invalid-init") + invalid_init(); + + for_each_engine_class_instance(fd, e) { + /** + * Test that a single engine metric can be initialized. + */ + igt_subtest_f("init-queued-%s", e->name) + init(fd, e, I915_SAMPLE_QUEUED); + + igt_subtest_f("init-busy-%s", e->name) + init(fd, e, I915_SAMPLE_BUSY); + + igt_subtest_f("init-wait-%s", e->name) + init(fd, e, I915_SAMPLE_WAIT); + + igt_subtest_f("init-sema-%s", e->name) + init(fd, e, I915_SAMPLE_SEMA); + + /** + * Test that queued metric works. + */ + igt_subtest_f("queued-%s", e->name) + queued(fd, e); + + /** + * Test that engines show nothing queued when idle or busy. + */ + igt_subtest_f("idle-no-queued-%s", e->name) + single(fd, e, I915_SAMPLE_QUEUED, false); + + igt_subtest_f("busy-no-queued-%s", e->name) + single(fd, e, I915_SAMPLE_QUEUED, true); + + /** + * Test that engines show no load when idle. + */ + igt_subtest_f("idle-%s", e->name) + single(fd, e, I915_SAMPLE_BUSY, false); + + /** + * Test that a single engine reports load correctly. + */ + igt_subtest_f("busy-%s", e->name) + single(fd, e, I915_SAMPLE_BUSY, true); + + /** + * Test that when one engine is loaded other report no load. + */ + igt_subtest_f("busy-check-all-%s", e->name) + busy_check_all(fd, e, num_engines); + + /** + * Test that when all except one engine are loaded all loads + * are correctly reported. + */ + igt_subtest_f("most-busy-check-all-%s", e->name) + most_busy_check_all(fd, e, num_engines); + + /** + * Test that semphore counters report no activity on idle + * or busy engines. + */ + igt_subtest_f("idle-no-semaphores-%s", e->name) + no_sema(fd, e, false); + + igt_subtest_f("busy-no-semaphores-%s", e->name) + no_sema(fd, e, true); + + /** + * Check that two perf clients do not influence each others + * observations. + */ + igt_subtest_f("multi-client-%s", e->name) + multi_client(fd, e); + } + + /** + * Test that when all engines are loaded all loads are + * correctly reported. + */ + igt_subtest("all-busy-check-all") + all_busy_check_all(fd, num_engines); + + /** + * Test that non-engine counters can be initialized and read. Apart + * from the invalid metric which should fail. + */ + for (i = 0; i < num_other_metrics + 1; i++) { + igt_subtest_f("other-init-%u", i) + init_other(i, i < num_other_metrics); + + igt_subtest_f("other-read-%u", i) + read_other(i, i < num_other_metrics); + } + + /** + * Test counters are not affected by CPU offline/online events. + */ + igt_subtest("cpu-hotplug") + cpu_hotplug(fd); + + /** + * Test GPU frequency. + */ + igt_subtest("frequency") + test_frequency(fd); + + /** + * Test interrupt count reporting. + */ + igt_subtest("interrupts") + test_interrupts(fd); + + /** + * Test RC6 residency reporting. + */ + igt_subtest("rc6") + test_rc6(fd); + + /** + * Test RC6p residency reporting. + */ + igt_subtest("rc6p") + test_rc6p(fd); +} -- 2.9.5 _______________________________________________ Intel-gfx mailing list Intel-gfx@xxxxxxxxxxxxxxxxxxxxx https://lists.freedesktop.org/mailman/listinfo/intel-gfx