summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorChris Wilson <chris@chris-wilson.co.uk>2016-08-28 16:45:22 +0100
committerChris Wilson <chris@chris-wilson.co.uk>2016-08-28 18:25:07 +0100
commit93b8ad80f2691ae15dea78401db2b32d8cef7354 (patch)
treee9d106cd8767ff7b0d46d3196c0b65f6a6f9da8b
parent9d5e393da3f58c4d7bbdb61c96b01416e043836f (diff)
benchmarks/gem_busy: Exercise the busy ioctl
And include poll(dmabuf) for comparison. Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
-rw-r--r--benchmarks/Makefile.sources1
-rw-r--r--benchmarks/ezbench.d/gem_busy.test29
-rw-r--r--benchmarks/gem_busy.c274
3 files changed, 304 insertions, 0 deletions
diff --git a/benchmarks/Makefile.sources b/benchmarks/Makefile.sources
index 00d84ae8..f69d4f10 100644
--- a/benchmarks/Makefile.sources
+++ b/benchmarks/Makefile.sources
@@ -2,6 +2,7 @@ benchmarksdir=$(libexecdir)/intel-gpu-tools/benchmarks
benchmarks_prog_list = \
gem_blt \
+ gem_busy \
gem_create \
gem_exec_ctx \
gem_exec_fault \
diff --git a/benchmarks/ezbench.d/gem_busy.test b/benchmarks/ezbench.d/gem_busy.test
new file mode 100644
index 00000000..ae66b977
--- /dev/null
+++ b/benchmarks/ezbench.d/gem_busy.test
@@ -0,0 +1,29 @@
+[ -e $IGT_BENCHMARKS/gem_busy ] || return 1
+sudo -n true || return 1
+
+for ring in rcs bcs vcs vecs all; do
+while read label mode; do
+ name="gem:busy:$label:$ring"
+ test_name="$test_name $name"
+ eval "${name}_run() { sudo $IGT_BENCHMARKS/gem_busy $mode -e $ring -r \$1 ; }"
+
+ name="gem:busy:$label:$ring:forked"
+ test_name="$test_name $name"
+ eval "${name}_run() { sudo $IGT_BENCHMARKS/gem_busy $mode -f -e $ring -r \$1 ; }"
+
+ name="gem:busy:$label:$ring:dmabuf"
+ test_name="$test_name $name"
+ eval "${name}_run() { sudo $IGT_BENCHMARKS/gem_busy $mode -d -e $ring -r \$1 ; }"
+
+ name="gem:busy:$label:$ring:dmabuf:forked"
+ test_name="$test_name $name"
+ eval "${name}_run() { sudo $IGT_BENCHMARKS/gem_busy $mode -d -f -e $ring -r \$1 ; }"
+done<<MODES
+read
+write -W
+idle -I
+MODES
+done
+
+test_exec_time=3
+test_invert=1
diff --git a/benchmarks/gem_busy.c b/benchmarks/gem_busy.c
new file mode 100644
index 00000000..a6ff2361
--- /dev/null
+++ b/benchmarks/gem_busy.c
@@ -0,0 +1,274 @@
+/*
+ * Copyright © 2011 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice (including the next
+ * paragraph) shall be included in all copies or substantial portions of the
+ * Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
+ * IN THE SOFTWARE.
+ *
+ * Authors:
+ * Chris Wilson <chris@chris-wilson.co.uk>
+ *
+ */
+
+#include <unistd.h>
+#include <stdlib.h>
+#include <stdint.h>
+#include <stdio.h>
+#include <string.h>
+#include <fcntl.h>
+#include <inttypes.h>
+#include <errno.h>
+#include <sys/stat.h>
+#include <sys/poll.h>
+#include <sys/ioctl.h>
+#include <sys/time.h>
+#include <time.h>
+
+#include "drm.h"
+#include "ioctl_wrappers.h"
+#include "drmtest.h"
+#include "intel_chipset.h"
+#include "igt_stats.h"
+
+#define LOCAL_I915_EXEC_NO_RELOC (1<<11)
+#define LOCAL_I915_EXEC_HANDLE_LUT (1<<12)
+
+#define LOCAL_I915_EXEC_BSD_SHIFT (13)
+#define LOCAL_I915_EXEC_BSD_MASK (3 << LOCAL_I915_EXEC_BSD_SHIFT)
+
+#define ENGINE_FLAGS (I915_EXEC_RING_MASK | LOCAL_I915_EXEC_BSD_MASK)
+
+#define WRITE 0x1
+#define IDLE 0x2
+#define DMABUF 0x2
+
+static bool gem_busy(int fd, uint32_t handle)
+{
+ struct drm_i915_gem_busy busy;
+
+ memset(&busy, 0, sizeof(busy));
+ busy.handle = handle;
+
+ do_ioctl(fd, DRM_IOCTL_I915_GEM_BUSY, &busy);
+
+ return busy.busy != 0;
+}
+
+static double elapsed(const struct timespec *start,
+ const struct timespec *end)
+{
+ return 1e9*(end->tv_sec - start->tv_sec) +
+ (end->tv_nsec - start->tv_nsec);
+}
+
+static int loop(unsigned ring, int reps, int ncpus, unsigned flags)
+{
+ struct drm_i915_gem_execbuffer2 execbuf;
+ struct drm_i915_gem_exec_object2 obj[2];
+ struct drm_i915_gem_relocation_entry reloc[2];
+ unsigned engines[16];
+ unsigned nengine;
+ uint32_t *batch;
+ double *shared;
+ int fd, i, gen;
+ int dmabuf;
+
+ shared = mmap(0, 4096, PROT_WRITE, MAP_SHARED | MAP_ANON, -1, 0);
+
+ fd = drm_open_driver(DRIVER_INTEL);
+ gen = intel_gen(intel_get_drm_devid(fd));
+
+ memset(obj, 0, sizeof(obj));
+ obj[0].handle = gem_create(fd, 4096);
+ if (flags & WRITE)
+ obj[0].flags = EXEC_OBJECT_WRITE;
+ obj[1].handle = gem_create(fd, 4096);
+ if (gem_mmap__has_wc(fd))
+ batch = gem_mmap__wc(fd, obj[1].handle, 0, 4096, PROT_WRITE);
+ else
+ batch = gem_mmap__gtt(fd, obj[1].handle, 4096, PROT_WRITE);
+ gem_set_domain(fd, obj[1].handle,
+ I915_GEM_DOMAIN_GTT, I915_GEM_DOMAIN_GTT);
+ batch[0] = MI_BATCH_BUFFER_END;
+
+ memset(&execbuf, 0, sizeof(execbuf));
+ execbuf.buffers_ptr = (uintptr_t)obj;
+ execbuf.buffer_count = 2;
+ execbuf.flags |= LOCAL_I915_EXEC_HANDLE_LUT;
+ execbuf.flags |= LOCAL_I915_EXEC_NO_RELOC;
+ if (__gem_execbuf(fd, &execbuf)) {
+ execbuf.flags = 0;
+ if (__gem_execbuf(fd, &execbuf))
+ return 77;
+ }
+
+ if (ring == -1) {
+ nengine = 0;
+ for (ring = 1; ring < 16; ring++) {
+ execbuf.flags &= ~ENGINE_FLAGS;
+ execbuf.flags |= ring;
+ if (__gem_execbuf(fd, &execbuf) == 0)
+ engines[nengine++] = ring;
+ }
+ } else {
+ nengine = 1;
+ engines[0] = ring;
+ }
+
+ obj[1].relocs_ptr = (uintptr_t)reloc;
+ obj[1].relocation_count = 2;
+
+ if (flags & DMABUF)
+ dmabuf = prime_handle_to_fd(fd, obj[0].handle);
+
+ gem_set_domain(fd, obj[1].handle,
+ I915_GEM_DOMAIN_GTT, I915_GEM_DOMAIN_GTT);
+
+ reloc[0].target_handle = obj[1].handle; /* recurse */
+ reloc[0].presumed_offset = obj[1].offset;
+ reloc[0].offset = sizeof(uint32_t);
+ reloc[0].delta = 0;
+ if (gen < 4)
+ reloc[0].delta = 1;
+ reloc[0].read_domains = I915_GEM_DOMAIN_COMMAND;
+ reloc[0].write_domain = 0;
+
+ reloc[1].target_handle = obj[0].handle;
+ reloc[1].presumed_offset = obj[0].offset;
+ reloc[1].offset = 1024;
+ reloc[1].delta = 0;
+ reloc[1].read_domains = I915_GEM_DOMAIN_RENDER;
+ reloc[1].write_domain = 0;
+ if (flags & WRITE)
+ reloc[1].write_domain = I915_GEM_DOMAIN_RENDER;
+
+ while (reps--) {
+ memset(shared, 0, 4096);
+
+ gem_set_domain(fd, obj[1].handle,
+ I915_GEM_DOMAIN_GTT, I915_GEM_DOMAIN_GTT);
+ sleep(1); /* wait for the hw to go back to sleep */
+ batch[i = 0] = MI_BATCH_BUFFER_START;
+ if (gen >= 8) {
+ batch[i] |= 1 << 8 | 1;
+ batch[++i] = obj[1].offset;
+ batch[++i] = obj[1].offset >> 32;
+ } else if (gen >= 6) {
+ batch[i] |= 1 << 8;
+ batch[++i] = obj[1].offset;
+ } else {
+ batch[i] |= 2 << 6;
+ batch[++i] = obj[1].offset;
+ if (gen < 4)
+ batch[i] |= 1;
+ }
+
+ if ((flags & IDLE) == 0) {
+ for (int n = 0; n < nengine; n++) {
+ execbuf.flags &= ~ENGINE_FLAGS;
+ execbuf.flags |= engines[n];
+ gem_execbuf(fd, &execbuf);
+ }
+ }
+
+ igt_fork(child, ncpus) {
+ struct timespec start, end;
+ unsigned count = 0;
+
+ clock_gettime(CLOCK_MONOTONIC, &start);
+ do {
+ if (flags & DMABUF) {
+ struct pollfd pfd = { .fd = dmabuf, .events = POLLOUT };
+ for (int inner = 0; inner < 1024; inner++)
+ poll(&pfd, 1, 0);
+ } else {
+ for (int inner = 0; inner < 1024; inner++)
+ gem_busy(fd, obj[0].handle);
+ }
+
+ clock_gettime(CLOCK_MONOTONIC, &end);
+ count += 1024;
+ } while (elapsed(&start, &end) < 2e9);
+
+ clock_gettime(CLOCK_MONOTONIC, &end);
+ shared[child] = elapsed(&start, &end) / count;
+ }
+ igt_waitchildren();
+
+ batch[0] = MI_BATCH_BUFFER_END;
+
+ for (int child = 0; child < ncpus; child++)
+ shared[ncpus] += shared[child];
+ printf("%7.3f\n", shared[ncpus] / ncpus);
+ }
+ return 0;
+}
+
+int main(int argc, char **argv)
+{
+ unsigned ring = I915_EXEC_RENDER;
+ unsigned flags = 0;
+ int reps = 1;
+ int ncpus = 1;
+ int c;
+
+ while ((c = getopt (argc, argv, "e:r:dfWI")) != -1) {
+ switch (c) {
+ case 'e':
+ if (strcmp(optarg, "rcs") == 0)
+ ring = I915_EXEC_RENDER;
+ else if (strcmp(optarg, "vcs") == 0)
+ ring = I915_EXEC_BSD;
+ else if (strcmp(optarg, "bcs") == 0)
+ ring = I915_EXEC_BLT;
+ else if (strcmp(optarg, "vecs") == 0)
+ ring = I915_EXEC_VEBOX;
+ else if (strcmp(optarg, "all") == 0)
+ ring = -1;
+ else
+ ring = atoi(optarg);
+ break;
+
+ case 'r':
+ reps = atoi(optarg);
+ if (reps < 1)
+ reps = 1;
+ break;
+
+ case 'f':
+ ncpus = sysconf(_SC_NPROCESSORS_ONLN);
+ break;
+
+ case 'd':
+ flags |= DMABUF;
+ break;
+
+ case 'W':
+ flags |= WRITE;
+ break;
+
+ case 'I':
+ flags |= IDLE;
+ break;
+ default:
+ break;
+ }
+ }
+
+ return loop(ring, reps, ncpus, flags);
+}