Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright © 2011 Intel Corporation |
| 3 | * |
| 4 | * Permission is hereby granted, free of charge, to any person obtaining a |
| 5 | * copy of this software and associated documentation files (the "Software"), |
| 6 | * to deal in the Software without restriction, including without limitation |
| 7 | * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| 8 | * and/or sell copies of the Software, and to permit persons to whom the |
| 9 | * Software is furnished to do so, subject to the following conditions: |
| 10 | * |
| 11 | * The above copyright notice and this permission notice (including the next |
| 12 | * paragraph) shall be included in all copies or substantial portions of the |
| 13 | * Software. |
| 14 | * |
| 15 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| 16 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| 17 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| 18 | * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
| 19 | * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING |
| 20 | * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS |
| 21 | * IN THE SOFTWARE. |
| 22 | * |
| 23 | * Authors: |
| 24 | * Chris Wilson <chris@chris-wilson.co.uk> |
| 25 | * |
| 26 | */ |
| 27 | |
Thomas Wood | 804e11f | 2015-08-17 17:57:43 +0100 | [diff] [blame] | 28 | #include "igt.h" |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 29 | #include <unistd.h> |
| 30 | #include <stdlib.h> |
| 31 | #include <stdint.h> |
| 32 | #include <stdio.h> |
| 33 | #include <string.h> |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 34 | #include <fcntl.h> |
| 35 | #include <inttypes.h> |
| 36 | #include <errno.h> |
| 37 | #include <sys/stat.h> |
| 38 | #include <sys/ioctl.h> |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 39 | #include <sys/time.h> |
Chris Wilson | b430709 | 2015-07-01 13:53:07 +0100 | [diff] [blame] | 40 | #include <time.h> |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 41 | #include "drm.h" |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 42 | |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 43 | #define LOCAL_I915_EXEC_NO_RELOC (1<<11) |
| 44 | #define LOCAL_I915_EXEC_HANDLE_LUT (1<<12) |
| 45 | |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 46 | #define LOCAL_I915_EXEC_BSD_SHIFT (13) |
| 47 | #define LOCAL_I915_EXEC_BSD_MASK (3 << LOCAL_I915_EXEC_BSD_SHIFT) |
Daniel Vetter | 51f0830 | 2012-12-05 19:29:11 +0100 | [diff] [blame] | 48 | |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 49 | #define ENGINE_FLAGS (I915_EXEC_RING_MASK | LOCAL_I915_EXEC_BSD_MASK) |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 50 | |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 51 | static double elapsed(const struct timespec *start, const struct timespec *end) |
| 52 | { |
| 53 | return ((end->tv_sec - start->tv_sec) + |
| 54 | (end->tv_nsec - start->tv_nsec)*1e-9); |
| 55 | } |
| 56 | |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 57 | static double nop_on_ring(int fd, uint32_t handle, unsigned ring_id, |
| 58 | int timeout, unsigned long *out) |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 59 | { |
| 60 | struct drm_i915_gem_execbuffer2 execbuf; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 61 | struct drm_i915_gem_exec_object2 obj; |
| 62 | struct timespec start, now; |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 63 | unsigned long count; |
Daniel Vetter | 8f5387e | 2013-08-13 13:20:58 +0200 | [diff] [blame] | 64 | |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 65 | memset(&obj, 0, sizeof(obj)); |
| 66 | obj.handle = handle; |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 67 | |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 68 | memset(&execbuf, 0, sizeof(execbuf)); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 69 | execbuf.buffers_ptr = (uintptr_t)&obj; |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 70 | execbuf.buffer_count = 1; |
| 71 | execbuf.flags = ring_id; |
| 72 | execbuf.flags |= LOCAL_I915_EXEC_HANDLE_LUT; |
| 73 | execbuf.flags |= LOCAL_I915_EXEC_NO_RELOC; |
Chris Wilson | 3e2443f | 2016-03-10 11:50:53 +0000 | [diff] [blame] | 74 | if (__gem_execbuf(fd, &execbuf)) { |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 75 | execbuf.flags = ring_id; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 76 | gem_execbuf(fd, &execbuf); |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 77 | } |
| 78 | gem_sync(fd, handle); |
| 79 | |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 80 | count = 0; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 81 | clock_gettime(CLOCK_MONOTONIC, &start); |
| 82 | do { |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 83 | for (int loop = 0; loop < 1024; loop++) |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 84 | gem_execbuf(fd, &execbuf); |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 85 | |
| 86 | count += 1024; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 87 | clock_gettime(CLOCK_MONOTONIC, &now); |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 88 | } while (elapsed(&start, &now) < timeout); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 89 | gem_sync(fd, handle); |
| 90 | clock_gettime(CLOCK_MONOTONIC, &now); |
| 91 | |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 92 | *out = count; |
| 93 | return elapsed(&start, &now); |
| 94 | } |
| 95 | |
| 96 | static void single(int fd, uint32_t handle, |
| 97 | unsigned ring_id, const char *ring_name) |
| 98 | { |
| 99 | double time; |
| 100 | unsigned long count; |
| 101 | |
| 102 | gem_require_ring(fd, ring_id); |
| 103 | |
| 104 | time = nop_on_ring(fd, handle, ring_id, 20, &count); |
| 105 | igt_info("%s: %'lu cycles: %.3fus\n", |
| 106 | ring_name, count, time*1e6 / count); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 107 | } |
| 108 | |
Chris Wilson | 0aacdac | 2016-03-09 21:06:16 +0000 | [diff] [blame] | 109 | static bool ignore_engine(int fd, unsigned engine) |
| 110 | { |
| 111 | if (engine == 0) |
| 112 | return true; |
| 113 | |
| 114 | if (gem_has_bsd2(fd) && engine == I915_EXEC_BSD) |
| 115 | return true; |
| 116 | |
| 117 | return false; |
| 118 | } |
| 119 | |
Chris Wilson | 772393e | 2016-03-14 14:31:36 +0000 | [diff] [blame] | 120 | static void all(int fd, uint32_t handle, int timeout) |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 121 | { |
| 122 | struct drm_i915_gem_execbuffer2 execbuf; |
| 123 | struct drm_i915_gem_exec_object2 obj; |
| 124 | struct timespec start, now; |
| 125 | unsigned engines[16]; |
| 126 | unsigned nengine; |
| 127 | unsigned engine; |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 128 | unsigned long count; |
Chris Wilson | 41a26b5 | 2016-03-28 16:26:01 +0100 | [diff] [blame^] | 129 | double time, max = 0, min = HUGE_VAL, sum = 0; |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 130 | const char *name; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 131 | |
| 132 | nengine = 0; |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 133 | for_each_engine(fd, engine) { |
| 134 | if (ignore_engine(fd, engine)) |
| 135 | continue; |
| 136 | |
| 137 | time = nop_on_ring(fd, handle, engine, 1, &count) / count; |
| 138 | if (time > max) { |
| 139 | name = e__->name; |
| 140 | max = time; |
| 141 | } |
Chris Wilson | 41a26b5 | 2016-03-28 16:26:01 +0100 | [diff] [blame^] | 142 | if (time < min) |
| 143 | min = time; |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 144 | sum += time; |
| 145 | engines[nengine++] = engine; |
| 146 | } |
Chris Wilson | 0aacdac | 2016-03-09 21:06:16 +0000 | [diff] [blame] | 147 | igt_require(nengine); |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 148 | igt_info("Maximum execution latency on %s, %.3fus, total %.3fus per cycle\n", |
| 149 | name, max*1e6, sum*1e6); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 150 | |
| 151 | memset(&obj, 0, sizeof(obj)); |
| 152 | obj.handle = handle; |
| 153 | |
| 154 | memset(&execbuf, 0, sizeof(execbuf)); |
| 155 | execbuf.buffers_ptr = (uintptr_t)&obj; |
| 156 | execbuf.buffer_count = 1; |
| 157 | execbuf.flags |= LOCAL_I915_EXEC_HANDLE_LUT; |
| 158 | execbuf.flags |= LOCAL_I915_EXEC_NO_RELOC; |
Chris Wilson | 3e2443f | 2016-03-10 11:50:53 +0000 | [diff] [blame] | 159 | if (__gem_execbuf(fd, &execbuf)) { |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 160 | execbuf.flags = 0; |
| 161 | gem_execbuf(fd, &execbuf); |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 162 | } |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 163 | gem_sync(fd, handle); |
| 164 | |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 165 | count = 0; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 166 | clock_gettime(CLOCK_MONOTONIC, &start); |
| 167 | do { |
| 168 | for (int loop = 0; loop < 1024; loop++) { |
| 169 | for (int n = 0; n < nengine; n++) { |
| 170 | execbuf.flags &= ~ENGINE_FLAGS; |
| 171 | execbuf.flags |= engines[n]; |
| 172 | gem_execbuf(fd, &execbuf); |
| 173 | } |
| 174 | } |
| 175 | count += nengine * 1024; |
| 176 | clock_gettime(CLOCK_MONOTONIC, &now); |
Chris Wilson | 772393e | 2016-03-14 14:31:36 +0000 | [diff] [blame] | 177 | } while (elapsed(&start, &now) < timeout); /* Hang detection ~120s */ |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 178 | gem_sync(fd, handle); |
| 179 | clock_gettime(CLOCK_MONOTONIC, &now); |
| 180 | |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 181 | time = elapsed(&start, &now) / count; |
| 182 | igt_info("All (%d engines): %'lu cycles, average %.3fus per cycle\n", |
| 183 | nengine, count, 1e6*time); |
Chris Wilson | 41a26b5 | 2016-03-28 16:26:01 +0100 | [diff] [blame^] | 184 | |
| 185 | /* The rate limiting step is how fast the slowest engine can |
| 186 | * its queue of requests, if we wait upon a full ring all dispatch |
| 187 | * is frozen. So in general we cannot go faster than the slowest |
| 188 | * engine, but we should equally not go any slower. |
| 189 | */ |
| 190 | igt_assert(time < max + min); /* ensure parallel execution */ |
Daniel Vetter | d9d9578 | 2012-12-04 17:13:05 +0100 | [diff] [blame] | 191 | } |
Daniel Vetter | 8f5387e | 2013-08-13 13:20:58 +0200 | [diff] [blame] | 192 | |
Daniel Vetter | 071e9ca | 2013-10-31 16:23:26 +0100 | [diff] [blame] | 193 | igt_main |
Daniel Vetter | d9d9578 | 2012-12-04 17:13:05 +0100 | [diff] [blame] | 194 | { |
Chris Wilson | 7e0853c | 2016-01-27 14:17:53 +0000 | [diff] [blame] | 195 | const struct intel_execution_engine *e; |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 196 | uint32_t handle = 0; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 197 | int device = -1; |
Daniel Vetter | d9d9578 | 2012-12-04 17:13:05 +0100 | [diff] [blame] | 198 | |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 199 | igt_fixture { |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 200 | const uint32_t bbe = MI_BATCH_BUFFER_END; |
| 201 | |
Micah Fedke | c81d293 | 2015-07-22 21:54:02 +0000 | [diff] [blame] | 202 | device = drm_open_driver(DRIVER_INTEL); |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 203 | handle = gem_create(device, 4096); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 204 | gem_write(device, handle, 0, &bbe, sizeof(bbe)); |
Daniel Vetter | b3880d3 | 2013-08-14 18:02:46 +0200 | [diff] [blame] | 205 | } |
Daniel Vetter | d9d9578 | 2012-12-04 17:13:05 +0100 | [diff] [blame] | 206 | |
Chris Wilson | 9d61a68 | 2016-03-25 18:22:54 +0000 | [diff] [blame] | 207 | igt_fork_hang_detector(device); |
| 208 | |
Chris Wilson | 772393e | 2016-03-14 14:31:36 +0000 | [diff] [blame] | 209 | igt_subtest("basic") |
| 210 | all(device, handle, 10); |
| 211 | |
Chris Wilson | 7e0853c | 2016-01-27 14:17:53 +0000 | [diff] [blame] | 212 | for (e = intel_execution_engines; e->name; e++) |
| 213 | igt_subtest_f("%s", e->name) |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 214 | single(device, handle, e->exec_id | e->flags, e->name); |
| 215 | |
Chris Wilson | 772393e | 2016-03-14 14:31:36 +0000 | [diff] [blame] | 216 | igt_subtest("all") |
| 217 | all(device, handle, 150); |
Daniel Vetter | d9d9578 | 2012-12-04 17:13:05 +0100 | [diff] [blame] | 218 | |
Chris Wilson | 9d61a68 | 2016-03-25 18:22:54 +0000 | [diff] [blame] | 219 | igt_stop_hang_detector(); |
| 220 | |
Daniel Vetter | b3880d3 | 2013-08-14 18:02:46 +0200 | [diff] [blame] | 221 | igt_fixture { |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 222 | gem_close(device, handle); |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 223 | close(device); |
Daniel Vetter | b3880d3 | 2013-08-14 18:02:46 +0200 | [diff] [blame] | 224 | } |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 225 | } |