Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright © 2011 Intel Corporation |
| 3 | * |
| 4 | * Permission is hereby granted, free of charge, to any person obtaining a |
| 5 | * copy of this software and associated documentation files (the "Software"), |
| 6 | * to deal in the Software without restriction, including without limitation |
| 7 | * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| 8 | * and/or sell copies of the Software, and to permit persons to whom the |
| 9 | * Software is furnished to do so, subject to the following conditions: |
| 10 | * |
| 11 | * The above copyright notice and this permission notice (including the next |
| 12 | * paragraph) shall be included in all copies or substantial portions of the |
| 13 | * Software. |
| 14 | * |
| 15 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| 16 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| 17 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| 18 | * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
| 19 | * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING |
| 20 | * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS |
| 21 | * IN THE SOFTWARE. |
| 22 | * |
| 23 | * Authors: |
| 24 | * Chris Wilson <chris@chris-wilson.co.uk> |
| 25 | * |
| 26 | */ |
| 27 | |
Thomas Wood | 804e11f | 2015-08-17 17:57:43 +0100 | [diff] [blame] | 28 | #include "igt.h" |
Chris Wilson | c6e26e4 | 2016-07-22 12:58:54 +0100 | [diff] [blame] | 29 | #include "igt_sysfs.h" |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 30 | #include <unistd.h> |
| 31 | #include <stdlib.h> |
| 32 | #include <stdint.h> |
| 33 | #include <stdio.h> |
| 34 | #include <string.h> |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 35 | #include <fcntl.h> |
| 36 | #include <inttypes.h> |
| 37 | #include <errno.h> |
| 38 | #include <sys/stat.h> |
| 39 | #include <sys/ioctl.h> |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 40 | #include <sys/time.h> |
Chris Wilson | b430709 | 2015-07-01 13:53:07 +0100 | [diff] [blame] | 41 | #include <time.h> |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 42 | #include "drm.h" |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 43 | |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 44 | #define LOCAL_I915_EXEC_NO_RELOC (1<<11) |
| 45 | #define LOCAL_I915_EXEC_HANDLE_LUT (1<<12) |
| 46 | |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 47 | #define LOCAL_I915_EXEC_BSD_SHIFT (13) |
| 48 | #define LOCAL_I915_EXEC_BSD_MASK (3 << LOCAL_I915_EXEC_BSD_SHIFT) |
Daniel Vetter | 51f0830 | 2012-12-05 19:29:11 +0100 | [diff] [blame] | 49 | |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 50 | #define ENGINE_FLAGS (I915_EXEC_RING_MASK | LOCAL_I915_EXEC_BSD_MASK) |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 51 | |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 52 | static double elapsed(const struct timespec *start, const struct timespec *end) |
| 53 | { |
| 54 | return ((end->tv_sec - start->tv_sec) + |
| 55 | (end->tv_nsec - start->tv_nsec)*1e-9); |
| 56 | } |
| 57 | |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 58 | static double nop_on_ring(int fd, uint32_t handle, unsigned ring_id, |
| 59 | int timeout, unsigned long *out) |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 60 | { |
| 61 | struct drm_i915_gem_execbuffer2 execbuf; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 62 | struct drm_i915_gem_exec_object2 obj; |
| 63 | struct timespec start, now; |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 64 | unsigned long count; |
Daniel Vetter | 8f5387e | 2013-08-13 13:20:58 +0200 | [diff] [blame] | 65 | |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 66 | memset(&obj, 0, sizeof(obj)); |
| 67 | obj.handle = handle; |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 68 | |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 69 | memset(&execbuf, 0, sizeof(execbuf)); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 70 | execbuf.buffers_ptr = (uintptr_t)&obj; |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 71 | execbuf.buffer_count = 1; |
| 72 | execbuf.flags = ring_id; |
| 73 | execbuf.flags |= LOCAL_I915_EXEC_HANDLE_LUT; |
| 74 | execbuf.flags |= LOCAL_I915_EXEC_NO_RELOC; |
Chris Wilson | 3e2443f | 2016-03-10 11:50:53 +0000 | [diff] [blame] | 75 | if (__gem_execbuf(fd, &execbuf)) { |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 76 | execbuf.flags = ring_id; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 77 | gem_execbuf(fd, &execbuf); |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 78 | } |
| 79 | gem_sync(fd, handle); |
Chris Wilson | 71f4153 | 2016-04-22 16:55:29 +0100 | [diff] [blame] | 80 | intel_detect_and_clear_missed_interrupts(fd); |
Chris Wilson | cd8d380 | 2015-03-24 09:15:12 +0000 | [diff] [blame] | 81 | |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 82 | count = 0; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 83 | clock_gettime(CLOCK_MONOTONIC, &start); |
| 84 | do { |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 85 | for (int loop = 0; loop < 1024; loop++) |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 86 | gem_execbuf(fd, &execbuf); |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 87 | |
| 88 | count += 1024; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 89 | clock_gettime(CLOCK_MONOTONIC, &now); |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 90 | } while (elapsed(&start, &now) < timeout); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 91 | gem_sync(fd, handle); |
| 92 | clock_gettime(CLOCK_MONOTONIC, &now); |
Chris Wilson | 71f4153 | 2016-04-22 16:55:29 +0100 | [diff] [blame] | 93 | igt_assert_eq(intel_detect_and_clear_missed_interrupts(fd), 0); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 94 | |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 95 | *out = count; |
| 96 | return elapsed(&start, &now); |
| 97 | } |
| 98 | |
| 99 | static void single(int fd, uint32_t handle, |
| 100 | unsigned ring_id, const char *ring_name) |
| 101 | { |
| 102 | double time; |
| 103 | unsigned long count; |
| 104 | |
| 105 | gem_require_ring(fd, ring_id); |
| 106 | |
| 107 | time = nop_on_ring(fd, handle, ring_id, 20, &count); |
| 108 | igt_info("%s: %'lu cycles: %.3fus\n", |
| 109 | ring_name, count, time*1e6 / count); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 110 | } |
| 111 | |
Chris Wilson | 0aacdac | 2016-03-09 21:06:16 +0000 | [diff] [blame] | 112 | static bool ignore_engine(int fd, unsigned engine) |
| 113 | { |
| 114 | if (engine == 0) |
| 115 | return true; |
| 116 | |
| 117 | if (gem_has_bsd2(fd) && engine == I915_EXEC_BSD) |
| 118 | return true; |
| 119 | |
| 120 | return false; |
| 121 | } |
| 122 | |
Chris Wilson | 772393e | 2016-03-14 14:31:36 +0000 | [diff] [blame] | 123 | static void all(int fd, uint32_t handle, int timeout) |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 124 | { |
| 125 | struct drm_i915_gem_execbuffer2 execbuf; |
| 126 | struct drm_i915_gem_exec_object2 obj; |
| 127 | struct timespec start, now; |
| 128 | unsigned engines[16]; |
| 129 | unsigned nengine; |
| 130 | unsigned engine; |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 131 | unsigned long count; |
Chris Wilson | 41a26b5 | 2016-03-28 16:26:01 +0100 | [diff] [blame] | 132 | double time, max = 0, min = HUGE_VAL, sum = 0; |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 133 | const char *name; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 134 | |
| 135 | nengine = 0; |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 136 | for_each_engine(fd, engine) { |
| 137 | if (ignore_engine(fd, engine)) |
| 138 | continue; |
| 139 | |
| 140 | time = nop_on_ring(fd, handle, engine, 1, &count) / count; |
| 141 | if (time > max) { |
| 142 | name = e__->name; |
| 143 | max = time; |
| 144 | } |
Chris Wilson | 41a26b5 | 2016-03-28 16:26:01 +0100 | [diff] [blame] | 145 | if (time < min) |
| 146 | min = time; |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 147 | sum += time; |
| 148 | engines[nengine++] = engine; |
| 149 | } |
Chris Wilson | 0aacdac | 2016-03-09 21:06:16 +0000 | [diff] [blame] | 150 | igt_require(nengine); |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 151 | igt_info("Maximum execution latency on %s, %.3fus, total %.3fus per cycle\n", |
| 152 | name, max*1e6, sum*1e6); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 153 | |
| 154 | memset(&obj, 0, sizeof(obj)); |
| 155 | obj.handle = handle; |
| 156 | |
| 157 | memset(&execbuf, 0, sizeof(execbuf)); |
| 158 | execbuf.buffers_ptr = (uintptr_t)&obj; |
| 159 | execbuf.buffer_count = 1; |
| 160 | execbuf.flags |= LOCAL_I915_EXEC_HANDLE_LUT; |
| 161 | execbuf.flags |= LOCAL_I915_EXEC_NO_RELOC; |
Chris Wilson | 3e2443f | 2016-03-10 11:50:53 +0000 | [diff] [blame] | 162 | if (__gem_execbuf(fd, &execbuf)) { |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 163 | execbuf.flags = 0; |
| 164 | gem_execbuf(fd, &execbuf); |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 165 | } |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 166 | gem_sync(fd, handle); |
Chris Wilson | 71f4153 | 2016-04-22 16:55:29 +0100 | [diff] [blame] | 167 | intel_detect_and_clear_missed_interrupts(fd); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 168 | |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 169 | count = 0; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 170 | clock_gettime(CLOCK_MONOTONIC, &start); |
| 171 | do { |
| 172 | for (int loop = 0; loop < 1024; loop++) { |
| 173 | for (int n = 0; n < nengine; n++) { |
| 174 | execbuf.flags &= ~ENGINE_FLAGS; |
| 175 | execbuf.flags |= engines[n]; |
| 176 | gem_execbuf(fd, &execbuf); |
| 177 | } |
| 178 | } |
| 179 | count += nengine * 1024; |
| 180 | clock_gettime(CLOCK_MONOTONIC, &now); |
Chris Wilson | 772393e | 2016-03-14 14:31:36 +0000 | [diff] [blame] | 181 | } while (elapsed(&start, &now) < timeout); /* Hang detection ~120s */ |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 182 | gem_sync(fd, handle); |
| 183 | clock_gettime(CLOCK_MONOTONIC, &now); |
Chris Wilson | 71f4153 | 2016-04-22 16:55:29 +0100 | [diff] [blame] | 184 | igt_assert_eq(intel_detect_and_clear_missed_interrupts(fd), 0); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 185 | |
Chris Wilson | 870c774 | 2016-03-28 15:29:46 +0100 | [diff] [blame] | 186 | time = elapsed(&start, &now) / count; |
Chris Wilson | a0eebbd | 2016-09-08 13:29:31 +0100 | [diff] [blame^] | 187 | igt_info("All (%d engines): %'lu cycles, average %.3fus per cycle [expected ideal %.3fus]\n", |
| 188 | nengine, count, 1e6*time, 1e6*max/nengine); |
Chris Wilson | 41a26b5 | 2016-03-28 16:26:01 +0100 | [diff] [blame] | 189 | |
Chris Wilson | a0eebbd | 2016-09-08 13:29:31 +0100 | [diff] [blame^] | 190 | /* The rate limiting step should be how fast the slowest engine can |
| 191 | * execute its queue of requests, as when we wait upon a full ring all |
| 192 | * dispatch is frozen. So in general we cannot go faster than the |
| 193 | * slowest engine (but as all engines are in lockstep, they should all |
| 194 | * be executing in parallel and so the average should be max/nengines), |
| 195 | * but we should equally not go any slower. |
| 196 | * |
| 197 | * However, that depends upon being able to submit fast enough, and |
| 198 | * that in turns depends upon debugging turned off and no bottlenecks |
| 199 | * within the driver. We cannot assert that we hit ideal conditions |
| 200 | * across all engines, so we only look for an outrageous error |
| 201 | * condition. |
Chris Wilson | 41a26b5 | 2016-03-28 16:26:01 +0100 | [diff] [blame] | 202 | */ |
Chris Wilson | a0eebbd | 2016-09-08 13:29:31 +0100 | [diff] [blame^] | 203 | igt_assert_f(time < 2*sum, |
| 204 | "Average time (%.3fus) exceeds expectation for parallel execution (min %.3fus, max %.3fus; limit set at %.3fus)\n", |
| 205 | 1e6*time, 1e6*min, 1e6*max, 1e6*sum*2); |
Daniel Vetter | d9d9578 | 2012-12-04 17:13:05 +0100 | [diff] [blame] | 206 | } |
Daniel Vetter | 8f5387e | 2013-08-13 13:20:58 +0200 | [diff] [blame] | 207 | |
Chris Wilson | c6e26e4 | 2016-07-22 12:58:54 +0100 | [diff] [blame] | 208 | static void print_welcome(int fd) |
| 209 | { |
| 210 | bool active; |
Chris Wilson | c6e26e4 | 2016-07-22 12:58:54 +0100 | [diff] [blame] | 211 | int dir; |
| 212 | |
| 213 | dir = igt_sysfs_open_parameters(fd); |
| 214 | if (dir < 0) |
| 215 | return; |
| 216 | |
Chris Wilson | b64d10c | 2016-07-22 17:53:51 +0100 | [diff] [blame] | 217 | active = igt_sysfs_get_boolean(dir, "enable_guc_submission"); |
Chris Wilson | c6e26e4 | 2016-07-22 12:58:54 +0100 | [diff] [blame] | 218 | if (active) { |
| 219 | igt_info("Using GuC submission\n"); |
| 220 | goto out; |
| 221 | } |
| 222 | |
Chris Wilson | b64d10c | 2016-07-22 17:53:51 +0100 | [diff] [blame] | 223 | active = igt_sysfs_get_boolean(dir, "enable_execlists"); |
Chris Wilson | c6e26e4 | 2016-07-22 12:58:54 +0100 | [diff] [blame] | 224 | if (active) { |
| 225 | igt_info("Using Execlists submission\n"); |
| 226 | goto out; |
| 227 | } |
| 228 | |
Chris Wilson | b64d10c | 2016-07-22 17:53:51 +0100 | [diff] [blame] | 229 | active = igt_sysfs_get_boolean(dir, "semaphores"); |
Chris Wilson | c6e26e4 | 2016-07-22 12:58:54 +0100 | [diff] [blame] | 230 | igt_info("Using Legacy submission %s\n", |
| 231 | active ? ", with semaphores" : ""); |
| 232 | |
| 233 | out: |
| 234 | close(dir); |
| 235 | } |
| 236 | |
Daniel Vetter | 071e9ca | 2013-10-31 16:23:26 +0100 | [diff] [blame] | 237 | igt_main |
Daniel Vetter | d9d9578 | 2012-12-04 17:13:05 +0100 | [diff] [blame] | 238 | { |
Chris Wilson | 7e0853c | 2016-01-27 14:17:53 +0000 | [diff] [blame] | 239 | const struct intel_execution_engine *e; |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 240 | uint32_t handle = 0; |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 241 | int device = -1; |
Daniel Vetter | d9d9578 | 2012-12-04 17:13:05 +0100 | [diff] [blame] | 242 | |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 243 | igt_fixture { |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 244 | const uint32_t bbe = MI_BATCH_BUFFER_END; |
| 245 | |
Micah Fedke | c81d293 | 2015-07-22 21:54:02 +0000 | [diff] [blame] | 246 | device = drm_open_driver(DRIVER_INTEL); |
Chris Wilson | c6e26e4 | 2016-07-22 12:58:54 +0100 | [diff] [blame] | 247 | print_welcome(device); |
| 248 | |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 249 | handle = gem_create(device, 4096); |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 250 | gem_write(device, handle, 0, &bbe, sizeof(bbe)); |
Daniel Vetter | d9d9578 | 2012-12-04 17:13:05 +0100 | [diff] [blame] | 251 | |
Daniel Vetter | be21fc0 | 2016-06-17 16:04:09 +0200 | [diff] [blame] | 252 | igt_fork_hang_detector(device); |
| 253 | } |
Chris Wilson | 9d61a68 | 2016-03-25 18:22:54 +0000 | [diff] [blame] | 254 | |
Chris Wilson | 772393e | 2016-03-14 14:31:36 +0000 | [diff] [blame] | 255 | igt_subtest("basic") |
| 256 | all(device, handle, 10); |
| 257 | |
Chris Wilson | 7e0853c | 2016-01-27 14:17:53 +0000 | [diff] [blame] | 258 | for (e = intel_execution_engines; e->name; e++) |
| 259 | igt_subtest_f("%s", e->name) |
Chris Wilson | 3a7325e | 2016-03-08 11:43:31 +0000 | [diff] [blame] | 260 | single(device, handle, e->exec_id | e->flags, e->name); |
| 261 | |
Chris Wilson | 772393e | 2016-03-14 14:31:36 +0000 | [diff] [blame] | 262 | igt_subtest("all") |
| 263 | all(device, handle, 150); |
Daniel Vetter | d9d9578 | 2012-12-04 17:13:05 +0100 | [diff] [blame] | 264 | |
Daniel Vetter | b3880d3 | 2013-08-14 18:02:46 +0200 | [diff] [blame] | 265 | igt_fixture { |
Daniel Vetter | be21fc0 | 2016-06-17 16:04:09 +0200 | [diff] [blame] | 266 | igt_stop_hang_detector(); |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 267 | gem_close(device, handle); |
Chris Wilson | 2659cbb | 2015-03-26 12:09:57 +0000 | [diff] [blame] | 268 | close(device); |
Daniel Vetter | b3880d3 | 2013-08-14 18:02:46 +0200 | [diff] [blame] | 269 | } |
Chris Wilson | 07d59b3 | 2011-01-20 22:10:10 +0000 | [diff] [blame] | 270 | } |