blob: d1b99b5655008e67e14c691f2fb6625416ff61f2 [file] [log] [blame]
Chris Wilsonf97fbf92017-02-13 17:15:14 +00001/*
2 * Copyright © 2016 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 */
24
25#include "../i915_selftest.h"
26#include "i915_random.h"
27
28#include "mock_engine.h"
29
30static int check_rbtree(struct intel_engine_cs *engine,
31 const unsigned long *bitmap,
32 const struct intel_wait *waiters,
33 const int count)
34{
35 struct intel_breadcrumbs *b = &engine->breadcrumbs;
36 struct rb_node *rb;
37 int n;
38
39 if (&b->first_wait->node != rb_first(&b->waiters)) {
40 pr_err("First waiter does not match first element of wait-tree\n");
41 return -EINVAL;
42 }
43
44 n = find_first_bit(bitmap, count);
45 for (rb = rb_first(&b->waiters); rb; rb = rb_next(rb)) {
46 struct intel_wait *w = container_of(rb, typeof(*w), node);
47 int idx = w - waiters;
48
49 if (!test_bit(idx, bitmap)) {
50 pr_err("waiter[%d, seqno=%d] removed but still in wait-tree\n",
51 idx, w->seqno);
52 return -EINVAL;
53 }
54
55 if (n != idx) {
56 pr_err("waiter[%d, seqno=%d] does not match expected next element in tree [%d]\n",
57 idx, w->seqno, n);
58 return -EINVAL;
59 }
60
61 n = find_next_bit(bitmap, count, n + 1);
62 }
63
64 return 0;
65}
66
Chris Wilsonae1f8092017-02-13 17:15:15 +000067static int check_completion(struct intel_engine_cs *engine,
68 const unsigned long *bitmap,
69 const struct intel_wait *waiters,
70 const int count)
71{
72 int n;
73
74 for (n = 0; n < count; n++) {
75 if (intel_wait_complete(&waiters[n]) != !!test_bit(n, bitmap))
76 continue;
77
78 pr_err("waiter[%d, seqno=%d] is %s, but expected %s\n",
79 n, waiters[n].seqno,
80 intel_wait_complete(&waiters[n]) ? "complete" : "active",
81 test_bit(n, bitmap) ? "active" : "complete");
82 return -EINVAL;
83 }
84
85 return 0;
86}
87
Chris Wilsonf97fbf92017-02-13 17:15:14 +000088static int check_rbtree_empty(struct intel_engine_cs *engine)
89{
90 struct intel_breadcrumbs *b = &engine->breadcrumbs;
91
92 if (b->first_wait) {
93 pr_err("Empty breadcrumbs still has a waiter\n");
94 return -EINVAL;
95 }
96
97 if (!RB_EMPTY_ROOT(&b->waiters)) {
98 pr_err("Empty breadcrumbs, but wait-tree not empty\n");
99 return -EINVAL;
100 }
101
102 return 0;
103}
104
105static int igt_random_insert_remove(void *arg)
106{
107 const u32 seqno_bias = 0x1000;
108 I915_RND_STATE(prng);
109 struct intel_engine_cs *engine = arg;
110 struct intel_wait *waiters;
111 const int count = 4096;
112 unsigned int *order;
113 unsigned long *bitmap;
114 int err = -ENOMEM;
115 int n;
116
117 mock_engine_reset(engine);
118
119 waiters = drm_malloc_gfp(count, sizeof(*waiters), GFP_TEMPORARY);
120 if (!waiters)
121 goto out_engines;
122
123 bitmap = kcalloc(DIV_ROUND_UP(count, BITS_PER_LONG), sizeof(*bitmap),
124 GFP_TEMPORARY);
125 if (!bitmap)
126 goto out_waiters;
127
128 order = i915_random_order(count, &prng);
129 if (!order)
130 goto out_bitmap;
131
132 for (n = 0; n < count; n++)
133 intel_wait_init(&waiters[n], seqno_bias + n);
134
135 err = check_rbtree(engine, bitmap, waiters, count);
136 if (err)
137 goto out_order;
138
139 /* Add and remove waiters into the rbtree in random order. At each
140 * step, we verify that the rbtree is correctly ordered.
141 */
142 for (n = 0; n < count; n++) {
143 int i = order[n];
144
145 intel_engine_add_wait(engine, &waiters[i]);
146 __set_bit(i, bitmap);
147
148 err = check_rbtree(engine, bitmap, waiters, count);
149 if (err)
150 goto out_order;
151 }
152
153 i915_random_reorder(order, count, &prng);
154 for (n = 0; n < count; n++) {
155 int i = order[n];
156
157 intel_engine_remove_wait(engine, &waiters[i]);
158 __clear_bit(i, bitmap);
159
160 err = check_rbtree(engine, bitmap, waiters, count);
161 if (err)
162 goto out_order;
163 }
164
165 err = check_rbtree_empty(engine);
166out_order:
167 kfree(order);
168out_bitmap:
169 kfree(bitmap);
170out_waiters:
171 drm_free_large(waiters);
172out_engines:
173 mock_engine_flush(engine);
174 return err;
175}
176
Chris Wilsonae1f8092017-02-13 17:15:15 +0000177static int igt_insert_complete(void *arg)
178{
179 const u32 seqno_bias = 0x1000;
180 struct intel_engine_cs *engine = arg;
181 struct intel_wait *waiters;
182 const int count = 4096;
183 unsigned long *bitmap;
184 int err = -ENOMEM;
185 int n, m;
186
187 mock_engine_reset(engine);
188
189 waiters = drm_malloc_gfp(count, sizeof(*waiters), GFP_TEMPORARY);
190 if (!waiters)
191 goto out_engines;
192
193 bitmap = kcalloc(DIV_ROUND_UP(count, BITS_PER_LONG), sizeof(*bitmap),
194 GFP_TEMPORARY);
195 if (!bitmap)
196 goto out_waiters;
197
198 for (n = 0; n < count; n++) {
199 intel_wait_init(&waiters[n], n + seqno_bias);
200 intel_engine_add_wait(engine, &waiters[n]);
201 __set_bit(n, bitmap);
202 }
203 err = check_rbtree(engine, bitmap, waiters, count);
204 if (err)
205 goto out_bitmap;
206
207 /* On each step, we advance the seqno so that several waiters are then
208 * complete (we increase the seqno by increasingly larger values to
209 * retire more and more waiters at once). All retired waiters should
210 * be woken and removed from the rbtree, and so that we check.
211 */
212 for (n = 0; n < count; n = m) {
213 int seqno = 2 * n;
214
215 GEM_BUG_ON(find_first_bit(bitmap, count) != n);
216
217 if (intel_wait_complete(&waiters[n])) {
218 pr_err("waiter[%d, seqno=%d] completed too early\n",
219 n, waiters[n].seqno);
220 err = -EINVAL;
221 goto out_bitmap;
222 }
223
224 /* complete the following waiters */
225 mock_seqno_advance(engine, seqno + seqno_bias);
226 for (m = n; m <= seqno; m++) {
227 if (m == count)
228 break;
229
230 GEM_BUG_ON(!test_bit(m, bitmap));
231 __clear_bit(m, bitmap);
232 }
233
234 intel_engine_remove_wait(engine, &waiters[n]);
235 RB_CLEAR_NODE(&waiters[n].node);
236
237 err = check_rbtree(engine, bitmap, waiters, count);
238 if (err) {
239 pr_err("rbtree corrupt after seqno advance to %d\n",
240 seqno + seqno_bias);
241 goto out_bitmap;
242 }
243
244 err = check_completion(engine, bitmap, waiters, count);
245 if (err) {
246 pr_err("completions after seqno advance to %d failed\n",
247 seqno + seqno_bias);
248 goto out_bitmap;
249 }
250 }
251
252 err = check_rbtree_empty(engine);
253out_bitmap:
254 kfree(bitmap);
255out_waiters:
256 drm_free_large(waiters);
257out_engines:
258 mock_engine_flush(engine);
259 return err;
260}
261
Chris Wilsone62e8ad2017-02-13 17:15:16 +0000262struct igt_wakeup {
263 struct task_struct *tsk;
264 atomic_t *ready, *set, *done;
265 struct intel_engine_cs *engine;
266 unsigned long flags;
267#define STOP 0
268#define IDLE 1
269 wait_queue_head_t *wq;
270 u32 seqno;
271};
272
273static int wait_atomic(atomic_t *p)
274{
275 schedule();
276 return 0;
277}
278
279static int wait_atomic_timeout(atomic_t *p)
280{
281 return schedule_timeout(10 * HZ) ? 0 : -ETIMEDOUT;
282}
283
284static bool wait_for_ready(struct igt_wakeup *w)
285{
286 DEFINE_WAIT(ready);
287
288 set_bit(IDLE, &w->flags);
289 if (atomic_dec_and_test(w->done))
290 wake_up_atomic_t(w->done);
291
292 if (test_bit(STOP, &w->flags))
293 goto out;
294
295 for (;;) {
296 prepare_to_wait(w->wq, &ready, TASK_INTERRUPTIBLE);
297 if (atomic_read(w->ready) == 0)
298 break;
299
300 schedule();
301 }
302 finish_wait(w->wq, &ready);
303
304out:
305 clear_bit(IDLE, &w->flags);
306 if (atomic_dec_and_test(w->set))
307 wake_up_atomic_t(w->set);
308
309 return !test_bit(STOP, &w->flags);
310}
311
312static int igt_wakeup_thread(void *arg)
313{
314 struct igt_wakeup *w = arg;
315 struct intel_wait wait;
316
317 while (wait_for_ready(w)) {
318 GEM_BUG_ON(kthread_should_stop());
319
320 intel_wait_init(&wait, w->seqno);
321 intel_engine_add_wait(w->engine, &wait);
322 for (;;) {
323 set_current_state(TASK_UNINTERRUPTIBLE);
324 if (i915_seqno_passed(intel_engine_get_seqno(w->engine),
325 w->seqno))
326 break;
327
328 if (test_bit(STOP, &w->flags)) /* emergency escape */
329 break;
330
331 schedule();
332 }
333 intel_engine_remove_wait(w->engine, &wait);
334 __set_current_state(TASK_RUNNING);
335 }
336
337 return 0;
338}
339
340static void igt_wake_all_sync(atomic_t *ready,
341 atomic_t *set,
342 atomic_t *done,
343 wait_queue_head_t *wq,
344 int count)
345{
346 atomic_set(set, count);
347 atomic_set(ready, 0);
348 wake_up_all(wq);
349
350 wait_on_atomic_t(set, wait_atomic, TASK_UNINTERRUPTIBLE);
351 atomic_set(ready, count);
352 atomic_set(done, count);
353}
354
355static int igt_wakeup(void *arg)
356{
357 I915_RND_STATE(prng);
358 const int state = TASK_UNINTERRUPTIBLE;
359 struct intel_engine_cs *engine = arg;
360 struct igt_wakeup *waiters;
361 DECLARE_WAIT_QUEUE_HEAD_ONSTACK(wq);
362 const int count = 4096;
363 const u32 max_seqno = count / 4;
364 atomic_t ready, set, done;
365 int err = -ENOMEM;
366 int n, step;
367
368 mock_engine_reset(engine);
369
370 waiters = drm_malloc_gfp(count, sizeof(*waiters), GFP_TEMPORARY);
371 if (!waiters)
372 goto out_engines;
373
374 /* Create a large number of threads, each waiting on a random seqno.
375 * Multiple waiters will be waiting for the same seqno.
376 */
377 atomic_set(&ready, count);
378 for (n = 0; n < count; n++) {
379 waiters[n].wq = &wq;
380 waiters[n].ready = &ready;
381 waiters[n].set = &set;
382 waiters[n].done = &done;
383 waiters[n].engine = engine;
384 waiters[n].flags = BIT(IDLE);
385
386 waiters[n].tsk = kthread_run(igt_wakeup_thread, &waiters[n],
387 "i915/igt:%d", n);
388 if (IS_ERR(waiters[n].tsk))
389 goto out_waiters;
390
391 get_task_struct(waiters[n].tsk);
392 }
393
394 for (step = 1; step <= max_seqno; step <<= 1) {
395 u32 seqno;
396
397 /* The waiter threads start paused as we assign them a random
398 * seqno and reset the engine. Once the engine is reset,
399 * we signal that the threads may begin their wait upon their
400 * seqno.
401 */
402 for (n = 0; n < count; n++) {
403 GEM_BUG_ON(!test_bit(IDLE, &waiters[n].flags));
404 waiters[n].seqno =
405 1 + prandom_u32_state(&prng) % max_seqno;
406 }
407 mock_seqno_advance(engine, 0);
408 igt_wake_all_sync(&ready, &set, &done, &wq, count);
409
410 /* Simulate the GPU doing chunks of work, with one or more
411 * seqno appearing to finish at the same time. A random number
412 * of threads will be waiting upon the update and hopefully be
413 * woken.
414 */
415 for (seqno = 1; seqno <= max_seqno + step; seqno += step) {
416 usleep_range(50, 500);
417 mock_seqno_advance(engine, seqno);
418 }
419 GEM_BUG_ON(intel_engine_get_seqno(engine) < 1 + max_seqno);
420
421 /* With the seqno now beyond any of the waiting threads, they
422 * should all be woken, see that they are complete and signal
423 * that they are ready for the next test. We wait until all
424 * threads are complete and waiting for us (i.e. not a seqno).
425 */
426 err = wait_on_atomic_t(&done, wait_atomic_timeout, state);
427 if (err) {
428 pr_err("Timed out waiting for %d remaining waiters\n",
429 atomic_read(&done));
430 break;
431 }
432
433 err = check_rbtree_empty(engine);
434 if (err)
435 break;
436 }
437
438out_waiters:
439 for (n = 0; n < count; n++) {
440 if (IS_ERR(waiters[n].tsk))
441 break;
442
443 set_bit(STOP, &waiters[n].flags);
444 }
445 mock_seqno_advance(engine, INT_MAX); /* wakeup any broken waiters */
446 igt_wake_all_sync(&ready, &set, &done, &wq, n);
447
448 for (n = 0; n < count; n++) {
449 if (IS_ERR(waiters[n].tsk))
450 break;
451
452 kthread_stop(waiters[n].tsk);
453 put_task_struct(waiters[n].tsk);
454 }
455
456 drm_free_large(waiters);
457out_engines:
458 mock_engine_flush(engine);
459 return err;
460}
461
Chris Wilsonf97fbf92017-02-13 17:15:14 +0000462int intel_breadcrumbs_mock_selftests(void)
463{
464 static const struct i915_subtest tests[] = {
465 SUBTEST(igt_random_insert_remove),
Chris Wilsonae1f8092017-02-13 17:15:15 +0000466 SUBTEST(igt_insert_complete),
Chris Wilsone62e8ad2017-02-13 17:15:16 +0000467 SUBTEST(igt_wakeup),
Chris Wilsonf97fbf92017-02-13 17:15:14 +0000468 };
469 struct intel_engine_cs *engine;
470 int err;
471
472 engine = mock_engine("mock");
473 if (!engine)
474 return -ENOMEM;
475
476 err = i915_subtests(tests, engine);
477 kfree(engine);
478
479 return err;
480}