intel_breadcrumbs.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481
  1. /*
  2. * Copyright © 2016 Intel Corporation
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice (including the next
  12. * paragraph) shall be included in all copies or substantial portions of the
  13. * Software.
  14. *
  15. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  18. * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  21. * IN THE SOFTWARE.
  22. *
  23. */
  24. #include "../i915_selftest.h"
  25. #include "i915_random.h"
  26. #include "mock_gem_device.h"
  27. #include "mock_engine.h"
  28. static int check_rbtree(struct intel_engine_cs *engine,
  29. const unsigned long *bitmap,
  30. const struct intel_wait *waiters,
  31. const int count)
  32. {
  33. struct intel_breadcrumbs *b = &engine->breadcrumbs;
  34. struct rb_node *rb;
  35. int n;
  36. if (&b->irq_wait->node != rb_first(&b->waiters)) {
  37. pr_err("First waiter does not match first element of wait-tree\n");
  38. return -EINVAL;
  39. }
  40. n = find_first_bit(bitmap, count);
  41. for (rb = rb_first(&b->waiters); rb; rb = rb_next(rb)) {
  42. struct intel_wait *w = container_of(rb, typeof(*w), node);
  43. int idx = w - waiters;
  44. if (!test_bit(idx, bitmap)) {
  45. pr_err("waiter[%d, seqno=%d] removed but still in wait-tree\n",
  46. idx, w->seqno);
  47. return -EINVAL;
  48. }
  49. if (n != idx) {
  50. pr_err("waiter[%d, seqno=%d] does not match expected next element in tree [%d]\n",
  51. idx, w->seqno, n);
  52. return -EINVAL;
  53. }
  54. n = find_next_bit(bitmap, count, n + 1);
  55. }
  56. return 0;
  57. }
  58. static int check_completion(struct intel_engine_cs *engine,
  59. const unsigned long *bitmap,
  60. const struct intel_wait *waiters,
  61. const int count)
  62. {
  63. int n;
  64. for (n = 0; n < count; n++) {
  65. if (intel_wait_complete(&waiters[n]) != !!test_bit(n, bitmap))
  66. continue;
  67. pr_err("waiter[%d, seqno=%d] is %s, but expected %s\n",
  68. n, waiters[n].seqno,
  69. intel_wait_complete(&waiters[n]) ? "complete" : "active",
  70. test_bit(n, bitmap) ? "active" : "complete");
  71. return -EINVAL;
  72. }
  73. return 0;
  74. }
  75. static int check_rbtree_empty(struct intel_engine_cs *engine)
  76. {
  77. struct intel_breadcrumbs *b = &engine->breadcrumbs;
  78. if (b->irq_wait) {
  79. pr_err("Empty breadcrumbs still has a waiter\n");
  80. return -EINVAL;
  81. }
  82. if (!RB_EMPTY_ROOT(&b->waiters)) {
  83. pr_err("Empty breadcrumbs, but wait-tree not empty\n");
  84. return -EINVAL;
  85. }
  86. return 0;
  87. }
  88. static int igt_random_insert_remove(void *arg)
  89. {
  90. const u32 seqno_bias = 0x1000;
  91. I915_RND_STATE(prng);
  92. struct intel_engine_cs *engine = arg;
  93. struct intel_wait *waiters;
  94. const int count = 4096;
  95. unsigned int *order;
  96. unsigned long *bitmap;
  97. int err = -ENOMEM;
  98. int n;
  99. mock_engine_reset(engine);
  100. waiters = drm_malloc_gfp(count, sizeof(*waiters), GFP_TEMPORARY);
  101. if (!waiters)
  102. goto out_engines;
  103. bitmap = kcalloc(DIV_ROUND_UP(count, BITS_PER_LONG), sizeof(*bitmap),
  104. GFP_TEMPORARY);
  105. if (!bitmap)
  106. goto out_waiters;
  107. order = i915_random_order(count, &prng);
  108. if (!order)
  109. goto out_bitmap;
  110. for (n = 0; n < count; n++)
  111. intel_wait_init_for_seqno(&waiters[n], seqno_bias + n);
  112. err = check_rbtree(engine, bitmap, waiters, count);
  113. if (err)
  114. goto out_order;
  115. /* Add and remove waiters into the rbtree in random order. At each
  116. * step, we verify that the rbtree is correctly ordered.
  117. */
  118. for (n = 0; n < count; n++) {
  119. int i = order[n];
  120. intel_engine_add_wait(engine, &waiters[i]);
  121. __set_bit(i, bitmap);
  122. err = check_rbtree(engine, bitmap, waiters, count);
  123. if (err)
  124. goto out_order;
  125. }
  126. i915_random_reorder(order, count, &prng);
  127. for (n = 0; n < count; n++) {
  128. int i = order[n];
  129. intel_engine_remove_wait(engine, &waiters[i]);
  130. __clear_bit(i, bitmap);
  131. err = check_rbtree(engine, bitmap, waiters, count);
  132. if (err)
  133. goto out_order;
  134. }
  135. err = check_rbtree_empty(engine);
  136. out_order:
  137. kfree(order);
  138. out_bitmap:
  139. kfree(bitmap);
  140. out_waiters:
  141. drm_free_large(waiters);
  142. out_engines:
  143. mock_engine_flush(engine);
  144. return err;
  145. }
  146. static int igt_insert_complete(void *arg)
  147. {
  148. const u32 seqno_bias = 0x1000;
  149. struct intel_engine_cs *engine = arg;
  150. struct intel_wait *waiters;
  151. const int count = 4096;
  152. unsigned long *bitmap;
  153. int err = -ENOMEM;
  154. int n, m;
  155. mock_engine_reset(engine);
  156. waiters = drm_malloc_gfp(count, sizeof(*waiters), GFP_TEMPORARY);
  157. if (!waiters)
  158. goto out_engines;
  159. bitmap = kcalloc(DIV_ROUND_UP(count, BITS_PER_LONG), sizeof(*bitmap),
  160. GFP_TEMPORARY);
  161. if (!bitmap)
  162. goto out_waiters;
  163. for (n = 0; n < count; n++) {
  164. intel_wait_init_for_seqno(&waiters[n], n + seqno_bias);
  165. intel_engine_add_wait(engine, &waiters[n]);
  166. __set_bit(n, bitmap);
  167. }
  168. err = check_rbtree(engine, bitmap, waiters, count);
  169. if (err)
  170. goto out_bitmap;
  171. /* On each step, we advance the seqno so that several waiters are then
  172. * complete (we increase the seqno by increasingly larger values to
  173. * retire more and more waiters at once). All retired waiters should
  174. * be woken and removed from the rbtree, and so that we check.
  175. */
  176. for (n = 0; n < count; n = m) {
  177. int seqno = 2 * n;
  178. GEM_BUG_ON(find_first_bit(bitmap, count) != n);
  179. if (intel_wait_complete(&waiters[n])) {
  180. pr_err("waiter[%d, seqno=%d] completed too early\n",
  181. n, waiters[n].seqno);
  182. err = -EINVAL;
  183. goto out_bitmap;
  184. }
  185. /* complete the following waiters */
  186. mock_seqno_advance(engine, seqno + seqno_bias);
  187. for (m = n; m <= seqno; m++) {
  188. if (m == count)
  189. break;
  190. GEM_BUG_ON(!test_bit(m, bitmap));
  191. __clear_bit(m, bitmap);
  192. }
  193. intel_engine_remove_wait(engine, &waiters[n]);
  194. RB_CLEAR_NODE(&waiters[n].node);
  195. err = check_rbtree(engine, bitmap, waiters, count);
  196. if (err) {
  197. pr_err("rbtree corrupt after seqno advance to %d\n",
  198. seqno + seqno_bias);
  199. goto out_bitmap;
  200. }
  201. err = check_completion(engine, bitmap, waiters, count);
  202. if (err) {
  203. pr_err("completions after seqno advance to %d failed\n",
  204. seqno + seqno_bias);
  205. goto out_bitmap;
  206. }
  207. }
  208. err = check_rbtree_empty(engine);
  209. out_bitmap:
  210. kfree(bitmap);
  211. out_waiters:
  212. drm_free_large(waiters);
  213. out_engines:
  214. mock_engine_flush(engine);
  215. return err;
  216. }
  217. struct igt_wakeup {
  218. struct task_struct *tsk;
  219. atomic_t *ready, *set, *done;
  220. struct intel_engine_cs *engine;
  221. unsigned long flags;
  222. #define STOP 0
  223. #define IDLE 1
  224. wait_queue_head_t *wq;
  225. u32 seqno;
  226. };
  227. static int wait_atomic(atomic_t *p)
  228. {
  229. schedule();
  230. return 0;
  231. }
  232. static int wait_atomic_timeout(atomic_t *p)
  233. {
  234. return schedule_timeout(10 * HZ) ? 0 : -ETIMEDOUT;
  235. }
  236. static bool wait_for_ready(struct igt_wakeup *w)
  237. {
  238. DEFINE_WAIT(ready);
  239. set_bit(IDLE, &w->flags);
  240. if (atomic_dec_and_test(w->done))
  241. wake_up_atomic_t(w->done);
  242. if (test_bit(STOP, &w->flags))
  243. goto out;
  244. for (;;) {
  245. prepare_to_wait(w->wq, &ready, TASK_INTERRUPTIBLE);
  246. if (atomic_read(w->ready) == 0)
  247. break;
  248. schedule();
  249. }
  250. finish_wait(w->wq, &ready);
  251. out:
  252. clear_bit(IDLE, &w->flags);
  253. if (atomic_dec_and_test(w->set))
  254. wake_up_atomic_t(w->set);
  255. return !test_bit(STOP, &w->flags);
  256. }
  257. static int igt_wakeup_thread(void *arg)
  258. {
  259. struct igt_wakeup *w = arg;
  260. struct intel_wait wait;
  261. while (wait_for_ready(w)) {
  262. GEM_BUG_ON(kthread_should_stop());
  263. intel_wait_init_for_seqno(&wait, w->seqno);
  264. intel_engine_add_wait(w->engine, &wait);
  265. for (;;) {
  266. set_current_state(TASK_UNINTERRUPTIBLE);
  267. if (i915_seqno_passed(intel_engine_get_seqno(w->engine),
  268. w->seqno))
  269. break;
  270. if (test_bit(STOP, &w->flags)) /* emergency escape */
  271. break;
  272. schedule();
  273. }
  274. intel_engine_remove_wait(w->engine, &wait);
  275. __set_current_state(TASK_RUNNING);
  276. }
  277. return 0;
  278. }
  279. static void igt_wake_all_sync(atomic_t *ready,
  280. atomic_t *set,
  281. atomic_t *done,
  282. wait_queue_head_t *wq,
  283. int count)
  284. {
  285. atomic_set(set, count);
  286. atomic_set(ready, 0);
  287. wake_up_all(wq);
  288. wait_on_atomic_t(set, wait_atomic, TASK_UNINTERRUPTIBLE);
  289. atomic_set(ready, count);
  290. atomic_set(done, count);
  291. }
  292. static int igt_wakeup(void *arg)
  293. {
  294. I915_RND_STATE(prng);
  295. const int state = TASK_UNINTERRUPTIBLE;
  296. struct intel_engine_cs *engine = arg;
  297. struct igt_wakeup *waiters;
  298. DECLARE_WAIT_QUEUE_HEAD_ONSTACK(wq);
  299. const int count = 4096;
  300. const u32 max_seqno = count / 4;
  301. atomic_t ready, set, done;
  302. int err = -ENOMEM;
  303. int n, step;
  304. mock_engine_reset(engine);
  305. waiters = drm_malloc_gfp(count, sizeof(*waiters), GFP_TEMPORARY);
  306. if (!waiters)
  307. goto out_engines;
  308. /* Create a large number of threads, each waiting on a random seqno.
  309. * Multiple waiters will be waiting for the same seqno.
  310. */
  311. atomic_set(&ready, count);
  312. for (n = 0; n < count; n++) {
  313. waiters[n].wq = &wq;
  314. waiters[n].ready = &ready;
  315. waiters[n].set = &set;
  316. waiters[n].done = &done;
  317. waiters[n].engine = engine;
  318. waiters[n].flags = BIT(IDLE);
  319. waiters[n].tsk = kthread_run(igt_wakeup_thread, &waiters[n],
  320. "i915/igt:%d", n);
  321. if (IS_ERR(waiters[n].tsk))
  322. goto out_waiters;
  323. get_task_struct(waiters[n].tsk);
  324. }
  325. for (step = 1; step <= max_seqno; step <<= 1) {
  326. u32 seqno;
  327. /* The waiter threads start paused as we assign them a random
  328. * seqno and reset the engine. Once the engine is reset,
  329. * we signal that the threads may begin their wait upon their
  330. * seqno.
  331. */
  332. for (n = 0; n < count; n++) {
  333. GEM_BUG_ON(!test_bit(IDLE, &waiters[n].flags));
  334. waiters[n].seqno =
  335. 1 + prandom_u32_state(&prng) % max_seqno;
  336. }
  337. mock_seqno_advance(engine, 0);
  338. igt_wake_all_sync(&ready, &set, &done, &wq, count);
  339. /* Simulate the GPU doing chunks of work, with one or more
  340. * seqno appearing to finish at the same time. A random number
  341. * of threads will be waiting upon the update and hopefully be
  342. * woken.
  343. */
  344. for (seqno = 1; seqno <= max_seqno + step; seqno += step) {
  345. usleep_range(50, 500);
  346. mock_seqno_advance(engine, seqno);
  347. }
  348. GEM_BUG_ON(intel_engine_get_seqno(engine) < 1 + max_seqno);
  349. /* With the seqno now beyond any of the waiting threads, they
  350. * should all be woken, see that they are complete and signal
  351. * that they are ready for the next test. We wait until all
  352. * threads are complete and waiting for us (i.e. not a seqno).
  353. */
  354. err = wait_on_atomic_t(&done, wait_atomic_timeout, state);
  355. if (err) {
  356. pr_err("Timed out waiting for %d remaining waiters\n",
  357. atomic_read(&done));
  358. break;
  359. }
  360. err = check_rbtree_empty(engine);
  361. if (err)
  362. break;
  363. }
  364. out_waiters:
  365. for (n = 0; n < count; n++) {
  366. if (IS_ERR(waiters[n].tsk))
  367. break;
  368. set_bit(STOP, &waiters[n].flags);
  369. }
  370. mock_seqno_advance(engine, INT_MAX); /* wakeup any broken waiters */
  371. igt_wake_all_sync(&ready, &set, &done, &wq, n);
  372. for (n = 0; n < count; n++) {
  373. if (IS_ERR(waiters[n].tsk))
  374. break;
  375. kthread_stop(waiters[n].tsk);
  376. put_task_struct(waiters[n].tsk);
  377. }
  378. drm_free_large(waiters);
  379. out_engines:
  380. mock_engine_flush(engine);
  381. return err;
  382. }
  383. int intel_breadcrumbs_mock_selftests(void)
  384. {
  385. static const struct i915_subtest tests[] = {
  386. SUBTEST(igt_random_insert_remove),
  387. SUBTEST(igt_insert_complete),
  388. SUBTEST(igt_wakeup),
  389. };
  390. struct drm_i915_private *i915;
  391. int err;
  392. i915 = mock_gem_device();
  393. if (!i915)
  394. return -ENOMEM;
  395. err = i915_subtests(tests, i915->engine[RCS]);
  396. drm_dev_unref(&i915->drm);
  397. return err;
  398. }