intel_breadcrumbs.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470
  1. /*
  2. * Copyright © 2016 Intel Corporation
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice (including the next
  12. * paragraph) shall be included in all copies or substantial portions of the
  13. * Software.
  14. *
  15. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  18. * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  21. * IN THE SOFTWARE.
  22. *
  23. */
  24. #include "../i915_selftest.h"
  25. #include "i915_random.h"
  26. #include "mock_gem_device.h"
  27. #include "mock_engine.h"
  28. static int check_rbtree(struct intel_engine_cs *engine,
  29. const unsigned long *bitmap,
  30. const struct intel_wait *waiters,
  31. const int count)
  32. {
  33. struct intel_breadcrumbs *b = &engine->breadcrumbs;
  34. struct rb_node *rb;
  35. int n;
  36. if (&b->irq_wait->node != rb_first(&b->waiters)) {
  37. pr_err("First waiter does not match first element of wait-tree\n");
  38. return -EINVAL;
  39. }
  40. n = find_first_bit(bitmap, count);
  41. for (rb = rb_first(&b->waiters); rb; rb = rb_next(rb)) {
  42. struct intel_wait *w = container_of(rb, typeof(*w), node);
  43. int idx = w - waiters;
  44. if (!test_bit(idx, bitmap)) {
  45. pr_err("waiter[%d, seqno=%d] removed but still in wait-tree\n",
  46. idx, w->seqno);
  47. return -EINVAL;
  48. }
  49. if (n != idx) {
  50. pr_err("waiter[%d, seqno=%d] does not match expected next element in tree [%d]\n",
  51. idx, w->seqno, n);
  52. return -EINVAL;
  53. }
  54. n = find_next_bit(bitmap, count, n + 1);
  55. }
  56. return 0;
  57. }
  58. static int check_completion(struct intel_engine_cs *engine,
  59. const unsigned long *bitmap,
  60. const struct intel_wait *waiters,
  61. const int count)
  62. {
  63. int n;
  64. for (n = 0; n < count; n++) {
  65. if (intel_wait_complete(&waiters[n]) != !!test_bit(n, bitmap))
  66. continue;
  67. pr_err("waiter[%d, seqno=%d] is %s, but expected %s\n",
  68. n, waiters[n].seqno,
  69. intel_wait_complete(&waiters[n]) ? "complete" : "active",
  70. test_bit(n, bitmap) ? "active" : "complete");
  71. return -EINVAL;
  72. }
  73. return 0;
  74. }
  75. static int check_rbtree_empty(struct intel_engine_cs *engine)
  76. {
  77. struct intel_breadcrumbs *b = &engine->breadcrumbs;
  78. if (b->irq_wait) {
  79. pr_err("Empty breadcrumbs still has a waiter\n");
  80. return -EINVAL;
  81. }
  82. if (!RB_EMPTY_ROOT(&b->waiters)) {
  83. pr_err("Empty breadcrumbs, but wait-tree not empty\n");
  84. return -EINVAL;
  85. }
  86. return 0;
  87. }
  88. static int igt_random_insert_remove(void *arg)
  89. {
  90. const u32 seqno_bias = 0x1000;
  91. I915_RND_STATE(prng);
  92. struct intel_engine_cs *engine = arg;
  93. struct intel_wait *waiters;
  94. const int count = 4096;
  95. unsigned int *order;
  96. unsigned long *bitmap;
  97. int err = -ENOMEM;
  98. int n;
  99. mock_engine_reset(engine);
  100. waiters = kvmalloc_array(count, sizeof(*waiters), GFP_KERNEL);
  101. if (!waiters)
  102. goto out_engines;
  103. bitmap = kcalloc(DIV_ROUND_UP(count, BITS_PER_LONG), sizeof(*bitmap),
  104. GFP_KERNEL);
  105. if (!bitmap)
  106. goto out_waiters;
  107. order = i915_random_order(count, &prng);
  108. if (!order)
  109. goto out_bitmap;
  110. for (n = 0; n < count; n++)
  111. intel_wait_init_for_seqno(&waiters[n], seqno_bias + n);
  112. err = check_rbtree(engine, bitmap, waiters, count);
  113. if (err)
  114. goto out_order;
  115. /* Add and remove waiters into the rbtree in random order. At each
  116. * step, we verify that the rbtree is correctly ordered.
  117. */
  118. for (n = 0; n < count; n++) {
  119. int i = order[n];
  120. intel_engine_add_wait(engine, &waiters[i]);
  121. __set_bit(i, bitmap);
  122. err = check_rbtree(engine, bitmap, waiters, count);
  123. if (err)
  124. goto out_order;
  125. }
  126. i915_random_reorder(order, count, &prng);
  127. for (n = 0; n < count; n++) {
  128. int i = order[n];
  129. intel_engine_remove_wait(engine, &waiters[i]);
  130. __clear_bit(i, bitmap);
  131. err = check_rbtree(engine, bitmap, waiters, count);
  132. if (err)
  133. goto out_order;
  134. }
  135. err = check_rbtree_empty(engine);
  136. out_order:
  137. kfree(order);
  138. out_bitmap:
  139. kfree(bitmap);
  140. out_waiters:
  141. kvfree(waiters);
  142. out_engines:
  143. mock_engine_flush(engine);
  144. return err;
  145. }
  146. static int igt_insert_complete(void *arg)
  147. {
  148. const u32 seqno_bias = 0x1000;
  149. struct intel_engine_cs *engine = arg;
  150. struct intel_wait *waiters;
  151. const int count = 4096;
  152. unsigned long *bitmap;
  153. int err = -ENOMEM;
  154. int n, m;
  155. mock_engine_reset(engine);
  156. waiters = kvmalloc_array(count, sizeof(*waiters), GFP_KERNEL);
  157. if (!waiters)
  158. goto out_engines;
  159. bitmap = kcalloc(DIV_ROUND_UP(count, BITS_PER_LONG), sizeof(*bitmap),
  160. GFP_KERNEL);
  161. if (!bitmap)
  162. goto out_waiters;
  163. for (n = 0; n < count; n++) {
  164. intel_wait_init_for_seqno(&waiters[n], n + seqno_bias);
  165. intel_engine_add_wait(engine, &waiters[n]);
  166. __set_bit(n, bitmap);
  167. }
  168. err = check_rbtree(engine, bitmap, waiters, count);
  169. if (err)
  170. goto out_bitmap;
  171. /* On each step, we advance the seqno so that several waiters are then
  172. * complete (we increase the seqno by increasingly larger values to
  173. * retire more and more waiters at once). All retired waiters should
  174. * be woken and removed from the rbtree, and so that we check.
  175. */
  176. for (n = 0; n < count; n = m) {
  177. int seqno = 2 * n;
  178. GEM_BUG_ON(find_first_bit(bitmap, count) != n);
  179. if (intel_wait_complete(&waiters[n])) {
  180. pr_err("waiter[%d, seqno=%d] completed too early\n",
  181. n, waiters[n].seqno);
  182. err = -EINVAL;
  183. goto out_bitmap;
  184. }
  185. /* complete the following waiters */
  186. mock_seqno_advance(engine, seqno + seqno_bias);
  187. for (m = n; m <= seqno; m++) {
  188. if (m == count)
  189. break;
  190. GEM_BUG_ON(!test_bit(m, bitmap));
  191. __clear_bit(m, bitmap);
  192. }
  193. intel_engine_remove_wait(engine, &waiters[n]);
  194. RB_CLEAR_NODE(&waiters[n].node);
  195. err = check_rbtree(engine, bitmap, waiters, count);
  196. if (err) {
  197. pr_err("rbtree corrupt after seqno advance to %d\n",
  198. seqno + seqno_bias);
  199. goto out_bitmap;
  200. }
  201. err = check_completion(engine, bitmap, waiters, count);
  202. if (err) {
  203. pr_err("completions after seqno advance to %d failed\n",
  204. seqno + seqno_bias);
  205. goto out_bitmap;
  206. }
  207. }
  208. err = check_rbtree_empty(engine);
  209. out_bitmap:
  210. kfree(bitmap);
  211. out_waiters:
  212. kvfree(waiters);
  213. out_engines:
  214. mock_engine_flush(engine);
  215. return err;
  216. }
  217. struct igt_wakeup {
  218. struct task_struct *tsk;
  219. atomic_t *ready, *set, *done;
  220. struct intel_engine_cs *engine;
  221. unsigned long flags;
  222. #define STOP 0
  223. #define IDLE 1
  224. wait_queue_head_t *wq;
  225. u32 seqno;
  226. };
  227. static bool wait_for_ready(struct igt_wakeup *w)
  228. {
  229. DEFINE_WAIT(ready);
  230. set_bit(IDLE, &w->flags);
  231. if (atomic_dec_and_test(w->done))
  232. wake_up_var(w->done);
  233. if (test_bit(STOP, &w->flags))
  234. goto out;
  235. for (;;) {
  236. prepare_to_wait(w->wq, &ready, TASK_INTERRUPTIBLE);
  237. if (atomic_read(w->ready) == 0)
  238. break;
  239. schedule();
  240. }
  241. finish_wait(w->wq, &ready);
  242. out:
  243. clear_bit(IDLE, &w->flags);
  244. if (atomic_dec_and_test(w->set))
  245. wake_up_var(w->set);
  246. return !test_bit(STOP, &w->flags);
  247. }
  248. static int igt_wakeup_thread(void *arg)
  249. {
  250. struct igt_wakeup *w = arg;
  251. struct intel_wait wait;
  252. while (wait_for_ready(w)) {
  253. GEM_BUG_ON(kthread_should_stop());
  254. intel_wait_init_for_seqno(&wait, w->seqno);
  255. intel_engine_add_wait(w->engine, &wait);
  256. for (;;) {
  257. set_current_state(TASK_UNINTERRUPTIBLE);
  258. if (i915_seqno_passed(intel_engine_get_seqno(w->engine),
  259. w->seqno))
  260. break;
  261. if (test_bit(STOP, &w->flags)) /* emergency escape */
  262. break;
  263. schedule();
  264. }
  265. intel_engine_remove_wait(w->engine, &wait);
  266. __set_current_state(TASK_RUNNING);
  267. }
  268. return 0;
  269. }
  270. static void igt_wake_all_sync(atomic_t *ready,
  271. atomic_t *set,
  272. atomic_t *done,
  273. wait_queue_head_t *wq,
  274. int count)
  275. {
  276. atomic_set(set, count);
  277. atomic_set(ready, 0);
  278. wake_up_all(wq);
  279. wait_var_event(set, !atomic_read(set));
  280. atomic_set(ready, count);
  281. atomic_set(done, count);
  282. }
  283. static int igt_wakeup(void *arg)
  284. {
  285. I915_RND_STATE(prng);
  286. struct intel_engine_cs *engine = arg;
  287. struct igt_wakeup *waiters;
  288. DECLARE_WAIT_QUEUE_HEAD_ONSTACK(wq);
  289. const int count = 4096;
  290. const u32 max_seqno = count / 4;
  291. atomic_t ready, set, done;
  292. int err = -ENOMEM;
  293. int n, step;
  294. mock_engine_reset(engine);
  295. waiters = kvmalloc_array(count, sizeof(*waiters), GFP_KERNEL);
  296. if (!waiters)
  297. goto out_engines;
  298. /* Create a large number of threads, each waiting on a random seqno.
  299. * Multiple waiters will be waiting for the same seqno.
  300. */
  301. atomic_set(&ready, count);
  302. for (n = 0; n < count; n++) {
  303. waiters[n].wq = &wq;
  304. waiters[n].ready = &ready;
  305. waiters[n].set = &set;
  306. waiters[n].done = &done;
  307. waiters[n].engine = engine;
  308. waiters[n].flags = BIT(IDLE);
  309. waiters[n].tsk = kthread_run(igt_wakeup_thread, &waiters[n],
  310. "i915/igt:%d", n);
  311. if (IS_ERR(waiters[n].tsk))
  312. goto out_waiters;
  313. get_task_struct(waiters[n].tsk);
  314. }
  315. for (step = 1; step <= max_seqno; step <<= 1) {
  316. u32 seqno;
  317. /* The waiter threads start paused as we assign them a random
  318. * seqno and reset the engine. Once the engine is reset,
  319. * we signal that the threads may begin their wait upon their
  320. * seqno.
  321. */
  322. for (n = 0; n < count; n++) {
  323. GEM_BUG_ON(!test_bit(IDLE, &waiters[n].flags));
  324. waiters[n].seqno =
  325. 1 + prandom_u32_state(&prng) % max_seqno;
  326. }
  327. mock_seqno_advance(engine, 0);
  328. igt_wake_all_sync(&ready, &set, &done, &wq, count);
  329. /* Simulate the GPU doing chunks of work, with one or more
  330. * seqno appearing to finish at the same time. A random number
  331. * of threads will be waiting upon the update and hopefully be
  332. * woken.
  333. */
  334. for (seqno = 1; seqno <= max_seqno + step; seqno += step) {
  335. usleep_range(50, 500);
  336. mock_seqno_advance(engine, seqno);
  337. }
  338. GEM_BUG_ON(intel_engine_get_seqno(engine) < 1 + max_seqno);
  339. /* With the seqno now beyond any of the waiting threads, they
  340. * should all be woken, see that they are complete and signal
  341. * that they are ready for the next test. We wait until all
  342. * threads are complete and waiting for us (i.e. not a seqno).
  343. */
  344. if (!wait_var_event_timeout(&done,
  345. !atomic_read(&done), 10 * HZ)) {
  346. pr_err("Timed out waiting for %d remaining waiters\n",
  347. atomic_read(&done));
  348. err = -ETIMEDOUT;
  349. break;
  350. }
  351. err = check_rbtree_empty(engine);
  352. if (err)
  353. break;
  354. }
  355. out_waiters:
  356. for (n = 0; n < count; n++) {
  357. if (IS_ERR(waiters[n].tsk))
  358. break;
  359. set_bit(STOP, &waiters[n].flags);
  360. }
  361. mock_seqno_advance(engine, INT_MAX); /* wakeup any broken waiters */
  362. igt_wake_all_sync(&ready, &set, &done, &wq, n);
  363. for (n = 0; n < count; n++) {
  364. if (IS_ERR(waiters[n].tsk))
  365. break;
  366. kthread_stop(waiters[n].tsk);
  367. put_task_struct(waiters[n].tsk);
  368. }
  369. kvfree(waiters);
  370. out_engines:
  371. mock_engine_flush(engine);
  372. return err;
  373. }
  374. int intel_breadcrumbs_mock_selftests(void)
  375. {
  376. static const struct i915_subtest tests[] = {
  377. SUBTEST(igt_random_insert_remove),
  378. SUBTEST(igt_insert_complete),
  379. SUBTEST(igt_wakeup),
  380. };
  381. struct drm_i915_private *i915;
  382. int err;
  383. i915 = mock_gem_device();
  384. if (!i915)
  385. return -ENOMEM;
  386. err = i915_subtests(tests, i915->engine[RCS]);
  387. drm_dev_unref(&i915->drm);
  388. return err;
  389. }