i915_gem_evict.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437
  1. /*
  2. * Copyright © 2008-2010 Intel Corporation
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice (including the next
  12. * paragraph) shall be included in all copies or substantial portions of the
  13. * Software.
  14. *
  15. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  18. * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  21. * IN THE SOFTWARE.
  22. *
  23. * Authors:
  24. * Eric Anholt <eric@anholt.net>
  25. * Chris Wilson <chris@chris-wilson.co.uuk>
  26. *
  27. */
  28. #include <drm/drmP.h>
  29. #include <drm/i915_drm.h>
  30. #include "i915_drv.h"
  31. #include "intel_drv.h"
  32. #include "i915_trace.h"
  33. I915_SELFTEST_DECLARE(static struct igt_evict_ctl {
  34. bool fail_if_busy:1;
  35. } igt_evict_ctl;)
  36. static bool ggtt_is_idle(struct drm_i915_private *i915)
  37. {
  38. struct intel_engine_cs *engine;
  39. enum intel_engine_id id;
  40. if (i915->gt.active_requests)
  41. return false;
  42. for_each_engine(engine, i915, id) {
  43. if (!intel_engine_has_kernel_context(engine))
  44. return false;
  45. }
  46. return true;
  47. }
  48. static int ggtt_flush(struct drm_i915_private *i915)
  49. {
  50. int err;
  51. /* Not everything in the GGTT is tracked via vma (otherwise we
  52. * could evict as required with minimal stalling) so we are forced
  53. * to idle the GPU and explicitly retire outstanding requests in
  54. * the hopes that we can then remove contexts and the like only
  55. * bound by their active reference.
  56. */
  57. err = i915_gem_switch_to_kernel_context(i915);
  58. if (err)
  59. return err;
  60. err = i915_gem_wait_for_idle(i915,
  61. I915_WAIT_INTERRUPTIBLE |
  62. I915_WAIT_LOCKED);
  63. if (err)
  64. return err;
  65. GEM_BUG_ON(!ggtt_is_idle(i915));
  66. return 0;
  67. }
  68. static bool
  69. mark_free(struct drm_mm_scan *scan,
  70. struct i915_vma *vma,
  71. unsigned int flags,
  72. struct list_head *unwind)
  73. {
  74. if (i915_vma_is_pinned(vma))
  75. return false;
  76. if (flags & PIN_NONFAULT && i915_vma_has_userfault(vma))
  77. return false;
  78. list_add(&vma->evict_link, unwind);
  79. return drm_mm_scan_add_block(scan, &vma->node);
  80. }
  81. /**
  82. * i915_gem_evict_something - Evict vmas to make room for binding a new one
  83. * @vm: address space to evict from
  84. * @min_size: size of the desired free space
  85. * @alignment: alignment constraint of the desired free space
  86. * @cache_level: cache_level for the desired space
  87. * @start: start (inclusive) of the range from which to evict objects
  88. * @end: end (exclusive) of the range from which to evict objects
  89. * @flags: additional flags to control the eviction algorithm
  90. *
  91. * This function will try to evict vmas until a free space satisfying the
  92. * requirements is found. Callers must check first whether any such hole exists
  93. * already before calling this function.
  94. *
  95. * This function is used by the object/vma binding code.
  96. *
  97. * Since this function is only used to free up virtual address space it only
  98. * ignores pinned vmas, and not object where the backing storage itself is
  99. * pinned. Hence obj->pages_pin_count does not protect against eviction.
  100. *
  101. * To clarify: This is for freeing up virtual address space, not for freeing
  102. * memory in e.g. the shrinker.
  103. */
  104. int
  105. i915_gem_evict_something(struct i915_address_space *vm,
  106. u64 min_size, u64 alignment,
  107. unsigned cache_level,
  108. u64 start, u64 end,
  109. unsigned flags)
  110. {
  111. struct drm_i915_private *dev_priv = vm->i915;
  112. struct drm_mm_scan scan;
  113. struct list_head eviction_list;
  114. struct list_head *phases[] = {
  115. &vm->inactive_list,
  116. &vm->active_list,
  117. NULL,
  118. }, **phase;
  119. struct i915_vma *vma, *next;
  120. struct drm_mm_node *node;
  121. enum drm_mm_insert_mode mode;
  122. int ret;
  123. lockdep_assert_held(&vm->i915->drm.struct_mutex);
  124. trace_i915_gem_evict(vm, min_size, alignment, flags);
  125. /*
  126. * The goal is to evict objects and amalgamate space in LRU order.
  127. * The oldest idle objects reside on the inactive list, which is in
  128. * retirement order. The next objects to retire are those in flight,
  129. * on the active list, again in retirement order.
  130. *
  131. * The retirement sequence is thus:
  132. * 1. Inactive objects (already retired)
  133. * 2. Active objects (will stall on unbinding)
  134. *
  135. * On each list, the oldest objects lie at the HEAD with the freshest
  136. * object on the TAIL.
  137. */
  138. mode = DRM_MM_INSERT_BEST;
  139. if (flags & PIN_HIGH)
  140. mode = DRM_MM_INSERT_HIGH;
  141. if (flags & PIN_MAPPABLE)
  142. mode = DRM_MM_INSERT_LOW;
  143. drm_mm_scan_init_with_range(&scan, &vm->mm,
  144. min_size, alignment, cache_level,
  145. start, end, mode);
  146. /*
  147. * Retire before we search the active list. Although we have
  148. * reasonable accuracy in our retirement lists, we may have
  149. * a stray pin (preventing eviction) that can only be resolved by
  150. * retiring.
  151. */
  152. if (!(flags & PIN_NONBLOCK))
  153. i915_gem_retire_requests(dev_priv);
  154. else
  155. phases[1] = NULL;
  156. search_again:
  157. INIT_LIST_HEAD(&eviction_list);
  158. phase = phases;
  159. do {
  160. list_for_each_entry(vma, *phase, vm_link)
  161. if (mark_free(&scan, vma, flags, &eviction_list))
  162. goto found;
  163. } while (*++phase);
  164. /* Nothing found, clean up and bail out! */
  165. list_for_each_entry_safe(vma, next, &eviction_list, evict_link) {
  166. ret = drm_mm_scan_remove_block(&scan, &vma->node);
  167. BUG_ON(ret);
  168. }
  169. /*
  170. * Can we unpin some objects such as idle hw contents,
  171. * or pending flips? But since only the GGTT has global entries
  172. * such as scanouts, rinbuffers and contexts, we can skip the
  173. * purge when inspecting per-process local address spaces.
  174. */
  175. if (!i915_is_ggtt(vm) || flags & PIN_NONBLOCK)
  176. return -ENOSPC;
  177. /*
  178. * Not everything in the GGTT is tracked via VMA using
  179. * i915_vma_move_to_active(), otherwise we could evict as required
  180. * with minimal stalling. Instead we are forced to idle the GPU and
  181. * explicitly retire outstanding requests which will then remove
  182. * the pinning for active objects such as contexts and ring,
  183. * enabling us to evict them on the next iteration.
  184. *
  185. * To ensure that all user contexts are evictable, we perform
  186. * a switch to the perma-pinned kernel context. This all also gives
  187. * us a termination condition, when the last retired context is
  188. * the kernel's there is no more we can evict.
  189. */
  190. if (!ggtt_is_idle(dev_priv)) {
  191. if (I915_SELFTEST_ONLY(igt_evict_ctl.fail_if_busy))
  192. return -EBUSY;
  193. ret = ggtt_flush(dev_priv);
  194. if (ret)
  195. return ret;
  196. cond_resched();
  197. goto search_again;
  198. }
  199. /*
  200. * If we still have pending pageflip completions, drop
  201. * back to userspace to give our workqueues time to
  202. * acquire our locks and unpin the old scanouts.
  203. */
  204. return intel_has_pending_fb_unpin(dev_priv) ? -EAGAIN : -ENOSPC;
  205. found:
  206. /* drm_mm doesn't allow any other other operations while
  207. * scanning, therefore store to-be-evicted objects on a
  208. * temporary list and take a reference for all before
  209. * calling unbind (which may remove the active reference
  210. * of any of our objects, thus corrupting the list).
  211. */
  212. list_for_each_entry_safe(vma, next, &eviction_list, evict_link) {
  213. if (drm_mm_scan_remove_block(&scan, &vma->node))
  214. __i915_vma_pin(vma);
  215. else
  216. list_del(&vma->evict_link);
  217. }
  218. /* Unbinding will emit any required flushes */
  219. ret = 0;
  220. list_for_each_entry_safe(vma, next, &eviction_list, evict_link) {
  221. __i915_vma_unpin(vma);
  222. if (ret == 0)
  223. ret = i915_vma_unbind(vma);
  224. }
  225. while (ret == 0 && (node = drm_mm_scan_color_evict(&scan))) {
  226. vma = container_of(node, struct i915_vma, node);
  227. ret = i915_vma_unbind(vma);
  228. }
  229. return ret;
  230. }
  231. /**
  232. * i915_gem_evict_for_vma - Evict vmas to make room for binding a new one
  233. * @vm: address space to evict from
  234. * @target: range (and color) to evict for
  235. * @flags: additional flags to control the eviction algorithm
  236. *
  237. * This function will try to evict vmas that overlap the target node.
  238. *
  239. * To clarify: This is for freeing up virtual address space, not for freeing
  240. * memory in e.g. the shrinker.
  241. */
  242. int i915_gem_evict_for_node(struct i915_address_space *vm,
  243. struct drm_mm_node *target,
  244. unsigned int flags)
  245. {
  246. LIST_HEAD(eviction_list);
  247. struct drm_mm_node *node;
  248. u64 start = target->start;
  249. u64 end = start + target->size;
  250. struct i915_vma *vma, *next;
  251. bool check_color;
  252. int ret = 0;
  253. lockdep_assert_held(&vm->i915->drm.struct_mutex);
  254. GEM_BUG_ON(!IS_ALIGNED(start, I915_GTT_PAGE_SIZE));
  255. GEM_BUG_ON(!IS_ALIGNED(end, I915_GTT_PAGE_SIZE));
  256. trace_i915_gem_evict_node(vm, target, flags);
  257. /* Retire before we search the active list. Although we have
  258. * reasonable accuracy in our retirement lists, we may have
  259. * a stray pin (preventing eviction) that can only be resolved by
  260. * retiring.
  261. */
  262. if (!(flags & PIN_NONBLOCK))
  263. i915_gem_retire_requests(vm->i915);
  264. check_color = vm->mm.color_adjust;
  265. if (check_color) {
  266. /* Expand search to cover neighbouring guard pages (or lack!) */
  267. if (start)
  268. start -= I915_GTT_PAGE_SIZE;
  269. /* Always look at the page afterwards to avoid the end-of-GTT */
  270. end += I915_GTT_PAGE_SIZE;
  271. }
  272. GEM_BUG_ON(start >= end);
  273. drm_mm_for_each_node_in_range(node, &vm->mm, start, end) {
  274. /* If we find any non-objects (!vma), we cannot evict them */
  275. if (node->color == I915_COLOR_UNEVICTABLE) {
  276. ret = -ENOSPC;
  277. break;
  278. }
  279. GEM_BUG_ON(!node->allocated);
  280. vma = container_of(node, typeof(*vma), node);
  281. /* If we are using coloring to insert guard pages between
  282. * different cache domains within the address space, we have
  283. * to check whether the objects on either side of our range
  284. * abutt and conflict. If they are in conflict, then we evict
  285. * those as well to make room for our guard pages.
  286. */
  287. if (check_color) {
  288. if (node->start + node->size == target->start) {
  289. if (node->color == target->color)
  290. continue;
  291. }
  292. if (node->start == target->start + target->size) {
  293. if (node->color == target->color)
  294. continue;
  295. }
  296. }
  297. if (flags & PIN_NONBLOCK &&
  298. (i915_vma_is_pinned(vma) || i915_vma_is_active(vma))) {
  299. ret = -ENOSPC;
  300. break;
  301. }
  302. if (flags & PIN_NONFAULT && i915_vma_has_userfault(vma)) {
  303. ret = -ENOSPC;
  304. break;
  305. }
  306. /* Overlap of objects in the same batch? */
  307. if (i915_vma_is_pinned(vma)) {
  308. ret = -ENOSPC;
  309. if (vma->exec_flags &&
  310. *vma->exec_flags & EXEC_OBJECT_PINNED)
  311. ret = -EINVAL;
  312. break;
  313. }
  314. /* Never show fear in the face of dragons!
  315. *
  316. * We cannot directly remove this node from within this
  317. * iterator and as with i915_gem_evict_something() we employ
  318. * the vma pin_count in order to prevent the action of
  319. * unbinding one vma from freeing (by dropping its active
  320. * reference) another in our eviction list.
  321. */
  322. __i915_vma_pin(vma);
  323. list_add(&vma->evict_link, &eviction_list);
  324. }
  325. list_for_each_entry_safe(vma, next, &eviction_list, evict_link) {
  326. __i915_vma_unpin(vma);
  327. if (ret == 0)
  328. ret = i915_vma_unbind(vma);
  329. }
  330. return ret;
  331. }
  332. /**
  333. * i915_gem_evict_vm - Evict all idle vmas from a vm
  334. * @vm: Address space to cleanse
  335. *
  336. * This function evicts all vmas from a vm.
  337. *
  338. * This is used by the execbuf code as a last-ditch effort to defragment the
  339. * address space.
  340. *
  341. * To clarify: This is for freeing up virtual address space, not for freeing
  342. * memory in e.g. the shrinker.
  343. */
  344. int i915_gem_evict_vm(struct i915_address_space *vm)
  345. {
  346. struct list_head *phases[] = {
  347. &vm->inactive_list,
  348. &vm->active_list,
  349. NULL
  350. }, **phase;
  351. struct list_head eviction_list;
  352. struct i915_vma *vma, *next;
  353. int ret;
  354. lockdep_assert_held(&vm->i915->drm.struct_mutex);
  355. trace_i915_gem_evict_vm(vm);
  356. /* Switch back to the default context in order to unpin
  357. * the existing context objects. However, such objects only
  358. * pin themselves inside the global GTT and performing the
  359. * switch otherwise is ineffective.
  360. */
  361. if (i915_is_ggtt(vm)) {
  362. ret = ggtt_flush(vm->i915);
  363. if (ret)
  364. return ret;
  365. }
  366. INIT_LIST_HEAD(&eviction_list);
  367. phase = phases;
  368. do {
  369. list_for_each_entry(vma, *phase, vm_link) {
  370. if (i915_vma_is_pinned(vma))
  371. continue;
  372. __i915_vma_pin(vma);
  373. list_add(&vma->evict_link, &eviction_list);
  374. }
  375. } while (*++phase);
  376. ret = 0;
  377. list_for_each_entry_safe(vma, next, &eviction_list, evict_link) {
  378. __i915_vma_unpin(vma);
  379. if (ret == 0)
  380. ret = i915_vma_unbind(vma);
  381. }
  382. return ret;
  383. }
  384. #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
  385. #include "selftests/i915_gem_evict.c"
  386. #endif