intel_workarounds.c 6.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291
  1. /*
  2. * SPDX-License-Identifier: MIT
  3. *
  4. * Copyright © 2018 Intel Corporation
  5. */
  6. #include "../i915_selftest.h"
  7. #include "mock_context.h"
  8. static struct drm_i915_gem_object *
  9. read_nonprivs(struct i915_gem_context *ctx, struct intel_engine_cs *engine)
  10. {
  11. struct drm_i915_gem_object *result;
  12. struct i915_request *rq;
  13. struct i915_vma *vma;
  14. const u32 base = engine->mmio_base;
  15. u32 srm, *cs;
  16. int err;
  17. int i;
  18. result = i915_gem_object_create_internal(engine->i915, PAGE_SIZE);
  19. if (IS_ERR(result))
  20. return result;
  21. i915_gem_object_set_cache_level(result, I915_CACHE_LLC);
  22. cs = i915_gem_object_pin_map(result, I915_MAP_WB);
  23. if (IS_ERR(cs)) {
  24. err = PTR_ERR(cs);
  25. goto err_obj;
  26. }
  27. memset(cs, 0xc5, PAGE_SIZE);
  28. i915_gem_object_unpin_map(result);
  29. vma = i915_vma_instance(result, &engine->i915->ggtt.base, NULL);
  30. if (IS_ERR(vma)) {
  31. err = PTR_ERR(vma);
  32. goto err_obj;
  33. }
  34. err = i915_vma_pin(vma, 0, 0, PIN_GLOBAL);
  35. if (err)
  36. goto err_obj;
  37. rq = i915_request_alloc(engine, ctx);
  38. if (IS_ERR(rq)) {
  39. err = PTR_ERR(rq);
  40. goto err_pin;
  41. }
  42. srm = MI_STORE_REGISTER_MEM | MI_SRM_LRM_GLOBAL_GTT;
  43. if (INTEL_GEN(ctx->i915) >= 8)
  44. srm++;
  45. cs = intel_ring_begin(rq, 4 * RING_MAX_NONPRIV_SLOTS);
  46. if (IS_ERR(cs)) {
  47. err = PTR_ERR(cs);
  48. goto err_req;
  49. }
  50. for (i = 0; i < RING_MAX_NONPRIV_SLOTS; i++) {
  51. *cs++ = srm;
  52. *cs++ = i915_mmio_reg_offset(RING_FORCE_TO_NONPRIV(base, i));
  53. *cs++ = i915_ggtt_offset(vma) + sizeof(u32) * i;
  54. *cs++ = 0;
  55. }
  56. intel_ring_advance(rq, cs);
  57. i915_vma_move_to_active(vma, rq, EXEC_OBJECT_WRITE);
  58. reservation_object_lock(vma->resv, NULL);
  59. reservation_object_add_excl_fence(vma->resv, &rq->fence);
  60. reservation_object_unlock(vma->resv);
  61. i915_gem_object_get(result);
  62. i915_gem_object_set_active_reference(result);
  63. __i915_request_add(rq, true);
  64. i915_vma_unpin(vma);
  65. return result;
  66. err_req:
  67. i915_request_add(rq);
  68. err_pin:
  69. i915_vma_unpin(vma);
  70. err_obj:
  71. i915_gem_object_put(result);
  72. return ERR_PTR(err);
  73. }
  74. static u32 get_whitelist_reg(const struct whitelist *w, unsigned int i)
  75. {
  76. return i < w->count ? i915_mmio_reg_offset(w->reg[i]) : w->nopid;
  77. }
  78. static void print_results(const struct whitelist *w, const u32 *results)
  79. {
  80. unsigned int i;
  81. for (i = 0; i < RING_MAX_NONPRIV_SLOTS; i++) {
  82. u32 expected = get_whitelist_reg(w, i);
  83. u32 actual = results[i];
  84. pr_info("RING_NONPRIV[%d]: expected 0x%08x, found 0x%08x\n",
  85. i, expected, actual);
  86. }
  87. }
  88. static int check_whitelist(const struct whitelist *w,
  89. struct i915_gem_context *ctx,
  90. struct intel_engine_cs *engine)
  91. {
  92. struct drm_i915_gem_object *results;
  93. u32 *vaddr;
  94. int err;
  95. int i;
  96. results = read_nonprivs(ctx, engine);
  97. if (IS_ERR(results))
  98. return PTR_ERR(results);
  99. err = i915_gem_object_set_to_cpu_domain(results, false);
  100. if (err)
  101. goto out_put;
  102. vaddr = i915_gem_object_pin_map(results, I915_MAP_WB);
  103. if (IS_ERR(vaddr)) {
  104. err = PTR_ERR(vaddr);
  105. goto out_put;
  106. }
  107. for (i = 0; i < RING_MAX_NONPRIV_SLOTS; i++) {
  108. u32 expected = get_whitelist_reg(w, i);
  109. u32 actual = vaddr[i];
  110. if (expected != actual) {
  111. print_results(w, vaddr);
  112. pr_err("Invalid RING_NONPRIV[%d], expected 0x%08x, found 0x%08x\n",
  113. i, expected, actual);
  114. err = -EINVAL;
  115. break;
  116. }
  117. }
  118. i915_gem_object_unpin_map(results);
  119. out_put:
  120. i915_gem_object_put(results);
  121. return err;
  122. }
  123. static int do_device_reset(struct intel_engine_cs *engine)
  124. {
  125. i915_reset(engine->i915, ENGINE_MASK(engine->id), NULL);
  126. return 0;
  127. }
  128. static int do_engine_reset(struct intel_engine_cs *engine)
  129. {
  130. return i915_reset_engine(engine, NULL);
  131. }
  132. static int switch_to_scratch_context(struct intel_engine_cs *engine)
  133. {
  134. struct i915_gem_context *ctx;
  135. struct i915_request *rq;
  136. ctx = kernel_context(engine->i915);
  137. if (IS_ERR(ctx))
  138. return PTR_ERR(ctx);
  139. rq = i915_request_alloc(engine, ctx);
  140. kernel_context_close(ctx);
  141. if (IS_ERR(rq))
  142. return PTR_ERR(rq);
  143. i915_request_add(rq);
  144. return 0;
  145. }
  146. static int check_whitelist_across_reset(struct intel_engine_cs *engine,
  147. int (*reset)(struct intel_engine_cs *),
  148. const struct whitelist *w,
  149. const char *name)
  150. {
  151. struct i915_gem_context *ctx;
  152. int err;
  153. ctx = kernel_context(engine->i915);
  154. if (IS_ERR(ctx))
  155. return PTR_ERR(ctx);
  156. err = check_whitelist(w, ctx, engine);
  157. if (err) {
  158. pr_err("Invalid whitelist *before* %s reset!\n", name);
  159. goto out;
  160. }
  161. err = switch_to_scratch_context(engine);
  162. if (err)
  163. goto out;
  164. err = reset(engine);
  165. if (err) {
  166. pr_err("%s reset failed\n", name);
  167. goto out;
  168. }
  169. err = check_whitelist(w, ctx, engine);
  170. if (err) {
  171. pr_err("Whitelist not preserved in context across %s reset!\n",
  172. name);
  173. goto out;
  174. }
  175. kernel_context_close(ctx);
  176. ctx = kernel_context(engine->i915);
  177. if (IS_ERR(ctx))
  178. return PTR_ERR(ctx);
  179. err = check_whitelist(w, ctx, engine);
  180. if (err) {
  181. pr_err("Invalid whitelist *after* %s reset in fresh context!\n",
  182. name);
  183. goto out;
  184. }
  185. out:
  186. kernel_context_close(ctx);
  187. return err;
  188. }
  189. static int live_reset_whitelist(void *arg)
  190. {
  191. struct drm_i915_private *i915 = arg;
  192. struct intel_engine_cs *engine = i915->engine[RCS];
  193. struct i915_gpu_error *error = &i915->gpu_error;
  194. struct whitelist w;
  195. int err = 0;
  196. /* If we reset the gpu, we should not lose the RING_NONPRIV */
  197. if (!engine)
  198. return 0;
  199. if (!whitelist_build(engine, &w))
  200. return 0;
  201. pr_info("Checking %d whitelisted registers (RING_NONPRIV)\n", w.count);
  202. set_bit(I915_RESET_BACKOFF, &error->flags);
  203. set_bit(I915_RESET_ENGINE + engine->id, &error->flags);
  204. if (intel_has_reset_engine(i915)) {
  205. err = check_whitelist_across_reset(engine,
  206. do_engine_reset, &w,
  207. "engine");
  208. if (err)
  209. goto out;
  210. }
  211. if (intel_has_gpu_reset(i915)) {
  212. err = check_whitelist_across_reset(engine,
  213. do_device_reset, &w,
  214. "device");
  215. if (err)
  216. goto out;
  217. }
  218. out:
  219. clear_bit(I915_RESET_ENGINE + engine->id, &error->flags);
  220. clear_bit(I915_RESET_BACKOFF, &error->flags);
  221. return err;
  222. }
  223. int intel_workarounds_live_selftests(struct drm_i915_private *i915)
  224. {
  225. static const struct i915_subtest tests[] = {
  226. SUBTEST(live_reset_whitelist),
  227. };
  228. int err;
  229. mutex_lock(&i915->drm.struct_mutex);
  230. err = i915_subtests(tests, i915);
  231. mutex_unlock(&i915->drm.struct_mutex);
  232. return err;
  233. }