amdgpu_virt.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include "amdgpu.h"
  24. uint64_t amdgpu_csa_vaddr(struct amdgpu_device *adev)
  25. {
  26. uint64_t addr = adev->vm_manager.max_pfn << AMDGPU_GPU_PAGE_SHIFT;
  27. addr -= AMDGPU_VA_RESERVED_SIZE;
  28. addr = amdgpu_gmc_sign_extend(addr);
  29. return addr;
  30. }
  31. bool amdgpu_virt_mmio_blocked(struct amdgpu_device *adev)
  32. {
  33. /* By now all MMIO pages except mailbox are blocked */
  34. /* if blocking is enabled in hypervisor. Choose the */
  35. /* SCRATCH_REG0 to test. */
  36. return RREG32_NO_KIQ(0xc040) == 0xffffffff;
  37. }
  38. int amdgpu_allocate_static_csa(struct amdgpu_device *adev)
  39. {
  40. int r;
  41. void *ptr;
  42. r = amdgpu_bo_create_kernel(adev, AMDGPU_CSA_SIZE, PAGE_SIZE,
  43. AMDGPU_GEM_DOMAIN_VRAM, &adev->virt.csa_obj,
  44. &adev->virt.csa_vmid0_addr, &ptr);
  45. if (r)
  46. return r;
  47. memset(ptr, 0, AMDGPU_CSA_SIZE);
  48. return 0;
  49. }
  50. void amdgpu_free_static_csa(struct amdgpu_device *adev) {
  51. amdgpu_bo_free_kernel(&adev->virt.csa_obj,
  52. &adev->virt.csa_vmid0_addr,
  53. NULL);
  54. }
  55. /*
  56. * amdgpu_map_static_csa should be called during amdgpu_vm_init
  57. * it maps virtual address amdgpu_csa_vaddr() to this VM, and each command
  58. * submission of GFX should use this virtual address within META_DATA init
  59. * package to support SRIOV gfx preemption.
  60. */
  61. int amdgpu_map_static_csa(struct amdgpu_device *adev, struct amdgpu_vm *vm,
  62. struct amdgpu_bo_va **bo_va)
  63. {
  64. uint64_t csa_addr = amdgpu_csa_vaddr(adev) & AMDGPU_GMC_HOLE_MASK;
  65. struct ww_acquire_ctx ticket;
  66. struct list_head list;
  67. struct amdgpu_bo_list_entry pd;
  68. struct ttm_validate_buffer csa_tv;
  69. int r;
  70. INIT_LIST_HEAD(&list);
  71. INIT_LIST_HEAD(&csa_tv.head);
  72. csa_tv.bo = &adev->virt.csa_obj->tbo;
  73. csa_tv.shared = true;
  74. list_add(&csa_tv.head, &list);
  75. amdgpu_vm_get_pd_bo(vm, &list, &pd);
  76. r = ttm_eu_reserve_buffers(&ticket, &list, true, NULL);
  77. if (r) {
  78. DRM_ERROR("failed to reserve CSA,PD BOs: err=%d\n", r);
  79. return r;
  80. }
  81. *bo_va = amdgpu_vm_bo_add(adev, vm, adev->virt.csa_obj);
  82. if (!*bo_va) {
  83. ttm_eu_backoff_reservation(&ticket, &list);
  84. DRM_ERROR("failed to create bo_va for static CSA\n");
  85. return -ENOMEM;
  86. }
  87. r = amdgpu_vm_alloc_pts(adev, (*bo_va)->base.vm, csa_addr,
  88. AMDGPU_CSA_SIZE);
  89. if (r) {
  90. DRM_ERROR("failed to allocate pts for static CSA, err=%d\n", r);
  91. amdgpu_vm_bo_rmv(adev, *bo_va);
  92. ttm_eu_backoff_reservation(&ticket, &list);
  93. return r;
  94. }
  95. r = amdgpu_vm_bo_map(adev, *bo_va, csa_addr, 0, AMDGPU_CSA_SIZE,
  96. AMDGPU_PTE_READABLE | AMDGPU_PTE_WRITEABLE |
  97. AMDGPU_PTE_EXECUTABLE);
  98. if (r) {
  99. DRM_ERROR("failed to do bo_map on static CSA, err=%d\n", r);
  100. amdgpu_vm_bo_rmv(adev, *bo_va);
  101. ttm_eu_backoff_reservation(&ticket, &list);
  102. return r;
  103. }
  104. ttm_eu_backoff_reservation(&ticket, &list);
  105. return 0;
  106. }
  107. void amdgpu_virt_init_setting(struct amdgpu_device *adev)
  108. {
  109. /* enable virtual display */
  110. adev->mode_info.num_crtc = 1;
  111. adev->enable_virtual_display = true;
  112. adev->cg_flags = 0;
  113. adev->pg_flags = 0;
  114. }
  115. uint32_t amdgpu_virt_kiq_rreg(struct amdgpu_device *adev, uint32_t reg)
  116. {
  117. signed long r, cnt = 0;
  118. unsigned long flags;
  119. uint32_t seq;
  120. struct amdgpu_kiq *kiq = &adev->gfx.kiq;
  121. struct amdgpu_ring *ring = &kiq->ring;
  122. BUG_ON(!ring->funcs->emit_rreg);
  123. spin_lock_irqsave(&kiq->ring_lock, flags);
  124. amdgpu_ring_alloc(ring, 32);
  125. amdgpu_ring_emit_rreg(ring, reg);
  126. amdgpu_fence_emit_polling(ring, &seq);
  127. amdgpu_ring_commit(ring);
  128. spin_unlock_irqrestore(&kiq->ring_lock, flags);
  129. r = amdgpu_fence_wait_polling(ring, seq, MAX_KIQ_REG_WAIT);
  130. /* don't wait anymore for gpu reset case because this way may
  131. * block gpu_recover() routine forever, e.g. this virt_kiq_rreg
  132. * is triggered in TTM and ttm_bo_lock_delayed_workqueue() will
  133. * never return if we keep waiting in virt_kiq_rreg, which cause
  134. * gpu_recover() hang there.
  135. *
  136. * also don't wait anymore for IRQ context
  137. * */
  138. if (r < 1 && (adev->in_gpu_reset || in_interrupt()))
  139. goto failed_kiq_read;
  140. if (in_interrupt())
  141. might_sleep();
  142. while (r < 1 && cnt++ < MAX_KIQ_REG_TRY) {
  143. msleep(MAX_KIQ_REG_BAILOUT_INTERVAL);
  144. r = amdgpu_fence_wait_polling(ring, seq, MAX_KIQ_REG_WAIT);
  145. }
  146. if (cnt > MAX_KIQ_REG_TRY)
  147. goto failed_kiq_read;
  148. return adev->wb.wb[adev->virt.reg_val_offs];
  149. failed_kiq_read:
  150. pr_err("failed to read reg:%x\n", reg);
  151. return ~0;
  152. }
  153. void amdgpu_virt_kiq_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v)
  154. {
  155. signed long r, cnt = 0;
  156. unsigned long flags;
  157. uint32_t seq;
  158. struct amdgpu_kiq *kiq = &adev->gfx.kiq;
  159. struct amdgpu_ring *ring = &kiq->ring;
  160. BUG_ON(!ring->funcs->emit_wreg);
  161. spin_lock_irqsave(&kiq->ring_lock, flags);
  162. amdgpu_ring_alloc(ring, 32);
  163. amdgpu_ring_emit_wreg(ring, reg, v);
  164. amdgpu_fence_emit_polling(ring, &seq);
  165. amdgpu_ring_commit(ring);
  166. spin_unlock_irqrestore(&kiq->ring_lock, flags);
  167. r = amdgpu_fence_wait_polling(ring, seq, MAX_KIQ_REG_WAIT);
  168. /* don't wait anymore for gpu reset case because this way may
  169. * block gpu_recover() routine forever, e.g. this virt_kiq_rreg
  170. * is triggered in TTM and ttm_bo_lock_delayed_workqueue() will
  171. * never return if we keep waiting in virt_kiq_rreg, which cause
  172. * gpu_recover() hang there.
  173. *
  174. * also don't wait anymore for IRQ context
  175. * */
  176. if (r < 1 && (adev->in_gpu_reset || in_interrupt()))
  177. goto failed_kiq_write;
  178. if (in_interrupt())
  179. might_sleep();
  180. while (r < 1 && cnt++ < MAX_KIQ_REG_TRY) {
  181. msleep(MAX_KIQ_REG_BAILOUT_INTERVAL);
  182. r = amdgpu_fence_wait_polling(ring, seq, MAX_KIQ_REG_WAIT);
  183. }
  184. if (cnt > MAX_KIQ_REG_TRY)
  185. goto failed_kiq_write;
  186. return;
  187. failed_kiq_write:
  188. pr_err("failed to write reg:%x\n", reg);
  189. }
  190. /**
  191. * amdgpu_virt_request_full_gpu() - request full gpu access
  192. * @amdgpu: amdgpu device.
  193. * @init: is driver init time.
  194. * When start to init/fini driver, first need to request full gpu access.
  195. * Return: Zero if request success, otherwise will return error.
  196. */
  197. int amdgpu_virt_request_full_gpu(struct amdgpu_device *adev, bool init)
  198. {
  199. struct amdgpu_virt *virt = &adev->virt;
  200. int r;
  201. if (virt->ops && virt->ops->req_full_gpu) {
  202. r = virt->ops->req_full_gpu(adev, init);
  203. if (r)
  204. return r;
  205. adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
  206. }
  207. return 0;
  208. }
  209. /**
  210. * amdgpu_virt_release_full_gpu() - release full gpu access
  211. * @amdgpu: amdgpu device.
  212. * @init: is driver init time.
  213. * When finishing driver init/fini, need to release full gpu access.
  214. * Return: Zero if release success, otherwise will returen error.
  215. */
  216. int amdgpu_virt_release_full_gpu(struct amdgpu_device *adev, bool init)
  217. {
  218. struct amdgpu_virt *virt = &adev->virt;
  219. int r;
  220. if (virt->ops && virt->ops->rel_full_gpu) {
  221. r = virt->ops->rel_full_gpu(adev, init);
  222. if (r)
  223. return r;
  224. adev->virt.caps |= AMDGPU_SRIOV_CAPS_RUNTIME;
  225. }
  226. return 0;
  227. }
  228. /**
  229. * amdgpu_virt_reset_gpu() - reset gpu
  230. * @amdgpu: amdgpu device.
  231. * Send reset command to GPU hypervisor to reset GPU that VM is using
  232. * Return: Zero if reset success, otherwise will return error.
  233. */
  234. int amdgpu_virt_reset_gpu(struct amdgpu_device *adev)
  235. {
  236. struct amdgpu_virt *virt = &adev->virt;
  237. int r;
  238. if (virt->ops && virt->ops->reset_gpu) {
  239. r = virt->ops->reset_gpu(adev);
  240. if (r)
  241. return r;
  242. adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
  243. }
  244. return 0;
  245. }
  246. /**
  247. * amdgpu_virt_wait_reset() - wait for reset gpu completed
  248. * @amdgpu: amdgpu device.
  249. * Wait for GPU reset completed.
  250. * Return: Zero if reset success, otherwise will return error.
  251. */
  252. int amdgpu_virt_wait_reset(struct amdgpu_device *adev)
  253. {
  254. struct amdgpu_virt *virt = &adev->virt;
  255. if (!virt->ops || !virt->ops->wait_reset)
  256. return -EINVAL;
  257. return virt->ops->wait_reset(adev);
  258. }
  259. /**
  260. * amdgpu_virt_alloc_mm_table() - alloc memory for mm table
  261. * @amdgpu: amdgpu device.
  262. * MM table is used by UVD and VCE for its initialization
  263. * Return: Zero if allocate success.
  264. */
  265. int amdgpu_virt_alloc_mm_table(struct amdgpu_device *adev)
  266. {
  267. int r;
  268. if (!amdgpu_sriov_vf(adev) || adev->virt.mm_table.gpu_addr)
  269. return 0;
  270. r = amdgpu_bo_create_kernel(adev, PAGE_SIZE, PAGE_SIZE,
  271. AMDGPU_GEM_DOMAIN_VRAM,
  272. &adev->virt.mm_table.bo,
  273. &adev->virt.mm_table.gpu_addr,
  274. (void *)&adev->virt.mm_table.cpu_addr);
  275. if (r) {
  276. DRM_ERROR("failed to alloc mm table and error = %d.\n", r);
  277. return r;
  278. }
  279. memset((void *)adev->virt.mm_table.cpu_addr, 0, PAGE_SIZE);
  280. DRM_INFO("MM table gpu addr = 0x%llx, cpu addr = %p.\n",
  281. adev->virt.mm_table.gpu_addr,
  282. adev->virt.mm_table.cpu_addr);
  283. return 0;
  284. }
  285. /**
  286. * amdgpu_virt_free_mm_table() - free mm table memory
  287. * @amdgpu: amdgpu device.
  288. * Free MM table memory
  289. */
  290. void amdgpu_virt_free_mm_table(struct amdgpu_device *adev)
  291. {
  292. if (!amdgpu_sriov_vf(adev) || !adev->virt.mm_table.gpu_addr)
  293. return;
  294. amdgpu_bo_free_kernel(&adev->virt.mm_table.bo,
  295. &adev->virt.mm_table.gpu_addr,
  296. (void *)&adev->virt.mm_table.cpu_addr);
  297. adev->virt.mm_table.gpu_addr = 0;
  298. }
  299. int amdgpu_virt_fw_reserve_get_checksum(void *obj,
  300. unsigned long obj_size,
  301. unsigned int key,
  302. unsigned int chksum)
  303. {
  304. unsigned int ret = key;
  305. unsigned long i = 0;
  306. unsigned char *pos;
  307. pos = (char *)obj;
  308. /* calculate checksum */
  309. for (i = 0; i < obj_size; ++i)
  310. ret += *(pos + i);
  311. /* minus the chksum itself */
  312. pos = (char *)&chksum;
  313. for (i = 0; i < sizeof(chksum); ++i)
  314. ret -= *(pos + i);
  315. return ret;
  316. }
  317. void amdgpu_virt_init_data_exchange(struct amdgpu_device *adev)
  318. {
  319. uint32_t pf2vf_size = 0;
  320. uint32_t checksum = 0;
  321. uint32_t checkval;
  322. char *str;
  323. adev->virt.fw_reserve.p_pf2vf = NULL;
  324. adev->virt.fw_reserve.p_vf2pf = NULL;
  325. if (adev->fw_vram_usage.va != NULL) {
  326. adev->virt.fw_reserve.p_pf2vf =
  327. (struct amdgim_pf2vf_info_header *)(
  328. adev->fw_vram_usage.va + AMDGIM_DATAEXCHANGE_OFFSET);
  329. AMDGPU_FW_VRAM_PF2VF_READ(adev, header.size, &pf2vf_size);
  330. AMDGPU_FW_VRAM_PF2VF_READ(adev, checksum, &checksum);
  331. AMDGPU_FW_VRAM_PF2VF_READ(adev, feature_flags, &adev->virt.gim_feature);
  332. /* pf2vf message must be in 4K */
  333. if (pf2vf_size > 0 && pf2vf_size < 4096) {
  334. checkval = amdgpu_virt_fw_reserve_get_checksum(
  335. adev->virt.fw_reserve.p_pf2vf, pf2vf_size,
  336. adev->virt.fw_reserve.checksum_key, checksum);
  337. if (checkval == checksum) {
  338. adev->virt.fw_reserve.p_vf2pf =
  339. ((void *)adev->virt.fw_reserve.p_pf2vf +
  340. pf2vf_size);
  341. memset((void *)adev->virt.fw_reserve.p_vf2pf, 0,
  342. sizeof(amdgim_vf2pf_info));
  343. AMDGPU_FW_VRAM_VF2PF_WRITE(adev, header.version,
  344. AMDGPU_FW_VRAM_VF2PF_VER);
  345. AMDGPU_FW_VRAM_VF2PF_WRITE(adev, header.size,
  346. sizeof(amdgim_vf2pf_info));
  347. AMDGPU_FW_VRAM_VF2PF_READ(adev, driver_version,
  348. &str);
  349. #ifdef MODULE
  350. if (THIS_MODULE->version != NULL)
  351. strcpy(str, THIS_MODULE->version);
  352. else
  353. #endif
  354. strcpy(str, "N/A");
  355. AMDGPU_FW_VRAM_VF2PF_WRITE(adev, driver_cert,
  356. 0);
  357. AMDGPU_FW_VRAM_VF2PF_WRITE(adev, checksum,
  358. amdgpu_virt_fw_reserve_get_checksum(
  359. adev->virt.fw_reserve.p_vf2pf,
  360. pf2vf_size,
  361. adev->virt.fw_reserve.checksum_key, 0));
  362. }
  363. }
  364. }
  365. }