vce_v3_0.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521
  1. /*
  2. * Copyright 2014 Advanced Micro Devices, Inc.
  3. * All Rights Reserved.
  4. *
  5. * Permission is hereby granted, free of charge, to any person obtaining a
  6. * copy of this software and associated documentation files (the
  7. * "Software"), to deal in the Software without restriction, including
  8. * without limitation the rights to use, copy, modify, merge, publish,
  9. * distribute, sub license, and/or sell copies of the Software, and to
  10. * permit persons to whom the Software is furnished to do so, subject to
  11. * the following conditions:
  12. *
  13. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  14. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  15. * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
  16. * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
  17. * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  18. * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
  19. * USE OR OTHER DEALINGS IN THE SOFTWARE.
  20. *
  21. * The above copyright notice and this permission notice (including the
  22. * next paragraph) shall be included in all copies or substantial portions
  23. * of the Software.
  24. *
  25. * Authors: Christian König <christian.koenig@amd.com>
  26. */
  27. #include <linux/firmware.h>
  28. #include <drm/drmP.h>
  29. #include "amdgpu.h"
  30. #include "amdgpu_vce.h"
  31. #include "vid.h"
  32. #include "vce/vce_3_0_d.h"
  33. #include "vce/vce_3_0_sh_mask.h"
  34. #include "oss/oss_2_0_d.h"
  35. #include "oss/oss_2_0_sh_mask.h"
  36. static void vce_v3_0_mc_resume(struct amdgpu_device *adev);
  37. static void vce_v3_0_set_ring_funcs(struct amdgpu_device *adev);
  38. static void vce_v3_0_set_irq_funcs(struct amdgpu_device *adev);
  39. /**
  40. * vce_v3_0_ring_get_rptr - get read pointer
  41. *
  42. * @ring: amdgpu_ring pointer
  43. *
  44. * Returns the current hardware read pointer
  45. */
  46. static uint32_t vce_v3_0_ring_get_rptr(struct amdgpu_ring *ring)
  47. {
  48. struct amdgpu_device *adev = ring->adev;
  49. if (ring == &adev->vce.ring[0])
  50. return RREG32(mmVCE_RB_RPTR);
  51. else
  52. return RREG32(mmVCE_RB_RPTR2);
  53. }
  54. /**
  55. * vce_v3_0_ring_get_wptr - get write pointer
  56. *
  57. * @ring: amdgpu_ring pointer
  58. *
  59. * Returns the current hardware write pointer
  60. */
  61. static uint32_t vce_v3_0_ring_get_wptr(struct amdgpu_ring *ring)
  62. {
  63. struct amdgpu_device *adev = ring->adev;
  64. if (ring == &adev->vce.ring[0])
  65. return RREG32(mmVCE_RB_WPTR);
  66. else
  67. return RREG32(mmVCE_RB_WPTR2);
  68. }
  69. /**
  70. * vce_v3_0_ring_set_wptr - set write pointer
  71. *
  72. * @ring: amdgpu_ring pointer
  73. *
  74. * Commits the write pointer to the hardware
  75. */
  76. static void vce_v3_0_ring_set_wptr(struct amdgpu_ring *ring)
  77. {
  78. struct amdgpu_device *adev = ring->adev;
  79. if (ring == &adev->vce.ring[0])
  80. WREG32(mmVCE_RB_WPTR, ring->wptr);
  81. else
  82. WREG32(mmVCE_RB_WPTR2, ring->wptr);
  83. }
  84. /**
  85. * vce_v3_0_start - start VCE block
  86. *
  87. * @adev: amdgpu_device pointer
  88. *
  89. * Setup and start the VCE block
  90. */
  91. static int vce_v3_0_start(struct amdgpu_device *adev)
  92. {
  93. struct amdgpu_ring *ring;
  94. int i, j, r;
  95. vce_v3_0_mc_resume(adev);
  96. /* set BUSY flag */
  97. WREG32_P(mmVCE_STATUS, 1, ~1);
  98. ring = &adev->vce.ring[0];
  99. WREG32(mmVCE_RB_RPTR, ring->wptr);
  100. WREG32(mmVCE_RB_WPTR, ring->wptr);
  101. WREG32(mmVCE_RB_BASE_LO, ring->gpu_addr);
  102. WREG32(mmVCE_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
  103. WREG32(mmVCE_RB_SIZE, ring->ring_size / 4);
  104. ring = &adev->vce.ring[1];
  105. WREG32(mmVCE_RB_RPTR2, ring->wptr);
  106. WREG32(mmVCE_RB_WPTR2, ring->wptr);
  107. WREG32(mmVCE_RB_BASE_LO2, ring->gpu_addr);
  108. WREG32(mmVCE_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
  109. WREG32(mmVCE_RB_SIZE2, ring->ring_size / 4);
  110. WREG32_P(mmVCE_VCPU_CNTL, VCE_VCPU_CNTL__CLK_EN_MASK, ~VCE_VCPU_CNTL__CLK_EN_MASK);
  111. WREG32_P(mmVCE_SOFT_RESET,
  112. VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK,
  113. ~VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK);
  114. mdelay(100);
  115. WREG32_P(mmVCE_SOFT_RESET, 0, ~VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK);
  116. for (i = 0; i < 10; ++i) {
  117. uint32_t status;
  118. for (j = 0; j < 100; ++j) {
  119. status = RREG32(mmVCE_STATUS);
  120. if (status & 2)
  121. break;
  122. mdelay(10);
  123. }
  124. r = 0;
  125. if (status & 2)
  126. break;
  127. DRM_ERROR("VCE not responding, trying to reset the ECPU!!!\n");
  128. WREG32_P(mmVCE_SOFT_RESET, VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK,
  129. ~VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK);
  130. mdelay(10);
  131. WREG32_P(mmVCE_SOFT_RESET, 0, ~VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK);
  132. mdelay(10);
  133. r = -1;
  134. }
  135. /* clear BUSY flag */
  136. WREG32_P(mmVCE_STATUS, 0, ~1);
  137. if (r) {
  138. DRM_ERROR("VCE not responding, giving up!!!\n");
  139. return r;
  140. }
  141. return 0;
  142. }
  143. static int vce_v3_0_early_init(struct amdgpu_device *adev)
  144. {
  145. vce_v3_0_set_ring_funcs(adev);
  146. vce_v3_0_set_irq_funcs(adev);
  147. return 0;
  148. }
  149. static int vce_v3_0_sw_init(struct amdgpu_device *adev)
  150. {
  151. struct amdgpu_ring *ring;
  152. int r;
  153. /* VCE */
  154. r = amdgpu_irq_add_id(adev, 167, &adev->vce.irq);
  155. if (r)
  156. return r;
  157. r = amdgpu_vce_sw_init(adev);
  158. if (r)
  159. return r;
  160. r = amdgpu_vce_resume(adev);
  161. if (r)
  162. return r;
  163. ring = &adev->vce.ring[0];
  164. sprintf(ring->name, "vce0");
  165. r = amdgpu_ring_init(adev, ring, 4096, VCE_CMD_NO_OP, 0xf,
  166. &adev->vce.irq, 0, AMDGPU_RING_TYPE_VCE);
  167. if (r)
  168. return r;
  169. ring = &adev->vce.ring[1];
  170. sprintf(ring->name, "vce1");
  171. r = amdgpu_ring_init(adev, ring, 4096, VCE_CMD_NO_OP, 0xf,
  172. &adev->vce.irq, 0, AMDGPU_RING_TYPE_VCE);
  173. if (r)
  174. return r;
  175. return r;
  176. }
  177. static int vce_v3_0_sw_fini(struct amdgpu_device *adev)
  178. {
  179. int r;
  180. r = amdgpu_vce_suspend(adev);
  181. if (r)
  182. return r;
  183. r = amdgpu_vce_sw_fini(adev);
  184. if (r)
  185. return r;
  186. return r;
  187. }
  188. static int vce_v3_0_hw_init(struct amdgpu_device *adev)
  189. {
  190. struct amdgpu_ring *ring;
  191. int r;
  192. r = vce_v3_0_start(adev);
  193. if (r)
  194. return r;
  195. ring = &adev->vce.ring[0];
  196. ring->ready = true;
  197. r = amdgpu_ring_test_ring(ring);
  198. if (r) {
  199. ring->ready = false;
  200. return r;
  201. }
  202. ring = &adev->vce.ring[1];
  203. ring->ready = true;
  204. r = amdgpu_ring_test_ring(ring);
  205. if (r) {
  206. ring->ready = false;
  207. return r;
  208. }
  209. DRM_INFO("VCE initialized successfully.\n");
  210. return 0;
  211. }
  212. static int vce_v3_0_hw_fini(struct amdgpu_device *adev)
  213. {
  214. // TODO
  215. return 0;
  216. }
  217. static int vce_v3_0_suspend(struct amdgpu_device *adev)
  218. {
  219. int r;
  220. r = vce_v3_0_hw_fini(adev);
  221. if (r)
  222. return r;
  223. r = amdgpu_vce_suspend(adev);
  224. if (r)
  225. return r;
  226. return r;
  227. }
  228. static int vce_v3_0_resume(struct amdgpu_device *adev)
  229. {
  230. int r;
  231. r = amdgpu_vce_resume(adev);
  232. if (r)
  233. return r;
  234. r = vce_v3_0_hw_init(adev);
  235. if (r)
  236. return r;
  237. return r;
  238. }
  239. static void vce_v3_0_mc_resume(struct amdgpu_device *adev)
  240. {
  241. uint32_t offset, size;
  242. WREG32_P(mmVCE_CLOCK_GATING_A, 0, ~(1 << 16));
  243. WREG32_P(mmVCE_UENC_CLOCK_GATING, 0x1FF000, ~0xFF9FF000);
  244. WREG32_P(mmVCE_UENC_REG_CLOCK_GATING, 0x3F, ~0x3F);
  245. WREG32(mmVCE_CLOCK_GATING_B, 0xf7);
  246. WREG32(mmVCE_LMI_CTRL, 0x00398000);
  247. WREG32_P(mmVCE_LMI_CACHE_CTRL, 0x0, ~0x1);
  248. WREG32(mmVCE_LMI_SWAP_CNTL, 0);
  249. WREG32(mmVCE_LMI_SWAP_CNTL1, 0);
  250. WREG32(mmVCE_LMI_VM_CTRL, 0);
  251. WREG32(mmVCE_LMI_VCPU_CACHE_40BIT_BAR, (adev->vce.gpu_addr >> 8));
  252. offset = AMDGPU_VCE_FIRMWARE_OFFSET;
  253. size = AMDGPU_GPU_PAGE_ALIGN(adev->vce.fw->size);
  254. WREG32(mmVCE_VCPU_CACHE_OFFSET0, offset & 0x7fffffff);
  255. WREG32(mmVCE_VCPU_CACHE_SIZE0, size);
  256. offset += size;
  257. size = AMDGPU_VCE_STACK_SIZE;
  258. WREG32(mmVCE_VCPU_CACHE_OFFSET1, offset & 0x7fffffff);
  259. WREG32(mmVCE_VCPU_CACHE_SIZE1, size);
  260. offset += size;
  261. size = AMDGPU_VCE_HEAP_SIZE;
  262. WREG32(mmVCE_VCPU_CACHE_OFFSET2, offset & 0x7fffffff);
  263. WREG32(mmVCE_VCPU_CACHE_SIZE2, size);
  264. WREG32_P(mmVCE_LMI_CTRL2, 0x0, ~0x100);
  265. WREG32_P(mmVCE_SYS_INT_EN, VCE_SYS_INT_EN__VCE_SYS_INT_TRAP_INTERRUPT_EN_MASK,
  266. ~VCE_SYS_INT_EN__VCE_SYS_INT_TRAP_INTERRUPT_EN_MASK);
  267. }
  268. static bool vce_v3_0_is_idle(struct amdgpu_device *adev)
  269. {
  270. return !(RREG32(mmSRBM_STATUS2) & SRBM_STATUS2__VCE_BUSY_MASK);
  271. }
  272. static int vce_v3_0_wait_for_idle(struct amdgpu_device *adev)
  273. {
  274. unsigned i;
  275. for (i = 0; i < adev->usec_timeout; i++) {
  276. if (!(RREG32(mmSRBM_STATUS2) & SRBM_STATUS2__VCE_BUSY_MASK))
  277. return 0;
  278. }
  279. return -ETIMEDOUT;
  280. }
  281. static int vce_v3_0_soft_reset(struct amdgpu_device *adev)
  282. {
  283. WREG32_P(mmSRBM_SOFT_RESET, SRBM_SOFT_RESET__SOFT_RESET_VCE_MASK,
  284. ~SRBM_SOFT_RESET__SOFT_RESET_VCE_MASK);
  285. mdelay(5);
  286. return vce_v3_0_start(adev);
  287. }
  288. static void vce_v3_0_print_status(struct amdgpu_device *adev)
  289. {
  290. dev_info(adev->dev, "VCE 3.0 registers\n");
  291. dev_info(adev->dev, " VCE_STATUS=0x%08X\n",
  292. RREG32(mmVCE_STATUS));
  293. dev_info(adev->dev, " VCE_VCPU_CNTL=0x%08X\n",
  294. RREG32(mmVCE_VCPU_CNTL));
  295. dev_info(adev->dev, " VCE_VCPU_CACHE_OFFSET0=0x%08X\n",
  296. RREG32(mmVCE_VCPU_CACHE_OFFSET0));
  297. dev_info(adev->dev, " VCE_VCPU_CACHE_SIZE0=0x%08X\n",
  298. RREG32(mmVCE_VCPU_CACHE_SIZE0));
  299. dev_info(adev->dev, " VCE_VCPU_CACHE_OFFSET1=0x%08X\n",
  300. RREG32(mmVCE_VCPU_CACHE_OFFSET1));
  301. dev_info(adev->dev, " VCE_VCPU_CACHE_SIZE1=0x%08X\n",
  302. RREG32(mmVCE_VCPU_CACHE_SIZE1));
  303. dev_info(adev->dev, " VCE_VCPU_CACHE_OFFSET2=0x%08X\n",
  304. RREG32(mmVCE_VCPU_CACHE_OFFSET2));
  305. dev_info(adev->dev, " VCE_VCPU_CACHE_SIZE2=0x%08X\n",
  306. RREG32(mmVCE_VCPU_CACHE_SIZE2));
  307. dev_info(adev->dev, " VCE_SOFT_RESET=0x%08X\n",
  308. RREG32(mmVCE_SOFT_RESET));
  309. dev_info(adev->dev, " VCE_RB_BASE_LO2=0x%08X\n",
  310. RREG32(mmVCE_RB_BASE_LO2));
  311. dev_info(adev->dev, " VCE_RB_BASE_HI2=0x%08X\n",
  312. RREG32(mmVCE_RB_BASE_HI2));
  313. dev_info(adev->dev, " VCE_RB_SIZE2=0x%08X\n",
  314. RREG32(mmVCE_RB_SIZE2));
  315. dev_info(adev->dev, " VCE_RB_RPTR2=0x%08X\n",
  316. RREG32(mmVCE_RB_RPTR2));
  317. dev_info(adev->dev, " VCE_RB_WPTR2=0x%08X\n",
  318. RREG32(mmVCE_RB_WPTR2));
  319. dev_info(adev->dev, " VCE_RB_BASE_LO=0x%08X\n",
  320. RREG32(mmVCE_RB_BASE_LO));
  321. dev_info(adev->dev, " VCE_RB_BASE_HI=0x%08X\n",
  322. RREG32(mmVCE_RB_BASE_HI));
  323. dev_info(adev->dev, " VCE_RB_SIZE=0x%08X\n",
  324. RREG32(mmVCE_RB_SIZE));
  325. dev_info(adev->dev, " VCE_RB_RPTR=0x%08X\n",
  326. RREG32(mmVCE_RB_RPTR));
  327. dev_info(adev->dev, " VCE_RB_WPTR=0x%08X\n",
  328. RREG32(mmVCE_RB_WPTR));
  329. dev_info(adev->dev, " VCE_CLOCK_GATING_A=0x%08X\n",
  330. RREG32(mmVCE_CLOCK_GATING_A));
  331. dev_info(adev->dev, " VCE_CLOCK_GATING_B=0x%08X\n",
  332. RREG32(mmVCE_CLOCK_GATING_B));
  333. dev_info(adev->dev, " VCE_UENC_CLOCK_GATING=0x%08X\n",
  334. RREG32(mmVCE_UENC_CLOCK_GATING));
  335. dev_info(adev->dev, " VCE_UENC_REG_CLOCK_GATING=0x%08X\n",
  336. RREG32(mmVCE_UENC_REG_CLOCK_GATING));
  337. dev_info(adev->dev, " VCE_SYS_INT_EN=0x%08X\n",
  338. RREG32(mmVCE_SYS_INT_EN));
  339. dev_info(adev->dev, " VCE_LMI_CTRL2=0x%08X\n",
  340. RREG32(mmVCE_LMI_CTRL2));
  341. dev_info(adev->dev, " VCE_LMI_CTRL=0x%08X\n",
  342. RREG32(mmVCE_LMI_CTRL));
  343. dev_info(adev->dev, " VCE_LMI_VM_CTRL=0x%08X\n",
  344. RREG32(mmVCE_LMI_VM_CTRL));
  345. dev_info(adev->dev, " VCE_LMI_SWAP_CNTL=0x%08X\n",
  346. RREG32(mmVCE_LMI_SWAP_CNTL));
  347. dev_info(adev->dev, " VCE_LMI_SWAP_CNTL1=0x%08X\n",
  348. RREG32(mmVCE_LMI_SWAP_CNTL1));
  349. dev_info(adev->dev, " VCE_LMI_CACHE_CTRL=0x%08X\n",
  350. RREG32(mmVCE_LMI_CACHE_CTRL));
  351. }
  352. static int vce_v3_0_set_interrupt_state(struct amdgpu_device *adev,
  353. struct amdgpu_irq_src *source,
  354. unsigned type,
  355. enum amdgpu_interrupt_state state)
  356. {
  357. uint32_t val = 0;
  358. if (state == AMDGPU_IRQ_STATE_ENABLE)
  359. val |= VCE_SYS_INT_EN__VCE_SYS_INT_TRAP_INTERRUPT_EN_MASK;
  360. WREG32_P(mmVCE_SYS_INT_EN, val, ~VCE_SYS_INT_EN__VCE_SYS_INT_TRAP_INTERRUPT_EN_MASK);
  361. return 0;
  362. }
  363. static int vce_v3_0_process_interrupt(struct amdgpu_device *adev,
  364. struct amdgpu_irq_src *source,
  365. struct amdgpu_iv_entry *entry)
  366. {
  367. DRM_DEBUG("IH: VCE\n");
  368. switch (entry->src_data) {
  369. case 0:
  370. amdgpu_fence_process(&adev->vce.ring[0]);
  371. break;
  372. case 1:
  373. amdgpu_fence_process(&adev->vce.ring[1]);
  374. break;
  375. default:
  376. DRM_ERROR("Unhandled interrupt: %d %d\n",
  377. entry->src_id, entry->src_data);
  378. break;
  379. }
  380. return 0;
  381. }
  382. static int vce_v3_0_set_clockgating_state(struct amdgpu_device *adev,
  383. enum amdgpu_clockgating_state state)
  384. {
  385. //TODO
  386. return 0;
  387. }
  388. static int vce_v3_0_set_powergating_state(struct amdgpu_device *adev,
  389. enum amdgpu_powergating_state state)
  390. {
  391. /* This doesn't actually powergate the VCE block.
  392. * That's done in the dpm code via the SMC. This
  393. * just re-inits the block as necessary. The actual
  394. * gating still happens in the dpm code. We should
  395. * revisit this when there is a cleaner line between
  396. * the smc and the hw blocks
  397. */
  398. if (state == AMDGPU_PG_STATE_GATE)
  399. /* XXX do we need a vce_v3_0_stop()? */
  400. return 0;
  401. else
  402. return vce_v3_0_start(adev);
  403. }
  404. const struct amdgpu_ip_funcs vce_v3_0_ip_funcs = {
  405. .early_init = vce_v3_0_early_init,
  406. .late_init = NULL,
  407. .sw_init = vce_v3_0_sw_init,
  408. .sw_fini = vce_v3_0_sw_fini,
  409. .hw_init = vce_v3_0_hw_init,
  410. .hw_fini = vce_v3_0_hw_fini,
  411. .suspend = vce_v3_0_suspend,
  412. .resume = vce_v3_0_resume,
  413. .is_idle = vce_v3_0_is_idle,
  414. .wait_for_idle = vce_v3_0_wait_for_idle,
  415. .soft_reset = vce_v3_0_soft_reset,
  416. .print_status = vce_v3_0_print_status,
  417. .set_clockgating_state = vce_v3_0_set_clockgating_state,
  418. .set_powergating_state = vce_v3_0_set_powergating_state,
  419. };
  420. static const struct amdgpu_ring_funcs vce_v3_0_ring_funcs = {
  421. .get_rptr = vce_v3_0_ring_get_rptr,
  422. .get_wptr = vce_v3_0_ring_get_wptr,
  423. .set_wptr = vce_v3_0_ring_set_wptr,
  424. .parse_cs = amdgpu_vce_ring_parse_cs,
  425. .emit_ib = amdgpu_vce_ring_emit_ib,
  426. .emit_fence = amdgpu_vce_ring_emit_fence,
  427. .emit_semaphore = amdgpu_vce_ring_emit_semaphore,
  428. .test_ring = amdgpu_vce_ring_test_ring,
  429. .test_ib = amdgpu_vce_ring_test_ib,
  430. .is_lockup = amdgpu_ring_test_lockup,
  431. };
  432. static void vce_v3_0_set_ring_funcs(struct amdgpu_device *adev)
  433. {
  434. adev->vce.ring[0].funcs = &vce_v3_0_ring_funcs;
  435. adev->vce.ring[1].funcs = &vce_v3_0_ring_funcs;
  436. }
  437. static const struct amdgpu_irq_src_funcs vce_v3_0_irq_funcs = {
  438. .set = vce_v3_0_set_interrupt_state,
  439. .process = vce_v3_0_process_interrupt,
  440. };
  441. static void vce_v3_0_set_irq_funcs(struct amdgpu_device *adev)
  442. {
  443. adev->vce.irq.num_types = 1;
  444. adev->vce.irq.funcs = &vce_v3_0_irq_funcs;
  445. };