uvd_v6_0.c 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921
  1. /*
  2. * Copyright 2014 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. * Authors: Christian König <christian.koenig@amd.com>
  23. */
  24. #include <linux/firmware.h>
  25. #include <drm/drmP.h>
  26. #include "amdgpu.h"
  27. #include "amdgpu_uvd.h"
  28. #include "vid.h"
  29. #include "uvd/uvd_6_0_d.h"
  30. #include "uvd/uvd_6_0_sh_mask.h"
  31. #include "oss/oss_2_0_d.h"
  32. #include "oss/oss_2_0_sh_mask.h"
  33. #include "vi.h"
  34. static void uvd_v6_0_set_ring_funcs(struct amdgpu_device *adev);
  35. static void uvd_v6_0_set_irq_funcs(struct amdgpu_device *adev);
  36. static int uvd_v6_0_start(struct amdgpu_device *adev);
  37. static void uvd_v6_0_stop(struct amdgpu_device *adev);
  38. static void uvd_v6_0_set_sw_clock_gating(struct amdgpu_device *adev);
  39. /**
  40. * uvd_v6_0_ring_get_rptr - get read pointer
  41. *
  42. * @ring: amdgpu_ring pointer
  43. *
  44. * Returns the current hardware read pointer
  45. */
  46. static uint32_t uvd_v6_0_ring_get_rptr(struct amdgpu_ring *ring)
  47. {
  48. struct amdgpu_device *adev = ring->adev;
  49. return RREG32(mmUVD_RBC_RB_RPTR);
  50. }
  51. /**
  52. * uvd_v6_0_ring_get_wptr - get write pointer
  53. *
  54. * @ring: amdgpu_ring pointer
  55. *
  56. * Returns the current hardware write pointer
  57. */
  58. static uint32_t uvd_v6_0_ring_get_wptr(struct amdgpu_ring *ring)
  59. {
  60. struct amdgpu_device *adev = ring->adev;
  61. return RREG32(mmUVD_RBC_RB_WPTR);
  62. }
  63. /**
  64. * uvd_v6_0_ring_set_wptr - set write pointer
  65. *
  66. * @ring: amdgpu_ring pointer
  67. *
  68. * Commits the write pointer to the hardware
  69. */
  70. static void uvd_v6_0_ring_set_wptr(struct amdgpu_ring *ring)
  71. {
  72. struct amdgpu_device *adev = ring->adev;
  73. WREG32(mmUVD_RBC_RB_WPTR, ring->wptr);
  74. }
  75. static int uvd_v6_0_early_init(void *handle)
  76. {
  77. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  78. uvd_v6_0_set_ring_funcs(adev);
  79. uvd_v6_0_set_irq_funcs(adev);
  80. return 0;
  81. }
  82. static int uvd_v6_0_sw_init(void *handle)
  83. {
  84. struct amdgpu_ring *ring;
  85. int r;
  86. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  87. /* UVD TRAP */
  88. r = amdgpu_irq_add_id(adev, 124, &adev->uvd.irq);
  89. if (r)
  90. return r;
  91. r = amdgpu_uvd_sw_init(adev);
  92. if (r)
  93. return r;
  94. r = amdgpu_uvd_resume(adev);
  95. if (r)
  96. return r;
  97. ring = &adev->uvd.ring;
  98. sprintf(ring->name, "uvd");
  99. r = amdgpu_ring_init(adev, ring, 512, CP_PACKET2, 0xf,
  100. &adev->uvd.irq, 0, AMDGPU_RING_TYPE_UVD);
  101. return r;
  102. }
  103. static int uvd_v6_0_sw_fini(void *handle)
  104. {
  105. int r;
  106. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  107. r = amdgpu_uvd_suspend(adev);
  108. if (r)
  109. return r;
  110. r = amdgpu_uvd_sw_fini(adev);
  111. if (r)
  112. return r;
  113. return r;
  114. }
  115. /**
  116. * uvd_v6_0_hw_init - start and test UVD block
  117. *
  118. * @adev: amdgpu_device pointer
  119. *
  120. * Initialize the hardware, boot up the VCPU and do some testing
  121. */
  122. static int uvd_v6_0_hw_init(void *handle)
  123. {
  124. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  125. struct amdgpu_ring *ring = &adev->uvd.ring;
  126. uint32_t tmp;
  127. int r;
  128. r = uvd_v6_0_start(adev);
  129. if (r)
  130. goto done;
  131. ring->ready = true;
  132. r = amdgpu_ring_test_ring(ring);
  133. if (r) {
  134. ring->ready = false;
  135. goto done;
  136. }
  137. r = amdgpu_ring_alloc(ring, 10);
  138. if (r) {
  139. DRM_ERROR("amdgpu: ring failed to lock UVD ring (%d).\n", r);
  140. goto done;
  141. }
  142. tmp = PACKET0(mmUVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL, 0);
  143. amdgpu_ring_write(ring, tmp);
  144. amdgpu_ring_write(ring, 0xFFFFF);
  145. tmp = PACKET0(mmUVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL, 0);
  146. amdgpu_ring_write(ring, tmp);
  147. amdgpu_ring_write(ring, 0xFFFFF);
  148. tmp = PACKET0(mmUVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL, 0);
  149. amdgpu_ring_write(ring, tmp);
  150. amdgpu_ring_write(ring, 0xFFFFF);
  151. /* Clear timeout status bits */
  152. amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_TIMEOUT_STATUS, 0));
  153. amdgpu_ring_write(ring, 0x8);
  154. amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_CNTL, 0));
  155. amdgpu_ring_write(ring, 3);
  156. amdgpu_ring_commit(ring);
  157. done:
  158. if (!r)
  159. DRM_INFO("UVD initialized successfully.\n");
  160. return r;
  161. }
  162. /**
  163. * uvd_v6_0_hw_fini - stop the hardware block
  164. *
  165. * @adev: amdgpu_device pointer
  166. *
  167. * Stop the UVD block, mark ring as not ready any more
  168. */
  169. static int uvd_v6_0_hw_fini(void *handle)
  170. {
  171. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  172. struct amdgpu_ring *ring = &adev->uvd.ring;
  173. uvd_v6_0_stop(adev);
  174. ring->ready = false;
  175. return 0;
  176. }
  177. static int uvd_v6_0_suspend(void *handle)
  178. {
  179. int r;
  180. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  181. r = uvd_v6_0_hw_fini(adev);
  182. if (r)
  183. return r;
  184. /* Skip this for APU for now */
  185. if (!(adev->flags & AMD_IS_APU)) {
  186. r = amdgpu_uvd_suspend(adev);
  187. if (r)
  188. return r;
  189. }
  190. return r;
  191. }
  192. static int uvd_v6_0_resume(void *handle)
  193. {
  194. int r;
  195. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  196. /* Skip this for APU for now */
  197. if (!(adev->flags & AMD_IS_APU)) {
  198. r = amdgpu_uvd_resume(adev);
  199. if (r)
  200. return r;
  201. }
  202. r = uvd_v6_0_hw_init(adev);
  203. if (r)
  204. return r;
  205. return r;
  206. }
  207. /**
  208. * uvd_v6_0_mc_resume - memory controller programming
  209. *
  210. * @adev: amdgpu_device pointer
  211. *
  212. * Let the UVD memory controller know it's offsets
  213. */
  214. static void uvd_v6_0_mc_resume(struct amdgpu_device *adev)
  215. {
  216. uint64_t offset;
  217. uint32_t size;
  218. /* programm memory controller bits 0-27 */
  219. WREG32(mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  220. lower_32_bits(adev->uvd.gpu_addr));
  221. WREG32(mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  222. upper_32_bits(adev->uvd.gpu_addr));
  223. offset = AMDGPU_UVD_FIRMWARE_OFFSET;
  224. size = AMDGPU_GPU_PAGE_ALIGN(adev->uvd.fw->size + 4);
  225. WREG32(mmUVD_VCPU_CACHE_OFFSET0, offset >> 3);
  226. WREG32(mmUVD_VCPU_CACHE_SIZE0, size);
  227. offset += size;
  228. size = AMDGPU_UVD_HEAP_SIZE;
  229. WREG32(mmUVD_VCPU_CACHE_OFFSET1, offset >> 3);
  230. WREG32(mmUVD_VCPU_CACHE_SIZE1, size);
  231. offset += size;
  232. size = AMDGPU_UVD_STACK_SIZE +
  233. (AMDGPU_UVD_SESSION_SIZE * adev->uvd.max_handles);
  234. WREG32(mmUVD_VCPU_CACHE_OFFSET2, offset >> 3);
  235. WREG32(mmUVD_VCPU_CACHE_SIZE2, size);
  236. WREG32(mmUVD_UDEC_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
  237. WREG32(mmUVD_UDEC_DB_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
  238. WREG32(mmUVD_UDEC_DBW_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
  239. WREG32(mmUVD_GP_SCRATCH4, adev->uvd.max_handles);
  240. }
  241. #if 0
  242. static void cz_set_uvd_clock_gating_branches(struct amdgpu_device *adev,
  243. bool enable)
  244. {
  245. u32 data, data1;
  246. data = RREG32(mmUVD_CGC_GATE);
  247. data1 = RREG32(mmUVD_SUVD_CGC_GATE);
  248. if (enable) {
  249. data |= UVD_CGC_GATE__SYS_MASK |
  250. UVD_CGC_GATE__UDEC_MASK |
  251. UVD_CGC_GATE__MPEG2_MASK |
  252. UVD_CGC_GATE__RBC_MASK |
  253. UVD_CGC_GATE__LMI_MC_MASK |
  254. UVD_CGC_GATE__IDCT_MASK |
  255. UVD_CGC_GATE__MPRD_MASK |
  256. UVD_CGC_GATE__MPC_MASK |
  257. UVD_CGC_GATE__LBSI_MASK |
  258. UVD_CGC_GATE__LRBBM_MASK |
  259. UVD_CGC_GATE__UDEC_RE_MASK |
  260. UVD_CGC_GATE__UDEC_CM_MASK |
  261. UVD_CGC_GATE__UDEC_IT_MASK |
  262. UVD_CGC_GATE__UDEC_DB_MASK |
  263. UVD_CGC_GATE__UDEC_MP_MASK |
  264. UVD_CGC_GATE__WCB_MASK |
  265. UVD_CGC_GATE__VCPU_MASK |
  266. UVD_CGC_GATE__SCPU_MASK;
  267. data1 |= UVD_SUVD_CGC_GATE__SRE_MASK |
  268. UVD_SUVD_CGC_GATE__SIT_MASK |
  269. UVD_SUVD_CGC_GATE__SMP_MASK |
  270. UVD_SUVD_CGC_GATE__SCM_MASK |
  271. UVD_SUVD_CGC_GATE__SDB_MASK |
  272. UVD_SUVD_CGC_GATE__SRE_H264_MASK |
  273. UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
  274. UVD_SUVD_CGC_GATE__SIT_H264_MASK |
  275. UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
  276. UVD_SUVD_CGC_GATE__SCM_H264_MASK |
  277. UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
  278. UVD_SUVD_CGC_GATE__SDB_H264_MASK |
  279. UVD_SUVD_CGC_GATE__SDB_HEVC_MASK;
  280. } else {
  281. data &= ~(UVD_CGC_GATE__SYS_MASK |
  282. UVD_CGC_GATE__UDEC_MASK |
  283. UVD_CGC_GATE__MPEG2_MASK |
  284. UVD_CGC_GATE__RBC_MASK |
  285. UVD_CGC_GATE__LMI_MC_MASK |
  286. UVD_CGC_GATE__LMI_UMC_MASK |
  287. UVD_CGC_GATE__IDCT_MASK |
  288. UVD_CGC_GATE__MPRD_MASK |
  289. UVD_CGC_GATE__MPC_MASK |
  290. UVD_CGC_GATE__LBSI_MASK |
  291. UVD_CGC_GATE__LRBBM_MASK |
  292. UVD_CGC_GATE__UDEC_RE_MASK |
  293. UVD_CGC_GATE__UDEC_CM_MASK |
  294. UVD_CGC_GATE__UDEC_IT_MASK |
  295. UVD_CGC_GATE__UDEC_DB_MASK |
  296. UVD_CGC_GATE__UDEC_MP_MASK |
  297. UVD_CGC_GATE__WCB_MASK |
  298. UVD_CGC_GATE__VCPU_MASK |
  299. UVD_CGC_GATE__SCPU_MASK);
  300. data1 &= ~(UVD_SUVD_CGC_GATE__SRE_MASK |
  301. UVD_SUVD_CGC_GATE__SIT_MASK |
  302. UVD_SUVD_CGC_GATE__SMP_MASK |
  303. UVD_SUVD_CGC_GATE__SCM_MASK |
  304. UVD_SUVD_CGC_GATE__SDB_MASK |
  305. UVD_SUVD_CGC_GATE__SRE_H264_MASK |
  306. UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
  307. UVD_SUVD_CGC_GATE__SIT_H264_MASK |
  308. UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
  309. UVD_SUVD_CGC_GATE__SCM_H264_MASK |
  310. UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
  311. UVD_SUVD_CGC_GATE__SDB_H264_MASK |
  312. UVD_SUVD_CGC_GATE__SDB_HEVC_MASK);
  313. }
  314. WREG32(mmUVD_CGC_GATE, data);
  315. WREG32(mmUVD_SUVD_CGC_GATE, data1);
  316. }
  317. #endif
  318. /**
  319. * uvd_v6_0_start - start UVD block
  320. *
  321. * @adev: amdgpu_device pointer
  322. *
  323. * Setup and start the UVD block
  324. */
  325. static int uvd_v6_0_start(struct amdgpu_device *adev)
  326. {
  327. struct amdgpu_ring *ring = &adev->uvd.ring;
  328. uint32_t rb_bufsz, tmp;
  329. uint32_t lmi_swap_cntl;
  330. uint32_t mp_swap_cntl;
  331. int i, j, r;
  332. /*disable DPG */
  333. WREG32_P(mmUVD_POWER_STATUS, 0, ~(1 << 2));
  334. /* disable byte swapping */
  335. lmi_swap_cntl = 0;
  336. mp_swap_cntl = 0;
  337. uvd_v6_0_mc_resume(adev);
  338. /* Set dynamic clock gating in S/W control mode */
  339. if (adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG) {
  340. uvd_v6_0_set_sw_clock_gating(adev);
  341. } else {
  342. /* disable clock gating */
  343. uint32_t data = RREG32(mmUVD_CGC_CTRL);
  344. data &= ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
  345. WREG32(mmUVD_CGC_CTRL, data);
  346. }
  347. /* disable interupt */
  348. WREG32_P(mmUVD_MASTINT_EN, 0, ~(1 << 1));
  349. /* stall UMC and register bus before resetting VCPU */
  350. WREG32_P(mmUVD_LMI_CTRL2, 1 << 8, ~(1 << 8));
  351. mdelay(1);
  352. /* put LMI, VCPU, RBC etc... into reset */
  353. WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  354. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK | UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  355. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK | UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  356. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK | UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  357. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
  358. mdelay(5);
  359. /* take UVD block out of reset */
  360. WREG32_P(mmSRBM_SOFT_RESET, 0, ~SRBM_SOFT_RESET__SOFT_RESET_UVD_MASK);
  361. mdelay(5);
  362. /* initialize UVD memory controller */
  363. WREG32(mmUVD_LMI_CTRL, 0x40 | (1 << 8) | (1 << 13) |
  364. (1 << 21) | (1 << 9) | (1 << 20));
  365. #ifdef __BIG_ENDIAN
  366. /* swap (8 in 32) RB and IB */
  367. lmi_swap_cntl = 0xa;
  368. mp_swap_cntl = 0;
  369. #endif
  370. WREG32(mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
  371. WREG32(mmUVD_MP_SWAP_CNTL, mp_swap_cntl);
  372. WREG32(mmUVD_MPC_SET_MUXA0, 0x40c2040);
  373. WREG32(mmUVD_MPC_SET_MUXA1, 0x0);
  374. WREG32(mmUVD_MPC_SET_MUXB0, 0x40c2040);
  375. WREG32(mmUVD_MPC_SET_MUXB1, 0x0);
  376. WREG32(mmUVD_MPC_SET_ALU, 0);
  377. WREG32(mmUVD_MPC_SET_MUX, 0x88);
  378. /* take all subblocks out of reset, except VCPU */
  379. WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  380. mdelay(5);
  381. /* enable VCPU clock */
  382. WREG32(mmUVD_VCPU_CNTL, 1 << 9);
  383. /* enable UMC */
  384. WREG32_P(mmUVD_LMI_CTRL2, 0, ~(1 << 8));
  385. /* boot up the VCPU */
  386. WREG32(mmUVD_SOFT_RESET, 0);
  387. mdelay(10);
  388. for (i = 0; i < 10; ++i) {
  389. uint32_t status;
  390. for (j = 0; j < 100; ++j) {
  391. status = RREG32(mmUVD_STATUS);
  392. if (status & 2)
  393. break;
  394. mdelay(10);
  395. }
  396. r = 0;
  397. if (status & 2)
  398. break;
  399. DRM_ERROR("UVD not responding, trying to reset the VCPU!!!\n");
  400. WREG32_P(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
  401. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  402. mdelay(10);
  403. WREG32_P(mmUVD_SOFT_RESET, 0,
  404. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  405. mdelay(10);
  406. r = -1;
  407. }
  408. if (r) {
  409. DRM_ERROR("UVD not responding, giving up!!!\n");
  410. return r;
  411. }
  412. /* enable master interrupt */
  413. WREG32_P(mmUVD_MASTINT_EN, 3 << 1, ~(3 << 1));
  414. /* clear the bit 4 of UVD_STATUS */
  415. WREG32_P(mmUVD_STATUS, 0, ~(2 << 1));
  416. rb_bufsz = order_base_2(ring->ring_size);
  417. tmp = 0;
  418. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
  419. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
  420. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  421. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
  422. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
  423. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
  424. /* force RBC into idle state */
  425. WREG32(mmUVD_RBC_RB_CNTL, tmp);
  426. /* set the write pointer delay */
  427. WREG32(mmUVD_RBC_RB_WPTR_CNTL, 0);
  428. /* set the wb address */
  429. WREG32(mmUVD_RBC_RB_RPTR_ADDR, (upper_32_bits(ring->gpu_addr) >> 2));
  430. /* programm the RB_BASE for ring buffer */
  431. WREG32(mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
  432. lower_32_bits(ring->gpu_addr));
  433. WREG32(mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
  434. upper_32_bits(ring->gpu_addr));
  435. /* Initialize the ring buffer's read and write pointers */
  436. WREG32(mmUVD_RBC_RB_RPTR, 0);
  437. ring->wptr = RREG32(mmUVD_RBC_RB_RPTR);
  438. WREG32(mmUVD_RBC_RB_WPTR, ring->wptr);
  439. WREG32_P(mmUVD_RBC_RB_CNTL, 0, ~UVD_RBC_RB_CNTL__RB_NO_FETCH_MASK);
  440. return 0;
  441. }
  442. /**
  443. * uvd_v6_0_stop - stop UVD block
  444. *
  445. * @adev: amdgpu_device pointer
  446. *
  447. * stop the UVD block
  448. */
  449. static void uvd_v6_0_stop(struct amdgpu_device *adev)
  450. {
  451. /* force RBC into idle state */
  452. WREG32(mmUVD_RBC_RB_CNTL, 0x11010101);
  453. /* Stall UMC and register bus before resetting VCPU */
  454. WREG32_P(mmUVD_LMI_CTRL2, 1 << 8, ~(1 << 8));
  455. mdelay(1);
  456. /* put VCPU into reset */
  457. WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  458. mdelay(5);
  459. /* disable VCPU clock */
  460. WREG32(mmUVD_VCPU_CNTL, 0x0);
  461. /* Unstall UMC and register bus */
  462. WREG32_P(mmUVD_LMI_CTRL2, 0, ~(1 << 8));
  463. }
  464. /**
  465. * uvd_v6_0_ring_emit_fence - emit an fence & trap command
  466. *
  467. * @ring: amdgpu_ring pointer
  468. * @fence: fence to emit
  469. *
  470. * Write a fence and a trap command to the ring.
  471. */
  472. static void uvd_v6_0_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
  473. unsigned flags)
  474. {
  475. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  476. amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
  477. amdgpu_ring_write(ring, seq);
  478. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
  479. amdgpu_ring_write(ring, addr & 0xffffffff);
  480. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
  481. amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
  482. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
  483. amdgpu_ring_write(ring, 0);
  484. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
  485. amdgpu_ring_write(ring, 0);
  486. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
  487. amdgpu_ring_write(ring, 0);
  488. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
  489. amdgpu_ring_write(ring, 2);
  490. }
  491. /**
  492. * uvd_v6_0_ring_test_ring - register write test
  493. *
  494. * @ring: amdgpu_ring pointer
  495. *
  496. * Test if we can successfully write to the context register
  497. */
  498. static int uvd_v6_0_ring_test_ring(struct amdgpu_ring *ring)
  499. {
  500. struct amdgpu_device *adev = ring->adev;
  501. uint32_t tmp = 0;
  502. unsigned i;
  503. int r;
  504. WREG32(mmUVD_CONTEXT_ID, 0xCAFEDEAD);
  505. r = amdgpu_ring_alloc(ring, 3);
  506. if (r) {
  507. DRM_ERROR("amdgpu: cp failed to lock ring %d (%d).\n",
  508. ring->idx, r);
  509. return r;
  510. }
  511. amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
  512. amdgpu_ring_write(ring, 0xDEADBEEF);
  513. amdgpu_ring_commit(ring);
  514. for (i = 0; i < adev->usec_timeout; i++) {
  515. tmp = RREG32(mmUVD_CONTEXT_ID);
  516. if (tmp == 0xDEADBEEF)
  517. break;
  518. DRM_UDELAY(1);
  519. }
  520. if (i < adev->usec_timeout) {
  521. DRM_INFO("ring test on %d succeeded in %d usecs\n",
  522. ring->idx, i);
  523. } else {
  524. DRM_ERROR("amdgpu: ring %d test failed (0x%08X)\n",
  525. ring->idx, tmp);
  526. r = -EINVAL;
  527. }
  528. return r;
  529. }
  530. /**
  531. * uvd_v6_0_ring_emit_ib - execute indirect buffer
  532. *
  533. * @ring: amdgpu_ring pointer
  534. * @ib: indirect buffer to execute
  535. *
  536. * Write ring commands to execute the indirect buffer
  537. */
  538. static void uvd_v6_0_ring_emit_ib(struct amdgpu_ring *ring,
  539. struct amdgpu_ib *ib)
  540. {
  541. amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_64BIT_BAR_LOW, 0));
  542. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  543. amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH, 0));
  544. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  545. amdgpu_ring_write(ring, PACKET0(mmUVD_RBC_IB_SIZE, 0));
  546. amdgpu_ring_write(ring, ib->length_dw);
  547. }
  548. /**
  549. * uvd_v6_0_ring_test_ib - test ib execution
  550. *
  551. * @ring: amdgpu_ring pointer
  552. *
  553. * Test if we can successfully execute an IB
  554. */
  555. static int uvd_v6_0_ring_test_ib(struct amdgpu_ring *ring)
  556. {
  557. struct fence *fence = NULL;
  558. int r;
  559. r = amdgpu_uvd_get_create_msg(ring, 1, NULL);
  560. if (r) {
  561. DRM_ERROR("amdgpu: failed to get create msg (%d).\n", r);
  562. goto error;
  563. }
  564. r = amdgpu_uvd_get_destroy_msg(ring, 1, true, &fence);
  565. if (r) {
  566. DRM_ERROR("amdgpu: failed to get destroy ib (%d).\n", r);
  567. goto error;
  568. }
  569. r = fence_wait(fence, false);
  570. if (r) {
  571. DRM_ERROR("amdgpu: fence wait failed (%d).\n", r);
  572. goto error;
  573. }
  574. DRM_INFO("ib test on ring %d succeeded\n", ring->idx);
  575. error:
  576. fence_put(fence);
  577. return r;
  578. }
  579. static bool uvd_v6_0_is_idle(void *handle)
  580. {
  581. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  582. return !(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK);
  583. }
  584. static int uvd_v6_0_wait_for_idle(void *handle)
  585. {
  586. unsigned i;
  587. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  588. for (i = 0; i < adev->usec_timeout; i++) {
  589. if (!(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK))
  590. return 0;
  591. }
  592. return -ETIMEDOUT;
  593. }
  594. static int uvd_v6_0_soft_reset(void *handle)
  595. {
  596. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  597. uvd_v6_0_stop(adev);
  598. WREG32_P(mmSRBM_SOFT_RESET, SRBM_SOFT_RESET__SOFT_RESET_UVD_MASK,
  599. ~SRBM_SOFT_RESET__SOFT_RESET_UVD_MASK);
  600. mdelay(5);
  601. return uvd_v6_0_start(adev);
  602. }
  603. static int uvd_v6_0_set_interrupt_state(struct amdgpu_device *adev,
  604. struct amdgpu_irq_src *source,
  605. unsigned type,
  606. enum amdgpu_interrupt_state state)
  607. {
  608. // TODO
  609. return 0;
  610. }
  611. static int uvd_v6_0_process_interrupt(struct amdgpu_device *adev,
  612. struct amdgpu_irq_src *source,
  613. struct amdgpu_iv_entry *entry)
  614. {
  615. DRM_DEBUG("IH: UVD TRAP\n");
  616. amdgpu_fence_process(&adev->uvd.ring);
  617. return 0;
  618. }
  619. static void uvd_v6_0_set_sw_clock_gating(struct amdgpu_device *adev)
  620. {
  621. uint32_t data, data1, data2, suvd_flags;
  622. data = RREG32(mmUVD_CGC_CTRL);
  623. data1 = RREG32(mmUVD_SUVD_CGC_GATE);
  624. data2 = RREG32(mmUVD_SUVD_CGC_CTRL);
  625. data &= ~(UVD_CGC_CTRL__CLK_OFF_DELAY_MASK |
  626. UVD_CGC_CTRL__CLK_GATE_DLY_TIMER_MASK);
  627. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  628. UVD_SUVD_CGC_GATE__SIT_MASK |
  629. UVD_SUVD_CGC_GATE__SMP_MASK |
  630. UVD_SUVD_CGC_GATE__SCM_MASK |
  631. UVD_SUVD_CGC_GATE__SDB_MASK;
  632. data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK |
  633. (1 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_GATE_DLY_TIMER)) |
  634. (4 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_OFF_DELAY));
  635. data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
  636. UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
  637. UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
  638. UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
  639. UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
  640. UVD_CGC_CTRL__SYS_MODE_MASK |
  641. UVD_CGC_CTRL__UDEC_MODE_MASK |
  642. UVD_CGC_CTRL__MPEG2_MODE_MASK |
  643. UVD_CGC_CTRL__REGS_MODE_MASK |
  644. UVD_CGC_CTRL__RBC_MODE_MASK |
  645. UVD_CGC_CTRL__LMI_MC_MODE_MASK |
  646. UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
  647. UVD_CGC_CTRL__IDCT_MODE_MASK |
  648. UVD_CGC_CTRL__MPRD_MODE_MASK |
  649. UVD_CGC_CTRL__MPC_MODE_MASK |
  650. UVD_CGC_CTRL__LBSI_MODE_MASK |
  651. UVD_CGC_CTRL__LRBBM_MODE_MASK |
  652. UVD_CGC_CTRL__WCB_MODE_MASK |
  653. UVD_CGC_CTRL__VCPU_MODE_MASK |
  654. UVD_CGC_CTRL__JPEG_MODE_MASK |
  655. UVD_CGC_CTRL__SCPU_MODE_MASK |
  656. UVD_CGC_CTRL__JPEG2_MODE_MASK);
  657. data2 &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK |
  658. UVD_SUVD_CGC_CTRL__SIT_MODE_MASK |
  659. UVD_SUVD_CGC_CTRL__SMP_MODE_MASK |
  660. UVD_SUVD_CGC_CTRL__SCM_MODE_MASK |
  661. UVD_SUVD_CGC_CTRL__SDB_MODE_MASK);
  662. data1 |= suvd_flags;
  663. WREG32(mmUVD_CGC_CTRL, data);
  664. WREG32(mmUVD_CGC_GATE, 0);
  665. WREG32(mmUVD_SUVD_CGC_GATE, data1);
  666. WREG32(mmUVD_SUVD_CGC_CTRL, data2);
  667. }
  668. #if 0
  669. static void uvd_v6_0_set_hw_clock_gating(struct amdgpu_device *adev)
  670. {
  671. uint32_t data, data1, cgc_flags, suvd_flags;
  672. data = RREG32(mmUVD_CGC_GATE);
  673. data1 = RREG32(mmUVD_SUVD_CGC_GATE);
  674. cgc_flags = UVD_CGC_GATE__SYS_MASK |
  675. UVD_CGC_GATE__UDEC_MASK |
  676. UVD_CGC_GATE__MPEG2_MASK |
  677. UVD_CGC_GATE__RBC_MASK |
  678. UVD_CGC_GATE__LMI_MC_MASK |
  679. UVD_CGC_GATE__IDCT_MASK |
  680. UVD_CGC_GATE__MPRD_MASK |
  681. UVD_CGC_GATE__MPC_MASK |
  682. UVD_CGC_GATE__LBSI_MASK |
  683. UVD_CGC_GATE__LRBBM_MASK |
  684. UVD_CGC_GATE__UDEC_RE_MASK |
  685. UVD_CGC_GATE__UDEC_CM_MASK |
  686. UVD_CGC_GATE__UDEC_IT_MASK |
  687. UVD_CGC_GATE__UDEC_DB_MASK |
  688. UVD_CGC_GATE__UDEC_MP_MASK |
  689. UVD_CGC_GATE__WCB_MASK |
  690. UVD_CGC_GATE__VCPU_MASK |
  691. UVD_CGC_GATE__SCPU_MASK |
  692. UVD_CGC_GATE__JPEG_MASK |
  693. UVD_CGC_GATE__JPEG2_MASK;
  694. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  695. UVD_SUVD_CGC_GATE__SIT_MASK |
  696. UVD_SUVD_CGC_GATE__SMP_MASK |
  697. UVD_SUVD_CGC_GATE__SCM_MASK |
  698. UVD_SUVD_CGC_GATE__SDB_MASK;
  699. data |= cgc_flags;
  700. data1 |= suvd_flags;
  701. WREG32(mmUVD_CGC_GATE, data);
  702. WREG32(mmUVD_SUVD_CGC_GATE, data1);
  703. }
  704. #endif
  705. static int uvd_v6_0_set_clockgating_state(void *handle,
  706. enum amd_clockgating_state state)
  707. {
  708. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  709. bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
  710. static int curstate = -1;
  711. if (!(adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG))
  712. return 0;
  713. if (curstate == state)
  714. return 0;
  715. curstate = state;
  716. if (enable) {
  717. /* disable HW gating and enable Sw gating */
  718. uvd_v6_0_set_sw_clock_gating(adev);
  719. } else {
  720. /* wait for STATUS to clear */
  721. if (uvd_v6_0_wait_for_idle(handle))
  722. return -EBUSY;
  723. /* enable HW gates because UVD is idle */
  724. /* uvd_v6_0_set_hw_clock_gating(adev); */
  725. }
  726. return 0;
  727. }
  728. static int uvd_v6_0_set_powergating_state(void *handle,
  729. enum amd_powergating_state state)
  730. {
  731. /* This doesn't actually powergate the UVD block.
  732. * That's done in the dpm code via the SMC. This
  733. * just re-inits the block as necessary. The actual
  734. * gating still happens in the dpm code. We should
  735. * revisit this when there is a cleaner line between
  736. * the smc and the hw blocks
  737. */
  738. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  739. if (!(adev->pg_flags & AMD_PG_SUPPORT_UVD))
  740. return 0;
  741. if (state == AMD_PG_STATE_GATE) {
  742. uvd_v6_0_stop(adev);
  743. return 0;
  744. } else {
  745. return uvd_v6_0_start(adev);
  746. }
  747. }
  748. const struct amd_ip_funcs uvd_v6_0_ip_funcs = {
  749. .early_init = uvd_v6_0_early_init,
  750. .late_init = NULL,
  751. .sw_init = uvd_v6_0_sw_init,
  752. .sw_fini = uvd_v6_0_sw_fini,
  753. .hw_init = uvd_v6_0_hw_init,
  754. .hw_fini = uvd_v6_0_hw_fini,
  755. .suspend = uvd_v6_0_suspend,
  756. .resume = uvd_v6_0_resume,
  757. .is_idle = uvd_v6_0_is_idle,
  758. .wait_for_idle = uvd_v6_0_wait_for_idle,
  759. .soft_reset = uvd_v6_0_soft_reset,
  760. .set_clockgating_state = uvd_v6_0_set_clockgating_state,
  761. .set_powergating_state = uvd_v6_0_set_powergating_state,
  762. };
  763. static const struct amdgpu_ring_funcs uvd_v6_0_ring_funcs = {
  764. .get_rptr = uvd_v6_0_ring_get_rptr,
  765. .get_wptr = uvd_v6_0_ring_get_wptr,
  766. .set_wptr = uvd_v6_0_ring_set_wptr,
  767. .parse_cs = amdgpu_uvd_ring_parse_cs,
  768. .emit_ib = uvd_v6_0_ring_emit_ib,
  769. .emit_fence = uvd_v6_0_ring_emit_fence,
  770. .test_ring = uvd_v6_0_ring_test_ring,
  771. .test_ib = uvd_v6_0_ring_test_ib,
  772. .insert_nop = amdgpu_ring_insert_nop,
  773. .pad_ib = amdgpu_ring_generic_pad_ib,
  774. };
  775. static void uvd_v6_0_set_ring_funcs(struct amdgpu_device *adev)
  776. {
  777. adev->uvd.ring.funcs = &uvd_v6_0_ring_funcs;
  778. }
  779. static const struct amdgpu_irq_src_funcs uvd_v6_0_irq_funcs = {
  780. .set = uvd_v6_0_set_interrupt_state,
  781. .process = uvd_v6_0_process_interrupt,
  782. };
  783. static void uvd_v6_0_set_irq_funcs(struct amdgpu_device *adev)
  784. {
  785. adev->uvd.irq.num_types = 1;
  786. adev->uvd.irq.funcs = &uvd_v6_0_irq_funcs;
  787. }