uvd_v6_0.c 25 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983
  1. /*
  2. * Copyright 2014 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. * Authors: Christian König <christian.koenig@amd.com>
  23. */
  24. #include <linux/firmware.h>
  25. #include <drm/drmP.h>
  26. #include "amdgpu.h"
  27. #include "amdgpu_uvd.h"
  28. #include "vid.h"
  29. #include "uvd/uvd_6_0_d.h"
  30. #include "uvd/uvd_6_0_sh_mask.h"
  31. #include "oss/oss_2_0_d.h"
  32. #include "oss/oss_2_0_sh_mask.h"
  33. #include "smu/smu_7_1_3_d.h"
  34. #include "smu/smu_7_1_3_sh_mask.h"
  35. #include "bif/bif_5_1_d.h"
  36. #include "vi.h"
  37. static void uvd_v6_0_set_ring_funcs(struct amdgpu_device *adev);
  38. static void uvd_v6_0_set_irq_funcs(struct amdgpu_device *adev);
  39. static int uvd_v6_0_start(struct amdgpu_device *adev);
  40. static void uvd_v6_0_stop(struct amdgpu_device *adev);
  41. static void uvd_v6_0_set_sw_clock_gating(struct amdgpu_device *adev);
  42. /**
  43. * uvd_v6_0_ring_get_rptr - get read pointer
  44. *
  45. * @ring: amdgpu_ring pointer
  46. *
  47. * Returns the current hardware read pointer
  48. */
  49. static uint32_t uvd_v6_0_ring_get_rptr(struct amdgpu_ring *ring)
  50. {
  51. struct amdgpu_device *adev = ring->adev;
  52. return RREG32(mmUVD_RBC_RB_RPTR);
  53. }
  54. /**
  55. * uvd_v6_0_ring_get_wptr - get write pointer
  56. *
  57. * @ring: amdgpu_ring pointer
  58. *
  59. * Returns the current hardware write pointer
  60. */
  61. static uint32_t uvd_v6_0_ring_get_wptr(struct amdgpu_ring *ring)
  62. {
  63. struct amdgpu_device *adev = ring->adev;
  64. return RREG32(mmUVD_RBC_RB_WPTR);
  65. }
  66. /**
  67. * uvd_v6_0_ring_set_wptr - set write pointer
  68. *
  69. * @ring: amdgpu_ring pointer
  70. *
  71. * Commits the write pointer to the hardware
  72. */
  73. static void uvd_v6_0_ring_set_wptr(struct amdgpu_ring *ring)
  74. {
  75. struct amdgpu_device *adev = ring->adev;
  76. WREG32(mmUVD_RBC_RB_WPTR, ring->wptr);
  77. }
  78. static int uvd_v6_0_early_init(void *handle)
  79. {
  80. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  81. uvd_v6_0_set_ring_funcs(adev);
  82. uvd_v6_0_set_irq_funcs(adev);
  83. return 0;
  84. }
  85. static int uvd_v6_0_sw_init(void *handle)
  86. {
  87. struct amdgpu_ring *ring;
  88. int r;
  89. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  90. /* UVD TRAP */
  91. r = amdgpu_irq_add_id(adev, 124, &adev->uvd.irq);
  92. if (r)
  93. return r;
  94. r = amdgpu_uvd_sw_init(adev);
  95. if (r)
  96. return r;
  97. r = amdgpu_uvd_resume(adev);
  98. if (r)
  99. return r;
  100. ring = &adev->uvd.ring;
  101. sprintf(ring->name, "uvd");
  102. r = amdgpu_ring_init(adev, ring, 512, CP_PACKET2, 0xf,
  103. &adev->uvd.irq, 0, AMDGPU_RING_TYPE_UVD);
  104. return r;
  105. }
  106. static int uvd_v6_0_sw_fini(void *handle)
  107. {
  108. int r;
  109. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  110. r = amdgpu_uvd_suspend(adev);
  111. if (r)
  112. return r;
  113. r = amdgpu_uvd_sw_fini(adev);
  114. if (r)
  115. return r;
  116. return r;
  117. }
  118. /**
  119. * uvd_v6_0_hw_init - start and test UVD block
  120. *
  121. * @adev: amdgpu_device pointer
  122. *
  123. * Initialize the hardware, boot up the VCPU and do some testing
  124. */
  125. static int uvd_v6_0_hw_init(void *handle)
  126. {
  127. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  128. struct amdgpu_ring *ring = &adev->uvd.ring;
  129. uint32_t tmp;
  130. int r;
  131. r = uvd_v6_0_start(adev);
  132. if (r)
  133. goto done;
  134. ring->ready = true;
  135. r = amdgpu_ring_test_ring(ring);
  136. if (r) {
  137. ring->ready = false;
  138. goto done;
  139. }
  140. r = amdgpu_ring_alloc(ring, 10);
  141. if (r) {
  142. DRM_ERROR("amdgpu: ring failed to lock UVD ring (%d).\n", r);
  143. goto done;
  144. }
  145. tmp = PACKET0(mmUVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL, 0);
  146. amdgpu_ring_write(ring, tmp);
  147. amdgpu_ring_write(ring, 0xFFFFF);
  148. tmp = PACKET0(mmUVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL, 0);
  149. amdgpu_ring_write(ring, tmp);
  150. amdgpu_ring_write(ring, 0xFFFFF);
  151. tmp = PACKET0(mmUVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL, 0);
  152. amdgpu_ring_write(ring, tmp);
  153. amdgpu_ring_write(ring, 0xFFFFF);
  154. /* Clear timeout status bits */
  155. amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_TIMEOUT_STATUS, 0));
  156. amdgpu_ring_write(ring, 0x8);
  157. amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_CNTL, 0));
  158. amdgpu_ring_write(ring, 3);
  159. amdgpu_ring_commit(ring);
  160. done:
  161. if (!r)
  162. DRM_INFO("UVD initialized successfully.\n");
  163. return r;
  164. }
  165. /**
  166. * uvd_v6_0_hw_fini - stop the hardware block
  167. *
  168. * @adev: amdgpu_device pointer
  169. *
  170. * Stop the UVD block, mark ring as not ready any more
  171. */
  172. static int uvd_v6_0_hw_fini(void *handle)
  173. {
  174. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  175. struct amdgpu_ring *ring = &adev->uvd.ring;
  176. uvd_v6_0_stop(adev);
  177. ring->ready = false;
  178. return 0;
  179. }
  180. static int uvd_v6_0_suspend(void *handle)
  181. {
  182. int r;
  183. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  184. r = uvd_v6_0_hw_fini(adev);
  185. if (r)
  186. return r;
  187. /* Skip this for APU for now */
  188. if (!(adev->flags & AMD_IS_APU)) {
  189. r = amdgpu_uvd_suspend(adev);
  190. if (r)
  191. return r;
  192. }
  193. return r;
  194. }
  195. static int uvd_v6_0_resume(void *handle)
  196. {
  197. int r;
  198. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  199. /* Skip this for APU for now */
  200. if (!(adev->flags & AMD_IS_APU)) {
  201. r = amdgpu_uvd_resume(adev);
  202. if (r)
  203. return r;
  204. }
  205. r = uvd_v6_0_hw_init(adev);
  206. if (r)
  207. return r;
  208. return r;
  209. }
  210. /**
  211. * uvd_v6_0_mc_resume - memory controller programming
  212. *
  213. * @adev: amdgpu_device pointer
  214. *
  215. * Let the UVD memory controller know it's offsets
  216. */
  217. static void uvd_v6_0_mc_resume(struct amdgpu_device *adev)
  218. {
  219. uint64_t offset;
  220. uint32_t size;
  221. /* programm memory controller bits 0-27 */
  222. WREG32(mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  223. lower_32_bits(adev->uvd.gpu_addr));
  224. WREG32(mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  225. upper_32_bits(adev->uvd.gpu_addr));
  226. offset = AMDGPU_UVD_FIRMWARE_OFFSET;
  227. size = AMDGPU_GPU_PAGE_ALIGN(adev->uvd.fw->size + 4);
  228. WREG32(mmUVD_VCPU_CACHE_OFFSET0, offset >> 3);
  229. WREG32(mmUVD_VCPU_CACHE_SIZE0, size);
  230. offset += size;
  231. size = AMDGPU_UVD_HEAP_SIZE;
  232. WREG32(mmUVD_VCPU_CACHE_OFFSET1, offset >> 3);
  233. WREG32(mmUVD_VCPU_CACHE_SIZE1, size);
  234. offset += size;
  235. size = AMDGPU_UVD_STACK_SIZE +
  236. (AMDGPU_UVD_SESSION_SIZE * adev->uvd.max_handles);
  237. WREG32(mmUVD_VCPU_CACHE_OFFSET2, offset >> 3);
  238. WREG32(mmUVD_VCPU_CACHE_SIZE2, size);
  239. WREG32(mmUVD_UDEC_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
  240. WREG32(mmUVD_UDEC_DB_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
  241. WREG32(mmUVD_UDEC_DBW_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
  242. WREG32(mmUVD_GP_SCRATCH4, adev->uvd.max_handles);
  243. }
  244. #if 0
  245. static void cz_set_uvd_clock_gating_branches(struct amdgpu_device *adev,
  246. bool enable)
  247. {
  248. u32 data, data1;
  249. data = RREG32(mmUVD_CGC_GATE);
  250. data1 = RREG32(mmUVD_SUVD_CGC_GATE);
  251. if (enable) {
  252. data |= UVD_CGC_GATE__SYS_MASK |
  253. UVD_CGC_GATE__UDEC_MASK |
  254. UVD_CGC_GATE__MPEG2_MASK |
  255. UVD_CGC_GATE__RBC_MASK |
  256. UVD_CGC_GATE__LMI_MC_MASK |
  257. UVD_CGC_GATE__IDCT_MASK |
  258. UVD_CGC_GATE__MPRD_MASK |
  259. UVD_CGC_GATE__MPC_MASK |
  260. UVD_CGC_GATE__LBSI_MASK |
  261. UVD_CGC_GATE__LRBBM_MASK |
  262. UVD_CGC_GATE__UDEC_RE_MASK |
  263. UVD_CGC_GATE__UDEC_CM_MASK |
  264. UVD_CGC_GATE__UDEC_IT_MASK |
  265. UVD_CGC_GATE__UDEC_DB_MASK |
  266. UVD_CGC_GATE__UDEC_MP_MASK |
  267. UVD_CGC_GATE__WCB_MASK |
  268. UVD_CGC_GATE__VCPU_MASK |
  269. UVD_CGC_GATE__SCPU_MASK;
  270. data1 |= UVD_SUVD_CGC_GATE__SRE_MASK |
  271. UVD_SUVD_CGC_GATE__SIT_MASK |
  272. UVD_SUVD_CGC_GATE__SMP_MASK |
  273. UVD_SUVD_CGC_GATE__SCM_MASK |
  274. UVD_SUVD_CGC_GATE__SDB_MASK |
  275. UVD_SUVD_CGC_GATE__SRE_H264_MASK |
  276. UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
  277. UVD_SUVD_CGC_GATE__SIT_H264_MASK |
  278. UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
  279. UVD_SUVD_CGC_GATE__SCM_H264_MASK |
  280. UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
  281. UVD_SUVD_CGC_GATE__SDB_H264_MASK |
  282. UVD_SUVD_CGC_GATE__SDB_HEVC_MASK;
  283. } else {
  284. data &= ~(UVD_CGC_GATE__SYS_MASK |
  285. UVD_CGC_GATE__UDEC_MASK |
  286. UVD_CGC_GATE__MPEG2_MASK |
  287. UVD_CGC_GATE__RBC_MASK |
  288. UVD_CGC_GATE__LMI_MC_MASK |
  289. UVD_CGC_GATE__LMI_UMC_MASK |
  290. UVD_CGC_GATE__IDCT_MASK |
  291. UVD_CGC_GATE__MPRD_MASK |
  292. UVD_CGC_GATE__MPC_MASK |
  293. UVD_CGC_GATE__LBSI_MASK |
  294. UVD_CGC_GATE__LRBBM_MASK |
  295. UVD_CGC_GATE__UDEC_RE_MASK |
  296. UVD_CGC_GATE__UDEC_CM_MASK |
  297. UVD_CGC_GATE__UDEC_IT_MASK |
  298. UVD_CGC_GATE__UDEC_DB_MASK |
  299. UVD_CGC_GATE__UDEC_MP_MASK |
  300. UVD_CGC_GATE__WCB_MASK |
  301. UVD_CGC_GATE__VCPU_MASK |
  302. UVD_CGC_GATE__SCPU_MASK);
  303. data1 &= ~(UVD_SUVD_CGC_GATE__SRE_MASK |
  304. UVD_SUVD_CGC_GATE__SIT_MASK |
  305. UVD_SUVD_CGC_GATE__SMP_MASK |
  306. UVD_SUVD_CGC_GATE__SCM_MASK |
  307. UVD_SUVD_CGC_GATE__SDB_MASK |
  308. UVD_SUVD_CGC_GATE__SRE_H264_MASK |
  309. UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
  310. UVD_SUVD_CGC_GATE__SIT_H264_MASK |
  311. UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
  312. UVD_SUVD_CGC_GATE__SCM_H264_MASK |
  313. UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
  314. UVD_SUVD_CGC_GATE__SDB_H264_MASK |
  315. UVD_SUVD_CGC_GATE__SDB_HEVC_MASK);
  316. }
  317. WREG32(mmUVD_CGC_GATE, data);
  318. WREG32(mmUVD_SUVD_CGC_GATE, data1);
  319. }
  320. #endif
  321. /**
  322. * uvd_v6_0_start - start UVD block
  323. *
  324. * @adev: amdgpu_device pointer
  325. *
  326. * Setup and start the UVD block
  327. */
  328. static int uvd_v6_0_start(struct amdgpu_device *adev)
  329. {
  330. struct amdgpu_ring *ring = &adev->uvd.ring;
  331. uint32_t rb_bufsz, tmp;
  332. uint32_t lmi_swap_cntl;
  333. uint32_t mp_swap_cntl;
  334. int i, j, r;
  335. /* disable DPG */
  336. WREG32_P(mmUVD_POWER_STATUS, 0, ~UVD_POWER_STATUS__UVD_PG_MODE_MASK);
  337. /* disable byte swapping */
  338. lmi_swap_cntl = 0;
  339. mp_swap_cntl = 0;
  340. uvd_v6_0_mc_resume(adev);
  341. /* Set dynamic clock gating in S/W control mode */
  342. if (adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG) {
  343. uvd_v6_0_set_sw_clock_gating(adev);
  344. } else {
  345. /* disable clock gating */
  346. uint32_t data = RREG32(mmUVD_CGC_CTRL);
  347. data &= ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
  348. WREG32(mmUVD_CGC_CTRL, data);
  349. }
  350. /* disable interupt */
  351. WREG32_P(mmUVD_MASTINT_EN, 0, ~UVD_MASTINT_EN__VCPU_EN_MASK);
  352. /* stall UMC and register bus before resetting VCPU */
  353. WREG32_P(mmUVD_LMI_CTRL2, UVD_LMI_CTRL2__STALL_ARB_UMC_MASK, ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  354. mdelay(1);
  355. /* put LMI, VCPU, RBC etc... into reset */
  356. WREG32(mmUVD_SOFT_RESET,
  357. UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  358. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
  359. UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  360. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
  361. UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  362. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
  363. UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  364. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
  365. mdelay(5);
  366. /* take UVD block out of reset */
  367. WREG32_P(mmSRBM_SOFT_RESET, 0, ~SRBM_SOFT_RESET__SOFT_RESET_UVD_MASK);
  368. mdelay(5);
  369. /* initialize UVD memory controller */
  370. WREG32(mmUVD_LMI_CTRL,
  371. (0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  372. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  373. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  374. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  375. UVD_LMI_CTRL__REQ_MODE_MASK |
  376. UVD_LMI_CTRL__DISABLE_ON_FWV_FAIL_MASK);
  377. #ifdef __BIG_ENDIAN
  378. /* swap (8 in 32) RB and IB */
  379. lmi_swap_cntl = 0xa;
  380. mp_swap_cntl = 0;
  381. #endif
  382. WREG32(mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
  383. WREG32(mmUVD_MP_SWAP_CNTL, mp_swap_cntl);
  384. WREG32(mmUVD_MPC_SET_MUXA0, 0x40c2040);
  385. WREG32(mmUVD_MPC_SET_MUXA1, 0x0);
  386. WREG32(mmUVD_MPC_SET_MUXB0, 0x40c2040);
  387. WREG32(mmUVD_MPC_SET_MUXB1, 0x0);
  388. WREG32(mmUVD_MPC_SET_ALU, 0);
  389. WREG32(mmUVD_MPC_SET_MUX, 0x88);
  390. /* take all subblocks out of reset, except VCPU */
  391. WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  392. mdelay(5);
  393. /* enable VCPU clock */
  394. WREG32(mmUVD_VCPU_CNTL, UVD_VCPU_CNTL__CLK_EN_MASK);
  395. /* enable UMC */
  396. WREG32_P(mmUVD_LMI_CTRL2, 0, ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  397. /* boot up the VCPU */
  398. WREG32(mmUVD_SOFT_RESET, 0);
  399. mdelay(10);
  400. for (i = 0; i < 10; ++i) {
  401. uint32_t status;
  402. for (j = 0; j < 100; ++j) {
  403. status = RREG32(mmUVD_STATUS);
  404. if (status & 2)
  405. break;
  406. mdelay(10);
  407. }
  408. r = 0;
  409. if (status & 2)
  410. break;
  411. DRM_ERROR("UVD not responding, trying to reset the VCPU!!!\n");
  412. WREG32_P(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
  413. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  414. mdelay(10);
  415. WREG32_P(mmUVD_SOFT_RESET, 0,
  416. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  417. mdelay(10);
  418. r = -1;
  419. }
  420. if (r) {
  421. DRM_ERROR("UVD not responding, giving up!!!\n");
  422. return r;
  423. }
  424. /* enable master interrupt */
  425. WREG32_P(mmUVD_MASTINT_EN,
  426. (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
  427. ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
  428. /* clear the bit 4 of UVD_STATUS */
  429. WREG32_P(mmUVD_STATUS, 0, ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
  430. rb_bufsz = order_base_2(ring->ring_size);
  431. tmp = 0;
  432. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
  433. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
  434. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  435. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
  436. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
  437. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
  438. /* force RBC into idle state */
  439. WREG32(mmUVD_RBC_RB_CNTL, tmp);
  440. /* set the write pointer delay */
  441. WREG32(mmUVD_RBC_RB_WPTR_CNTL, 0);
  442. /* set the wb address */
  443. WREG32(mmUVD_RBC_RB_RPTR_ADDR, (upper_32_bits(ring->gpu_addr) >> 2));
  444. /* programm the RB_BASE for ring buffer */
  445. WREG32(mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
  446. lower_32_bits(ring->gpu_addr));
  447. WREG32(mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
  448. upper_32_bits(ring->gpu_addr));
  449. /* Initialize the ring buffer's read and write pointers */
  450. WREG32(mmUVD_RBC_RB_RPTR, 0);
  451. ring->wptr = RREG32(mmUVD_RBC_RB_RPTR);
  452. WREG32(mmUVD_RBC_RB_WPTR, ring->wptr);
  453. WREG32_P(mmUVD_RBC_RB_CNTL, 0, ~UVD_RBC_RB_CNTL__RB_NO_FETCH_MASK);
  454. return 0;
  455. }
  456. /**
  457. * uvd_v6_0_stop - stop UVD block
  458. *
  459. * @adev: amdgpu_device pointer
  460. *
  461. * stop the UVD block
  462. */
  463. static void uvd_v6_0_stop(struct amdgpu_device *adev)
  464. {
  465. /* force RBC into idle state */
  466. WREG32(mmUVD_RBC_RB_CNTL, 0x11010101);
  467. /* Stall UMC and register bus before resetting VCPU */
  468. WREG32_P(mmUVD_LMI_CTRL2, 1 << 8, ~(1 << 8));
  469. mdelay(1);
  470. /* put VCPU into reset */
  471. WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  472. mdelay(5);
  473. /* disable VCPU clock */
  474. WREG32(mmUVD_VCPU_CNTL, 0x0);
  475. /* Unstall UMC and register bus */
  476. WREG32_P(mmUVD_LMI_CTRL2, 0, ~(1 << 8));
  477. }
  478. /**
  479. * uvd_v6_0_ring_emit_fence - emit an fence & trap command
  480. *
  481. * @ring: amdgpu_ring pointer
  482. * @fence: fence to emit
  483. *
  484. * Write a fence and a trap command to the ring.
  485. */
  486. static void uvd_v6_0_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
  487. unsigned flags)
  488. {
  489. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  490. amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
  491. amdgpu_ring_write(ring, seq);
  492. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
  493. amdgpu_ring_write(ring, addr & 0xffffffff);
  494. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
  495. amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
  496. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
  497. amdgpu_ring_write(ring, 0);
  498. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
  499. amdgpu_ring_write(ring, 0);
  500. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
  501. amdgpu_ring_write(ring, 0);
  502. amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
  503. amdgpu_ring_write(ring, 2);
  504. }
  505. /**
  506. * uvd_v6_0_ring_emit_hdp_flush - emit an hdp flush
  507. *
  508. * @ring: amdgpu_ring pointer
  509. *
  510. * Emits an hdp flush.
  511. */
  512. static void uvd_v6_0_ring_emit_hdp_flush(struct amdgpu_ring *ring)
  513. {
  514. amdgpu_ring_write(ring, PACKET0(mmHDP_MEM_COHERENCY_FLUSH_CNTL, 0));
  515. amdgpu_ring_write(ring, 0);
  516. }
  517. /**
  518. * uvd_v6_0_ring_hdp_invalidate - emit an hdp invalidate
  519. *
  520. * @ring: amdgpu_ring pointer
  521. *
  522. * Emits an hdp invalidate.
  523. */
  524. static void uvd_v6_0_ring_emit_hdp_invalidate(struct amdgpu_ring *ring)
  525. {
  526. amdgpu_ring_write(ring, PACKET0(mmHDP_DEBUG0, 0));
  527. amdgpu_ring_write(ring, 1);
  528. }
  529. /**
  530. * uvd_v6_0_ring_test_ring - register write test
  531. *
  532. * @ring: amdgpu_ring pointer
  533. *
  534. * Test if we can successfully write to the context register
  535. */
  536. static int uvd_v6_0_ring_test_ring(struct amdgpu_ring *ring)
  537. {
  538. struct amdgpu_device *adev = ring->adev;
  539. uint32_t tmp = 0;
  540. unsigned i;
  541. int r;
  542. WREG32(mmUVD_CONTEXT_ID, 0xCAFEDEAD);
  543. r = amdgpu_ring_alloc(ring, 3);
  544. if (r) {
  545. DRM_ERROR("amdgpu: cp failed to lock ring %d (%d).\n",
  546. ring->idx, r);
  547. return r;
  548. }
  549. amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
  550. amdgpu_ring_write(ring, 0xDEADBEEF);
  551. amdgpu_ring_commit(ring);
  552. for (i = 0; i < adev->usec_timeout; i++) {
  553. tmp = RREG32(mmUVD_CONTEXT_ID);
  554. if (tmp == 0xDEADBEEF)
  555. break;
  556. DRM_UDELAY(1);
  557. }
  558. if (i < adev->usec_timeout) {
  559. DRM_INFO("ring test on %d succeeded in %d usecs\n",
  560. ring->idx, i);
  561. } else {
  562. DRM_ERROR("amdgpu: ring %d test failed (0x%08X)\n",
  563. ring->idx, tmp);
  564. r = -EINVAL;
  565. }
  566. return r;
  567. }
  568. /**
  569. * uvd_v6_0_ring_emit_ib - execute indirect buffer
  570. *
  571. * @ring: amdgpu_ring pointer
  572. * @ib: indirect buffer to execute
  573. *
  574. * Write ring commands to execute the indirect buffer
  575. */
  576. static void uvd_v6_0_ring_emit_ib(struct amdgpu_ring *ring,
  577. struct amdgpu_ib *ib,
  578. unsigned vm_id, bool ctx_switch)
  579. {
  580. amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_64BIT_BAR_LOW, 0));
  581. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  582. amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH, 0));
  583. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  584. amdgpu_ring_write(ring, PACKET0(mmUVD_RBC_IB_SIZE, 0));
  585. amdgpu_ring_write(ring, ib->length_dw);
  586. }
  587. /**
  588. * uvd_v6_0_ring_test_ib - test ib execution
  589. *
  590. * @ring: amdgpu_ring pointer
  591. *
  592. * Test if we can successfully execute an IB
  593. */
  594. static int uvd_v6_0_ring_test_ib(struct amdgpu_ring *ring)
  595. {
  596. struct fence *fence = NULL;
  597. int r;
  598. r = amdgpu_uvd_get_create_msg(ring, 1, NULL);
  599. if (r) {
  600. DRM_ERROR("amdgpu: failed to get create msg (%d).\n", r);
  601. goto error;
  602. }
  603. r = amdgpu_uvd_get_destroy_msg(ring, 1, true, &fence);
  604. if (r) {
  605. DRM_ERROR("amdgpu: failed to get destroy ib (%d).\n", r);
  606. goto error;
  607. }
  608. r = fence_wait(fence, false);
  609. if (r) {
  610. DRM_ERROR("amdgpu: fence wait failed (%d).\n", r);
  611. goto error;
  612. }
  613. DRM_INFO("ib test on ring %d succeeded\n", ring->idx);
  614. error:
  615. fence_put(fence);
  616. return r;
  617. }
  618. static bool uvd_v6_0_is_idle(void *handle)
  619. {
  620. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  621. return !(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK);
  622. }
  623. static int uvd_v6_0_wait_for_idle(void *handle)
  624. {
  625. unsigned i;
  626. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  627. for (i = 0; i < adev->usec_timeout; i++) {
  628. if (!(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK))
  629. return 0;
  630. }
  631. return -ETIMEDOUT;
  632. }
  633. static int uvd_v6_0_soft_reset(void *handle)
  634. {
  635. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  636. uvd_v6_0_stop(adev);
  637. WREG32_P(mmSRBM_SOFT_RESET, SRBM_SOFT_RESET__SOFT_RESET_UVD_MASK,
  638. ~SRBM_SOFT_RESET__SOFT_RESET_UVD_MASK);
  639. mdelay(5);
  640. return uvd_v6_0_start(adev);
  641. }
  642. static int uvd_v6_0_set_interrupt_state(struct amdgpu_device *adev,
  643. struct amdgpu_irq_src *source,
  644. unsigned type,
  645. enum amdgpu_interrupt_state state)
  646. {
  647. // TODO
  648. return 0;
  649. }
  650. static int uvd_v6_0_process_interrupt(struct amdgpu_device *adev,
  651. struct amdgpu_irq_src *source,
  652. struct amdgpu_iv_entry *entry)
  653. {
  654. DRM_DEBUG("IH: UVD TRAP\n");
  655. amdgpu_fence_process(&adev->uvd.ring);
  656. return 0;
  657. }
  658. static void uvd_v6_0_set_sw_clock_gating(struct amdgpu_device *adev)
  659. {
  660. uint32_t data, data1, data2, suvd_flags;
  661. data = RREG32(mmUVD_CGC_CTRL);
  662. data1 = RREG32(mmUVD_SUVD_CGC_GATE);
  663. data2 = RREG32(mmUVD_SUVD_CGC_CTRL);
  664. data &= ~(UVD_CGC_CTRL__CLK_OFF_DELAY_MASK |
  665. UVD_CGC_CTRL__CLK_GATE_DLY_TIMER_MASK);
  666. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  667. UVD_SUVD_CGC_GATE__SIT_MASK |
  668. UVD_SUVD_CGC_GATE__SMP_MASK |
  669. UVD_SUVD_CGC_GATE__SCM_MASK |
  670. UVD_SUVD_CGC_GATE__SDB_MASK;
  671. data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK |
  672. (1 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_GATE_DLY_TIMER)) |
  673. (4 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_OFF_DELAY));
  674. data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
  675. UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
  676. UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
  677. UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
  678. UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
  679. UVD_CGC_CTRL__SYS_MODE_MASK |
  680. UVD_CGC_CTRL__UDEC_MODE_MASK |
  681. UVD_CGC_CTRL__MPEG2_MODE_MASK |
  682. UVD_CGC_CTRL__REGS_MODE_MASK |
  683. UVD_CGC_CTRL__RBC_MODE_MASK |
  684. UVD_CGC_CTRL__LMI_MC_MODE_MASK |
  685. UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
  686. UVD_CGC_CTRL__IDCT_MODE_MASK |
  687. UVD_CGC_CTRL__MPRD_MODE_MASK |
  688. UVD_CGC_CTRL__MPC_MODE_MASK |
  689. UVD_CGC_CTRL__LBSI_MODE_MASK |
  690. UVD_CGC_CTRL__LRBBM_MODE_MASK |
  691. UVD_CGC_CTRL__WCB_MODE_MASK |
  692. UVD_CGC_CTRL__VCPU_MODE_MASK |
  693. UVD_CGC_CTRL__JPEG_MODE_MASK |
  694. UVD_CGC_CTRL__SCPU_MODE_MASK |
  695. UVD_CGC_CTRL__JPEG2_MODE_MASK);
  696. data2 &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK |
  697. UVD_SUVD_CGC_CTRL__SIT_MODE_MASK |
  698. UVD_SUVD_CGC_CTRL__SMP_MODE_MASK |
  699. UVD_SUVD_CGC_CTRL__SCM_MODE_MASK |
  700. UVD_SUVD_CGC_CTRL__SDB_MODE_MASK);
  701. data1 |= suvd_flags;
  702. WREG32(mmUVD_CGC_CTRL, data);
  703. WREG32(mmUVD_CGC_GATE, 0);
  704. WREG32(mmUVD_SUVD_CGC_GATE, data1);
  705. WREG32(mmUVD_SUVD_CGC_CTRL, data2);
  706. }
  707. #if 0
  708. static void uvd_v6_0_set_hw_clock_gating(struct amdgpu_device *adev)
  709. {
  710. uint32_t data, data1, cgc_flags, suvd_flags;
  711. data = RREG32(mmUVD_CGC_GATE);
  712. data1 = RREG32(mmUVD_SUVD_CGC_GATE);
  713. cgc_flags = UVD_CGC_GATE__SYS_MASK |
  714. UVD_CGC_GATE__UDEC_MASK |
  715. UVD_CGC_GATE__MPEG2_MASK |
  716. UVD_CGC_GATE__RBC_MASK |
  717. UVD_CGC_GATE__LMI_MC_MASK |
  718. UVD_CGC_GATE__IDCT_MASK |
  719. UVD_CGC_GATE__MPRD_MASK |
  720. UVD_CGC_GATE__MPC_MASK |
  721. UVD_CGC_GATE__LBSI_MASK |
  722. UVD_CGC_GATE__LRBBM_MASK |
  723. UVD_CGC_GATE__UDEC_RE_MASK |
  724. UVD_CGC_GATE__UDEC_CM_MASK |
  725. UVD_CGC_GATE__UDEC_IT_MASK |
  726. UVD_CGC_GATE__UDEC_DB_MASK |
  727. UVD_CGC_GATE__UDEC_MP_MASK |
  728. UVD_CGC_GATE__WCB_MASK |
  729. UVD_CGC_GATE__VCPU_MASK |
  730. UVD_CGC_GATE__SCPU_MASK |
  731. UVD_CGC_GATE__JPEG_MASK |
  732. UVD_CGC_GATE__JPEG2_MASK;
  733. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  734. UVD_SUVD_CGC_GATE__SIT_MASK |
  735. UVD_SUVD_CGC_GATE__SMP_MASK |
  736. UVD_SUVD_CGC_GATE__SCM_MASK |
  737. UVD_SUVD_CGC_GATE__SDB_MASK;
  738. data |= cgc_flags;
  739. data1 |= suvd_flags;
  740. WREG32(mmUVD_CGC_GATE, data);
  741. WREG32(mmUVD_SUVD_CGC_GATE, data1);
  742. }
  743. #endif
  744. static void uvd_v6_set_bypass_mode(struct amdgpu_device *adev, bool enable)
  745. {
  746. u32 tmp = RREG32_SMC(ixGCK_DFS_BYPASS_CNTL);
  747. if (enable)
  748. tmp |= (GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
  749. GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
  750. else
  751. tmp &= ~(GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
  752. GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
  753. WREG32_SMC(ixGCK_DFS_BYPASS_CNTL, tmp);
  754. }
  755. static int uvd_v6_0_set_clockgating_state(void *handle,
  756. enum amd_clockgating_state state)
  757. {
  758. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  759. bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
  760. static int curstate = -1;
  761. if (adev->asic_type == CHIP_FIJI ||
  762. adev->asic_type == CHIP_POLARIS10)
  763. uvd_v6_set_bypass_mode(adev, enable);
  764. if (!(adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG))
  765. return 0;
  766. if (curstate == state)
  767. return 0;
  768. curstate = state;
  769. if (enable) {
  770. /* disable HW gating and enable Sw gating */
  771. uvd_v6_0_set_sw_clock_gating(adev);
  772. } else {
  773. /* wait for STATUS to clear */
  774. if (uvd_v6_0_wait_for_idle(handle))
  775. return -EBUSY;
  776. /* enable HW gates because UVD is idle */
  777. /* uvd_v6_0_set_hw_clock_gating(adev); */
  778. }
  779. return 0;
  780. }
  781. static int uvd_v6_0_set_powergating_state(void *handle,
  782. enum amd_powergating_state state)
  783. {
  784. /* This doesn't actually powergate the UVD block.
  785. * That's done in the dpm code via the SMC. This
  786. * just re-inits the block as necessary. The actual
  787. * gating still happens in the dpm code. We should
  788. * revisit this when there is a cleaner line between
  789. * the smc and the hw blocks
  790. */
  791. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  792. if (!(adev->pg_flags & AMD_PG_SUPPORT_UVD))
  793. return 0;
  794. if (state == AMD_PG_STATE_GATE) {
  795. uvd_v6_0_stop(adev);
  796. return 0;
  797. } else {
  798. return uvd_v6_0_start(adev);
  799. }
  800. }
  801. const struct amd_ip_funcs uvd_v6_0_ip_funcs = {
  802. .name = "uvd_v6_0",
  803. .early_init = uvd_v6_0_early_init,
  804. .late_init = NULL,
  805. .sw_init = uvd_v6_0_sw_init,
  806. .sw_fini = uvd_v6_0_sw_fini,
  807. .hw_init = uvd_v6_0_hw_init,
  808. .hw_fini = uvd_v6_0_hw_fini,
  809. .suspend = uvd_v6_0_suspend,
  810. .resume = uvd_v6_0_resume,
  811. .is_idle = uvd_v6_0_is_idle,
  812. .wait_for_idle = uvd_v6_0_wait_for_idle,
  813. .soft_reset = uvd_v6_0_soft_reset,
  814. .set_clockgating_state = uvd_v6_0_set_clockgating_state,
  815. .set_powergating_state = uvd_v6_0_set_powergating_state,
  816. };
  817. static const struct amdgpu_ring_funcs uvd_v6_0_ring_funcs = {
  818. .get_rptr = uvd_v6_0_ring_get_rptr,
  819. .get_wptr = uvd_v6_0_ring_get_wptr,
  820. .set_wptr = uvd_v6_0_ring_set_wptr,
  821. .parse_cs = amdgpu_uvd_ring_parse_cs,
  822. .emit_ib = uvd_v6_0_ring_emit_ib,
  823. .emit_fence = uvd_v6_0_ring_emit_fence,
  824. .emit_hdp_flush = uvd_v6_0_ring_emit_hdp_flush,
  825. .emit_hdp_invalidate = uvd_v6_0_ring_emit_hdp_invalidate,
  826. .test_ring = uvd_v6_0_ring_test_ring,
  827. .test_ib = uvd_v6_0_ring_test_ib,
  828. .insert_nop = amdgpu_ring_insert_nop,
  829. .pad_ib = amdgpu_ring_generic_pad_ib,
  830. };
  831. static void uvd_v6_0_set_ring_funcs(struct amdgpu_device *adev)
  832. {
  833. adev->uvd.ring.funcs = &uvd_v6_0_ring_funcs;
  834. }
  835. static const struct amdgpu_irq_src_funcs uvd_v6_0_irq_funcs = {
  836. .set = uvd_v6_0_set_interrupt_state,
  837. .process = uvd_v6_0_process_interrupt,
  838. };
  839. static void uvd_v6_0_set_irq_funcs(struct amdgpu_device *adev)
  840. {
  841. adev->uvd.irq.num_types = 1;
  842. adev->uvd.irq.funcs = &uvd_v6_0_irq_funcs;
  843. }