uvd_v7_0.c 53 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include <linux/firmware.h>
  24. #include <drm/drmP.h>
  25. #include "amdgpu.h"
  26. #include "amdgpu_uvd.h"
  27. #include "soc15.h"
  28. #include "soc15d.h"
  29. #include "soc15_common.h"
  30. #include "mmsch_v1_0.h"
  31. #include "uvd/uvd_7_0_offset.h"
  32. #include "uvd/uvd_7_0_sh_mask.h"
  33. #include "vce/vce_4_0_offset.h"
  34. #include "vce/vce_4_0_default.h"
  35. #include "vce/vce_4_0_sh_mask.h"
  36. #include "nbif/nbif_6_1_offset.h"
  37. #include "hdp/hdp_4_0_offset.h"
  38. #include "mmhub/mmhub_1_0_offset.h"
  39. #include "mmhub/mmhub_1_0_sh_mask.h"
  40. static void uvd_v7_0_set_ring_funcs(struct amdgpu_device *adev);
  41. static void uvd_v7_0_set_enc_ring_funcs(struct amdgpu_device *adev);
  42. static void uvd_v7_0_set_irq_funcs(struct amdgpu_device *adev);
  43. static int uvd_v7_0_start(struct amdgpu_device *adev);
  44. static void uvd_v7_0_stop(struct amdgpu_device *adev);
  45. static int uvd_v7_0_sriov_start(struct amdgpu_device *adev);
  46. /**
  47. * uvd_v7_0_ring_get_rptr - get read pointer
  48. *
  49. * @ring: amdgpu_ring pointer
  50. *
  51. * Returns the current hardware read pointer
  52. */
  53. static uint64_t uvd_v7_0_ring_get_rptr(struct amdgpu_ring *ring)
  54. {
  55. struct amdgpu_device *adev = ring->adev;
  56. return RREG32_SOC15(UVD, ring->me, mmUVD_RBC_RB_RPTR);
  57. }
  58. /**
  59. * uvd_v7_0_enc_ring_get_rptr - get enc read pointer
  60. *
  61. * @ring: amdgpu_ring pointer
  62. *
  63. * Returns the current hardware enc read pointer
  64. */
  65. static uint64_t uvd_v7_0_enc_ring_get_rptr(struct amdgpu_ring *ring)
  66. {
  67. struct amdgpu_device *adev = ring->adev;
  68. if (ring == &adev->uvd.inst[ring->me].ring_enc[0])
  69. return RREG32_SOC15(UVD, ring->me, mmUVD_RB_RPTR);
  70. else
  71. return RREG32_SOC15(UVD, ring->me, mmUVD_RB_RPTR2);
  72. }
  73. /**
  74. * uvd_v7_0_ring_get_wptr - get write pointer
  75. *
  76. * @ring: amdgpu_ring pointer
  77. *
  78. * Returns the current hardware write pointer
  79. */
  80. static uint64_t uvd_v7_0_ring_get_wptr(struct amdgpu_ring *ring)
  81. {
  82. struct amdgpu_device *adev = ring->adev;
  83. return RREG32_SOC15(UVD, ring->me, mmUVD_RBC_RB_WPTR);
  84. }
  85. /**
  86. * uvd_v7_0_enc_ring_get_wptr - get enc write pointer
  87. *
  88. * @ring: amdgpu_ring pointer
  89. *
  90. * Returns the current hardware enc write pointer
  91. */
  92. static uint64_t uvd_v7_0_enc_ring_get_wptr(struct amdgpu_ring *ring)
  93. {
  94. struct amdgpu_device *adev = ring->adev;
  95. if (ring->use_doorbell)
  96. return adev->wb.wb[ring->wptr_offs];
  97. if (ring == &adev->uvd.inst[ring->me].ring_enc[0])
  98. return RREG32_SOC15(UVD, ring->me, mmUVD_RB_WPTR);
  99. else
  100. return RREG32_SOC15(UVD, ring->me, mmUVD_RB_WPTR2);
  101. }
  102. /**
  103. * uvd_v7_0_ring_set_wptr - set write pointer
  104. *
  105. * @ring: amdgpu_ring pointer
  106. *
  107. * Commits the write pointer to the hardware
  108. */
  109. static void uvd_v7_0_ring_set_wptr(struct amdgpu_ring *ring)
  110. {
  111. struct amdgpu_device *adev = ring->adev;
  112. WREG32_SOC15(UVD, ring->me, mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
  113. }
  114. /**
  115. * uvd_v7_0_enc_ring_set_wptr - set enc write pointer
  116. *
  117. * @ring: amdgpu_ring pointer
  118. *
  119. * Commits the enc write pointer to the hardware
  120. */
  121. static void uvd_v7_0_enc_ring_set_wptr(struct amdgpu_ring *ring)
  122. {
  123. struct amdgpu_device *adev = ring->adev;
  124. if (ring->use_doorbell) {
  125. /* XXX check if swapping is necessary on BE */
  126. adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
  127. WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
  128. return;
  129. }
  130. if (ring == &adev->uvd.inst[ring->me].ring_enc[0])
  131. WREG32_SOC15(UVD, ring->me, mmUVD_RB_WPTR,
  132. lower_32_bits(ring->wptr));
  133. else
  134. WREG32_SOC15(UVD, ring->me, mmUVD_RB_WPTR2,
  135. lower_32_bits(ring->wptr));
  136. }
  137. /**
  138. * uvd_v7_0_enc_ring_test_ring - test if UVD ENC ring is working
  139. *
  140. * @ring: the engine to test on
  141. *
  142. */
  143. static int uvd_v7_0_enc_ring_test_ring(struct amdgpu_ring *ring)
  144. {
  145. struct amdgpu_device *adev = ring->adev;
  146. uint32_t rptr = amdgpu_ring_get_rptr(ring);
  147. unsigned i;
  148. int r;
  149. if (amdgpu_sriov_vf(adev))
  150. return 0;
  151. r = amdgpu_ring_alloc(ring, 16);
  152. if (r) {
  153. DRM_ERROR("amdgpu: uvd enc failed to lock (%d)ring %d (%d).\n",
  154. ring->me, ring->idx, r);
  155. return r;
  156. }
  157. amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
  158. amdgpu_ring_commit(ring);
  159. for (i = 0; i < adev->usec_timeout; i++) {
  160. if (amdgpu_ring_get_rptr(ring) != rptr)
  161. break;
  162. DRM_UDELAY(1);
  163. }
  164. if (i < adev->usec_timeout) {
  165. DRM_DEBUG("(%d)ring test on %d succeeded in %d usecs\n",
  166. ring->me, ring->idx, i);
  167. } else {
  168. DRM_ERROR("amdgpu: (%d)ring %d test failed\n",
  169. ring->me, ring->idx);
  170. r = -ETIMEDOUT;
  171. }
  172. return r;
  173. }
  174. /**
  175. * uvd_v7_0_enc_get_create_msg - generate a UVD ENC create msg
  176. *
  177. * @adev: amdgpu_device pointer
  178. * @ring: ring we should submit the msg to
  179. * @handle: session handle to use
  180. * @fence: optional fence to return
  181. *
  182. * Open up a stream for HW test
  183. */
  184. static int uvd_v7_0_enc_get_create_msg(struct amdgpu_ring *ring, uint32_t handle,
  185. struct dma_fence **fence)
  186. {
  187. const unsigned ib_size_dw = 16;
  188. struct amdgpu_job *job;
  189. struct amdgpu_ib *ib;
  190. struct dma_fence *f = NULL;
  191. uint64_t dummy;
  192. int i, r;
  193. r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
  194. if (r)
  195. return r;
  196. ib = &job->ibs[0];
  197. dummy = ib->gpu_addr + 1024;
  198. ib->length_dw = 0;
  199. ib->ptr[ib->length_dw++] = 0x00000018;
  200. ib->ptr[ib->length_dw++] = 0x00000001; /* session info */
  201. ib->ptr[ib->length_dw++] = handle;
  202. ib->ptr[ib->length_dw++] = 0x00000000;
  203. ib->ptr[ib->length_dw++] = upper_32_bits(dummy);
  204. ib->ptr[ib->length_dw++] = dummy;
  205. ib->ptr[ib->length_dw++] = 0x00000014;
  206. ib->ptr[ib->length_dw++] = 0x00000002; /* task info */
  207. ib->ptr[ib->length_dw++] = 0x0000001c;
  208. ib->ptr[ib->length_dw++] = 0x00000000;
  209. ib->ptr[ib->length_dw++] = 0x00000000;
  210. ib->ptr[ib->length_dw++] = 0x00000008;
  211. ib->ptr[ib->length_dw++] = 0x08000001; /* op initialize */
  212. for (i = ib->length_dw; i < ib_size_dw; ++i)
  213. ib->ptr[i] = 0x0;
  214. r = amdgpu_ib_schedule(ring, 1, ib, NULL, &f);
  215. job->fence = dma_fence_get(f);
  216. if (r)
  217. goto err;
  218. amdgpu_job_free(job);
  219. if (fence)
  220. *fence = dma_fence_get(f);
  221. dma_fence_put(f);
  222. return 0;
  223. err:
  224. amdgpu_job_free(job);
  225. return r;
  226. }
  227. /**
  228. * uvd_v7_0_enc_get_destroy_msg - generate a UVD ENC destroy msg
  229. *
  230. * @adev: amdgpu_device pointer
  231. * @ring: ring we should submit the msg to
  232. * @handle: session handle to use
  233. * @fence: optional fence to return
  234. *
  235. * Close up a stream for HW test or if userspace failed to do so
  236. */
  237. int uvd_v7_0_enc_get_destroy_msg(struct amdgpu_ring *ring, uint32_t handle,
  238. bool direct, struct dma_fence **fence)
  239. {
  240. const unsigned ib_size_dw = 16;
  241. struct amdgpu_job *job;
  242. struct amdgpu_ib *ib;
  243. struct dma_fence *f = NULL;
  244. uint64_t dummy;
  245. int i, r;
  246. r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
  247. if (r)
  248. return r;
  249. ib = &job->ibs[0];
  250. dummy = ib->gpu_addr + 1024;
  251. ib->length_dw = 0;
  252. ib->ptr[ib->length_dw++] = 0x00000018;
  253. ib->ptr[ib->length_dw++] = 0x00000001;
  254. ib->ptr[ib->length_dw++] = handle;
  255. ib->ptr[ib->length_dw++] = 0x00000000;
  256. ib->ptr[ib->length_dw++] = upper_32_bits(dummy);
  257. ib->ptr[ib->length_dw++] = dummy;
  258. ib->ptr[ib->length_dw++] = 0x00000014;
  259. ib->ptr[ib->length_dw++] = 0x00000002;
  260. ib->ptr[ib->length_dw++] = 0x0000001c;
  261. ib->ptr[ib->length_dw++] = 0x00000000;
  262. ib->ptr[ib->length_dw++] = 0x00000000;
  263. ib->ptr[ib->length_dw++] = 0x00000008;
  264. ib->ptr[ib->length_dw++] = 0x08000002; /* op close session */
  265. for (i = ib->length_dw; i < ib_size_dw; ++i)
  266. ib->ptr[i] = 0x0;
  267. if (direct) {
  268. r = amdgpu_ib_schedule(ring, 1, ib, NULL, &f);
  269. job->fence = dma_fence_get(f);
  270. if (r)
  271. goto err;
  272. amdgpu_job_free(job);
  273. } else {
  274. r = amdgpu_job_submit(job, ring, &ring->adev->vce.entity,
  275. AMDGPU_FENCE_OWNER_UNDEFINED, &f);
  276. if (r)
  277. goto err;
  278. }
  279. if (fence)
  280. *fence = dma_fence_get(f);
  281. dma_fence_put(f);
  282. return 0;
  283. err:
  284. amdgpu_job_free(job);
  285. return r;
  286. }
  287. /**
  288. * uvd_v7_0_enc_ring_test_ib - test if UVD ENC IBs are working
  289. *
  290. * @ring: the engine to test on
  291. *
  292. */
  293. static int uvd_v7_0_enc_ring_test_ib(struct amdgpu_ring *ring, long timeout)
  294. {
  295. struct dma_fence *fence = NULL;
  296. long r;
  297. r = uvd_v7_0_enc_get_create_msg(ring, 1, NULL);
  298. if (r) {
  299. DRM_ERROR("amdgpu: (%d)failed to get create msg (%ld).\n", ring->me, r);
  300. goto error;
  301. }
  302. r = uvd_v7_0_enc_get_destroy_msg(ring, 1, true, &fence);
  303. if (r) {
  304. DRM_ERROR("amdgpu: (%d)failed to get destroy ib (%ld).\n", ring->me, r);
  305. goto error;
  306. }
  307. r = dma_fence_wait_timeout(fence, false, timeout);
  308. if (r == 0) {
  309. DRM_ERROR("amdgpu: (%d)IB test timed out.\n", ring->me);
  310. r = -ETIMEDOUT;
  311. } else if (r < 0) {
  312. DRM_ERROR("amdgpu: (%d)fence wait failed (%ld).\n", ring->me, r);
  313. } else {
  314. DRM_DEBUG("ib test on (%d)ring %d succeeded\n", ring->me, ring->idx);
  315. r = 0;
  316. }
  317. error:
  318. dma_fence_put(fence);
  319. return r;
  320. }
  321. static int uvd_v7_0_early_init(void *handle)
  322. {
  323. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  324. adev->uvd.num_uvd_inst = 1;
  325. if (amdgpu_sriov_vf(adev))
  326. adev->uvd.num_enc_rings = 1;
  327. else
  328. adev->uvd.num_enc_rings = 2;
  329. uvd_v7_0_set_ring_funcs(adev);
  330. uvd_v7_0_set_enc_ring_funcs(adev);
  331. uvd_v7_0_set_irq_funcs(adev);
  332. return 0;
  333. }
  334. static int uvd_v7_0_sw_init(void *handle)
  335. {
  336. struct amdgpu_ring *ring;
  337. struct drm_sched_rq *rq;
  338. int i, j, r;
  339. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  340. for (j = 0; j < adev->uvd.num_uvd_inst; j++) {
  341. /* UVD TRAP */
  342. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_UVD, 124, &adev->uvd.inst[j].irq);
  343. if (r)
  344. return r;
  345. /* UVD ENC TRAP */
  346. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  347. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_UVD, i + 119, &adev->uvd.inst[j].irq);
  348. if (r)
  349. return r;
  350. }
  351. }
  352. r = amdgpu_uvd_sw_init(adev);
  353. if (r)
  354. return r;
  355. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  356. const struct common_firmware_header *hdr;
  357. hdr = (const struct common_firmware_header *)adev->uvd.fw->data;
  358. adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].ucode_id = AMDGPU_UCODE_ID_UVD;
  359. adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].fw = adev->uvd.fw;
  360. adev->firmware.fw_size +=
  361. ALIGN(le32_to_cpu(hdr->ucode_size_bytes), PAGE_SIZE);
  362. DRM_INFO("PSP loading UVD firmware\n");
  363. }
  364. for (j = 0; j < adev->uvd.num_uvd_inst; j++) {
  365. ring = &adev->uvd.inst[j].ring_enc[0];
  366. rq = &ring->sched.sched_rq[DRM_SCHED_PRIORITY_NORMAL];
  367. r = drm_sched_entity_init(&ring->sched, &adev->uvd.inst[j].entity_enc,
  368. rq, NULL);
  369. if (r) {
  370. DRM_ERROR("(%d)Failed setting up UVD ENC run queue.\n", j);
  371. return r;
  372. }
  373. }
  374. r = amdgpu_uvd_resume(adev);
  375. if (r)
  376. return r;
  377. for (j = 0; j < adev->uvd.num_uvd_inst; j++) {
  378. if (!amdgpu_sriov_vf(adev)) {
  379. ring = &adev->uvd.inst[j].ring;
  380. sprintf(ring->name, "uvd<%d>", j);
  381. r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.inst[j].irq, 0);
  382. if (r)
  383. return r;
  384. }
  385. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  386. ring = &adev->uvd.inst[j].ring_enc[i];
  387. sprintf(ring->name, "uvd_enc%d<%d>", i, j);
  388. if (amdgpu_sriov_vf(adev)) {
  389. ring->use_doorbell = true;
  390. /* currently only use the first enconding ring for
  391. * sriov, so set unused location for other unused rings.
  392. */
  393. if (i == 0)
  394. ring->doorbell_index = AMDGPU_DOORBELL64_UVD_RING0_1 * 2;
  395. else
  396. ring->doorbell_index = AMDGPU_DOORBELL64_UVD_RING2_3 * 2 + 1;
  397. }
  398. r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.inst[j].irq, 0);
  399. if (r)
  400. return r;
  401. }
  402. }
  403. r = amdgpu_virt_alloc_mm_table(adev);
  404. if (r)
  405. return r;
  406. return r;
  407. }
  408. static int uvd_v7_0_sw_fini(void *handle)
  409. {
  410. int i, j, r;
  411. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  412. amdgpu_virt_free_mm_table(adev);
  413. r = amdgpu_uvd_suspend(adev);
  414. if (r)
  415. return r;
  416. for (j = 0; j < adev->uvd.num_uvd_inst; ++j) {
  417. drm_sched_entity_fini(&adev->uvd.inst[j].ring_enc[0].sched, &adev->uvd.inst[j].entity_enc);
  418. for (i = 0; i < adev->uvd.num_enc_rings; ++i)
  419. amdgpu_ring_fini(&adev->uvd.inst[j].ring_enc[i]);
  420. }
  421. return amdgpu_uvd_sw_fini(adev);
  422. }
  423. /**
  424. * uvd_v7_0_hw_init - start and test UVD block
  425. *
  426. * @adev: amdgpu_device pointer
  427. *
  428. * Initialize the hardware, boot up the VCPU and do some testing
  429. */
  430. static int uvd_v7_0_hw_init(void *handle)
  431. {
  432. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  433. struct amdgpu_ring *ring;
  434. uint32_t tmp;
  435. int i, j, r;
  436. if (amdgpu_sriov_vf(adev))
  437. r = uvd_v7_0_sriov_start(adev);
  438. else
  439. r = uvd_v7_0_start(adev);
  440. if (r)
  441. goto done;
  442. for (j = 0; j < adev->uvd.num_uvd_inst; ++j) {
  443. ring = &adev->uvd.inst[j].ring;
  444. if (!amdgpu_sriov_vf(adev)) {
  445. ring->ready = true;
  446. r = amdgpu_ring_test_ring(ring);
  447. if (r) {
  448. ring->ready = false;
  449. goto done;
  450. }
  451. r = amdgpu_ring_alloc(ring, 10);
  452. if (r) {
  453. DRM_ERROR("amdgpu: (%d)ring failed to lock UVD ring (%d).\n", j, r);
  454. goto done;
  455. }
  456. tmp = PACKET0(SOC15_REG_OFFSET(UVD, j,
  457. mmUVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL), 0);
  458. amdgpu_ring_write(ring, tmp);
  459. amdgpu_ring_write(ring, 0xFFFFF);
  460. tmp = PACKET0(SOC15_REG_OFFSET(UVD, j,
  461. mmUVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL), 0);
  462. amdgpu_ring_write(ring, tmp);
  463. amdgpu_ring_write(ring, 0xFFFFF);
  464. tmp = PACKET0(SOC15_REG_OFFSET(UVD, j,
  465. mmUVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL), 0);
  466. amdgpu_ring_write(ring, tmp);
  467. amdgpu_ring_write(ring, 0xFFFFF);
  468. /* Clear timeout status bits */
  469. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, j,
  470. mmUVD_SEMA_TIMEOUT_STATUS), 0));
  471. amdgpu_ring_write(ring, 0x8);
  472. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, j,
  473. mmUVD_SEMA_CNTL), 0));
  474. amdgpu_ring_write(ring, 3);
  475. amdgpu_ring_commit(ring);
  476. }
  477. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  478. ring = &adev->uvd.inst[j].ring_enc[i];
  479. ring->ready = true;
  480. r = amdgpu_ring_test_ring(ring);
  481. if (r) {
  482. ring->ready = false;
  483. goto done;
  484. }
  485. }
  486. }
  487. done:
  488. if (!r)
  489. DRM_INFO("UVD and UVD ENC initialized successfully.\n");
  490. return r;
  491. }
  492. /**
  493. * uvd_v7_0_hw_fini - stop the hardware block
  494. *
  495. * @adev: amdgpu_device pointer
  496. *
  497. * Stop the UVD block, mark ring as not ready any more
  498. */
  499. static int uvd_v7_0_hw_fini(void *handle)
  500. {
  501. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  502. int i;
  503. if (!amdgpu_sriov_vf(adev))
  504. uvd_v7_0_stop(adev);
  505. else {
  506. /* full access mode, so don't touch any UVD register */
  507. DRM_DEBUG("For SRIOV client, shouldn't do anything.\n");
  508. }
  509. for (i = 0; i < adev->uvd.num_uvd_inst; ++i)
  510. adev->uvd.inst[i].ring.ready = false;
  511. return 0;
  512. }
  513. static int uvd_v7_0_suspend(void *handle)
  514. {
  515. int r;
  516. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  517. r = uvd_v7_0_hw_fini(adev);
  518. if (r)
  519. return r;
  520. return amdgpu_uvd_suspend(adev);
  521. }
  522. static int uvd_v7_0_resume(void *handle)
  523. {
  524. int r;
  525. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  526. r = amdgpu_uvd_resume(adev);
  527. if (r)
  528. return r;
  529. return uvd_v7_0_hw_init(adev);
  530. }
  531. /**
  532. * uvd_v7_0_mc_resume - memory controller programming
  533. *
  534. * @adev: amdgpu_device pointer
  535. *
  536. * Let the UVD memory controller know it's offsets
  537. */
  538. static void uvd_v7_0_mc_resume(struct amdgpu_device *adev)
  539. {
  540. uint32_t size = AMDGPU_UVD_FIRMWARE_SIZE(adev);
  541. uint32_t offset;
  542. int i;
  543. for (i = 0; i < adev->uvd.num_uvd_inst; ++i) {
  544. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  545. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  546. lower_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  547. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  548. upper_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  549. offset = 0;
  550. } else {
  551. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  552. lower_32_bits(adev->uvd.inst[i].gpu_addr));
  553. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  554. upper_32_bits(adev->uvd.inst[i].gpu_addr));
  555. offset = size;
  556. }
  557. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_OFFSET0,
  558. AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
  559. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_SIZE0, size);
  560. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW,
  561. lower_32_bits(adev->uvd.inst[i].gpu_addr + offset));
  562. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH,
  563. upper_32_bits(adev->uvd.inst[i].gpu_addr + offset));
  564. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_OFFSET1, (1 << 21));
  565. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_SIZE1, AMDGPU_UVD_HEAP_SIZE);
  566. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW,
  567. lower_32_bits(adev->uvd.inst[i].gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  568. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH,
  569. upper_32_bits(adev->uvd.inst[i].gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  570. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_OFFSET2, (2 << 21));
  571. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_SIZE2,
  572. AMDGPU_UVD_STACK_SIZE + (AMDGPU_UVD_SESSION_SIZE * 40));
  573. WREG32_SOC15(UVD, i, mmUVD_UDEC_ADDR_CONFIG,
  574. adev->gfx.config.gb_addr_config);
  575. WREG32_SOC15(UVD, i, mmUVD_UDEC_DB_ADDR_CONFIG,
  576. adev->gfx.config.gb_addr_config);
  577. WREG32_SOC15(UVD, i, mmUVD_UDEC_DBW_ADDR_CONFIG,
  578. adev->gfx.config.gb_addr_config);
  579. WREG32_SOC15(UVD, i, mmUVD_GP_SCRATCH4, adev->uvd.max_handles);
  580. }
  581. }
  582. static int uvd_v7_0_mmsch_start(struct amdgpu_device *adev,
  583. struct amdgpu_mm_table *table)
  584. {
  585. uint32_t data = 0, loop;
  586. uint64_t addr = table->gpu_addr;
  587. struct mmsch_v1_0_init_header *header = (struct mmsch_v1_0_init_header *)table->cpu_addr;
  588. uint32_t size;
  589. int i;
  590. size = header->header_size + header->vce_table_size + header->uvd_table_size;
  591. /* 1, write to vce_mmsch_vf_ctx_addr_lo/hi register with GPU mc addr of memory descriptor location */
  592. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_ADDR_LO, lower_32_bits(addr));
  593. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_ADDR_HI, upper_32_bits(addr));
  594. /* 2, update vmid of descriptor */
  595. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_VMID);
  596. data &= ~VCE_MMSCH_VF_VMID__VF_CTX_VMID_MASK;
  597. data |= (0 << VCE_MMSCH_VF_VMID__VF_CTX_VMID__SHIFT); /* use domain0 for MM scheduler */
  598. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_VMID, data);
  599. /* 3, notify mmsch about the size of this descriptor */
  600. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_SIZE, size);
  601. /* 4, set resp to zero */
  602. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP, 0);
  603. for (i = 0; i < adev->uvd.num_uvd_inst; ++i) {
  604. WDOORBELL32(adev->uvd.inst[i].ring_enc[0].doorbell_index, 0);
  605. adev->wb.wb[adev->uvd.inst[i].ring_enc[0].wptr_offs] = 0;
  606. adev->uvd.inst[i].ring_enc[0].wptr = 0;
  607. adev->uvd.inst[i].ring_enc[0].wptr_old = 0;
  608. }
  609. /* 5, kick off the initialization and wait until VCE_MMSCH_VF_MAILBOX_RESP becomes non-zero */
  610. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_HOST, 0x10000001);
  611. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP);
  612. loop = 1000;
  613. while ((data & 0x10000002) != 0x10000002) {
  614. udelay(10);
  615. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP);
  616. loop--;
  617. if (!loop)
  618. break;
  619. }
  620. if (!loop) {
  621. dev_err(adev->dev, "failed to init MMSCH, mmVCE_MMSCH_VF_MAILBOX_RESP = %x\n", data);
  622. return -EBUSY;
  623. }
  624. return 0;
  625. }
  626. static int uvd_v7_0_sriov_start(struct amdgpu_device *adev)
  627. {
  628. struct amdgpu_ring *ring;
  629. uint32_t offset, size, tmp;
  630. uint32_t table_size = 0;
  631. struct mmsch_v1_0_cmd_direct_write direct_wt = { {0} };
  632. struct mmsch_v1_0_cmd_direct_read_modify_write direct_rd_mod_wt = { {0} };
  633. struct mmsch_v1_0_cmd_direct_polling direct_poll = { {0} };
  634. struct mmsch_v1_0_cmd_end end = { {0} };
  635. uint32_t *init_table = adev->virt.mm_table.cpu_addr;
  636. struct mmsch_v1_0_init_header *header = (struct mmsch_v1_0_init_header *)init_table;
  637. uint8_t i = 0;
  638. direct_wt.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_WRITE;
  639. direct_rd_mod_wt.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_READ_MODIFY_WRITE;
  640. direct_poll.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_POLLING;
  641. end.cmd_header.command_type = MMSCH_COMMAND__END;
  642. if (header->uvd_table_offset == 0 && header->uvd_table_size == 0) {
  643. header->version = MMSCH_VERSION;
  644. header->header_size = sizeof(struct mmsch_v1_0_init_header) >> 2;
  645. if (header->vce_table_offset == 0 && header->vce_table_size == 0)
  646. header->uvd_table_offset = header->header_size;
  647. else
  648. header->uvd_table_offset = header->vce_table_size + header->vce_table_offset;
  649. init_table += header->uvd_table_offset;
  650. for (i = 0; i < adev->uvd.num_uvd_inst; ++i) {
  651. ring = &adev->uvd.inst[i].ring;
  652. ring->wptr = 0;
  653. size = AMDGPU_GPU_PAGE_ALIGN(adev->uvd.fw->size + 4);
  654. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_STATUS),
  655. 0xFFFFFFFF, 0x00000004);
  656. /* mc resume*/
  657. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  658. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW),
  659. lower_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  660. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH),
  661. upper_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  662. offset = 0;
  663. } else {
  664. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW),
  665. lower_32_bits(adev->uvd.inst[i].gpu_addr));
  666. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH),
  667. upper_32_bits(adev->uvd.inst[i].gpu_addr));
  668. offset = size;
  669. }
  670. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_OFFSET0),
  671. AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
  672. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_SIZE0), size);
  673. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW),
  674. lower_32_bits(adev->uvd.inst[i].gpu_addr + offset));
  675. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH),
  676. upper_32_bits(adev->uvd.inst[i].gpu_addr + offset));
  677. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_OFFSET1), (1 << 21));
  678. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_SIZE1), AMDGPU_UVD_HEAP_SIZE);
  679. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW),
  680. lower_32_bits(adev->uvd.inst[i].gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  681. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH),
  682. upper_32_bits(adev->uvd.inst[i].gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  683. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_OFFSET2), (2 << 21));
  684. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_SIZE2),
  685. AMDGPU_UVD_STACK_SIZE + (AMDGPU_UVD_SESSION_SIZE * 40));
  686. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_GP_SCRATCH4), adev->uvd.max_handles);
  687. /* mc resume end*/
  688. /* disable clock gating */
  689. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_CGC_CTRL),
  690. ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK, 0);
  691. /* disable interupt */
  692. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_MASTINT_EN),
  693. ~UVD_MASTINT_EN__VCPU_EN_MASK, 0);
  694. /* stall UMC and register bus before resetting VCPU */
  695. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_CTRL2),
  696. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  697. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  698. /* put LMI, VCPU, RBC etc... into reset */
  699. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_SOFT_RESET),
  700. (uint32_t)(UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  701. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
  702. UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  703. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
  704. UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  705. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
  706. UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  707. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK));
  708. /* initialize UVD memory controller */
  709. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_CTRL),
  710. (uint32_t)((0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  711. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  712. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  713. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  714. UVD_LMI_CTRL__REQ_MODE_MASK |
  715. 0x00100000L));
  716. /* take all subblocks out of reset, except VCPU */
  717. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_SOFT_RESET),
  718. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  719. /* enable VCPU clock */
  720. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CNTL),
  721. UVD_VCPU_CNTL__CLK_EN_MASK);
  722. /* enable master interrupt */
  723. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_MASTINT_EN),
  724. ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
  725. (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
  726. /* clear the bit 4 of UVD_STATUS */
  727. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_STATUS),
  728. ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT), 0);
  729. /* force RBC into idle state */
  730. size = order_base_2(ring->ring_size);
  731. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, size);
  732. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  733. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_RBC_RB_CNTL), tmp);
  734. ring = &adev->uvd.inst[i].ring_enc[0];
  735. ring->wptr = 0;
  736. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_RB_BASE_LO), ring->gpu_addr);
  737. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_RB_BASE_HI), upper_32_bits(ring->gpu_addr));
  738. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_RB_SIZE), ring->ring_size / 4);
  739. /* boot up the VCPU */
  740. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_SOFT_RESET), 0);
  741. /* enable UMC */
  742. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_CTRL2),
  743. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK, 0);
  744. MMSCH_V1_0_INSERT_DIRECT_POLL(SOC15_REG_OFFSET(UVD, i, mmUVD_STATUS), 0x02, 0x02);
  745. }
  746. /* add end packet */
  747. memcpy((void *)init_table, &end, sizeof(struct mmsch_v1_0_cmd_end));
  748. table_size += sizeof(struct mmsch_v1_0_cmd_end) / 4;
  749. header->uvd_table_size = table_size;
  750. }
  751. return uvd_v7_0_mmsch_start(adev, &adev->virt.mm_table);
  752. }
  753. /**
  754. * uvd_v7_0_start - start UVD block
  755. *
  756. * @adev: amdgpu_device pointer
  757. *
  758. * Setup and start the UVD block
  759. */
  760. static int uvd_v7_0_start(struct amdgpu_device *adev)
  761. {
  762. struct amdgpu_ring *ring;
  763. uint32_t rb_bufsz, tmp;
  764. uint32_t lmi_swap_cntl;
  765. uint32_t mp_swap_cntl;
  766. int i, j, k, r;
  767. for (k = 0; k < adev->uvd.num_uvd_inst; ++k) {
  768. /* disable DPG */
  769. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_POWER_STATUS), 0,
  770. ~UVD_POWER_STATUS__UVD_PG_MODE_MASK);
  771. }
  772. /* disable byte swapping */
  773. lmi_swap_cntl = 0;
  774. mp_swap_cntl = 0;
  775. uvd_v7_0_mc_resume(adev);
  776. for (k = 0; k < adev->uvd.num_uvd_inst; ++k) {
  777. ring = &adev->uvd.inst[k].ring;
  778. /* disable clock gating */
  779. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_CGC_CTRL), 0,
  780. ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK);
  781. /* disable interupt */
  782. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_MASTINT_EN), 0,
  783. ~UVD_MASTINT_EN__VCPU_EN_MASK);
  784. /* stall UMC and register bus before resetting VCPU */
  785. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_LMI_CTRL2),
  786. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  787. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  788. mdelay(1);
  789. /* put LMI, VCPU, RBC etc... into reset */
  790. WREG32_SOC15(UVD, k, mmUVD_SOFT_RESET,
  791. UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  792. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
  793. UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  794. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
  795. UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  796. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
  797. UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  798. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
  799. mdelay(5);
  800. /* initialize UVD memory controller */
  801. WREG32_SOC15(UVD, k, mmUVD_LMI_CTRL,
  802. (0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  803. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  804. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  805. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  806. UVD_LMI_CTRL__REQ_MODE_MASK |
  807. 0x00100000L);
  808. #ifdef __BIG_ENDIAN
  809. /* swap (8 in 32) RB and IB */
  810. lmi_swap_cntl = 0xa;
  811. mp_swap_cntl = 0;
  812. #endif
  813. WREG32_SOC15(UVD, k, mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
  814. WREG32_SOC15(UVD, k, mmUVD_MP_SWAP_CNTL, mp_swap_cntl);
  815. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_MUXA0, 0x40c2040);
  816. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_MUXA1, 0x0);
  817. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_MUXB0, 0x40c2040);
  818. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_MUXB1, 0x0);
  819. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_ALU, 0);
  820. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_MUX, 0x88);
  821. /* take all subblocks out of reset, except VCPU */
  822. WREG32_SOC15(UVD, k, mmUVD_SOFT_RESET,
  823. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  824. mdelay(5);
  825. /* enable VCPU clock */
  826. WREG32_SOC15(UVD, k, mmUVD_VCPU_CNTL,
  827. UVD_VCPU_CNTL__CLK_EN_MASK);
  828. /* enable UMC */
  829. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_LMI_CTRL2), 0,
  830. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  831. /* boot up the VCPU */
  832. WREG32_SOC15(UVD, k, mmUVD_SOFT_RESET, 0);
  833. mdelay(10);
  834. for (i = 0; i < 10; ++i) {
  835. uint32_t status;
  836. for (j = 0; j < 100; ++j) {
  837. status = RREG32_SOC15(UVD, k, mmUVD_STATUS);
  838. if (status & 2)
  839. break;
  840. mdelay(10);
  841. }
  842. r = 0;
  843. if (status & 2)
  844. break;
  845. DRM_ERROR("UVD(%d) not responding, trying to reset the VCPU!!!\n", k);
  846. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_SOFT_RESET),
  847. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
  848. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  849. mdelay(10);
  850. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_SOFT_RESET), 0,
  851. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  852. mdelay(10);
  853. r = -1;
  854. }
  855. if (r) {
  856. DRM_ERROR("UVD(%d) not responding, giving up!!!\n", k);
  857. return r;
  858. }
  859. /* enable master interrupt */
  860. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_MASTINT_EN),
  861. (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
  862. ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
  863. /* clear the bit 4 of UVD_STATUS */
  864. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_STATUS), 0,
  865. ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
  866. /* force RBC into idle state */
  867. rb_bufsz = order_base_2(ring->ring_size);
  868. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
  869. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
  870. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  871. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
  872. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
  873. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
  874. WREG32_SOC15(UVD, k, mmUVD_RBC_RB_CNTL, tmp);
  875. /* set the write pointer delay */
  876. WREG32_SOC15(UVD, k, mmUVD_RBC_RB_WPTR_CNTL, 0);
  877. /* set the wb address */
  878. WREG32_SOC15(UVD, k, mmUVD_RBC_RB_RPTR_ADDR,
  879. (upper_32_bits(ring->gpu_addr) >> 2));
  880. /* programm the RB_BASE for ring buffer */
  881. WREG32_SOC15(UVD, k, mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
  882. lower_32_bits(ring->gpu_addr));
  883. WREG32_SOC15(UVD, k, mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
  884. upper_32_bits(ring->gpu_addr));
  885. /* Initialize the ring buffer's read and write pointers */
  886. WREG32_SOC15(UVD, k, mmUVD_RBC_RB_RPTR, 0);
  887. ring->wptr = RREG32_SOC15(UVD, k, mmUVD_RBC_RB_RPTR);
  888. WREG32_SOC15(UVD, k, mmUVD_RBC_RB_WPTR,
  889. lower_32_bits(ring->wptr));
  890. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_RBC_RB_CNTL), 0,
  891. ~UVD_RBC_RB_CNTL__RB_NO_FETCH_MASK);
  892. ring = &adev->uvd.inst[k].ring_enc[0];
  893. WREG32_SOC15(UVD, k, mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
  894. WREG32_SOC15(UVD, k, mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
  895. WREG32_SOC15(UVD, k, mmUVD_RB_BASE_LO, ring->gpu_addr);
  896. WREG32_SOC15(UVD, k, mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
  897. WREG32_SOC15(UVD, k, mmUVD_RB_SIZE, ring->ring_size / 4);
  898. ring = &adev->uvd.inst[k].ring_enc[1];
  899. WREG32_SOC15(UVD, k, mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
  900. WREG32_SOC15(UVD, k, mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
  901. WREG32_SOC15(UVD, k, mmUVD_RB_BASE_LO2, ring->gpu_addr);
  902. WREG32_SOC15(UVD, k, mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
  903. WREG32_SOC15(UVD, k, mmUVD_RB_SIZE2, ring->ring_size / 4);
  904. }
  905. return 0;
  906. }
  907. /**
  908. * uvd_v7_0_stop - stop UVD block
  909. *
  910. * @adev: amdgpu_device pointer
  911. *
  912. * stop the UVD block
  913. */
  914. static void uvd_v7_0_stop(struct amdgpu_device *adev)
  915. {
  916. uint8_t i = 0;
  917. for (i = 0; i < adev->uvd.num_uvd_inst; ++i) {
  918. /* force RBC into idle state */
  919. WREG32_SOC15(UVD, i, mmUVD_RBC_RB_CNTL, 0x11010101);
  920. /* Stall UMC and register bus before resetting VCPU */
  921. WREG32_P(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_CTRL2),
  922. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  923. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  924. mdelay(1);
  925. /* put VCPU into reset */
  926. WREG32_SOC15(UVD, i, mmUVD_SOFT_RESET,
  927. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  928. mdelay(5);
  929. /* disable VCPU clock */
  930. WREG32_SOC15(UVD, i, mmUVD_VCPU_CNTL, 0x0);
  931. /* Unstall UMC and register bus */
  932. WREG32_P(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_CTRL2), 0,
  933. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  934. }
  935. }
  936. /**
  937. * uvd_v7_0_ring_emit_fence - emit an fence & trap command
  938. *
  939. * @ring: amdgpu_ring pointer
  940. * @fence: fence to emit
  941. *
  942. * Write a fence and a trap command to the ring.
  943. */
  944. static void uvd_v7_0_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
  945. unsigned flags)
  946. {
  947. struct amdgpu_device *adev = ring->adev;
  948. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  949. amdgpu_ring_write(ring,
  950. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_CONTEXT_ID), 0));
  951. amdgpu_ring_write(ring, seq);
  952. amdgpu_ring_write(ring,
  953. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA0), 0));
  954. amdgpu_ring_write(ring, addr & 0xffffffff);
  955. amdgpu_ring_write(ring,
  956. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA1), 0));
  957. amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
  958. amdgpu_ring_write(ring,
  959. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_CMD), 0));
  960. amdgpu_ring_write(ring, 0);
  961. amdgpu_ring_write(ring,
  962. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA0), 0));
  963. amdgpu_ring_write(ring, 0);
  964. amdgpu_ring_write(ring,
  965. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA1), 0));
  966. amdgpu_ring_write(ring, 0);
  967. amdgpu_ring_write(ring,
  968. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_CMD), 0));
  969. amdgpu_ring_write(ring, 2);
  970. }
  971. /**
  972. * uvd_v7_0_enc_ring_emit_fence - emit an enc fence & trap command
  973. *
  974. * @ring: amdgpu_ring pointer
  975. * @fence: fence to emit
  976. *
  977. * Write enc a fence and a trap command to the ring.
  978. */
  979. static void uvd_v7_0_enc_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
  980. u64 seq, unsigned flags)
  981. {
  982. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  983. amdgpu_ring_write(ring, HEVC_ENC_CMD_FENCE);
  984. amdgpu_ring_write(ring, addr);
  985. amdgpu_ring_write(ring, upper_32_bits(addr));
  986. amdgpu_ring_write(ring, seq);
  987. amdgpu_ring_write(ring, HEVC_ENC_CMD_TRAP);
  988. }
  989. /**
  990. * uvd_v7_0_ring_emit_hdp_flush - skip HDP flushing
  991. *
  992. * @ring: amdgpu_ring pointer
  993. */
  994. static void uvd_v7_0_ring_emit_hdp_flush(struct amdgpu_ring *ring)
  995. {
  996. /* The firmware doesn't seem to like touching registers at this point. */
  997. }
  998. /**
  999. * uvd_v7_0_ring_test_ring - register write test
  1000. *
  1001. * @ring: amdgpu_ring pointer
  1002. *
  1003. * Test if we can successfully write to the context register
  1004. */
  1005. static int uvd_v7_0_ring_test_ring(struct amdgpu_ring *ring)
  1006. {
  1007. struct amdgpu_device *adev = ring->adev;
  1008. uint32_t tmp = 0;
  1009. unsigned i;
  1010. int r;
  1011. WREG32_SOC15(UVD, ring->me, mmUVD_CONTEXT_ID, 0xCAFEDEAD);
  1012. r = amdgpu_ring_alloc(ring, 3);
  1013. if (r) {
  1014. DRM_ERROR("amdgpu: (%d)cp failed to lock ring %d (%d).\n",
  1015. ring->me, ring->idx, r);
  1016. return r;
  1017. }
  1018. amdgpu_ring_write(ring,
  1019. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_CONTEXT_ID), 0));
  1020. amdgpu_ring_write(ring, 0xDEADBEEF);
  1021. amdgpu_ring_commit(ring);
  1022. for (i = 0; i < adev->usec_timeout; i++) {
  1023. tmp = RREG32_SOC15(UVD, ring->me, mmUVD_CONTEXT_ID);
  1024. if (tmp == 0xDEADBEEF)
  1025. break;
  1026. DRM_UDELAY(1);
  1027. }
  1028. if (i < adev->usec_timeout) {
  1029. DRM_DEBUG("(%d)ring test on %d succeeded in %d usecs\n",
  1030. ring->me, ring->idx, i);
  1031. } else {
  1032. DRM_ERROR("(%d)amdgpu: ring %d test failed (0x%08X)\n",
  1033. ring->me, ring->idx, tmp);
  1034. r = -EINVAL;
  1035. }
  1036. return r;
  1037. }
  1038. /**
  1039. * uvd_v7_0_ring_emit_ib - execute indirect buffer
  1040. *
  1041. * @ring: amdgpu_ring pointer
  1042. * @ib: indirect buffer to execute
  1043. *
  1044. * Write ring commands to execute the indirect buffer
  1045. */
  1046. static void uvd_v7_0_ring_emit_ib(struct amdgpu_ring *ring,
  1047. struct amdgpu_ib *ib,
  1048. unsigned vmid, bool ctx_switch)
  1049. {
  1050. struct amdgpu_device *adev = ring->adev;
  1051. amdgpu_ring_write(ring,
  1052. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_LMI_RBC_IB_VMID), 0));
  1053. amdgpu_ring_write(ring, vmid);
  1054. amdgpu_ring_write(ring,
  1055. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_LMI_RBC_IB_64BIT_BAR_LOW), 0));
  1056. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1057. amdgpu_ring_write(ring,
  1058. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH), 0));
  1059. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1060. amdgpu_ring_write(ring,
  1061. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_RBC_IB_SIZE), 0));
  1062. amdgpu_ring_write(ring, ib->length_dw);
  1063. }
  1064. /**
  1065. * uvd_v7_0_enc_ring_emit_ib - enc execute indirect buffer
  1066. *
  1067. * @ring: amdgpu_ring pointer
  1068. * @ib: indirect buffer to execute
  1069. *
  1070. * Write enc ring commands to execute the indirect buffer
  1071. */
  1072. static void uvd_v7_0_enc_ring_emit_ib(struct amdgpu_ring *ring,
  1073. struct amdgpu_ib *ib, unsigned int vmid, bool ctx_switch)
  1074. {
  1075. amdgpu_ring_write(ring, HEVC_ENC_CMD_IB_VM);
  1076. amdgpu_ring_write(ring, vmid);
  1077. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1078. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1079. amdgpu_ring_write(ring, ib->length_dw);
  1080. }
  1081. static void uvd_v7_0_ring_emit_wreg(struct amdgpu_ring *ring,
  1082. uint32_t reg, uint32_t val)
  1083. {
  1084. struct amdgpu_device *adev = ring->adev;
  1085. amdgpu_ring_write(ring,
  1086. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA0), 0));
  1087. amdgpu_ring_write(ring, reg << 2);
  1088. amdgpu_ring_write(ring,
  1089. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA1), 0));
  1090. amdgpu_ring_write(ring, val);
  1091. amdgpu_ring_write(ring,
  1092. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_CMD), 0));
  1093. amdgpu_ring_write(ring, 8);
  1094. }
  1095. static void uvd_v7_0_ring_emit_reg_wait(struct amdgpu_ring *ring, uint32_t reg,
  1096. uint32_t val, uint32_t mask)
  1097. {
  1098. struct amdgpu_device *adev = ring->adev;
  1099. amdgpu_ring_write(ring,
  1100. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA0), 0));
  1101. amdgpu_ring_write(ring, reg << 2);
  1102. amdgpu_ring_write(ring,
  1103. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA1), 0));
  1104. amdgpu_ring_write(ring, val);
  1105. amdgpu_ring_write(ring,
  1106. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GP_SCRATCH8), 0));
  1107. amdgpu_ring_write(ring, mask);
  1108. amdgpu_ring_write(ring,
  1109. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_CMD), 0));
  1110. amdgpu_ring_write(ring, 12);
  1111. }
  1112. static void uvd_v7_0_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1113. unsigned vmid, uint64_t pd_addr)
  1114. {
  1115. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1116. uint32_t data0, data1, mask;
  1117. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  1118. /* wait for reg writes */
  1119. data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
  1120. data1 = lower_32_bits(pd_addr);
  1121. mask = 0xffffffff;
  1122. uvd_v7_0_ring_emit_reg_wait(ring, data0, data1, mask);
  1123. }
  1124. static void uvd_v7_0_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count)
  1125. {
  1126. int i;
  1127. struct amdgpu_device *adev = ring->adev;
  1128. for (i = 0; i < count; i++)
  1129. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_NO_OP), 0));
  1130. }
  1131. static void uvd_v7_0_enc_ring_insert_end(struct amdgpu_ring *ring)
  1132. {
  1133. amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
  1134. }
  1135. static void uvd_v7_0_enc_ring_emit_reg_wait(struct amdgpu_ring *ring,
  1136. uint32_t reg, uint32_t val,
  1137. uint32_t mask)
  1138. {
  1139. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WAIT);
  1140. amdgpu_ring_write(ring, reg << 2);
  1141. amdgpu_ring_write(ring, mask);
  1142. amdgpu_ring_write(ring, val);
  1143. }
  1144. static void uvd_v7_0_enc_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1145. unsigned int vmid, uint64_t pd_addr)
  1146. {
  1147. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1148. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  1149. /* wait for reg writes */
  1150. uvd_v7_0_enc_ring_emit_reg_wait(ring, hub->ctx0_ptb_addr_lo32 + vmid * 2,
  1151. lower_32_bits(pd_addr), 0xffffffff);
  1152. }
  1153. static void uvd_v7_0_enc_ring_emit_wreg(struct amdgpu_ring *ring,
  1154. uint32_t reg, uint32_t val)
  1155. {
  1156. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WRITE);
  1157. amdgpu_ring_write(ring, reg << 2);
  1158. amdgpu_ring_write(ring, val);
  1159. }
  1160. #if 0
  1161. static bool uvd_v7_0_is_idle(void *handle)
  1162. {
  1163. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1164. return !(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK);
  1165. }
  1166. static int uvd_v7_0_wait_for_idle(void *handle)
  1167. {
  1168. unsigned i;
  1169. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1170. for (i = 0; i < adev->usec_timeout; i++) {
  1171. if (uvd_v7_0_is_idle(handle))
  1172. return 0;
  1173. }
  1174. return -ETIMEDOUT;
  1175. }
  1176. #define AMDGPU_UVD_STATUS_BUSY_MASK 0xfd
  1177. static bool uvd_v7_0_check_soft_reset(void *handle)
  1178. {
  1179. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1180. u32 srbm_soft_reset = 0;
  1181. u32 tmp = RREG32(mmSRBM_STATUS);
  1182. if (REG_GET_FIELD(tmp, SRBM_STATUS, UVD_RQ_PENDING) ||
  1183. REG_GET_FIELD(tmp, SRBM_STATUS, UVD_BUSY) ||
  1184. (RREG32_SOC15(UVD, ring->me, mmUVD_STATUS) &
  1185. AMDGPU_UVD_STATUS_BUSY_MASK))
  1186. srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset,
  1187. SRBM_SOFT_RESET, SOFT_RESET_UVD, 1);
  1188. if (srbm_soft_reset) {
  1189. adev->uvd.inst[ring->me].srbm_soft_reset = srbm_soft_reset;
  1190. return true;
  1191. } else {
  1192. adev->uvd.inst[ring->me].srbm_soft_reset = 0;
  1193. return false;
  1194. }
  1195. }
  1196. static int uvd_v7_0_pre_soft_reset(void *handle)
  1197. {
  1198. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1199. if (!adev->uvd.inst[ring->me].srbm_soft_reset)
  1200. return 0;
  1201. uvd_v7_0_stop(adev);
  1202. return 0;
  1203. }
  1204. static int uvd_v7_0_soft_reset(void *handle)
  1205. {
  1206. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1207. u32 srbm_soft_reset;
  1208. if (!adev->uvd.inst[ring->me].srbm_soft_reset)
  1209. return 0;
  1210. srbm_soft_reset = adev->uvd.inst[ring->me].srbm_soft_reset;
  1211. if (srbm_soft_reset) {
  1212. u32 tmp;
  1213. tmp = RREG32(mmSRBM_SOFT_RESET);
  1214. tmp |= srbm_soft_reset;
  1215. dev_info(adev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
  1216. WREG32(mmSRBM_SOFT_RESET, tmp);
  1217. tmp = RREG32(mmSRBM_SOFT_RESET);
  1218. udelay(50);
  1219. tmp &= ~srbm_soft_reset;
  1220. WREG32(mmSRBM_SOFT_RESET, tmp);
  1221. tmp = RREG32(mmSRBM_SOFT_RESET);
  1222. /* Wait a little for things to settle down */
  1223. udelay(50);
  1224. }
  1225. return 0;
  1226. }
  1227. static int uvd_v7_0_post_soft_reset(void *handle)
  1228. {
  1229. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1230. if (!adev->uvd.inst[ring->me].srbm_soft_reset)
  1231. return 0;
  1232. mdelay(5);
  1233. return uvd_v7_0_start(adev);
  1234. }
  1235. #endif
  1236. static int uvd_v7_0_set_interrupt_state(struct amdgpu_device *adev,
  1237. struct amdgpu_irq_src *source,
  1238. unsigned type,
  1239. enum amdgpu_interrupt_state state)
  1240. {
  1241. // TODO
  1242. return 0;
  1243. }
  1244. static int uvd_v7_0_process_interrupt(struct amdgpu_device *adev,
  1245. struct amdgpu_irq_src *source,
  1246. struct amdgpu_iv_entry *entry)
  1247. {
  1248. uint32_t ip_instance;
  1249. switch (entry->client_id) {
  1250. case SOC15_IH_CLIENTID_UVD:
  1251. ip_instance = 0;
  1252. break;
  1253. default:
  1254. DRM_ERROR("Unhandled client id: %d\n", entry->client_id);
  1255. return 0;
  1256. }
  1257. DRM_DEBUG("IH: UVD TRAP\n");
  1258. switch (entry->src_id) {
  1259. case 124:
  1260. amdgpu_fence_process(&adev->uvd.inst[ip_instance].ring);
  1261. break;
  1262. case 119:
  1263. amdgpu_fence_process(&adev->uvd.inst[ip_instance].ring_enc[0]);
  1264. break;
  1265. case 120:
  1266. if (!amdgpu_sriov_vf(adev))
  1267. amdgpu_fence_process(&adev->uvd.inst[ip_instance].ring_enc[1]);
  1268. break;
  1269. default:
  1270. DRM_ERROR("Unhandled interrupt: %d %d\n",
  1271. entry->src_id, entry->src_data[0]);
  1272. break;
  1273. }
  1274. return 0;
  1275. }
  1276. #if 0
  1277. static void uvd_v7_0_set_sw_clock_gating(struct amdgpu_device *adev)
  1278. {
  1279. uint32_t data, data1, data2, suvd_flags;
  1280. data = RREG32_SOC15(UVD, ring->me, mmUVD_CGC_CTRL);
  1281. data1 = RREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_GATE);
  1282. data2 = RREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_CTRL);
  1283. data &= ~(UVD_CGC_CTRL__CLK_OFF_DELAY_MASK |
  1284. UVD_CGC_CTRL__CLK_GATE_DLY_TIMER_MASK);
  1285. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  1286. UVD_SUVD_CGC_GATE__SIT_MASK |
  1287. UVD_SUVD_CGC_GATE__SMP_MASK |
  1288. UVD_SUVD_CGC_GATE__SCM_MASK |
  1289. UVD_SUVD_CGC_GATE__SDB_MASK;
  1290. data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK |
  1291. (1 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_GATE_DLY_TIMER)) |
  1292. (4 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_OFF_DELAY));
  1293. data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
  1294. UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
  1295. UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
  1296. UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
  1297. UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
  1298. UVD_CGC_CTRL__SYS_MODE_MASK |
  1299. UVD_CGC_CTRL__UDEC_MODE_MASK |
  1300. UVD_CGC_CTRL__MPEG2_MODE_MASK |
  1301. UVD_CGC_CTRL__REGS_MODE_MASK |
  1302. UVD_CGC_CTRL__RBC_MODE_MASK |
  1303. UVD_CGC_CTRL__LMI_MC_MODE_MASK |
  1304. UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
  1305. UVD_CGC_CTRL__IDCT_MODE_MASK |
  1306. UVD_CGC_CTRL__MPRD_MODE_MASK |
  1307. UVD_CGC_CTRL__MPC_MODE_MASK |
  1308. UVD_CGC_CTRL__LBSI_MODE_MASK |
  1309. UVD_CGC_CTRL__LRBBM_MODE_MASK |
  1310. UVD_CGC_CTRL__WCB_MODE_MASK |
  1311. UVD_CGC_CTRL__VCPU_MODE_MASK |
  1312. UVD_CGC_CTRL__JPEG_MODE_MASK |
  1313. UVD_CGC_CTRL__JPEG2_MODE_MASK |
  1314. UVD_CGC_CTRL__SCPU_MODE_MASK);
  1315. data2 &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK |
  1316. UVD_SUVD_CGC_CTRL__SIT_MODE_MASK |
  1317. UVD_SUVD_CGC_CTRL__SMP_MODE_MASK |
  1318. UVD_SUVD_CGC_CTRL__SCM_MODE_MASK |
  1319. UVD_SUVD_CGC_CTRL__SDB_MODE_MASK);
  1320. data1 |= suvd_flags;
  1321. WREG32_SOC15(UVD, ring->me, mmUVD_CGC_CTRL, data);
  1322. WREG32_SOC15(UVD, ring->me, mmUVD_CGC_GATE, 0);
  1323. WREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_GATE, data1);
  1324. WREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_CTRL, data2);
  1325. }
  1326. static void uvd_v7_0_set_hw_clock_gating(struct amdgpu_device *adev)
  1327. {
  1328. uint32_t data, data1, cgc_flags, suvd_flags;
  1329. data = RREG32_SOC15(UVD, ring->me, mmUVD_CGC_GATE);
  1330. data1 = RREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_GATE);
  1331. cgc_flags = UVD_CGC_GATE__SYS_MASK |
  1332. UVD_CGC_GATE__UDEC_MASK |
  1333. UVD_CGC_GATE__MPEG2_MASK |
  1334. UVD_CGC_GATE__RBC_MASK |
  1335. UVD_CGC_GATE__LMI_MC_MASK |
  1336. UVD_CGC_GATE__IDCT_MASK |
  1337. UVD_CGC_GATE__MPRD_MASK |
  1338. UVD_CGC_GATE__MPC_MASK |
  1339. UVD_CGC_GATE__LBSI_MASK |
  1340. UVD_CGC_GATE__LRBBM_MASK |
  1341. UVD_CGC_GATE__UDEC_RE_MASK |
  1342. UVD_CGC_GATE__UDEC_CM_MASK |
  1343. UVD_CGC_GATE__UDEC_IT_MASK |
  1344. UVD_CGC_GATE__UDEC_DB_MASK |
  1345. UVD_CGC_GATE__UDEC_MP_MASK |
  1346. UVD_CGC_GATE__WCB_MASK |
  1347. UVD_CGC_GATE__VCPU_MASK |
  1348. UVD_CGC_GATE__SCPU_MASK |
  1349. UVD_CGC_GATE__JPEG_MASK |
  1350. UVD_CGC_GATE__JPEG2_MASK;
  1351. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  1352. UVD_SUVD_CGC_GATE__SIT_MASK |
  1353. UVD_SUVD_CGC_GATE__SMP_MASK |
  1354. UVD_SUVD_CGC_GATE__SCM_MASK |
  1355. UVD_SUVD_CGC_GATE__SDB_MASK;
  1356. data |= cgc_flags;
  1357. data1 |= suvd_flags;
  1358. WREG32_SOC15(UVD, ring->me, mmUVD_CGC_GATE, data);
  1359. WREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_GATE, data1);
  1360. }
  1361. static void uvd_v7_0_set_bypass_mode(struct amdgpu_device *adev, bool enable)
  1362. {
  1363. u32 tmp = RREG32_SMC(ixGCK_DFS_BYPASS_CNTL);
  1364. if (enable)
  1365. tmp |= (GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
  1366. GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
  1367. else
  1368. tmp &= ~(GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
  1369. GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
  1370. WREG32_SMC(ixGCK_DFS_BYPASS_CNTL, tmp);
  1371. }
  1372. static int uvd_v7_0_set_clockgating_state(void *handle,
  1373. enum amd_clockgating_state state)
  1374. {
  1375. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1376. bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
  1377. uvd_v7_0_set_bypass_mode(adev, enable);
  1378. if (!(adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG))
  1379. return 0;
  1380. if (enable) {
  1381. /* disable HW gating and enable Sw gating */
  1382. uvd_v7_0_set_sw_clock_gating(adev);
  1383. } else {
  1384. /* wait for STATUS to clear */
  1385. if (uvd_v7_0_wait_for_idle(handle))
  1386. return -EBUSY;
  1387. /* enable HW gates because UVD is idle */
  1388. /* uvd_v7_0_set_hw_clock_gating(adev); */
  1389. }
  1390. return 0;
  1391. }
  1392. static int uvd_v7_0_set_powergating_state(void *handle,
  1393. enum amd_powergating_state state)
  1394. {
  1395. /* This doesn't actually powergate the UVD block.
  1396. * That's done in the dpm code via the SMC. This
  1397. * just re-inits the block as necessary. The actual
  1398. * gating still happens in the dpm code. We should
  1399. * revisit this when there is a cleaner line between
  1400. * the smc and the hw blocks
  1401. */
  1402. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1403. if (!(adev->pg_flags & AMD_PG_SUPPORT_UVD))
  1404. return 0;
  1405. WREG32_SOC15(UVD, ring->me, mmUVD_POWER_STATUS, UVD_POWER_STATUS__UVD_PG_EN_MASK);
  1406. if (state == AMD_PG_STATE_GATE) {
  1407. uvd_v7_0_stop(adev);
  1408. return 0;
  1409. } else {
  1410. return uvd_v7_0_start(adev);
  1411. }
  1412. }
  1413. #endif
  1414. static int uvd_v7_0_set_clockgating_state(void *handle,
  1415. enum amd_clockgating_state state)
  1416. {
  1417. /* needed for driver unload*/
  1418. return 0;
  1419. }
  1420. const struct amd_ip_funcs uvd_v7_0_ip_funcs = {
  1421. .name = "uvd_v7_0",
  1422. .early_init = uvd_v7_0_early_init,
  1423. .late_init = NULL,
  1424. .sw_init = uvd_v7_0_sw_init,
  1425. .sw_fini = uvd_v7_0_sw_fini,
  1426. .hw_init = uvd_v7_0_hw_init,
  1427. .hw_fini = uvd_v7_0_hw_fini,
  1428. .suspend = uvd_v7_0_suspend,
  1429. .resume = uvd_v7_0_resume,
  1430. .is_idle = NULL /* uvd_v7_0_is_idle */,
  1431. .wait_for_idle = NULL /* uvd_v7_0_wait_for_idle */,
  1432. .check_soft_reset = NULL /* uvd_v7_0_check_soft_reset */,
  1433. .pre_soft_reset = NULL /* uvd_v7_0_pre_soft_reset */,
  1434. .soft_reset = NULL /* uvd_v7_0_soft_reset */,
  1435. .post_soft_reset = NULL /* uvd_v7_0_post_soft_reset */,
  1436. .set_clockgating_state = uvd_v7_0_set_clockgating_state,
  1437. .set_powergating_state = NULL /* uvd_v7_0_set_powergating_state */,
  1438. };
  1439. static const struct amdgpu_ring_funcs uvd_v7_0_ring_vm_funcs = {
  1440. .type = AMDGPU_RING_TYPE_UVD,
  1441. .align_mask = 0xf,
  1442. .nop = PACKET0(0x81ff, 0),
  1443. .support_64bit_ptrs = false,
  1444. .vmhub = AMDGPU_MMHUB,
  1445. .get_rptr = uvd_v7_0_ring_get_rptr,
  1446. .get_wptr = uvd_v7_0_ring_get_wptr,
  1447. .set_wptr = uvd_v7_0_ring_set_wptr,
  1448. .emit_frame_size =
  1449. 6 + /* hdp invalidate */
  1450. SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
  1451. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
  1452. 8 + /* uvd_v7_0_ring_emit_vm_flush */
  1453. 14 + 14, /* uvd_v7_0_ring_emit_fence x2 vm fence */
  1454. .emit_ib_size = 8, /* uvd_v7_0_ring_emit_ib */
  1455. .emit_ib = uvd_v7_0_ring_emit_ib,
  1456. .emit_fence = uvd_v7_0_ring_emit_fence,
  1457. .emit_vm_flush = uvd_v7_0_ring_emit_vm_flush,
  1458. .emit_hdp_flush = uvd_v7_0_ring_emit_hdp_flush,
  1459. .test_ring = uvd_v7_0_ring_test_ring,
  1460. .test_ib = amdgpu_uvd_ring_test_ib,
  1461. .insert_nop = uvd_v7_0_ring_insert_nop,
  1462. .pad_ib = amdgpu_ring_generic_pad_ib,
  1463. .begin_use = amdgpu_uvd_ring_begin_use,
  1464. .end_use = amdgpu_uvd_ring_end_use,
  1465. .emit_wreg = uvd_v7_0_ring_emit_wreg,
  1466. .emit_reg_wait = uvd_v7_0_ring_emit_reg_wait,
  1467. .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
  1468. };
  1469. static const struct amdgpu_ring_funcs uvd_v7_0_enc_ring_vm_funcs = {
  1470. .type = AMDGPU_RING_TYPE_UVD_ENC,
  1471. .align_mask = 0x3f,
  1472. .nop = HEVC_ENC_CMD_NO_OP,
  1473. .support_64bit_ptrs = false,
  1474. .vmhub = AMDGPU_MMHUB,
  1475. .get_rptr = uvd_v7_0_enc_ring_get_rptr,
  1476. .get_wptr = uvd_v7_0_enc_ring_get_wptr,
  1477. .set_wptr = uvd_v7_0_enc_ring_set_wptr,
  1478. .emit_frame_size =
  1479. 3 + 3 + /* hdp flush / invalidate */
  1480. SOC15_FLUSH_GPU_TLB_NUM_WREG * 3 +
  1481. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 4 +
  1482. 4 + /* uvd_v7_0_enc_ring_emit_vm_flush */
  1483. 5 + 5 + /* uvd_v7_0_enc_ring_emit_fence x2 vm fence */
  1484. 1, /* uvd_v7_0_enc_ring_insert_end */
  1485. .emit_ib_size = 5, /* uvd_v7_0_enc_ring_emit_ib */
  1486. .emit_ib = uvd_v7_0_enc_ring_emit_ib,
  1487. .emit_fence = uvd_v7_0_enc_ring_emit_fence,
  1488. .emit_vm_flush = uvd_v7_0_enc_ring_emit_vm_flush,
  1489. .test_ring = uvd_v7_0_enc_ring_test_ring,
  1490. .test_ib = uvd_v7_0_enc_ring_test_ib,
  1491. .insert_nop = amdgpu_ring_insert_nop,
  1492. .insert_end = uvd_v7_0_enc_ring_insert_end,
  1493. .pad_ib = amdgpu_ring_generic_pad_ib,
  1494. .begin_use = amdgpu_uvd_ring_begin_use,
  1495. .end_use = amdgpu_uvd_ring_end_use,
  1496. .emit_wreg = uvd_v7_0_enc_ring_emit_wreg,
  1497. .emit_reg_wait = uvd_v7_0_enc_ring_emit_reg_wait,
  1498. .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
  1499. };
  1500. static void uvd_v7_0_set_ring_funcs(struct amdgpu_device *adev)
  1501. {
  1502. int i;
  1503. for (i = 0; i < adev->uvd.num_uvd_inst; i++) {
  1504. adev->uvd.inst[i].ring.funcs = &uvd_v7_0_ring_vm_funcs;
  1505. adev->uvd.inst[i].ring.me = i;
  1506. DRM_INFO("UVD(%d) is enabled in VM mode\n", i);
  1507. }
  1508. }
  1509. static void uvd_v7_0_set_enc_ring_funcs(struct amdgpu_device *adev)
  1510. {
  1511. int i, j;
  1512. for (j = 0; j < adev->uvd.num_uvd_inst; j++) {
  1513. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  1514. adev->uvd.inst[j].ring_enc[i].funcs = &uvd_v7_0_enc_ring_vm_funcs;
  1515. adev->uvd.inst[j].ring_enc[i].me = j;
  1516. }
  1517. DRM_INFO("UVD(%d) ENC is enabled in VM mode\n", j);
  1518. }
  1519. }
  1520. static const struct amdgpu_irq_src_funcs uvd_v7_0_irq_funcs = {
  1521. .set = uvd_v7_0_set_interrupt_state,
  1522. .process = uvd_v7_0_process_interrupt,
  1523. };
  1524. static void uvd_v7_0_set_irq_funcs(struct amdgpu_device *adev)
  1525. {
  1526. int i;
  1527. for (i = 0; i < adev->uvd.num_uvd_inst; i++) {
  1528. adev->uvd.inst[i].irq.num_types = adev->uvd.num_enc_rings + 1;
  1529. adev->uvd.inst[i].irq.funcs = &uvd_v7_0_irq_funcs;
  1530. }
  1531. }
  1532. const struct amdgpu_ip_block_version uvd_v7_0_ip_block =
  1533. {
  1534. .type = AMD_IP_BLOCK_TYPE_UVD,
  1535. .major = 7,
  1536. .minor = 0,
  1537. .rev = 0,
  1538. .funcs = &uvd_v7_0_ip_funcs,
  1539. };