uvd_v7_0.c 53 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include <linux/firmware.h>
  24. #include <drm/drmP.h>
  25. #include "amdgpu.h"
  26. #include "amdgpu_uvd.h"
  27. #include "soc15.h"
  28. #include "soc15d.h"
  29. #include "soc15_common.h"
  30. #include "mmsch_v1_0.h"
  31. #include "uvd/uvd_7_0_offset.h"
  32. #include "uvd/uvd_7_0_sh_mask.h"
  33. #include "vce/vce_4_0_offset.h"
  34. #include "vce/vce_4_0_default.h"
  35. #include "vce/vce_4_0_sh_mask.h"
  36. #include "nbif/nbif_6_1_offset.h"
  37. #include "hdp/hdp_4_0_offset.h"
  38. #include "mmhub/mmhub_1_0_offset.h"
  39. #include "mmhub/mmhub_1_0_sh_mask.h"
  40. #define UVD7_MAX_HW_INSTANCES_VEGA20 2
  41. static void uvd_v7_0_set_ring_funcs(struct amdgpu_device *adev);
  42. static void uvd_v7_0_set_enc_ring_funcs(struct amdgpu_device *adev);
  43. static void uvd_v7_0_set_irq_funcs(struct amdgpu_device *adev);
  44. static int uvd_v7_0_start(struct amdgpu_device *adev);
  45. static void uvd_v7_0_stop(struct amdgpu_device *adev);
  46. static int uvd_v7_0_sriov_start(struct amdgpu_device *adev);
  47. static int amdgpu_ih_clientid_uvds[] = {
  48. SOC15_IH_CLIENTID_UVD,
  49. SOC15_IH_CLIENTID_UVD1
  50. };
  51. /**
  52. * uvd_v7_0_ring_get_rptr - get read pointer
  53. *
  54. * @ring: amdgpu_ring pointer
  55. *
  56. * Returns the current hardware read pointer
  57. */
  58. static uint64_t uvd_v7_0_ring_get_rptr(struct amdgpu_ring *ring)
  59. {
  60. struct amdgpu_device *adev = ring->adev;
  61. return RREG32_SOC15(UVD, ring->me, mmUVD_RBC_RB_RPTR);
  62. }
  63. /**
  64. * uvd_v7_0_enc_ring_get_rptr - get enc read pointer
  65. *
  66. * @ring: amdgpu_ring pointer
  67. *
  68. * Returns the current hardware enc read pointer
  69. */
  70. static uint64_t uvd_v7_0_enc_ring_get_rptr(struct amdgpu_ring *ring)
  71. {
  72. struct amdgpu_device *adev = ring->adev;
  73. if (ring == &adev->uvd.inst[ring->me].ring_enc[0])
  74. return RREG32_SOC15(UVD, ring->me, mmUVD_RB_RPTR);
  75. else
  76. return RREG32_SOC15(UVD, ring->me, mmUVD_RB_RPTR2);
  77. }
  78. /**
  79. * uvd_v7_0_ring_get_wptr - get write pointer
  80. *
  81. * @ring: amdgpu_ring pointer
  82. *
  83. * Returns the current hardware write pointer
  84. */
  85. static uint64_t uvd_v7_0_ring_get_wptr(struct amdgpu_ring *ring)
  86. {
  87. struct amdgpu_device *adev = ring->adev;
  88. return RREG32_SOC15(UVD, ring->me, mmUVD_RBC_RB_WPTR);
  89. }
  90. /**
  91. * uvd_v7_0_enc_ring_get_wptr - get enc write pointer
  92. *
  93. * @ring: amdgpu_ring pointer
  94. *
  95. * Returns the current hardware enc write pointer
  96. */
  97. static uint64_t uvd_v7_0_enc_ring_get_wptr(struct amdgpu_ring *ring)
  98. {
  99. struct amdgpu_device *adev = ring->adev;
  100. if (ring->use_doorbell)
  101. return adev->wb.wb[ring->wptr_offs];
  102. if (ring == &adev->uvd.inst[ring->me].ring_enc[0])
  103. return RREG32_SOC15(UVD, ring->me, mmUVD_RB_WPTR);
  104. else
  105. return RREG32_SOC15(UVD, ring->me, mmUVD_RB_WPTR2);
  106. }
  107. /**
  108. * uvd_v7_0_ring_set_wptr - set write pointer
  109. *
  110. * @ring: amdgpu_ring pointer
  111. *
  112. * Commits the write pointer to the hardware
  113. */
  114. static void uvd_v7_0_ring_set_wptr(struct amdgpu_ring *ring)
  115. {
  116. struct amdgpu_device *adev = ring->adev;
  117. WREG32_SOC15(UVD, ring->me, mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
  118. }
  119. /**
  120. * uvd_v7_0_enc_ring_set_wptr - set enc write pointer
  121. *
  122. * @ring: amdgpu_ring pointer
  123. *
  124. * Commits the enc write pointer to the hardware
  125. */
  126. static void uvd_v7_0_enc_ring_set_wptr(struct amdgpu_ring *ring)
  127. {
  128. struct amdgpu_device *adev = ring->adev;
  129. if (ring->use_doorbell) {
  130. /* XXX check if swapping is necessary on BE */
  131. adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
  132. WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
  133. return;
  134. }
  135. if (ring == &adev->uvd.inst[ring->me].ring_enc[0])
  136. WREG32_SOC15(UVD, ring->me, mmUVD_RB_WPTR,
  137. lower_32_bits(ring->wptr));
  138. else
  139. WREG32_SOC15(UVD, ring->me, mmUVD_RB_WPTR2,
  140. lower_32_bits(ring->wptr));
  141. }
  142. /**
  143. * uvd_v7_0_enc_ring_test_ring - test if UVD ENC ring is working
  144. *
  145. * @ring: the engine to test on
  146. *
  147. */
  148. static int uvd_v7_0_enc_ring_test_ring(struct amdgpu_ring *ring)
  149. {
  150. struct amdgpu_device *adev = ring->adev;
  151. uint32_t rptr = amdgpu_ring_get_rptr(ring);
  152. unsigned i;
  153. int r;
  154. if (amdgpu_sriov_vf(adev))
  155. return 0;
  156. r = amdgpu_ring_alloc(ring, 16);
  157. if (r) {
  158. DRM_ERROR("amdgpu: uvd enc failed to lock (%d)ring %d (%d).\n",
  159. ring->me, ring->idx, r);
  160. return r;
  161. }
  162. amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
  163. amdgpu_ring_commit(ring);
  164. for (i = 0; i < adev->usec_timeout; i++) {
  165. if (amdgpu_ring_get_rptr(ring) != rptr)
  166. break;
  167. DRM_UDELAY(1);
  168. }
  169. if (i < adev->usec_timeout) {
  170. DRM_DEBUG("(%d)ring test on %d succeeded in %d usecs\n",
  171. ring->me, ring->idx, i);
  172. } else {
  173. DRM_ERROR("amdgpu: (%d)ring %d test failed\n",
  174. ring->me, ring->idx);
  175. r = -ETIMEDOUT;
  176. }
  177. return r;
  178. }
  179. /**
  180. * uvd_v7_0_enc_get_create_msg - generate a UVD ENC create msg
  181. *
  182. * @adev: amdgpu_device pointer
  183. * @ring: ring we should submit the msg to
  184. * @handle: session handle to use
  185. * @fence: optional fence to return
  186. *
  187. * Open up a stream for HW test
  188. */
  189. static int uvd_v7_0_enc_get_create_msg(struct amdgpu_ring *ring, uint32_t handle,
  190. struct dma_fence **fence)
  191. {
  192. const unsigned ib_size_dw = 16;
  193. struct amdgpu_job *job;
  194. struct amdgpu_ib *ib;
  195. struct dma_fence *f = NULL;
  196. uint64_t dummy;
  197. int i, r;
  198. r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
  199. if (r)
  200. return r;
  201. ib = &job->ibs[0];
  202. dummy = ib->gpu_addr + 1024;
  203. ib->length_dw = 0;
  204. ib->ptr[ib->length_dw++] = 0x00000018;
  205. ib->ptr[ib->length_dw++] = 0x00000001; /* session info */
  206. ib->ptr[ib->length_dw++] = handle;
  207. ib->ptr[ib->length_dw++] = 0x00000000;
  208. ib->ptr[ib->length_dw++] = upper_32_bits(dummy);
  209. ib->ptr[ib->length_dw++] = dummy;
  210. ib->ptr[ib->length_dw++] = 0x00000014;
  211. ib->ptr[ib->length_dw++] = 0x00000002; /* task info */
  212. ib->ptr[ib->length_dw++] = 0x0000001c;
  213. ib->ptr[ib->length_dw++] = 0x00000000;
  214. ib->ptr[ib->length_dw++] = 0x00000000;
  215. ib->ptr[ib->length_dw++] = 0x00000008;
  216. ib->ptr[ib->length_dw++] = 0x08000001; /* op initialize */
  217. for (i = ib->length_dw; i < ib_size_dw; ++i)
  218. ib->ptr[i] = 0x0;
  219. r = amdgpu_ib_schedule(ring, 1, ib, NULL, &f);
  220. job->fence = dma_fence_get(f);
  221. if (r)
  222. goto err;
  223. amdgpu_job_free(job);
  224. if (fence)
  225. *fence = dma_fence_get(f);
  226. dma_fence_put(f);
  227. return 0;
  228. err:
  229. amdgpu_job_free(job);
  230. return r;
  231. }
  232. /**
  233. * uvd_v7_0_enc_get_destroy_msg - generate a UVD ENC destroy msg
  234. *
  235. * @adev: amdgpu_device pointer
  236. * @ring: ring we should submit the msg to
  237. * @handle: session handle to use
  238. * @fence: optional fence to return
  239. *
  240. * Close up a stream for HW test or if userspace failed to do so
  241. */
  242. int uvd_v7_0_enc_get_destroy_msg(struct amdgpu_ring *ring, uint32_t handle,
  243. bool direct, struct dma_fence **fence)
  244. {
  245. const unsigned ib_size_dw = 16;
  246. struct amdgpu_job *job;
  247. struct amdgpu_ib *ib;
  248. struct dma_fence *f = NULL;
  249. uint64_t dummy;
  250. int i, r;
  251. r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
  252. if (r)
  253. return r;
  254. ib = &job->ibs[0];
  255. dummy = ib->gpu_addr + 1024;
  256. ib->length_dw = 0;
  257. ib->ptr[ib->length_dw++] = 0x00000018;
  258. ib->ptr[ib->length_dw++] = 0x00000001;
  259. ib->ptr[ib->length_dw++] = handle;
  260. ib->ptr[ib->length_dw++] = 0x00000000;
  261. ib->ptr[ib->length_dw++] = upper_32_bits(dummy);
  262. ib->ptr[ib->length_dw++] = dummy;
  263. ib->ptr[ib->length_dw++] = 0x00000014;
  264. ib->ptr[ib->length_dw++] = 0x00000002;
  265. ib->ptr[ib->length_dw++] = 0x0000001c;
  266. ib->ptr[ib->length_dw++] = 0x00000000;
  267. ib->ptr[ib->length_dw++] = 0x00000000;
  268. ib->ptr[ib->length_dw++] = 0x00000008;
  269. ib->ptr[ib->length_dw++] = 0x08000002; /* op close session */
  270. for (i = ib->length_dw; i < ib_size_dw; ++i)
  271. ib->ptr[i] = 0x0;
  272. if (direct) {
  273. r = amdgpu_ib_schedule(ring, 1, ib, NULL, &f);
  274. job->fence = dma_fence_get(f);
  275. if (r)
  276. goto err;
  277. amdgpu_job_free(job);
  278. } else {
  279. r = amdgpu_job_submit(job, ring, &ring->adev->vce.entity,
  280. AMDGPU_FENCE_OWNER_UNDEFINED, &f);
  281. if (r)
  282. goto err;
  283. }
  284. if (fence)
  285. *fence = dma_fence_get(f);
  286. dma_fence_put(f);
  287. return 0;
  288. err:
  289. amdgpu_job_free(job);
  290. return r;
  291. }
  292. /**
  293. * uvd_v7_0_enc_ring_test_ib - test if UVD ENC IBs are working
  294. *
  295. * @ring: the engine to test on
  296. *
  297. */
  298. static int uvd_v7_0_enc_ring_test_ib(struct amdgpu_ring *ring, long timeout)
  299. {
  300. struct dma_fence *fence = NULL;
  301. long r;
  302. r = uvd_v7_0_enc_get_create_msg(ring, 1, NULL);
  303. if (r) {
  304. DRM_ERROR("amdgpu: (%d)failed to get create msg (%ld).\n", ring->me, r);
  305. goto error;
  306. }
  307. r = uvd_v7_0_enc_get_destroy_msg(ring, 1, true, &fence);
  308. if (r) {
  309. DRM_ERROR("amdgpu: (%d)failed to get destroy ib (%ld).\n", ring->me, r);
  310. goto error;
  311. }
  312. r = dma_fence_wait_timeout(fence, false, timeout);
  313. if (r == 0) {
  314. DRM_ERROR("amdgpu: (%d)IB test timed out.\n", ring->me);
  315. r = -ETIMEDOUT;
  316. } else if (r < 0) {
  317. DRM_ERROR("amdgpu: (%d)fence wait failed (%ld).\n", ring->me, r);
  318. } else {
  319. DRM_DEBUG("ib test on (%d)ring %d succeeded\n", ring->me, ring->idx);
  320. r = 0;
  321. }
  322. error:
  323. dma_fence_put(fence);
  324. return r;
  325. }
  326. static int uvd_v7_0_early_init(void *handle)
  327. {
  328. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  329. if (adev->asic_type == CHIP_VEGA20)
  330. adev->uvd.num_uvd_inst = UVD7_MAX_HW_INSTANCES_VEGA20;
  331. else
  332. adev->uvd.num_uvd_inst = 1;
  333. if (amdgpu_sriov_vf(adev))
  334. adev->uvd.num_enc_rings = 1;
  335. else
  336. adev->uvd.num_enc_rings = 2;
  337. uvd_v7_0_set_ring_funcs(adev);
  338. uvd_v7_0_set_enc_ring_funcs(adev);
  339. uvd_v7_0_set_irq_funcs(adev);
  340. return 0;
  341. }
  342. static int uvd_v7_0_sw_init(void *handle)
  343. {
  344. struct amdgpu_ring *ring;
  345. struct drm_sched_rq *rq;
  346. int i, j, r;
  347. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  348. for (j = 0; j < adev->uvd.num_uvd_inst; j++) {
  349. /* UVD TRAP */
  350. r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_uvds[j], 124, &adev->uvd.inst[j].irq);
  351. if (r)
  352. return r;
  353. /* UVD ENC TRAP */
  354. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  355. r = amdgpu_irq_add_id(adev, amdgpu_ih_clientid_uvds[j], i + 119, &adev->uvd.inst[j].irq);
  356. if (r)
  357. return r;
  358. }
  359. }
  360. r = amdgpu_uvd_sw_init(adev);
  361. if (r)
  362. return r;
  363. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  364. const struct common_firmware_header *hdr;
  365. hdr = (const struct common_firmware_header *)adev->uvd.fw->data;
  366. adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].ucode_id = AMDGPU_UCODE_ID_UVD;
  367. adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].fw = adev->uvd.fw;
  368. adev->firmware.fw_size +=
  369. ALIGN(le32_to_cpu(hdr->ucode_size_bytes), PAGE_SIZE);
  370. DRM_INFO("PSP loading UVD firmware\n");
  371. }
  372. for (j = 0; j < adev->uvd.num_uvd_inst; j++) {
  373. ring = &adev->uvd.inst[j].ring_enc[0];
  374. rq = &ring->sched.sched_rq[DRM_SCHED_PRIORITY_NORMAL];
  375. r = drm_sched_entity_init(&ring->sched, &adev->uvd.inst[j].entity_enc,
  376. rq, NULL);
  377. if (r) {
  378. DRM_ERROR("(%d)Failed setting up UVD ENC run queue.\n", j);
  379. return r;
  380. }
  381. }
  382. r = amdgpu_uvd_resume(adev);
  383. if (r)
  384. return r;
  385. for (j = 0; j < adev->uvd.num_uvd_inst; j++) {
  386. if (!amdgpu_sriov_vf(adev)) {
  387. ring = &adev->uvd.inst[j].ring;
  388. sprintf(ring->name, "uvd<%d>", j);
  389. r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.inst[j].irq, 0);
  390. if (r)
  391. return r;
  392. }
  393. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  394. ring = &adev->uvd.inst[j].ring_enc[i];
  395. sprintf(ring->name, "uvd_enc%d<%d>", i, j);
  396. if (amdgpu_sriov_vf(adev)) {
  397. ring->use_doorbell = true;
  398. /* currently only use the first enconding ring for
  399. * sriov, so set unused location for other unused rings.
  400. */
  401. if (i == 0)
  402. ring->doorbell_index = AMDGPU_DOORBELL64_UVD_RING0_1 * 2;
  403. else
  404. ring->doorbell_index = AMDGPU_DOORBELL64_UVD_RING2_3 * 2 + 1;
  405. }
  406. r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.inst[j].irq, 0);
  407. if (r)
  408. return r;
  409. }
  410. }
  411. r = amdgpu_virt_alloc_mm_table(adev);
  412. if (r)
  413. return r;
  414. return r;
  415. }
  416. static int uvd_v7_0_sw_fini(void *handle)
  417. {
  418. int i, j, r;
  419. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  420. amdgpu_virt_free_mm_table(adev);
  421. r = amdgpu_uvd_suspend(adev);
  422. if (r)
  423. return r;
  424. for (j = 0; j < adev->uvd.num_uvd_inst; ++j) {
  425. drm_sched_entity_fini(&adev->uvd.inst[j].ring_enc[0].sched, &adev->uvd.inst[j].entity_enc);
  426. for (i = 0; i < adev->uvd.num_enc_rings; ++i)
  427. amdgpu_ring_fini(&adev->uvd.inst[j].ring_enc[i]);
  428. }
  429. return amdgpu_uvd_sw_fini(adev);
  430. }
  431. /**
  432. * uvd_v7_0_hw_init - start and test UVD block
  433. *
  434. * @adev: amdgpu_device pointer
  435. *
  436. * Initialize the hardware, boot up the VCPU and do some testing
  437. */
  438. static int uvd_v7_0_hw_init(void *handle)
  439. {
  440. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  441. struct amdgpu_ring *ring;
  442. uint32_t tmp;
  443. int i, j, r;
  444. if (amdgpu_sriov_vf(adev))
  445. r = uvd_v7_0_sriov_start(adev);
  446. else
  447. r = uvd_v7_0_start(adev);
  448. if (r)
  449. goto done;
  450. for (j = 0; j < adev->uvd.num_uvd_inst; ++j) {
  451. ring = &adev->uvd.inst[j].ring;
  452. if (!amdgpu_sriov_vf(adev)) {
  453. ring->ready = true;
  454. r = amdgpu_ring_test_ring(ring);
  455. if (r) {
  456. ring->ready = false;
  457. goto done;
  458. }
  459. r = amdgpu_ring_alloc(ring, 10);
  460. if (r) {
  461. DRM_ERROR("amdgpu: (%d)ring failed to lock UVD ring (%d).\n", j, r);
  462. goto done;
  463. }
  464. tmp = PACKET0(SOC15_REG_OFFSET(UVD, j,
  465. mmUVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL), 0);
  466. amdgpu_ring_write(ring, tmp);
  467. amdgpu_ring_write(ring, 0xFFFFF);
  468. tmp = PACKET0(SOC15_REG_OFFSET(UVD, j,
  469. mmUVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL), 0);
  470. amdgpu_ring_write(ring, tmp);
  471. amdgpu_ring_write(ring, 0xFFFFF);
  472. tmp = PACKET0(SOC15_REG_OFFSET(UVD, j,
  473. mmUVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL), 0);
  474. amdgpu_ring_write(ring, tmp);
  475. amdgpu_ring_write(ring, 0xFFFFF);
  476. /* Clear timeout status bits */
  477. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, j,
  478. mmUVD_SEMA_TIMEOUT_STATUS), 0));
  479. amdgpu_ring_write(ring, 0x8);
  480. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, j,
  481. mmUVD_SEMA_CNTL), 0));
  482. amdgpu_ring_write(ring, 3);
  483. amdgpu_ring_commit(ring);
  484. }
  485. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  486. ring = &adev->uvd.inst[j].ring_enc[i];
  487. ring->ready = true;
  488. r = amdgpu_ring_test_ring(ring);
  489. if (r) {
  490. ring->ready = false;
  491. goto done;
  492. }
  493. }
  494. }
  495. done:
  496. if (!r)
  497. DRM_INFO("UVD and UVD ENC initialized successfully.\n");
  498. return r;
  499. }
  500. /**
  501. * uvd_v7_0_hw_fini - stop the hardware block
  502. *
  503. * @adev: amdgpu_device pointer
  504. *
  505. * Stop the UVD block, mark ring as not ready any more
  506. */
  507. static int uvd_v7_0_hw_fini(void *handle)
  508. {
  509. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  510. int i;
  511. if (!amdgpu_sriov_vf(adev))
  512. uvd_v7_0_stop(adev);
  513. else {
  514. /* full access mode, so don't touch any UVD register */
  515. DRM_DEBUG("For SRIOV client, shouldn't do anything.\n");
  516. }
  517. for (i = 0; i < adev->uvd.num_uvd_inst; ++i)
  518. adev->uvd.inst[i].ring.ready = false;
  519. return 0;
  520. }
  521. static int uvd_v7_0_suspend(void *handle)
  522. {
  523. int r;
  524. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  525. r = uvd_v7_0_hw_fini(adev);
  526. if (r)
  527. return r;
  528. return amdgpu_uvd_suspend(adev);
  529. }
  530. static int uvd_v7_0_resume(void *handle)
  531. {
  532. int r;
  533. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  534. r = amdgpu_uvd_resume(adev);
  535. if (r)
  536. return r;
  537. return uvd_v7_0_hw_init(adev);
  538. }
  539. /**
  540. * uvd_v7_0_mc_resume - memory controller programming
  541. *
  542. * @adev: amdgpu_device pointer
  543. *
  544. * Let the UVD memory controller know it's offsets
  545. */
  546. static void uvd_v7_0_mc_resume(struct amdgpu_device *adev)
  547. {
  548. uint32_t size = AMDGPU_UVD_FIRMWARE_SIZE(adev);
  549. uint32_t offset;
  550. int i;
  551. for (i = 0; i < adev->uvd.num_uvd_inst; ++i) {
  552. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  553. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  554. lower_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  555. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  556. upper_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  557. offset = 0;
  558. } else {
  559. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  560. lower_32_bits(adev->uvd.inst[i].gpu_addr));
  561. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  562. upper_32_bits(adev->uvd.inst[i].gpu_addr));
  563. offset = size;
  564. }
  565. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_OFFSET0,
  566. AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
  567. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_SIZE0, size);
  568. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW,
  569. lower_32_bits(adev->uvd.inst[i].gpu_addr + offset));
  570. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH,
  571. upper_32_bits(adev->uvd.inst[i].gpu_addr + offset));
  572. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_OFFSET1, (1 << 21));
  573. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_SIZE1, AMDGPU_UVD_HEAP_SIZE);
  574. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW,
  575. lower_32_bits(adev->uvd.inst[i].gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  576. WREG32_SOC15(UVD, i, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH,
  577. upper_32_bits(adev->uvd.inst[i].gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  578. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_OFFSET2, (2 << 21));
  579. WREG32_SOC15(UVD, i, mmUVD_VCPU_CACHE_SIZE2,
  580. AMDGPU_UVD_STACK_SIZE + (AMDGPU_UVD_SESSION_SIZE * 40));
  581. WREG32_SOC15(UVD, i, mmUVD_UDEC_ADDR_CONFIG,
  582. adev->gfx.config.gb_addr_config);
  583. WREG32_SOC15(UVD, i, mmUVD_UDEC_DB_ADDR_CONFIG,
  584. adev->gfx.config.gb_addr_config);
  585. WREG32_SOC15(UVD, i, mmUVD_UDEC_DBW_ADDR_CONFIG,
  586. adev->gfx.config.gb_addr_config);
  587. WREG32_SOC15(UVD, i, mmUVD_GP_SCRATCH4, adev->uvd.max_handles);
  588. }
  589. }
  590. static int uvd_v7_0_mmsch_start(struct amdgpu_device *adev,
  591. struct amdgpu_mm_table *table)
  592. {
  593. uint32_t data = 0, loop;
  594. uint64_t addr = table->gpu_addr;
  595. struct mmsch_v1_0_init_header *header = (struct mmsch_v1_0_init_header *)table->cpu_addr;
  596. uint32_t size;
  597. int i;
  598. size = header->header_size + header->vce_table_size + header->uvd_table_size;
  599. /* 1, write to vce_mmsch_vf_ctx_addr_lo/hi register with GPU mc addr of memory descriptor location */
  600. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_ADDR_LO, lower_32_bits(addr));
  601. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_ADDR_HI, upper_32_bits(addr));
  602. /* 2, update vmid of descriptor */
  603. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_VMID);
  604. data &= ~VCE_MMSCH_VF_VMID__VF_CTX_VMID_MASK;
  605. data |= (0 << VCE_MMSCH_VF_VMID__VF_CTX_VMID__SHIFT); /* use domain0 for MM scheduler */
  606. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_VMID, data);
  607. /* 3, notify mmsch about the size of this descriptor */
  608. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_SIZE, size);
  609. /* 4, set resp to zero */
  610. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP, 0);
  611. for (i = 0; i < adev->uvd.num_uvd_inst; ++i) {
  612. WDOORBELL32(adev->uvd.inst[i].ring_enc[0].doorbell_index, 0);
  613. adev->wb.wb[adev->uvd.inst[i].ring_enc[0].wptr_offs] = 0;
  614. adev->uvd.inst[i].ring_enc[0].wptr = 0;
  615. adev->uvd.inst[i].ring_enc[0].wptr_old = 0;
  616. }
  617. /* 5, kick off the initialization and wait until VCE_MMSCH_VF_MAILBOX_RESP becomes non-zero */
  618. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_HOST, 0x10000001);
  619. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP);
  620. loop = 1000;
  621. while ((data & 0x10000002) != 0x10000002) {
  622. udelay(10);
  623. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP);
  624. loop--;
  625. if (!loop)
  626. break;
  627. }
  628. if (!loop) {
  629. dev_err(adev->dev, "failed to init MMSCH, mmVCE_MMSCH_VF_MAILBOX_RESP = %x\n", data);
  630. return -EBUSY;
  631. }
  632. return 0;
  633. }
  634. static int uvd_v7_0_sriov_start(struct amdgpu_device *adev)
  635. {
  636. struct amdgpu_ring *ring;
  637. uint32_t offset, size, tmp;
  638. uint32_t table_size = 0;
  639. struct mmsch_v1_0_cmd_direct_write direct_wt = { {0} };
  640. struct mmsch_v1_0_cmd_direct_read_modify_write direct_rd_mod_wt = { {0} };
  641. struct mmsch_v1_0_cmd_direct_polling direct_poll = { {0} };
  642. struct mmsch_v1_0_cmd_end end = { {0} };
  643. uint32_t *init_table = adev->virt.mm_table.cpu_addr;
  644. struct mmsch_v1_0_init_header *header = (struct mmsch_v1_0_init_header *)init_table;
  645. uint8_t i = 0;
  646. direct_wt.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_WRITE;
  647. direct_rd_mod_wt.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_READ_MODIFY_WRITE;
  648. direct_poll.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_POLLING;
  649. end.cmd_header.command_type = MMSCH_COMMAND__END;
  650. if (header->uvd_table_offset == 0 && header->uvd_table_size == 0) {
  651. header->version = MMSCH_VERSION;
  652. header->header_size = sizeof(struct mmsch_v1_0_init_header) >> 2;
  653. if (header->vce_table_offset == 0 && header->vce_table_size == 0)
  654. header->uvd_table_offset = header->header_size;
  655. else
  656. header->uvd_table_offset = header->vce_table_size + header->vce_table_offset;
  657. init_table += header->uvd_table_offset;
  658. for (i = 0; i < adev->uvd.num_uvd_inst; ++i) {
  659. ring = &adev->uvd.inst[i].ring;
  660. ring->wptr = 0;
  661. size = AMDGPU_GPU_PAGE_ALIGN(adev->uvd.fw->size + 4);
  662. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_STATUS),
  663. 0xFFFFFFFF, 0x00000004);
  664. /* mc resume*/
  665. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  666. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW),
  667. lower_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  668. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH),
  669. upper_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  670. offset = 0;
  671. } else {
  672. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW),
  673. lower_32_bits(adev->uvd.inst[i].gpu_addr));
  674. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH),
  675. upper_32_bits(adev->uvd.inst[i].gpu_addr));
  676. offset = size;
  677. }
  678. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_OFFSET0),
  679. AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
  680. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_SIZE0), size);
  681. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW),
  682. lower_32_bits(adev->uvd.inst[i].gpu_addr + offset));
  683. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH),
  684. upper_32_bits(adev->uvd.inst[i].gpu_addr + offset));
  685. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_OFFSET1), (1 << 21));
  686. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_SIZE1), AMDGPU_UVD_HEAP_SIZE);
  687. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW),
  688. lower_32_bits(adev->uvd.inst[i].gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  689. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH),
  690. upper_32_bits(adev->uvd.inst[i].gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  691. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_OFFSET2), (2 << 21));
  692. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CACHE_SIZE2),
  693. AMDGPU_UVD_STACK_SIZE + (AMDGPU_UVD_SESSION_SIZE * 40));
  694. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_GP_SCRATCH4), adev->uvd.max_handles);
  695. /* mc resume end*/
  696. /* disable clock gating */
  697. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_CGC_CTRL),
  698. ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK, 0);
  699. /* disable interupt */
  700. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_MASTINT_EN),
  701. ~UVD_MASTINT_EN__VCPU_EN_MASK, 0);
  702. /* stall UMC and register bus before resetting VCPU */
  703. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_CTRL2),
  704. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  705. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  706. /* put LMI, VCPU, RBC etc... into reset */
  707. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_SOFT_RESET),
  708. (uint32_t)(UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  709. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
  710. UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  711. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
  712. UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  713. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
  714. UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  715. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK));
  716. /* initialize UVD memory controller */
  717. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_CTRL),
  718. (uint32_t)((0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  719. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  720. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  721. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  722. UVD_LMI_CTRL__REQ_MODE_MASK |
  723. 0x00100000L));
  724. /* take all subblocks out of reset, except VCPU */
  725. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_SOFT_RESET),
  726. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  727. /* enable VCPU clock */
  728. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_VCPU_CNTL),
  729. UVD_VCPU_CNTL__CLK_EN_MASK);
  730. /* enable master interrupt */
  731. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_MASTINT_EN),
  732. ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
  733. (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
  734. /* clear the bit 4 of UVD_STATUS */
  735. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_STATUS),
  736. ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT), 0);
  737. /* force RBC into idle state */
  738. size = order_base_2(ring->ring_size);
  739. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, size);
  740. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  741. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_RBC_RB_CNTL), tmp);
  742. ring = &adev->uvd.inst[i].ring_enc[0];
  743. ring->wptr = 0;
  744. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_RB_BASE_LO), ring->gpu_addr);
  745. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_RB_BASE_HI), upper_32_bits(ring->gpu_addr));
  746. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_RB_SIZE), ring->ring_size / 4);
  747. /* boot up the VCPU */
  748. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_SOFT_RESET), 0);
  749. /* enable UMC */
  750. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_CTRL2),
  751. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK, 0);
  752. MMSCH_V1_0_INSERT_DIRECT_POLL(SOC15_REG_OFFSET(UVD, i, mmUVD_STATUS), 0x02, 0x02);
  753. }
  754. /* add end packet */
  755. memcpy((void *)init_table, &end, sizeof(struct mmsch_v1_0_cmd_end));
  756. table_size += sizeof(struct mmsch_v1_0_cmd_end) / 4;
  757. header->uvd_table_size = table_size;
  758. }
  759. return uvd_v7_0_mmsch_start(adev, &adev->virt.mm_table);
  760. }
  761. /**
  762. * uvd_v7_0_start - start UVD block
  763. *
  764. * @adev: amdgpu_device pointer
  765. *
  766. * Setup and start the UVD block
  767. */
  768. static int uvd_v7_0_start(struct amdgpu_device *adev)
  769. {
  770. struct amdgpu_ring *ring;
  771. uint32_t rb_bufsz, tmp;
  772. uint32_t lmi_swap_cntl;
  773. uint32_t mp_swap_cntl;
  774. int i, j, k, r;
  775. for (k = 0; k < adev->uvd.num_uvd_inst; ++k) {
  776. /* disable DPG */
  777. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_POWER_STATUS), 0,
  778. ~UVD_POWER_STATUS__UVD_PG_MODE_MASK);
  779. }
  780. /* disable byte swapping */
  781. lmi_swap_cntl = 0;
  782. mp_swap_cntl = 0;
  783. uvd_v7_0_mc_resume(adev);
  784. for (k = 0; k < adev->uvd.num_uvd_inst; ++k) {
  785. ring = &adev->uvd.inst[k].ring;
  786. /* disable clock gating */
  787. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_CGC_CTRL), 0,
  788. ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK);
  789. /* disable interupt */
  790. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_MASTINT_EN), 0,
  791. ~UVD_MASTINT_EN__VCPU_EN_MASK);
  792. /* stall UMC and register bus before resetting VCPU */
  793. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_LMI_CTRL2),
  794. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  795. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  796. mdelay(1);
  797. /* put LMI, VCPU, RBC etc... into reset */
  798. WREG32_SOC15(UVD, k, mmUVD_SOFT_RESET,
  799. UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  800. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
  801. UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  802. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
  803. UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  804. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
  805. UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  806. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
  807. mdelay(5);
  808. /* initialize UVD memory controller */
  809. WREG32_SOC15(UVD, k, mmUVD_LMI_CTRL,
  810. (0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  811. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  812. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  813. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  814. UVD_LMI_CTRL__REQ_MODE_MASK |
  815. 0x00100000L);
  816. #ifdef __BIG_ENDIAN
  817. /* swap (8 in 32) RB and IB */
  818. lmi_swap_cntl = 0xa;
  819. mp_swap_cntl = 0;
  820. #endif
  821. WREG32_SOC15(UVD, k, mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
  822. WREG32_SOC15(UVD, k, mmUVD_MP_SWAP_CNTL, mp_swap_cntl);
  823. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_MUXA0, 0x40c2040);
  824. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_MUXA1, 0x0);
  825. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_MUXB0, 0x40c2040);
  826. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_MUXB1, 0x0);
  827. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_ALU, 0);
  828. WREG32_SOC15(UVD, k, mmUVD_MPC_SET_MUX, 0x88);
  829. /* take all subblocks out of reset, except VCPU */
  830. WREG32_SOC15(UVD, k, mmUVD_SOFT_RESET,
  831. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  832. mdelay(5);
  833. /* enable VCPU clock */
  834. WREG32_SOC15(UVD, k, mmUVD_VCPU_CNTL,
  835. UVD_VCPU_CNTL__CLK_EN_MASK);
  836. /* enable UMC */
  837. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_LMI_CTRL2), 0,
  838. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  839. /* boot up the VCPU */
  840. WREG32_SOC15(UVD, k, mmUVD_SOFT_RESET, 0);
  841. mdelay(10);
  842. for (i = 0; i < 10; ++i) {
  843. uint32_t status;
  844. for (j = 0; j < 100; ++j) {
  845. status = RREG32_SOC15(UVD, k, mmUVD_STATUS);
  846. if (status & 2)
  847. break;
  848. mdelay(10);
  849. }
  850. r = 0;
  851. if (status & 2)
  852. break;
  853. DRM_ERROR("UVD(%d) not responding, trying to reset the VCPU!!!\n", k);
  854. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_SOFT_RESET),
  855. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
  856. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  857. mdelay(10);
  858. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_SOFT_RESET), 0,
  859. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  860. mdelay(10);
  861. r = -1;
  862. }
  863. if (r) {
  864. DRM_ERROR("UVD(%d) not responding, giving up!!!\n", k);
  865. return r;
  866. }
  867. /* enable master interrupt */
  868. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_MASTINT_EN),
  869. (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
  870. ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
  871. /* clear the bit 4 of UVD_STATUS */
  872. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_STATUS), 0,
  873. ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
  874. /* force RBC into idle state */
  875. rb_bufsz = order_base_2(ring->ring_size);
  876. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
  877. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
  878. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  879. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
  880. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
  881. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
  882. WREG32_SOC15(UVD, k, mmUVD_RBC_RB_CNTL, tmp);
  883. /* set the write pointer delay */
  884. WREG32_SOC15(UVD, k, mmUVD_RBC_RB_WPTR_CNTL, 0);
  885. /* set the wb address */
  886. WREG32_SOC15(UVD, k, mmUVD_RBC_RB_RPTR_ADDR,
  887. (upper_32_bits(ring->gpu_addr) >> 2));
  888. /* programm the RB_BASE for ring buffer */
  889. WREG32_SOC15(UVD, k, mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
  890. lower_32_bits(ring->gpu_addr));
  891. WREG32_SOC15(UVD, k, mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
  892. upper_32_bits(ring->gpu_addr));
  893. /* Initialize the ring buffer's read and write pointers */
  894. WREG32_SOC15(UVD, k, mmUVD_RBC_RB_RPTR, 0);
  895. ring->wptr = RREG32_SOC15(UVD, k, mmUVD_RBC_RB_RPTR);
  896. WREG32_SOC15(UVD, k, mmUVD_RBC_RB_WPTR,
  897. lower_32_bits(ring->wptr));
  898. WREG32_P(SOC15_REG_OFFSET(UVD, k, mmUVD_RBC_RB_CNTL), 0,
  899. ~UVD_RBC_RB_CNTL__RB_NO_FETCH_MASK);
  900. ring = &adev->uvd.inst[k].ring_enc[0];
  901. WREG32_SOC15(UVD, k, mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
  902. WREG32_SOC15(UVD, k, mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
  903. WREG32_SOC15(UVD, k, mmUVD_RB_BASE_LO, ring->gpu_addr);
  904. WREG32_SOC15(UVD, k, mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
  905. WREG32_SOC15(UVD, k, mmUVD_RB_SIZE, ring->ring_size / 4);
  906. ring = &adev->uvd.inst[k].ring_enc[1];
  907. WREG32_SOC15(UVD, k, mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
  908. WREG32_SOC15(UVD, k, mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
  909. WREG32_SOC15(UVD, k, mmUVD_RB_BASE_LO2, ring->gpu_addr);
  910. WREG32_SOC15(UVD, k, mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
  911. WREG32_SOC15(UVD, k, mmUVD_RB_SIZE2, ring->ring_size / 4);
  912. }
  913. return 0;
  914. }
  915. /**
  916. * uvd_v7_0_stop - stop UVD block
  917. *
  918. * @adev: amdgpu_device pointer
  919. *
  920. * stop the UVD block
  921. */
  922. static void uvd_v7_0_stop(struct amdgpu_device *adev)
  923. {
  924. uint8_t i = 0;
  925. for (i = 0; i < adev->uvd.num_uvd_inst; ++i) {
  926. /* force RBC into idle state */
  927. WREG32_SOC15(UVD, i, mmUVD_RBC_RB_CNTL, 0x11010101);
  928. /* Stall UMC and register bus before resetting VCPU */
  929. WREG32_P(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_CTRL2),
  930. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  931. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  932. mdelay(1);
  933. /* put VCPU into reset */
  934. WREG32_SOC15(UVD, i, mmUVD_SOFT_RESET,
  935. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  936. mdelay(5);
  937. /* disable VCPU clock */
  938. WREG32_SOC15(UVD, i, mmUVD_VCPU_CNTL, 0x0);
  939. /* Unstall UMC and register bus */
  940. WREG32_P(SOC15_REG_OFFSET(UVD, i, mmUVD_LMI_CTRL2), 0,
  941. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  942. }
  943. }
  944. /**
  945. * uvd_v7_0_ring_emit_fence - emit an fence & trap command
  946. *
  947. * @ring: amdgpu_ring pointer
  948. * @fence: fence to emit
  949. *
  950. * Write a fence and a trap command to the ring.
  951. */
  952. static void uvd_v7_0_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
  953. unsigned flags)
  954. {
  955. struct amdgpu_device *adev = ring->adev;
  956. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  957. amdgpu_ring_write(ring,
  958. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_CONTEXT_ID), 0));
  959. amdgpu_ring_write(ring, seq);
  960. amdgpu_ring_write(ring,
  961. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA0), 0));
  962. amdgpu_ring_write(ring, addr & 0xffffffff);
  963. amdgpu_ring_write(ring,
  964. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA1), 0));
  965. amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
  966. amdgpu_ring_write(ring,
  967. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_CMD), 0));
  968. amdgpu_ring_write(ring, 0);
  969. amdgpu_ring_write(ring,
  970. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA0), 0));
  971. amdgpu_ring_write(ring, 0);
  972. amdgpu_ring_write(ring,
  973. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA1), 0));
  974. amdgpu_ring_write(ring, 0);
  975. amdgpu_ring_write(ring,
  976. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_CMD), 0));
  977. amdgpu_ring_write(ring, 2);
  978. }
  979. /**
  980. * uvd_v7_0_enc_ring_emit_fence - emit an enc fence & trap command
  981. *
  982. * @ring: amdgpu_ring pointer
  983. * @fence: fence to emit
  984. *
  985. * Write enc a fence and a trap command to the ring.
  986. */
  987. static void uvd_v7_0_enc_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
  988. u64 seq, unsigned flags)
  989. {
  990. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  991. amdgpu_ring_write(ring, HEVC_ENC_CMD_FENCE);
  992. amdgpu_ring_write(ring, addr);
  993. amdgpu_ring_write(ring, upper_32_bits(addr));
  994. amdgpu_ring_write(ring, seq);
  995. amdgpu_ring_write(ring, HEVC_ENC_CMD_TRAP);
  996. }
  997. /**
  998. * uvd_v7_0_ring_emit_hdp_flush - skip HDP flushing
  999. *
  1000. * @ring: amdgpu_ring pointer
  1001. */
  1002. static void uvd_v7_0_ring_emit_hdp_flush(struct amdgpu_ring *ring)
  1003. {
  1004. /* The firmware doesn't seem to like touching registers at this point. */
  1005. }
  1006. /**
  1007. * uvd_v7_0_ring_test_ring - register write test
  1008. *
  1009. * @ring: amdgpu_ring pointer
  1010. *
  1011. * Test if we can successfully write to the context register
  1012. */
  1013. static int uvd_v7_0_ring_test_ring(struct amdgpu_ring *ring)
  1014. {
  1015. struct amdgpu_device *adev = ring->adev;
  1016. uint32_t tmp = 0;
  1017. unsigned i;
  1018. int r;
  1019. WREG32_SOC15(UVD, ring->me, mmUVD_CONTEXT_ID, 0xCAFEDEAD);
  1020. r = amdgpu_ring_alloc(ring, 3);
  1021. if (r) {
  1022. DRM_ERROR("amdgpu: (%d)cp failed to lock ring %d (%d).\n",
  1023. ring->me, ring->idx, r);
  1024. return r;
  1025. }
  1026. amdgpu_ring_write(ring,
  1027. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_CONTEXT_ID), 0));
  1028. amdgpu_ring_write(ring, 0xDEADBEEF);
  1029. amdgpu_ring_commit(ring);
  1030. for (i = 0; i < adev->usec_timeout; i++) {
  1031. tmp = RREG32_SOC15(UVD, ring->me, mmUVD_CONTEXT_ID);
  1032. if (tmp == 0xDEADBEEF)
  1033. break;
  1034. DRM_UDELAY(1);
  1035. }
  1036. if (i < adev->usec_timeout) {
  1037. DRM_DEBUG("(%d)ring test on %d succeeded in %d usecs\n",
  1038. ring->me, ring->idx, i);
  1039. } else {
  1040. DRM_ERROR("(%d)amdgpu: ring %d test failed (0x%08X)\n",
  1041. ring->me, ring->idx, tmp);
  1042. r = -EINVAL;
  1043. }
  1044. return r;
  1045. }
  1046. /**
  1047. * uvd_v7_0_ring_emit_ib - execute indirect buffer
  1048. *
  1049. * @ring: amdgpu_ring pointer
  1050. * @ib: indirect buffer to execute
  1051. *
  1052. * Write ring commands to execute the indirect buffer
  1053. */
  1054. static void uvd_v7_0_ring_emit_ib(struct amdgpu_ring *ring,
  1055. struct amdgpu_ib *ib,
  1056. unsigned vmid, bool ctx_switch)
  1057. {
  1058. struct amdgpu_device *adev = ring->adev;
  1059. amdgpu_ring_write(ring,
  1060. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_LMI_RBC_IB_VMID), 0));
  1061. amdgpu_ring_write(ring, vmid);
  1062. amdgpu_ring_write(ring,
  1063. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_LMI_RBC_IB_64BIT_BAR_LOW), 0));
  1064. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1065. amdgpu_ring_write(ring,
  1066. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH), 0));
  1067. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1068. amdgpu_ring_write(ring,
  1069. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_RBC_IB_SIZE), 0));
  1070. amdgpu_ring_write(ring, ib->length_dw);
  1071. }
  1072. /**
  1073. * uvd_v7_0_enc_ring_emit_ib - enc execute indirect buffer
  1074. *
  1075. * @ring: amdgpu_ring pointer
  1076. * @ib: indirect buffer to execute
  1077. *
  1078. * Write enc ring commands to execute the indirect buffer
  1079. */
  1080. static void uvd_v7_0_enc_ring_emit_ib(struct amdgpu_ring *ring,
  1081. struct amdgpu_ib *ib, unsigned int vmid, bool ctx_switch)
  1082. {
  1083. amdgpu_ring_write(ring, HEVC_ENC_CMD_IB_VM);
  1084. amdgpu_ring_write(ring, vmid);
  1085. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1086. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1087. amdgpu_ring_write(ring, ib->length_dw);
  1088. }
  1089. static void uvd_v7_0_ring_emit_wreg(struct amdgpu_ring *ring,
  1090. uint32_t reg, uint32_t val)
  1091. {
  1092. struct amdgpu_device *adev = ring->adev;
  1093. amdgpu_ring_write(ring,
  1094. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA0), 0));
  1095. amdgpu_ring_write(ring, reg << 2);
  1096. amdgpu_ring_write(ring,
  1097. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA1), 0));
  1098. amdgpu_ring_write(ring, val);
  1099. amdgpu_ring_write(ring,
  1100. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_CMD), 0));
  1101. amdgpu_ring_write(ring, 8);
  1102. }
  1103. static void uvd_v7_0_ring_emit_reg_wait(struct amdgpu_ring *ring, uint32_t reg,
  1104. uint32_t val, uint32_t mask)
  1105. {
  1106. struct amdgpu_device *adev = ring->adev;
  1107. amdgpu_ring_write(ring,
  1108. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA0), 0));
  1109. amdgpu_ring_write(ring, reg << 2);
  1110. amdgpu_ring_write(ring,
  1111. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_DATA1), 0));
  1112. amdgpu_ring_write(ring, val);
  1113. amdgpu_ring_write(ring,
  1114. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GP_SCRATCH8), 0));
  1115. amdgpu_ring_write(ring, mask);
  1116. amdgpu_ring_write(ring,
  1117. PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_GPCOM_VCPU_CMD), 0));
  1118. amdgpu_ring_write(ring, 12);
  1119. }
  1120. static void uvd_v7_0_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1121. unsigned vmid, uint64_t pd_addr)
  1122. {
  1123. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1124. uint32_t data0, data1, mask;
  1125. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  1126. /* wait for reg writes */
  1127. data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
  1128. data1 = lower_32_bits(pd_addr);
  1129. mask = 0xffffffff;
  1130. uvd_v7_0_ring_emit_reg_wait(ring, data0, data1, mask);
  1131. }
  1132. static void uvd_v7_0_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count)
  1133. {
  1134. struct amdgpu_device *adev = ring->adev;
  1135. int i;
  1136. WARN_ON(ring->wptr % 2 || count % 2);
  1137. for (i = 0; i < count / 2; i++) {
  1138. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, ring->me, mmUVD_NO_OP), 0));
  1139. amdgpu_ring_write(ring, 0);
  1140. }
  1141. }
  1142. static void uvd_v7_0_enc_ring_insert_end(struct amdgpu_ring *ring)
  1143. {
  1144. amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
  1145. }
  1146. static void uvd_v7_0_enc_ring_emit_reg_wait(struct amdgpu_ring *ring,
  1147. uint32_t reg, uint32_t val,
  1148. uint32_t mask)
  1149. {
  1150. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WAIT);
  1151. amdgpu_ring_write(ring, reg << 2);
  1152. amdgpu_ring_write(ring, mask);
  1153. amdgpu_ring_write(ring, val);
  1154. }
  1155. static void uvd_v7_0_enc_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1156. unsigned int vmid, uint64_t pd_addr)
  1157. {
  1158. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1159. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  1160. /* wait for reg writes */
  1161. uvd_v7_0_enc_ring_emit_reg_wait(ring, hub->ctx0_ptb_addr_lo32 + vmid * 2,
  1162. lower_32_bits(pd_addr), 0xffffffff);
  1163. }
  1164. static void uvd_v7_0_enc_ring_emit_wreg(struct amdgpu_ring *ring,
  1165. uint32_t reg, uint32_t val)
  1166. {
  1167. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WRITE);
  1168. amdgpu_ring_write(ring, reg << 2);
  1169. amdgpu_ring_write(ring, val);
  1170. }
  1171. #if 0
  1172. static bool uvd_v7_0_is_idle(void *handle)
  1173. {
  1174. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1175. return !(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK);
  1176. }
  1177. static int uvd_v7_0_wait_for_idle(void *handle)
  1178. {
  1179. unsigned i;
  1180. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1181. for (i = 0; i < adev->usec_timeout; i++) {
  1182. if (uvd_v7_0_is_idle(handle))
  1183. return 0;
  1184. }
  1185. return -ETIMEDOUT;
  1186. }
  1187. #define AMDGPU_UVD_STATUS_BUSY_MASK 0xfd
  1188. static bool uvd_v7_0_check_soft_reset(void *handle)
  1189. {
  1190. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1191. u32 srbm_soft_reset = 0;
  1192. u32 tmp = RREG32(mmSRBM_STATUS);
  1193. if (REG_GET_FIELD(tmp, SRBM_STATUS, UVD_RQ_PENDING) ||
  1194. REG_GET_FIELD(tmp, SRBM_STATUS, UVD_BUSY) ||
  1195. (RREG32_SOC15(UVD, ring->me, mmUVD_STATUS) &
  1196. AMDGPU_UVD_STATUS_BUSY_MASK))
  1197. srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset,
  1198. SRBM_SOFT_RESET, SOFT_RESET_UVD, 1);
  1199. if (srbm_soft_reset) {
  1200. adev->uvd.inst[ring->me].srbm_soft_reset = srbm_soft_reset;
  1201. return true;
  1202. } else {
  1203. adev->uvd.inst[ring->me].srbm_soft_reset = 0;
  1204. return false;
  1205. }
  1206. }
  1207. static int uvd_v7_0_pre_soft_reset(void *handle)
  1208. {
  1209. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1210. if (!adev->uvd.inst[ring->me].srbm_soft_reset)
  1211. return 0;
  1212. uvd_v7_0_stop(adev);
  1213. return 0;
  1214. }
  1215. static int uvd_v7_0_soft_reset(void *handle)
  1216. {
  1217. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1218. u32 srbm_soft_reset;
  1219. if (!adev->uvd.inst[ring->me].srbm_soft_reset)
  1220. return 0;
  1221. srbm_soft_reset = adev->uvd.inst[ring->me].srbm_soft_reset;
  1222. if (srbm_soft_reset) {
  1223. u32 tmp;
  1224. tmp = RREG32(mmSRBM_SOFT_RESET);
  1225. tmp |= srbm_soft_reset;
  1226. dev_info(adev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
  1227. WREG32(mmSRBM_SOFT_RESET, tmp);
  1228. tmp = RREG32(mmSRBM_SOFT_RESET);
  1229. udelay(50);
  1230. tmp &= ~srbm_soft_reset;
  1231. WREG32(mmSRBM_SOFT_RESET, tmp);
  1232. tmp = RREG32(mmSRBM_SOFT_RESET);
  1233. /* Wait a little for things to settle down */
  1234. udelay(50);
  1235. }
  1236. return 0;
  1237. }
  1238. static int uvd_v7_0_post_soft_reset(void *handle)
  1239. {
  1240. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1241. if (!adev->uvd.inst[ring->me].srbm_soft_reset)
  1242. return 0;
  1243. mdelay(5);
  1244. return uvd_v7_0_start(adev);
  1245. }
  1246. #endif
  1247. static int uvd_v7_0_set_interrupt_state(struct amdgpu_device *adev,
  1248. struct amdgpu_irq_src *source,
  1249. unsigned type,
  1250. enum amdgpu_interrupt_state state)
  1251. {
  1252. // TODO
  1253. return 0;
  1254. }
  1255. static int uvd_v7_0_process_interrupt(struct amdgpu_device *adev,
  1256. struct amdgpu_irq_src *source,
  1257. struct amdgpu_iv_entry *entry)
  1258. {
  1259. uint32_t ip_instance;
  1260. switch (entry->client_id) {
  1261. case SOC15_IH_CLIENTID_UVD:
  1262. ip_instance = 0;
  1263. break;
  1264. case SOC15_IH_CLIENTID_UVD1:
  1265. ip_instance = 1;
  1266. break;
  1267. default:
  1268. DRM_ERROR("Unhandled client id: %d\n", entry->client_id);
  1269. return 0;
  1270. }
  1271. DRM_DEBUG("IH: UVD TRAP\n");
  1272. switch (entry->src_id) {
  1273. case 124:
  1274. amdgpu_fence_process(&adev->uvd.inst[ip_instance].ring);
  1275. break;
  1276. case 119:
  1277. amdgpu_fence_process(&adev->uvd.inst[ip_instance].ring_enc[0]);
  1278. break;
  1279. case 120:
  1280. if (!amdgpu_sriov_vf(adev))
  1281. amdgpu_fence_process(&adev->uvd.inst[ip_instance].ring_enc[1]);
  1282. break;
  1283. default:
  1284. DRM_ERROR("Unhandled interrupt: %d %d\n",
  1285. entry->src_id, entry->src_data[0]);
  1286. break;
  1287. }
  1288. return 0;
  1289. }
  1290. #if 0
  1291. static void uvd_v7_0_set_sw_clock_gating(struct amdgpu_device *adev)
  1292. {
  1293. uint32_t data, data1, data2, suvd_flags;
  1294. data = RREG32_SOC15(UVD, ring->me, mmUVD_CGC_CTRL);
  1295. data1 = RREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_GATE);
  1296. data2 = RREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_CTRL);
  1297. data &= ~(UVD_CGC_CTRL__CLK_OFF_DELAY_MASK |
  1298. UVD_CGC_CTRL__CLK_GATE_DLY_TIMER_MASK);
  1299. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  1300. UVD_SUVD_CGC_GATE__SIT_MASK |
  1301. UVD_SUVD_CGC_GATE__SMP_MASK |
  1302. UVD_SUVD_CGC_GATE__SCM_MASK |
  1303. UVD_SUVD_CGC_GATE__SDB_MASK;
  1304. data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK |
  1305. (1 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_GATE_DLY_TIMER)) |
  1306. (4 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_OFF_DELAY));
  1307. data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
  1308. UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
  1309. UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
  1310. UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
  1311. UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
  1312. UVD_CGC_CTRL__SYS_MODE_MASK |
  1313. UVD_CGC_CTRL__UDEC_MODE_MASK |
  1314. UVD_CGC_CTRL__MPEG2_MODE_MASK |
  1315. UVD_CGC_CTRL__REGS_MODE_MASK |
  1316. UVD_CGC_CTRL__RBC_MODE_MASK |
  1317. UVD_CGC_CTRL__LMI_MC_MODE_MASK |
  1318. UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
  1319. UVD_CGC_CTRL__IDCT_MODE_MASK |
  1320. UVD_CGC_CTRL__MPRD_MODE_MASK |
  1321. UVD_CGC_CTRL__MPC_MODE_MASK |
  1322. UVD_CGC_CTRL__LBSI_MODE_MASK |
  1323. UVD_CGC_CTRL__LRBBM_MODE_MASK |
  1324. UVD_CGC_CTRL__WCB_MODE_MASK |
  1325. UVD_CGC_CTRL__VCPU_MODE_MASK |
  1326. UVD_CGC_CTRL__JPEG_MODE_MASK |
  1327. UVD_CGC_CTRL__JPEG2_MODE_MASK |
  1328. UVD_CGC_CTRL__SCPU_MODE_MASK);
  1329. data2 &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK |
  1330. UVD_SUVD_CGC_CTRL__SIT_MODE_MASK |
  1331. UVD_SUVD_CGC_CTRL__SMP_MODE_MASK |
  1332. UVD_SUVD_CGC_CTRL__SCM_MODE_MASK |
  1333. UVD_SUVD_CGC_CTRL__SDB_MODE_MASK);
  1334. data1 |= suvd_flags;
  1335. WREG32_SOC15(UVD, ring->me, mmUVD_CGC_CTRL, data);
  1336. WREG32_SOC15(UVD, ring->me, mmUVD_CGC_GATE, 0);
  1337. WREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_GATE, data1);
  1338. WREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_CTRL, data2);
  1339. }
  1340. static void uvd_v7_0_set_hw_clock_gating(struct amdgpu_device *adev)
  1341. {
  1342. uint32_t data, data1, cgc_flags, suvd_flags;
  1343. data = RREG32_SOC15(UVD, ring->me, mmUVD_CGC_GATE);
  1344. data1 = RREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_GATE);
  1345. cgc_flags = UVD_CGC_GATE__SYS_MASK |
  1346. UVD_CGC_GATE__UDEC_MASK |
  1347. UVD_CGC_GATE__MPEG2_MASK |
  1348. UVD_CGC_GATE__RBC_MASK |
  1349. UVD_CGC_GATE__LMI_MC_MASK |
  1350. UVD_CGC_GATE__IDCT_MASK |
  1351. UVD_CGC_GATE__MPRD_MASK |
  1352. UVD_CGC_GATE__MPC_MASK |
  1353. UVD_CGC_GATE__LBSI_MASK |
  1354. UVD_CGC_GATE__LRBBM_MASK |
  1355. UVD_CGC_GATE__UDEC_RE_MASK |
  1356. UVD_CGC_GATE__UDEC_CM_MASK |
  1357. UVD_CGC_GATE__UDEC_IT_MASK |
  1358. UVD_CGC_GATE__UDEC_DB_MASK |
  1359. UVD_CGC_GATE__UDEC_MP_MASK |
  1360. UVD_CGC_GATE__WCB_MASK |
  1361. UVD_CGC_GATE__VCPU_MASK |
  1362. UVD_CGC_GATE__SCPU_MASK |
  1363. UVD_CGC_GATE__JPEG_MASK |
  1364. UVD_CGC_GATE__JPEG2_MASK;
  1365. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  1366. UVD_SUVD_CGC_GATE__SIT_MASK |
  1367. UVD_SUVD_CGC_GATE__SMP_MASK |
  1368. UVD_SUVD_CGC_GATE__SCM_MASK |
  1369. UVD_SUVD_CGC_GATE__SDB_MASK;
  1370. data |= cgc_flags;
  1371. data1 |= suvd_flags;
  1372. WREG32_SOC15(UVD, ring->me, mmUVD_CGC_GATE, data);
  1373. WREG32_SOC15(UVD, ring->me, mmUVD_SUVD_CGC_GATE, data1);
  1374. }
  1375. static void uvd_v7_0_set_bypass_mode(struct amdgpu_device *adev, bool enable)
  1376. {
  1377. u32 tmp = RREG32_SMC(ixGCK_DFS_BYPASS_CNTL);
  1378. if (enable)
  1379. tmp |= (GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
  1380. GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
  1381. else
  1382. tmp &= ~(GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
  1383. GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
  1384. WREG32_SMC(ixGCK_DFS_BYPASS_CNTL, tmp);
  1385. }
  1386. static int uvd_v7_0_set_clockgating_state(void *handle,
  1387. enum amd_clockgating_state state)
  1388. {
  1389. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1390. bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
  1391. uvd_v7_0_set_bypass_mode(adev, enable);
  1392. if (!(adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG))
  1393. return 0;
  1394. if (enable) {
  1395. /* disable HW gating and enable Sw gating */
  1396. uvd_v7_0_set_sw_clock_gating(adev);
  1397. } else {
  1398. /* wait for STATUS to clear */
  1399. if (uvd_v7_0_wait_for_idle(handle))
  1400. return -EBUSY;
  1401. /* enable HW gates because UVD is idle */
  1402. /* uvd_v7_0_set_hw_clock_gating(adev); */
  1403. }
  1404. return 0;
  1405. }
  1406. static int uvd_v7_0_set_powergating_state(void *handle,
  1407. enum amd_powergating_state state)
  1408. {
  1409. /* This doesn't actually powergate the UVD block.
  1410. * That's done in the dpm code via the SMC. This
  1411. * just re-inits the block as necessary. The actual
  1412. * gating still happens in the dpm code. We should
  1413. * revisit this when there is a cleaner line between
  1414. * the smc and the hw blocks
  1415. */
  1416. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1417. if (!(adev->pg_flags & AMD_PG_SUPPORT_UVD))
  1418. return 0;
  1419. WREG32_SOC15(UVD, ring->me, mmUVD_POWER_STATUS, UVD_POWER_STATUS__UVD_PG_EN_MASK);
  1420. if (state == AMD_PG_STATE_GATE) {
  1421. uvd_v7_0_stop(adev);
  1422. return 0;
  1423. } else {
  1424. return uvd_v7_0_start(adev);
  1425. }
  1426. }
  1427. #endif
  1428. static int uvd_v7_0_set_clockgating_state(void *handle,
  1429. enum amd_clockgating_state state)
  1430. {
  1431. /* needed for driver unload*/
  1432. return 0;
  1433. }
  1434. const struct amd_ip_funcs uvd_v7_0_ip_funcs = {
  1435. .name = "uvd_v7_0",
  1436. .early_init = uvd_v7_0_early_init,
  1437. .late_init = NULL,
  1438. .sw_init = uvd_v7_0_sw_init,
  1439. .sw_fini = uvd_v7_0_sw_fini,
  1440. .hw_init = uvd_v7_0_hw_init,
  1441. .hw_fini = uvd_v7_0_hw_fini,
  1442. .suspend = uvd_v7_0_suspend,
  1443. .resume = uvd_v7_0_resume,
  1444. .is_idle = NULL /* uvd_v7_0_is_idle */,
  1445. .wait_for_idle = NULL /* uvd_v7_0_wait_for_idle */,
  1446. .check_soft_reset = NULL /* uvd_v7_0_check_soft_reset */,
  1447. .pre_soft_reset = NULL /* uvd_v7_0_pre_soft_reset */,
  1448. .soft_reset = NULL /* uvd_v7_0_soft_reset */,
  1449. .post_soft_reset = NULL /* uvd_v7_0_post_soft_reset */,
  1450. .set_clockgating_state = uvd_v7_0_set_clockgating_state,
  1451. .set_powergating_state = NULL /* uvd_v7_0_set_powergating_state */,
  1452. };
  1453. static const struct amdgpu_ring_funcs uvd_v7_0_ring_vm_funcs = {
  1454. .type = AMDGPU_RING_TYPE_UVD,
  1455. .align_mask = 0xf,
  1456. .support_64bit_ptrs = false,
  1457. .vmhub = AMDGPU_MMHUB,
  1458. .get_rptr = uvd_v7_0_ring_get_rptr,
  1459. .get_wptr = uvd_v7_0_ring_get_wptr,
  1460. .set_wptr = uvd_v7_0_ring_set_wptr,
  1461. .emit_frame_size =
  1462. 6 + /* hdp invalidate */
  1463. SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
  1464. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
  1465. 8 + /* uvd_v7_0_ring_emit_vm_flush */
  1466. 14 + 14, /* uvd_v7_0_ring_emit_fence x2 vm fence */
  1467. .emit_ib_size = 8, /* uvd_v7_0_ring_emit_ib */
  1468. .emit_ib = uvd_v7_0_ring_emit_ib,
  1469. .emit_fence = uvd_v7_0_ring_emit_fence,
  1470. .emit_vm_flush = uvd_v7_0_ring_emit_vm_flush,
  1471. .emit_hdp_flush = uvd_v7_0_ring_emit_hdp_flush,
  1472. .test_ring = uvd_v7_0_ring_test_ring,
  1473. .test_ib = amdgpu_uvd_ring_test_ib,
  1474. .insert_nop = uvd_v7_0_ring_insert_nop,
  1475. .pad_ib = amdgpu_ring_generic_pad_ib,
  1476. .begin_use = amdgpu_uvd_ring_begin_use,
  1477. .end_use = amdgpu_uvd_ring_end_use,
  1478. .emit_wreg = uvd_v7_0_ring_emit_wreg,
  1479. .emit_reg_wait = uvd_v7_0_ring_emit_reg_wait,
  1480. .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
  1481. };
  1482. static const struct amdgpu_ring_funcs uvd_v7_0_enc_ring_vm_funcs = {
  1483. .type = AMDGPU_RING_TYPE_UVD_ENC,
  1484. .align_mask = 0x3f,
  1485. .nop = HEVC_ENC_CMD_NO_OP,
  1486. .support_64bit_ptrs = false,
  1487. .vmhub = AMDGPU_MMHUB,
  1488. .get_rptr = uvd_v7_0_enc_ring_get_rptr,
  1489. .get_wptr = uvd_v7_0_enc_ring_get_wptr,
  1490. .set_wptr = uvd_v7_0_enc_ring_set_wptr,
  1491. .emit_frame_size =
  1492. 3 + 3 + /* hdp flush / invalidate */
  1493. SOC15_FLUSH_GPU_TLB_NUM_WREG * 3 +
  1494. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 4 +
  1495. 4 + /* uvd_v7_0_enc_ring_emit_vm_flush */
  1496. 5 + 5 + /* uvd_v7_0_enc_ring_emit_fence x2 vm fence */
  1497. 1, /* uvd_v7_0_enc_ring_insert_end */
  1498. .emit_ib_size = 5, /* uvd_v7_0_enc_ring_emit_ib */
  1499. .emit_ib = uvd_v7_0_enc_ring_emit_ib,
  1500. .emit_fence = uvd_v7_0_enc_ring_emit_fence,
  1501. .emit_vm_flush = uvd_v7_0_enc_ring_emit_vm_flush,
  1502. .test_ring = uvd_v7_0_enc_ring_test_ring,
  1503. .test_ib = uvd_v7_0_enc_ring_test_ib,
  1504. .insert_nop = amdgpu_ring_insert_nop,
  1505. .insert_end = uvd_v7_0_enc_ring_insert_end,
  1506. .pad_ib = amdgpu_ring_generic_pad_ib,
  1507. .begin_use = amdgpu_uvd_ring_begin_use,
  1508. .end_use = amdgpu_uvd_ring_end_use,
  1509. .emit_wreg = uvd_v7_0_enc_ring_emit_wreg,
  1510. .emit_reg_wait = uvd_v7_0_enc_ring_emit_reg_wait,
  1511. .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
  1512. };
  1513. static void uvd_v7_0_set_ring_funcs(struct amdgpu_device *adev)
  1514. {
  1515. int i;
  1516. for (i = 0; i < adev->uvd.num_uvd_inst; i++) {
  1517. adev->uvd.inst[i].ring.funcs = &uvd_v7_0_ring_vm_funcs;
  1518. adev->uvd.inst[i].ring.me = i;
  1519. DRM_INFO("UVD(%d) is enabled in VM mode\n", i);
  1520. }
  1521. }
  1522. static void uvd_v7_0_set_enc_ring_funcs(struct amdgpu_device *adev)
  1523. {
  1524. int i, j;
  1525. for (j = 0; j < adev->uvd.num_uvd_inst; j++) {
  1526. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  1527. adev->uvd.inst[j].ring_enc[i].funcs = &uvd_v7_0_enc_ring_vm_funcs;
  1528. adev->uvd.inst[j].ring_enc[i].me = j;
  1529. }
  1530. DRM_INFO("UVD(%d) ENC is enabled in VM mode\n", j);
  1531. }
  1532. }
  1533. static const struct amdgpu_irq_src_funcs uvd_v7_0_irq_funcs = {
  1534. .set = uvd_v7_0_set_interrupt_state,
  1535. .process = uvd_v7_0_process_interrupt,
  1536. };
  1537. static void uvd_v7_0_set_irq_funcs(struct amdgpu_device *adev)
  1538. {
  1539. int i;
  1540. for (i = 0; i < adev->uvd.num_uvd_inst; i++) {
  1541. adev->uvd.inst[i].irq.num_types = adev->uvd.num_enc_rings + 1;
  1542. adev->uvd.inst[i].irq.funcs = &uvd_v7_0_irq_funcs;
  1543. }
  1544. }
  1545. const struct amdgpu_ip_block_version uvd_v7_0_ip_block =
  1546. {
  1547. .type = AMD_IP_BLOCK_TYPE_UVD,
  1548. .major = 7,
  1549. .minor = 0,
  1550. .rev = 0,
  1551. .funcs = &uvd_v7_0_ip_funcs,
  1552. };