uvd_v7_0.c 50 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include <linux/firmware.h>
  24. #include <drm/drmP.h>
  25. #include "amdgpu.h"
  26. #include "amdgpu_uvd.h"
  27. #include "soc15.h"
  28. #include "soc15d.h"
  29. #include "soc15_common.h"
  30. #include "mmsch_v1_0.h"
  31. #include "uvd/uvd_7_0_offset.h"
  32. #include "uvd/uvd_7_0_sh_mask.h"
  33. #include "vce/vce_4_0_offset.h"
  34. #include "vce/vce_4_0_default.h"
  35. #include "vce/vce_4_0_sh_mask.h"
  36. #include "nbif/nbif_6_1_offset.h"
  37. #include "hdp/hdp_4_0_offset.h"
  38. #include "mmhub/mmhub_1_0_offset.h"
  39. #include "mmhub/mmhub_1_0_sh_mask.h"
  40. static void uvd_v7_0_set_ring_funcs(struct amdgpu_device *adev);
  41. static void uvd_v7_0_set_enc_ring_funcs(struct amdgpu_device *adev);
  42. static void uvd_v7_0_set_irq_funcs(struct amdgpu_device *adev);
  43. static int uvd_v7_0_start(struct amdgpu_device *adev);
  44. static void uvd_v7_0_stop(struct amdgpu_device *adev);
  45. static int uvd_v7_0_sriov_start(struct amdgpu_device *adev);
  46. /**
  47. * uvd_v7_0_ring_get_rptr - get read pointer
  48. *
  49. * @ring: amdgpu_ring pointer
  50. *
  51. * Returns the current hardware read pointer
  52. */
  53. static uint64_t uvd_v7_0_ring_get_rptr(struct amdgpu_ring *ring)
  54. {
  55. struct amdgpu_device *adev = ring->adev;
  56. return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
  57. }
  58. /**
  59. * uvd_v7_0_enc_ring_get_rptr - get enc read pointer
  60. *
  61. * @ring: amdgpu_ring pointer
  62. *
  63. * Returns the current hardware enc read pointer
  64. */
  65. static uint64_t uvd_v7_0_enc_ring_get_rptr(struct amdgpu_ring *ring)
  66. {
  67. struct amdgpu_device *adev = ring->adev;
  68. if (ring == &adev->uvd.ring_enc[0])
  69. return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR);
  70. else
  71. return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2);
  72. }
  73. /**
  74. * uvd_v7_0_ring_get_wptr - get write pointer
  75. *
  76. * @ring: amdgpu_ring pointer
  77. *
  78. * Returns the current hardware write pointer
  79. */
  80. static uint64_t uvd_v7_0_ring_get_wptr(struct amdgpu_ring *ring)
  81. {
  82. struct amdgpu_device *adev = ring->adev;
  83. return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR);
  84. }
  85. /**
  86. * uvd_v7_0_enc_ring_get_wptr - get enc write pointer
  87. *
  88. * @ring: amdgpu_ring pointer
  89. *
  90. * Returns the current hardware enc write pointer
  91. */
  92. static uint64_t uvd_v7_0_enc_ring_get_wptr(struct amdgpu_ring *ring)
  93. {
  94. struct amdgpu_device *adev = ring->adev;
  95. if (ring->use_doorbell)
  96. return adev->wb.wb[ring->wptr_offs];
  97. if (ring == &adev->uvd.ring_enc[0])
  98. return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR);
  99. else
  100. return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2);
  101. }
  102. /**
  103. * uvd_v7_0_ring_set_wptr - set write pointer
  104. *
  105. * @ring: amdgpu_ring pointer
  106. *
  107. * Commits the write pointer to the hardware
  108. */
  109. static void uvd_v7_0_ring_set_wptr(struct amdgpu_ring *ring)
  110. {
  111. struct amdgpu_device *adev = ring->adev;
  112. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
  113. }
  114. /**
  115. * uvd_v7_0_enc_ring_set_wptr - set enc write pointer
  116. *
  117. * @ring: amdgpu_ring pointer
  118. *
  119. * Commits the enc write pointer to the hardware
  120. */
  121. static void uvd_v7_0_enc_ring_set_wptr(struct amdgpu_ring *ring)
  122. {
  123. struct amdgpu_device *adev = ring->adev;
  124. if (ring->use_doorbell) {
  125. /* XXX check if swapping is necessary on BE */
  126. adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
  127. WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
  128. return;
  129. }
  130. if (ring == &adev->uvd.ring_enc[0])
  131. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR,
  132. lower_32_bits(ring->wptr));
  133. else
  134. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2,
  135. lower_32_bits(ring->wptr));
  136. }
  137. /**
  138. * uvd_v7_0_enc_ring_test_ring - test if UVD ENC ring is working
  139. *
  140. * @ring: the engine to test on
  141. *
  142. */
  143. static int uvd_v7_0_enc_ring_test_ring(struct amdgpu_ring *ring)
  144. {
  145. struct amdgpu_device *adev = ring->adev;
  146. uint32_t rptr = amdgpu_ring_get_rptr(ring);
  147. unsigned i;
  148. int r;
  149. if (amdgpu_sriov_vf(adev))
  150. return 0;
  151. r = amdgpu_ring_alloc(ring, 16);
  152. if (r) {
  153. DRM_ERROR("amdgpu: uvd enc failed to lock ring %d (%d).\n",
  154. ring->idx, r);
  155. return r;
  156. }
  157. amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
  158. amdgpu_ring_commit(ring);
  159. for (i = 0; i < adev->usec_timeout; i++) {
  160. if (amdgpu_ring_get_rptr(ring) != rptr)
  161. break;
  162. DRM_UDELAY(1);
  163. }
  164. if (i < adev->usec_timeout) {
  165. DRM_DEBUG("ring test on %d succeeded in %d usecs\n",
  166. ring->idx, i);
  167. } else {
  168. DRM_ERROR("amdgpu: ring %d test failed\n",
  169. ring->idx);
  170. r = -ETIMEDOUT;
  171. }
  172. return r;
  173. }
  174. /**
  175. * uvd_v7_0_enc_get_create_msg - generate a UVD ENC create msg
  176. *
  177. * @adev: amdgpu_device pointer
  178. * @ring: ring we should submit the msg to
  179. * @handle: session handle to use
  180. * @fence: optional fence to return
  181. *
  182. * Open up a stream for HW test
  183. */
  184. static int uvd_v7_0_enc_get_create_msg(struct amdgpu_ring *ring, uint32_t handle,
  185. struct dma_fence **fence)
  186. {
  187. const unsigned ib_size_dw = 16;
  188. struct amdgpu_job *job;
  189. struct amdgpu_ib *ib;
  190. struct dma_fence *f = NULL;
  191. uint64_t dummy;
  192. int i, r;
  193. r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
  194. if (r)
  195. return r;
  196. ib = &job->ibs[0];
  197. dummy = ib->gpu_addr + 1024;
  198. ib->length_dw = 0;
  199. ib->ptr[ib->length_dw++] = 0x00000018;
  200. ib->ptr[ib->length_dw++] = 0x00000001; /* session info */
  201. ib->ptr[ib->length_dw++] = handle;
  202. ib->ptr[ib->length_dw++] = 0x00000000;
  203. ib->ptr[ib->length_dw++] = upper_32_bits(dummy);
  204. ib->ptr[ib->length_dw++] = dummy;
  205. ib->ptr[ib->length_dw++] = 0x00000014;
  206. ib->ptr[ib->length_dw++] = 0x00000002; /* task info */
  207. ib->ptr[ib->length_dw++] = 0x0000001c;
  208. ib->ptr[ib->length_dw++] = 0x00000000;
  209. ib->ptr[ib->length_dw++] = 0x00000000;
  210. ib->ptr[ib->length_dw++] = 0x00000008;
  211. ib->ptr[ib->length_dw++] = 0x08000001; /* op initialize */
  212. for (i = ib->length_dw; i < ib_size_dw; ++i)
  213. ib->ptr[i] = 0x0;
  214. r = amdgpu_ib_schedule(ring, 1, ib, NULL, &f);
  215. job->fence = dma_fence_get(f);
  216. if (r)
  217. goto err;
  218. amdgpu_job_free(job);
  219. if (fence)
  220. *fence = dma_fence_get(f);
  221. dma_fence_put(f);
  222. return 0;
  223. err:
  224. amdgpu_job_free(job);
  225. return r;
  226. }
  227. /**
  228. * uvd_v7_0_enc_get_destroy_msg - generate a UVD ENC destroy msg
  229. *
  230. * @adev: amdgpu_device pointer
  231. * @ring: ring we should submit the msg to
  232. * @handle: session handle to use
  233. * @fence: optional fence to return
  234. *
  235. * Close up a stream for HW test or if userspace failed to do so
  236. */
  237. int uvd_v7_0_enc_get_destroy_msg(struct amdgpu_ring *ring, uint32_t handle,
  238. bool direct, struct dma_fence **fence)
  239. {
  240. const unsigned ib_size_dw = 16;
  241. struct amdgpu_job *job;
  242. struct amdgpu_ib *ib;
  243. struct dma_fence *f = NULL;
  244. uint64_t dummy;
  245. int i, r;
  246. r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
  247. if (r)
  248. return r;
  249. ib = &job->ibs[0];
  250. dummy = ib->gpu_addr + 1024;
  251. ib->length_dw = 0;
  252. ib->ptr[ib->length_dw++] = 0x00000018;
  253. ib->ptr[ib->length_dw++] = 0x00000001;
  254. ib->ptr[ib->length_dw++] = handle;
  255. ib->ptr[ib->length_dw++] = 0x00000000;
  256. ib->ptr[ib->length_dw++] = upper_32_bits(dummy);
  257. ib->ptr[ib->length_dw++] = dummy;
  258. ib->ptr[ib->length_dw++] = 0x00000014;
  259. ib->ptr[ib->length_dw++] = 0x00000002;
  260. ib->ptr[ib->length_dw++] = 0x0000001c;
  261. ib->ptr[ib->length_dw++] = 0x00000000;
  262. ib->ptr[ib->length_dw++] = 0x00000000;
  263. ib->ptr[ib->length_dw++] = 0x00000008;
  264. ib->ptr[ib->length_dw++] = 0x08000002; /* op close session */
  265. for (i = ib->length_dw; i < ib_size_dw; ++i)
  266. ib->ptr[i] = 0x0;
  267. if (direct) {
  268. r = amdgpu_ib_schedule(ring, 1, ib, NULL, &f);
  269. job->fence = dma_fence_get(f);
  270. if (r)
  271. goto err;
  272. amdgpu_job_free(job);
  273. } else {
  274. r = amdgpu_job_submit(job, ring, &ring->adev->vce.entity,
  275. AMDGPU_FENCE_OWNER_UNDEFINED, &f);
  276. if (r)
  277. goto err;
  278. }
  279. if (fence)
  280. *fence = dma_fence_get(f);
  281. dma_fence_put(f);
  282. return 0;
  283. err:
  284. amdgpu_job_free(job);
  285. return r;
  286. }
  287. /**
  288. * uvd_v7_0_enc_ring_test_ib - test if UVD ENC IBs are working
  289. *
  290. * @ring: the engine to test on
  291. *
  292. */
  293. static int uvd_v7_0_enc_ring_test_ib(struct amdgpu_ring *ring, long timeout)
  294. {
  295. struct dma_fence *fence = NULL;
  296. long r;
  297. r = uvd_v7_0_enc_get_create_msg(ring, 1, NULL);
  298. if (r) {
  299. DRM_ERROR("amdgpu: failed to get create msg (%ld).\n", r);
  300. goto error;
  301. }
  302. r = uvd_v7_0_enc_get_destroy_msg(ring, 1, true, &fence);
  303. if (r) {
  304. DRM_ERROR("amdgpu: failed to get destroy ib (%ld).\n", r);
  305. goto error;
  306. }
  307. r = dma_fence_wait_timeout(fence, false, timeout);
  308. if (r == 0) {
  309. DRM_ERROR("amdgpu: IB test timed out.\n");
  310. r = -ETIMEDOUT;
  311. } else if (r < 0) {
  312. DRM_ERROR("amdgpu: fence wait failed (%ld).\n", r);
  313. } else {
  314. DRM_DEBUG("ib test on ring %d succeeded\n", ring->idx);
  315. r = 0;
  316. }
  317. error:
  318. dma_fence_put(fence);
  319. return r;
  320. }
  321. static int uvd_v7_0_early_init(void *handle)
  322. {
  323. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  324. if (amdgpu_sriov_vf(adev))
  325. adev->uvd.num_enc_rings = 1;
  326. else
  327. adev->uvd.num_enc_rings = 2;
  328. uvd_v7_0_set_ring_funcs(adev);
  329. uvd_v7_0_set_enc_ring_funcs(adev);
  330. uvd_v7_0_set_irq_funcs(adev);
  331. return 0;
  332. }
  333. static int uvd_v7_0_sw_init(void *handle)
  334. {
  335. struct amdgpu_ring *ring;
  336. struct drm_sched_rq *rq;
  337. int i, r;
  338. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  339. /* UVD TRAP */
  340. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_UVD, 124, &adev->uvd.irq);
  341. if (r)
  342. return r;
  343. /* UVD ENC TRAP */
  344. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  345. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_UVD, i + 119, &adev->uvd.irq);
  346. if (r)
  347. return r;
  348. }
  349. r = amdgpu_uvd_sw_init(adev);
  350. if (r)
  351. return r;
  352. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  353. const struct common_firmware_header *hdr;
  354. hdr = (const struct common_firmware_header *)adev->uvd.fw->data;
  355. adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].ucode_id = AMDGPU_UCODE_ID_UVD;
  356. adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].fw = adev->uvd.fw;
  357. adev->firmware.fw_size +=
  358. ALIGN(le32_to_cpu(hdr->ucode_size_bytes), PAGE_SIZE);
  359. DRM_INFO("PSP loading UVD firmware\n");
  360. }
  361. ring = &adev->uvd.ring_enc[0];
  362. rq = &ring->sched.sched_rq[DRM_SCHED_PRIORITY_NORMAL];
  363. r = drm_sched_entity_init(&ring->sched, &adev->uvd.entity_enc,
  364. rq, amdgpu_sched_jobs, NULL);
  365. if (r) {
  366. DRM_ERROR("Failed setting up UVD ENC run queue.\n");
  367. return r;
  368. }
  369. r = amdgpu_uvd_resume(adev);
  370. if (r)
  371. return r;
  372. if (!amdgpu_sriov_vf(adev)) {
  373. ring = &adev->uvd.ring;
  374. sprintf(ring->name, "uvd");
  375. r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.irq, 0);
  376. if (r)
  377. return r;
  378. }
  379. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  380. ring = &adev->uvd.ring_enc[i];
  381. sprintf(ring->name, "uvd_enc%d", i);
  382. if (amdgpu_sriov_vf(adev)) {
  383. ring->use_doorbell = true;
  384. /* currently only use the first enconding ring for
  385. * sriov, so set unused location for other unused rings.
  386. */
  387. if (i == 0)
  388. ring->doorbell_index = AMDGPU_DOORBELL64_UVD_RING0_1 * 2;
  389. else
  390. ring->doorbell_index = AMDGPU_DOORBELL64_UVD_RING2_3 * 2 + 1;
  391. }
  392. r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.irq, 0);
  393. if (r)
  394. return r;
  395. }
  396. r = amdgpu_virt_alloc_mm_table(adev);
  397. if (r)
  398. return r;
  399. return r;
  400. }
  401. static int uvd_v7_0_sw_fini(void *handle)
  402. {
  403. int i, r;
  404. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  405. amdgpu_virt_free_mm_table(adev);
  406. r = amdgpu_uvd_suspend(adev);
  407. if (r)
  408. return r;
  409. drm_sched_entity_fini(&adev->uvd.ring_enc[0].sched, &adev->uvd.entity_enc);
  410. for (i = 0; i < adev->uvd.num_enc_rings; ++i)
  411. amdgpu_ring_fini(&adev->uvd.ring_enc[i]);
  412. return amdgpu_uvd_sw_fini(adev);
  413. }
  414. /**
  415. * uvd_v7_0_hw_init - start and test UVD block
  416. *
  417. * @adev: amdgpu_device pointer
  418. *
  419. * Initialize the hardware, boot up the VCPU and do some testing
  420. */
  421. static int uvd_v7_0_hw_init(void *handle)
  422. {
  423. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  424. struct amdgpu_ring *ring = &adev->uvd.ring;
  425. uint32_t tmp;
  426. int i, r;
  427. if (amdgpu_sriov_vf(adev))
  428. r = uvd_v7_0_sriov_start(adev);
  429. else
  430. r = uvd_v7_0_start(adev);
  431. if (r)
  432. goto done;
  433. if (!amdgpu_sriov_vf(adev)) {
  434. ring->ready = true;
  435. r = amdgpu_ring_test_ring(ring);
  436. if (r) {
  437. ring->ready = false;
  438. goto done;
  439. }
  440. r = amdgpu_ring_alloc(ring, 10);
  441. if (r) {
  442. DRM_ERROR("amdgpu: ring failed to lock UVD ring (%d).\n", r);
  443. goto done;
  444. }
  445. tmp = PACKET0(SOC15_REG_OFFSET(UVD, 0,
  446. mmUVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL), 0);
  447. amdgpu_ring_write(ring, tmp);
  448. amdgpu_ring_write(ring, 0xFFFFF);
  449. tmp = PACKET0(SOC15_REG_OFFSET(UVD, 0,
  450. mmUVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL), 0);
  451. amdgpu_ring_write(ring, tmp);
  452. amdgpu_ring_write(ring, 0xFFFFF);
  453. tmp = PACKET0(SOC15_REG_OFFSET(UVD, 0,
  454. mmUVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL), 0);
  455. amdgpu_ring_write(ring, tmp);
  456. amdgpu_ring_write(ring, 0xFFFFF);
  457. /* Clear timeout status bits */
  458. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, 0,
  459. mmUVD_SEMA_TIMEOUT_STATUS), 0));
  460. amdgpu_ring_write(ring, 0x8);
  461. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, 0,
  462. mmUVD_SEMA_CNTL), 0));
  463. amdgpu_ring_write(ring, 3);
  464. amdgpu_ring_commit(ring);
  465. }
  466. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  467. ring = &adev->uvd.ring_enc[i];
  468. ring->ready = true;
  469. r = amdgpu_ring_test_ring(ring);
  470. if (r) {
  471. ring->ready = false;
  472. goto done;
  473. }
  474. }
  475. done:
  476. if (!r)
  477. DRM_INFO("UVD and UVD ENC initialized successfully.\n");
  478. return r;
  479. }
  480. /**
  481. * uvd_v7_0_hw_fini - stop the hardware block
  482. *
  483. * @adev: amdgpu_device pointer
  484. *
  485. * Stop the UVD block, mark ring as not ready any more
  486. */
  487. static int uvd_v7_0_hw_fini(void *handle)
  488. {
  489. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  490. struct amdgpu_ring *ring = &adev->uvd.ring;
  491. if (!amdgpu_sriov_vf(adev))
  492. uvd_v7_0_stop(adev);
  493. else {
  494. /* full access mode, so don't touch any UVD register */
  495. DRM_DEBUG("For SRIOV client, shouldn't do anything.\n");
  496. }
  497. ring->ready = false;
  498. return 0;
  499. }
  500. static int uvd_v7_0_suspend(void *handle)
  501. {
  502. int r;
  503. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  504. r = uvd_v7_0_hw_fini(adev);
  505. if (r)
  506. return r;
  507. return amdgpu_uvd_suspend(adev);
  508. }
  509. static int uvd_v7_0_resume(void *handle)
  510. {
  511. int r;
  512. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  513. r = amdgpu_uvd_resume(adev);
  514. if (r)
  515. return r;
  516. return uvd_v7_0_hw_init(adev);
  517. }
  518. /**
  519. * uvd_v7_0_mc_resume - memory controller programming
  520. *
  521. * @adev: amdgpu_device pointer
  522. *
  523. * Let the UVD memory controller know it's offsets
  524. */
  525. static void uvd_v7_0_mc_resume(struct amdgpu_device *adev)
  526. {
  527. uint32_t size = AMDGPU_UVD_FIRMWARE_SIZE(adev);
  528. uint32_t offset;
  529. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  530. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  531. lower_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  532. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  533. upper_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  534. offset = 0;
  535. } else {
  536. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  537. lower_32_bits(adev->uvd.gpu_addr));
  538. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  539. upper_32_bits(adev->uvd.gpu_addr));
  540. offset = size;
  541. }
  542. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0,
  543. AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
  544. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE0, size);
  545. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW,
  546. lower_32_bits(adev->uvd.gpu_addr + offset));
  547. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH,
  548. upper_32_bits(adev->uvd.gpu_addr + offset));
  549. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET1, (1 << 21));
  550. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE1, AMDGPU_UVD_HEAP_SIZE);
  551. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW,
  552. lower_32_bits(adev->uvd.gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  553. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH,
  554. upper_32_bits(adev->uvd.gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  555. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET2, (2 << 21));
  556. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE2,
  557. AMDGPU_UVD_STACK_SIZE + (AMDGPU_UVD_SESSION_SIZE * 40));
  558. WREG32_SOC15(UVD, 0, mmUVD_UDEC_ADDR_CONFIG,
  559. adev->gfx.config.gb_addr_config);
  560. WREG32_SOC15(UVD, 0, mmUVD_UDEC_DB_ADDR_CONFIG,
  561. adev->gfx.config.gb_addr_config);
  562. WREG32_SOC15(UVD, 0, mmUVD_UDEC_DBW_ADDR_CONFIG,
  563. adev->gfx.config.gb_addr_config);
  564. WREG32_SOC15(UVD, 0, mmUVD_GP_SCRATCH4, adev->uvd.max_handles);
  565. }
  566. static int uvd_v7_0_mmsch_start(struct amdgpu_device *adev,
  567. struct amdgpu_mm_table *table)
  568. {
  569. uint32_t data = 0, loop;
  570. uint64_t addr = table->gpu_addr;
  571. struct mmsch_v1_0_init_header *header = (struct mmsch_v1_0_init_header *)table->cpu_addr;
  572. uint32_t size;
  573. size = header->header_size + header->vce_table_size + header->uvd_table_size;
  574. /* 1, write to vce_mmsch_vf_ctx_addr_lo/hi register with GPU mc addr of memory descriptor location */
  575. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_ADDR_LO, lower_32_bits(addr));
  576. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_ADDR_HI, upper_32_bits(addr));
  577. /* 2, update vmid of descriptor */
  578. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_VMID);
  579. data &= ~VCE_MMSCH_VF_VMID__VF_CTX_VMID_MASK;
  580. data |= (0 << VCE_MMSCH_VF_VMID__VF_CTX_VMID__SHIFT); /* use domain0 for MM scheduler */
  581. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_VMID, data);
  582. /* 3, notify mmsch about the size of this descriptor */
  583. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_SIZE, size);
  584. /* 4, set resp to zero */
  585. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP, 0);
  586. WDOORBELL32(adev->uvd.ring_enc[0].doorbell_index, 0);
  587. adev->wb.wb[adev->uvd.ring_enc[0].wptr_offs] = 0;
  588. adev->uvd.ring_enc[0].wptr = 0;
  589. adev->uvd.ring_enc[0].wptr_old = 0;
  590. /* 5, kick off the initialization and wait until VCE_MMSCH_VF_MAILBOX_RESP becomes non-zero */
  591. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_HOST, 0x10000001);
  592. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP);
  593. loop = 1000;
  594. while ((data & 0x10000002) != 0x10000002) {
  595. udelay(10);
  596. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP);
  597. loop--;
  598. if (!loop)
  599. break;
  600. }
  601. if (!loop) {
  602. dev_err(adev->dev, "failed to init MMSCH, mmVCE_MMSCH_VF_MAILBOX_RESP = %x\n", data);
  603. return -EBUSY;
  604. }
  605. return 0;
  606. }
  607. static int uvd_v7_0_sriov_start(struct amdgpu_device *adev)
  608. {
  609. struct amdgpu_ring *ring;
  610. uint32_t offset, size, tmp;
  611. uint32_t table_size = 0;
  612. struct mmsch_v1_0_cmd_direct_write direct_wt = { {0} };
  613. struct mmsch_v1_0_cmd_direct_read_modify_write direct_rd_mod_wt = { {0} };
  614. struct mmsch_v1_0_cmd_direct_polling direct_poll = { {0} };
  615. struct mmsch_v1_0_cmd_end end = { {0} };
  616. uint32_t *init_table = adev->virt.mm_table.cpu_addr;
  617. struct mmsch_v1_0_init_header *header = (struct mmsch_v1_0_init_header *)init_table;
  618. direct_wt.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_WRITE;
  619. direct_rd_mod_wt.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_READ_MODIFY_WRITE;
  620. direct_poll.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_POLLING;
  621. end.cmd_header.command_type = MMSCH_COMMAND__END;
  622. if (header->uvd_table_offset == 0 && header->uvd_table_size == 0) {
  623. header->version = MMSCH_VERSION;
  624. header->header_size = sizeof(struct mmsch_v1_0_init_header) >> 2;
  625. if (header->vce_table_offset == 0 && header->vce_table_size == 0)
  626. header->uvd_table_offset = header->header_size;
  627. else
  628. header->uvd_table_offset = header->vce_table_size + header->vce_table_offset;
  629. init_table += header->uvd_table_offset;
  630. ring = &adev->uvd.ring;
  631. ring->wptr = 0;
  632. size = AMDGPU_GPU_PAGE_ALIGN(adev->uvd.fw->size + 4);
  633. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS),
  634. 0xFFFFFFFF, 0x00000004);
  635. /* mc resume*/
  636. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  637. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW),
  638. lower_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  639. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH),
  640. upper_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  641. offset = 0;
  642. } else {
  643. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW),
  644. lower_32_bits(adev->uvd.gpu_addr));
  645. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH),
  646. upper_32_bits(adev->uvd.gpu_addr));
  647. offset = size;
  648. }
  649. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0),
  650. AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
  651. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_SIZE0), size);
  652. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW),
  653. lower_32_bits(adev->uvd.gpu_addr + offset));
  654. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH),
  655. upper_32_bits(adev->uvd.gpu_addr + offset));
  656. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_OFFSET1), (1 << 21));
  657. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_SIZE1), AMDGPU_UVD_HEAP_SIZE);
  658. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW),
  659. lower_32_bits(adev->uvd.gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  660. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH),
  661. upper_32_bits(adev->uvd.gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  662. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_OFFSET2), (2 << 21));
  663. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_SIZE2),
  664. AMDGPU_UVD_STACK_SIZE + (AMDGPU_UVD_SESSION_SIZE * 40));
  665. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_GP_SCRATCH4), adev->uvd.max_handles);
  666. /* mc resume end*/
  667. /* disable clock gating */
  668. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_CGC_CTRL),
  669. ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK, 0);
  670. /* disable interupt */
  671. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN),
  672. ~UVD_MASTINT_EN__VCPU_EN_MASK, 0);
  673. /* stall UMC and register bus before resetting VCPU */
  674. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
  675. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  676. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  677. /* put LMI, VCPU, RBC etc... into reset */
  678. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  679. (uint32_t)(UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  680. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
  681. UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  682. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
  683. UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  684. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
  685. UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  686. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK));
  687. /* initialize UVD memory controller */
  688. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL),
  689. (uint32_t)((0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  690. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  691. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  692. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  693. UVD_LMI_CTRL__REQ_MODE_MASK |
  694. 0x00100000L));
  695. /* take all subblocks out of reset, except VCPU */
  696. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  697. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  698. /* enable VCPU clock */
  699. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CNTL),
  700. UVD_VCPU_CNTL__CLK_EN_MASK);
  701. /* enable master interrupt */
  702. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN),
  703. ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
  704. (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
  705. /* clear the bit 4 of UVD_STATUS */
  706. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS),
  707. ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT), 0);
  708. /* force RBC into idle state */
  709. size = order_base_2(ring->ring_size);
  710. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, size);
  711. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  712. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_RB_CNTL), tmp);
  713. ring = &adev->uvd.ring_enc[0];
  714. ring->wptr = 0;
  715. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_RB_BASE_LO), ring->gpu_addr);
  716. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_RB_BASE_HI), upper_32_bits(ring->gpu_addr));
  717. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_RB_SIZE), ring->ring_size / 4);
  718. /* boot up the VCPU */
  719. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET), 0);
  720. /* enable UMC */
  721. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
  722. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK, 0);
  723. MMSCH_V1_0_INSERT_DIRECT_POLL(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS), 0x02, 0x02);
  724. /* add end packet */
  725. memcpy((void *)init_table, &end, sizeof(struct mmsch_v1_0_cmd_end));
  726. table_size += sizeof(struct mmsch_v1_0_cmd_end) / 4;
  727. header->uvd_table_size = table_size;
  728. }
  729. return uvd_v7_0_mmsch_start(adev, &adev->virt.mm_table);
  730. }
  731. /**
  732. * uvd_v7_0_start - start UVD block
  733. *
  734. * @adev: amdgpu_device pointer
  735. *
  736. * Setup and start the UVD block
  737. */
  738. static int uvd_v7_0_start(struct amdgpu_device *adev)
  739. {
  740. struct amdgpu_ring *ring = &adev->uvd.ring;
  741. uint32_t rb_bufsz, tmp;
  742. uint32_t lmi_swap_cntl;
  743. uint32_t mp_swap_cntl;
  744. int i, j, r;
  745. /* disable DPG */
  746. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_POWER_STATUS), 0,
  747. ~UVD_POWER_STATUS__UVD_PG_MODE_MASK);
  748. /* disable byte swapping */
  749. lmi_swap_cntl = 0;
  750. mp_swap_cntl = 0;
  751. uvd_v7_0_mc_resume(adev);
  752. /* disable clock gating */
  753. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_CGC_CTRL), 0,
  754. ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK);
  755. /* disable interupt */
  756. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN), 0,
  757. ~UVD_MASTINT_EN__VCPU_EN_MASK);
  758. /* stall UMC and register bus before resetting VCPU */
  759. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
  760. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  761. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  762. mdelay(1);
  763. /* put LMI, VCPU, RBC etc... into reset */
  764. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
  765. UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  766. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
  767. UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  768. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
  769. UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  770. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
  771. UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  772. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
  773. mdelay(5);
  774. /* initialize UVD memory controller */
  775. WREG32_SOC15(UVD, 0, mmUVD_LMI_CTRL,
  776. (0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  777. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  778. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  779. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  780. UVD_LMI_CTRL__REQ_MODE_MASK |
  781. 0x00100000L);
  782. #ifdef __BIG_ENDIAN
  783. /* swap (8 in 32) RB and IB */
  784. lmi_swap_cntl = 0xa;
  785. mp_swap_cntl = 0;
  786. #endif
  787. WREG32_SOC15(UVD, 0, mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
  788. WREG32_SOC15(UVD, 0, mmUVD_MP_SWAP_CNTL, mp_swap_cntl);
  789. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXA0, 0x40c2040);
  790. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXA1, 0x0);
  791. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXB0, 0x40c2040);
  792. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXB1, 0x0);
  793. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_ALU, 0);
  794. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUX, 0x88);
  795. /* take all subblocks out of reset, except VCPU */
  796. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
  797. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  798. mdelay(5);
  799. /* enable VCPU clock */
  800. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CNTL,
  801. UVD_VCPU_CNTL__CLK_EN_MASK);
  802. /* enable UMC */
  803. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2), 0,
  804. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  805. /* boot up the VCPU */
  806. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET, 0);
  807. mdelay(10);
  808. for (i = 0; i < 10; ++i) {
  809. uint32_t status;
  810. for (j = 0; j < 100; ++j) {
  811. status = RREG32_SOC15(UVD, 0, mmUVD_STATUS);
  812. if (status & 2)
  813. break;
  814. mdelay(10);
  815. }
  816. r = 0;
  817. if (status & 2)
  818. break;
  819. DRM_ERROR("UVD not responding, trying to reset the VCPU!!!\n");
  820. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  821. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
  822. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  823. mdelay(10);
  824. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET), 0,
  825. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  826. mdelay(10);
  827. r = -1;
  828. }
  829. if (r) {
  830. DRM_ERROR("UVD not responding, giving up!!!\n");
  831. return r;
  832. }
  833. /* enable master interrupt */
  834. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN),
  835. (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
  836. ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
  837. /* clear the bit 4 of UVD_STATUS */
  838. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS), 0,
  839. ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
  840. /* force RBC into idle state */
  841. rb_bufsz = order_base_2(ring->ring_size);
  842. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
  843. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
  844. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  845. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
  846. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
  847. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
  848. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, tmp);
  849. /* set the write pointer delay */
  850. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR_CNTL, 0);
  851. /* set the wb address */
  852. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR_ADDR,
  853. (upper_32_bits(ring->gpu_addr) >> 2));
  854. /* programm the RB_BASE for ring buffer */
  855. WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
  856. lower_32_bits(ring->gpu_addr));
  857. WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
  858. upper_32_bits(ring->gpu_addr));
  859. /* Initialize the ring buffer's read and write pointers */
  860. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR, 0);
  861. ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
  862. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR,
  863. lower_32_bits(ring->wptr));
  864. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_RB_CNTL), 0,
  865. ~UVD_RBC_RB_CNTL__RB_NO_FETCH_MASK);
  866. ring = &adev->uvd.ring_enc[0];
  867. WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
  868. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
  869. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO, ring->gpu_addr);
  870. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
  871. WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE, ring->ring_size / 4);
  872. ring = &adev->uvd.ring_enc[1];
  873. WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
  874. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
  875. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO2, ring->gpu_addr);
  876. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
  877. WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE2, ring->ring_size / 4);
  878. return 0;
  879. }
  880. /**
  881. * uvd_v7_0_stop - stop UVD block
  882. *
  883. * @adev: amdgpu_device pointer
  884. *
  885. * stop the UVD block
  886. */
  887. static void uvd_v7_0_stop(struct amdgpu_device *adev)
  888. {
  889. /* force RBC into idle state */
  890. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, 0x11010101);
  891. /* Stall UMC and register bus before resetting VCPU */
  892. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
  893. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  894. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  895. mdelay(1);
  896. /* put VCPU into reset */
  897. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
  898. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  899. mdelay(5);
  900. /* disable VCPU clock */
  901. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CNTL, 0x0);
  902. /* Unstall UMC and register bus */
  903. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2), 0,
  904. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  905. }
  906. /**
  907. * uvd_v7_0_ring_emit_fence - emit an fence & trap command
  908. *
  909. * @ring: amdgpu_ring pointer
  910. * @fence: fence to emit
  911. *
  912. * Write a fence and a trap command to the ring.
  913. */
  914. static void uvd_v7_0_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
  915. unsigned flags)
  916. {
  917. struct amdgpu_device *adev = ring->adev;
  918. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  919. amdgpu_ring_write(ring,
  920. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_CONTEXT_ID), 0));
  921. amdgpu_ring_write(ring, seq);
  922. amdgpu_ring_write(ring,
  923. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  924. amdgpu_ring_write(ring, addr & 0xffffffff);
  925. amdgpu_ring_write(ring,
  926. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  927. amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
  928. amdgpu_ring_write(ring,
  929. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  930. amdgpu_ring_write(ring, 0);
  931. amdgpu_ring_write(ring,
  932. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  933. amdgpu_ring_write(ring, 0);
  934. amdgpu_ring_write(ring,
  935. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  936. amdgpu_ring_write(ring, 0);
  937. amdgpu_ring_write(ring,
  938. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  939. amdgpu_ring_write(ring, 2);
  940. }
  941. /**
  942. * uvd_v7_0_enc_ring_emit_fence - emit an enc fence & trap command
  943. *
  944. * @ring: amdgpu_ring pointer
  945. * @fence: fence to emit
  946. *
  947. * Write enc a fence and a trap command to the ring.
  948. */
  949. static void uvd_v7_0_enc_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
  950. u64 seq, unsigned flags)
  951. {
  952. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  953. amdgpu_ring_write(ring, HEVC_ENC_CMD_FENCE);
  954. amdgpu_ring_write(ring, addr);
  955. amdgpu_ring_write(ring, upper_32_bits(addr));
  956. amdgpu_ring_write(ring, seq);
  957. amdgpu_ring_write(ring, HEVC_ENC_CMD_TRAP);
  958. }
  959. /**
  960. * uvd_v7_0_ring_test_ring - register write test
  961. *
  962. * @ring: amdgpu_ring pointer
  963. *
  964. * Test if we can successfully write to the context register
  965. */
  966. static int uvd_v7_0_ring_test_ring(struct amdgpu_ring *ring)
  967. {
  968. struct amdgpu_device *adev = ring->adev;
  969. uint32_t tmp = 0;
  970. unsigned i;
  971. int r;
  972. WREG32_SOC15(UVD, 0, mmUVD_CONTEXT_ID, 0xCAFEDEAD);
  973. r = amdgpu_ring_alloc(ring, 3);
  974. if (r) {
  975. DRM_ERROR("amdgpu: cp failed to lock ring %d (%d).\n",
  976. ring->idx, r);
  977. return r;
  978. }
  979. amdgpu_ring_write(ring,
  980. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_CONTEXT_ID), 0));
  981. amdgpu_ring_write(ring, 0xDEADBEEF);
  982. amdgpu_ring_commit(ring);
  983. for (i = 0; i < adev->usec_timeout; i++) {
  984. tmp = RREG32_SOC15(UVD, 0, mmUVD_CONTEXT_ID);
  985. if (tmp == 0xDEADBEEF)
  986. break;
  987. DRM_UDELAY(1);
  988. }
  989. if (i < adev->usec_timeout) {
  990. DRM_DEBUG("ring test on %d succeeded in %d usecs\n",
  991. ring->idx, i);
  992. } else {
  993. DRM_ERROR("amdgpu: ring %d test failed (0x%08X)\n",
  994. ring->idx, tmp);
  995. r = -EINVAL;
  996. }
  997. return r;
  998. }
  999. /**
  1000. * uvd_v7_0_ring_emit_ib - execute indirect buffer
  1001. *
  1002. * @ring: amdgpu_ring pointer
  1003. * @ib: indirect buffer to execute
  1004. *
  1005. * Write ring commands to execute the indirect buffer
  1006. */
  1007. static void uvd_v7_0_ring_emit_ib(struct amdgpu_ring *ring,
  1008. struct amdgpu_ib *ib,
  1009. unsigned vmid, bool ctx_switch)
  1010. {
  1011. struct amdgpu_device *adev = ring->adev;
  1012. amdgpu_ring_write(ring,
  1013. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_VMID), 0));
  1014. amdgpu_ring_write(ring, vmid);
  1015. amdgpu_ring_write(ring,
  1016. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_64BIT_BAR_LOW), 0));
  1017. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1018. amdgpu_ring_write(ring,
  1019. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH), 0));
  1020. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1021. amdgpu_ring_write(ring,
  1022. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_IB_SIZE), 0));
  1023. amdgpu_ring_write(ring, ib->length_dw);
  1024. }
  1025. /**
  1026. * uvd_v7_0_enc_ring_emit_ib - enc execute indirect buffer
  1027. *
  1028. * @ring: amdgpu_ring pointer
  1029. * @ib: indirect buffer to execute
  1030. *
  1031. * Write enc ring commands to execute the indirect buffer
  1032. */
  1033. static void uvd_v7_0_enc_ring_emit_ib(struct amdgpu_ring *ring,
  1034. struct amdgpu_ib *ib, unsigned int vmid, bool ctx_switch)
  1035. {
  1036. amdgpu_ring_write(ring, HEVC_ENC_CMD_IB_VM);
  1037. amdgpu_ring_write(ring, vmid);
  1038. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1039. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1040. amdgpu_ring_write(ring, ib->length_dw);
  1041. }
  1042. static void uvd_v7_0_ring_emit_wreg(struct amdgpu_ring *ring,
  1043. uint32_t reg, uint32_t val)
  1044. {
  1045. struct amdgpu_device *adev = ring->adev;
  1046. amdgpu_ring_write(ring,
  1047. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  1048. amdgpu_ring_write(ring, reg << 2);
  1049. amdgpu_ring_write(ring,
  1050. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  1051. amdgpu_ring_write(ring, val);
  1052. amdgpu_ring_write(ring,
  1053. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  1054. amdgpu_ring_write(ring, 8);
  1055. }
  1056. static void uvd_v7_0_ring_emit_reg_wait(struct amdgpu_ring *ring, uint32_t reg,
  1057. uint32_t val, uint32_t mask)
  1058. {
  1059. struct amdgpu_device *adev = ring->adev;
  1060. amdgpu_ring_write(ring,
  1061. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  1062. amdgpu_ring_write(ring, reg << 2);
  1063. amdgpu_ring_write(ring,
  1064. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  1065. amdgpu_ring_write(ring, val);
  1066. amdgpu_ring_write(ring,
  1067. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GP_SCRATCH8), 0));
  1068. amdgpu_ring_write(ring, mask);
  1069. amdgpu_ring_write(ring,
  1070. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  1071. amdgpu_ring_write(ring, 12);
  1072. }
  1073. static void uvd_v7_0_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1074. unsigned vmid, uint64_t pd_addr)
  1075. {
  1076. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1077. uint32_t data0, data1, mask;
  1078. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  1079. /* wait for reg writes */
  1080. data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
  1081. data1 = lower_32_bits(pd_addr);
  1082. mask = 0xffffffff;
  1083. uvd_v7_0_ring_emit_reg_wait(ring, data0, data1, mask);
  1084. }
  1085. static void uvd_v7_0_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count)
  1086. {
  1087. int i;
  1088. struct amdgpu_device *adev = ring->adev;
  1089. for (i = 0; i < count; i++)
  1090. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_NO_OP), 0));
  1091. }
  1092. static void uvd_v7_0_enc_ring_insert_end(struct amdgpu_ring *ring)
  1093. {
  1094. amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
  1095. }
  1096. static void uvd_v7_0_enc_ring_emit_reg_wait(struct amdgpu_ring *ring,
  1097. uint32_t reg, uint32_t val,
  1098. uint32_t mask)
  1099. {
  1100. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WAIT);
  1101. amdgpu_ring_write(ring, reg << 2);
  1102. amdgpu_ring_write(ring, mask);
  1103. amdgpu_ring_write(ring, val);
  1104. }
  1105. static void uvd_v7_0_enc_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1106. unsigned int vmid, uint64_t pd_addr)
  1107. {
  1108. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1109. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  1110. /* wait for reg writes */
  1111. uvd_v7_0_enc_ring_emit_reg_wait(ring, hub->ctx0_ptb_addr_lo32 + vmid * 2,
  1112. lower_32_bits(pd_addr), 0xffffffff);
  1113. }
  1114. static void uvd_v7_0_enc_ring_emit_wreg(struct amdgpu_ring *ring,
  1115. uint32_t reg, uint32_t val)
  1116. {
  1117. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WRITE);
  1118. amdgpu_ring_write(ring, reg << 2);
  1119. amdgpu_ring_write(ring, val);
  1120. }
  1121. #if 0
  1122. static bool uvd_v7_0_is_idle(void *handle)
  1123. {
  1124. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1125. return !(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK);
  1126. }
  1127. static int uvd_v7_0_wait_for_idle(void *handle)
  1128. {
  1129. unsigned i;
  1130. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1131. for (i = 0; i < adev->usec_timeout; i++) {
  1132. if (uvd_v7_0_is_idle(handle))
  1133. return 0;
  1134. }
  1135. return -ETIMEDOUT;
  1136. }
  1137. #define AMDGPU_UVD_STATUS_BUSY_MASK 0xfd
  1138. static bool uvd_v7_0_check_soft_reset(void *handle)
  1139. {
  1140. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1141. u32 srbm_soft_reset = 0;
  1142. u32 tmp = RREG32(mmSRBM_STATUS);
  1143. if (REG_GET_FIELD(tmp, SRBM_STATUS, UVD_RQ_PENDING) ||
  1144. REG_GET_FIELD(tmp, SRBM_STATUS, UVD_BUSY) ||
  1145. (RREG32_SOC15(UVD, 0, mmUVD_STATUS) &
  1146. AMDGPU_UVD_STATUS_BUSY_MASK))
  1147. srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset,
  1148. SRBM_SOFT_RESET, SOFT_RESET_UVD, 1);
  1149. if (srbm_soft_reset) {
  1150. adev->uvd.srbm_soft_reset = srbm_soft_reset;
  1151. return true;
  1152. } else {
  1153. adev->uvd.srbm_soft_reset = 0;
  1154. return false;
  1155. }
  1156. }
  1157. static int uvd_v7_0_pre_soft_reset(void *handle)
  1158. {
  1159. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1160. if (!adev->uvd.srbm_soft_reset)
  1161. return 0;
  1162. uvd_v7_0_stop(adev);
  1163. return 0;
  1164. }
  1165. static int uvd_v7_0_soft_reset(void *handle)
  1166. {
  1167. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1168. u32 srbm_soft_reset;
  1169. if (!adev->uvd.srbm_soft_reset)
  1170. return 0;
  1171. srbm_soft_reset = adev->uvd.srbm_soft_reset;
  1172. if (srbm_soft_reset) {
  1173. u32 tmp;
  1174. tmp = RREG32(mmSRBM_SOFT_RESET);
  1175. tmp |= srbm_soft_reset;
  1176. dev_info(adev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
  1177. WREG32(mmSRBM_SOFT_RESET, tmp);
  1178. tmp = RREG32(mmSRBM_SOFT_RESET);
  1179. udelay(50);
  1180. tmp &= ~srbm_soft_reset;
  1181. WREG32(mmSRBM_SOFT_RESET, tmp);
  1182. tmp = RREG32(mmSRBM_SOFT_RESET);
  1183. /* Wait a little for things to settle down */
  1184. udelay(50);
  1185. }
  1186. return 0;
  1187. }
  1188. static int uvd_v7_0_post_soft_reset(void *handle)
  1189. {
  1190. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1191. if (!adev->uvd.srbm_soft_reset)
  1192. return 0;
  1193. mdelay(5);
  1194. return uvd_v7_0_start(adev);
  1195. }
  1196. #endif
  1197. static int uvd_v7_0_set_interrupt_state(struct amdgpu_device *adev,
  1198. struct amdgpu_irq_src *source,
  1199. unsigned type,
  1200. enum amdgpu_interrupt_state state)
  1201. {
  1202. // TODO
  1203. return 0;
  1204. }
  1205. static int uvd_v7_0_process_interrupt(struct amdgpu_device *adev,
  1206. struct amdgpu_irq_src *source,
  1207. struct amdgpu_iv_entry *entry)
  1208. {
  1209. DRM_DEBUG("IH: UVD TRAP\n");
  1210. switch (entry->src_id) {
  1211. case 124:
  1212. amdgpu_fence_process(&adev->uvd.ring);
  1213. break;
  1214. case 119:
  1215. amdgpu_fence_process(&adev->uvd.ring_enc[0]);
  1216. break;
  1217. case 120:
  1218. if (!amdgpu_sriov_vf(adev))
  1219. amdgpu_fence_process(&adev->uvd.ring_enc[1]);
  1220. break;
  1221. default:
  1222. DRM_ERROR("Unhandled interrupt: %d %d\n",
  1223. entry->src_id, entry->src_data[0]);
  1224. break;
  1225. }
  1226. return 0;
  1227. }
  1228. #if 0
  1229. static void uvd_v7_0_set_sw_clock_gating(struct amdgpu_device *adev)
  1230. {
  1231. uint32_t data, data1, data2, suvd_flags;
  1232. data = RREG32_SOC15(UVD, 0, mmUVD_CGC_CTRL);
  1233. data1 = RREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_GATE);
  1234. data2 = RREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_CTRL);
  1235. data &= ~(UVD_CGC_CTRL__CLK_OFF_DELAY_MASK |
  1236. UVD_CGC_CTRL__CLK_GATE_DLY_TIMER_MASK);
  1237. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  1238. UVD_SUVD_CGC_GATE__SIT_MASK |
  1239. UVD_SUVD_CGC_GATE__SMP_MASK |
  1240. UVD_SUVD_CGC_GATE__SCM_MASK |
  1241. UVD_SUVD_CGC_GATE__SDB_MASK;
  1242. data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK |
  1243. (1 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_GATE_DLY_TIMER)) |
  1244. (4 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_OFF_DELAY));
  1245. data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
  1246. UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
  1247. UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
  1248. UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
  1249. UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
  1250. UVD_CGC_CTRL__SYS_MODE_MASK |
  1251. UVD_CGC_CTRL__UDEC_MODE_MASK |
  1252. UVD_CGC_CTRL__MPEG2_MODE_MASK |
  1253. UVD_CGC_CTRL__REGS_MODE_MASK |
  1254. UVD_CGC_CTRL__RBC_MODE_MASK |
  1255. UVD_CGC_CTRL__LMI_MC_MODE_MASK |
  1256. UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
  1257. UVD_CGC_CTRL__IDCT_MODE_MASK |
  1258. UVD_CGC_CTRL__MPRD_MODE_MASK |
  1259. UVD_CGC_CTRL__MPC_MODE_MASK |
  1260. UVD_CGC_CTRL__LBSI_MODE_MASK |
  1261. UVD_CGC_CTRL__LRBBM_MODE_MASK |
  1262. UVD_CGC_CTRL__WCB_MODE_MASK |
  1263. UVD_CGC_CTRL__VCPU_MODE_MASK |
  1264. UVD_CGC_CTRL__JPEG_MODE_MASK |
  1265. UVD_CGC_CTRL__JPEG2_MODE_MASK |
  1266. UVD_CGC_CTRL__SCPU_MODE_MASK);
  1267. data2 &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK |
  1268. UVD_SUVD_CGC_CTRL__SIT_MODE_MASK |
  1269. UVD_SUVD_CGC_CTRL__SMP_MODE_MASK |
  1270. UVD_SUVD_CGC_CTRL__SCM_MODE_MASK |
  1271. UVD_SUVD_CGC_CTRL__SDB_MODE_MASK);
  1272. data1 |= suvd_flags;
  1273. WREG32_SOC15(UVD, 0, mmUVD_CGC_CTRL, data);
  1274. WREG32_SOC15(UVD, 0, mmUVD_CGC_GATE, 0);
  1275. WREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_GATE, data1);
  1276. WREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_CTRL, data2);
  1277. }
  1278. static void uvd_v7_0_set_hw_clock_gating(struct amdgpu_device *adev)
  1279. {
  1280. uint32_t data, data1, cgc_flags, suvd_flags;
  1281. data = RREG32_SOC15(UVD, 0, mmUVD_CGC_GATE);
  1282. data1 = RREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_GATE);
  1283. cgc_flags = UVD_CGC_GATE__SYS_MASK |
  1284. UVD_CGC_GATE__UDEC_MASK |
  1285. UVD_CGC_GATE__MPEG2_MASK |
  1286. UVD_CGC_GATE__RBC_MASK |
  1287. UVD_CGC_GATE__LMI_MC_MASK |
  1288. UVD_CGC_GATE__IDCT_MASK |
  1289. UVD_CGC_GATE__MPRD_MASK |
  1290. UVD_CGC_GATE__MPC_MASK |
  1291. UVD_CGC_GATE__LBSI_MASK |
  1292. UVD_CGC_GATE__LRBBM_MASK |
  1293. UVD_CGC_GATE__UDEC_RE_MASK |
  1294. UVD_CGC_GATE__UDEC_CM_MASK |
  1295. UVD_CGC_GATE__UDEC_IT_MASK |
  1296. UVD_CGC_GATE__UDEC_DB_MASK |
  1297. UVD_CGC_GATE__UDEC_MP_MASK |
  1298. UVD_CGC_GATE__WCB_MASK |
  1299. UVD_CGC_GATE__VCPU_MASK |
  1300. UVD_CGC_GATE__SCPU_MASK |
  1301. UVD_CGC_GATE__JPEG_MASK |
  1302. UVD_CGC_GATE__JPEG2_MASK;
  1303. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  1304. UVD_SUVD_CGC_GATE__SIT_MASK |
  1305. UVD_SUVD_CGC_GATE__SMP_MASK |
  1306. UVD_SUVD_CGC_GATE__SCM_MASK |
  1307. UVD_SUVD_CGC_GATE__SDB_MASK;
  1308. data |= cgc_flags;
  1309. data1 |= suvd_flags;
  1310. WREG32_SOC15(UVD, 0, mmUVD_CGC_GATE, data);
  1311. WREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_GATE, data1);
  1312. }
  1313. static void uvd_v7_0_set_bypass_mode(struct amdgpu_device *adev, bool enable)
  1314. {
  1315. u32 tmp = RREG32_SMC(ixGCK_DFS_BYPASS_CNTL);
  1316. if (enable)
  1317. tmp |= (GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
  1318. GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
  1319. else
  1320. tmp &= ~(GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
  1321. GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
  1322. WREG32_SMC(ixGCK_DFS_BYPASS_CNTL, tmp);
  1323. }
  1324. static int uvd_v7_0_set_clockgating_state(void *handle,
  1325. enum amd_clockgating_state state)
  1326. {
  1327. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1328. bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
  1329. uvd_v7_0_set_bypass_mode(adev, enable);
  1330. if (!(adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG))
  1331. return 0;
  1332. if (enable) {
  1333. /* disable HW gating and enable Sw gating */
  1334. uvd_v7_0_set_sw_clock_gating(adev);
  1335. } else {
  1336. /* wait for STATUS to clear */
  1337. if (uvd_v7_0_wait_for_idle(handle))
  1338. return -EBUSY;
  1339. /* enable HW gates because UVD is idle */
  1340. /* uvd_v7_0_set_hw_clock_gating(adev); */
  1341. }
  1342. return 0;
  1343. }
  1344. static int uvd_v7_0_set_powergating_state(void *handle,
  1345. enum amd_powergating_state state)
  1346. {
  1347. /* This doesn't actually powergate the UVD block.
  1348. * That's done in the dpm code via the SMC. This
  1349. * just re-inits the block as necessary. The actual
  1350. * gating still happens in the dpm code. We should
  1351. * revisit this when there is a cleaner line between
  1352. * the smc and the hw blocks
  1353. */
  1354. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1355. if (!(adev->pg_flags & AMD_PG_SUPPORT_UVD))
  1356. return 0;
  1357. WREG32_SOC15(UVD, 0, mmUVD_POWER_STATUS, UVD_POWER_STATUS__UVD_PG_EN_MASK);
  1358. if (state == AMD_PG_STATE_GATE) {
  1359. uvd_v7_0_stop(adev);
  1360. return 0;
  1361. } else {
  1362. return uvd_v7_0_start(adev);
  1363. }
  1364. }
  1365. #endif
  1366. static int uvd_v7_0_set_clockgating_state(void *handle,
  1367. enum amd_clockgating_state state)
  1368. {
  1369. /* needed for driver unload*/
  1370. return 0;
  1371. }
  1372. const struct amd_ip_funcs uvd_v7_0_ip_funcs = {
  1373. .name = "uvd_v7_0",
  1374. .early_init = uvd_v7_0_early_init,
  1375. .late_init = NULL,
  1376. .sw_init = uvd_v7_0_sw_init,
  1377. .sw_fini = uvd_v7_0_sw_fini,
  1378. .hw_init = uvd_v7_0_hw_init,
  1379. .hw_fini = uvd_v7_0_hw_fini,
  1380. .suspend = uvd_v7_0_suspend,
  1381. .resume = uvd_v7_0_resume,
  1382. .is_idle = NULL /* uvd_v7_0_is_idle */,
  1383. .wait_for_idle = NULL /* uvd_v7_0_wait_for_idle */,
  1384. .check_soft_reset = NULL /* uvd_v7_0_check_soft_reset */,
  1385. .pre_soft_reset = NULL /* uvd_v7_0_pre_soft_reset */,
  1386. .soft_reset = NULL /* uvd_v7_0_soft_reset */,
  1387. .post_soft_reset = NULL /* uvd_v7_0_post_soft_reset */,
  1388. .set_clockgating_state = uvd_v7_0_set_clockgating_state,
  1389. .set_powergating_state = NULL /* uvd_v7_0_set_powergating_state */,
  1390. };
  1391. static const struct amdgpu_ring_funcs uvd_v7_0_ring_vm_funcs = {
  1392. .type = AMDGPU_RING_TYPE_UVD,
  1393. .align_mask = 0xf,
  1394. .nop = PACKET0(0x81ff, 0),
  1395. .support_64bit_ptrs = false,
  1396. .vmhub = AMDGPU_MMHUB,
  1397. .get_rptr = uvd_v7_0_ring_get_rptr,
  1398. .get_wptr = uvd_v7_0_ring_get_wptr,
  1399. .set_wptr = uvd_v7_0_ring_set_wptr,
  1400. .emit_frame_size =
  1401. 6 + 6 + /* hdp flush / invalidate */
  1402. SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
  1403. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
  1404. 8 + /* uvd_v7_0_ring_emit_vm_flush */
  1405. 14 + 14, /* uvd_v7_0_ring_emit_fence x2 vm fence */
  1406. .emit_ib_size = 8, /* uvd_v7_0_ring_emit_ib */
  1407. .emit_ib = uvd_v7_0_ring_emit_ib,
  1408. .emit_fence = uvd_v7_0_ring_emit_fence,
  1409. .emit_vm_flush = uvd_v7_0_ring_emit_vm_flush,
  1410. .test_ring = uvd_v7_0_ring_test_ring,
  1411. .test_ib = amdgpu_uvd_ring_test_ib,
  1412. .insert_nop = uvd_v7_0_ring_insert_nop,
  1413. .pad_ib = amdgpu_ring_generic_pad_ib,
  1414. .begin_use = amdgpu_uvd_ring_begin_use,
  1415. .end_use = amdgpu_uvd_ring_end_use,
  1416. .emit_wreg = uvd_v7_0_ring_emit_wreg,
  1417. .emit_reg_wait = uvd_v7_0_ring_emit_reg_wait,
  1418. };
  1419. static const struct amdgpu_ring_funcs uvd_v7_0_enc_ring_vm_funcs = {
  1420. .type = AMDGPU_RING_TYPE_UVD_ENC,
  1421. .align_mask = 0x3f,
  1422. .nop = HEVC_ENC_CMD_NO_OP,
  1423. .support_64bit_ptrs = false,
  1424. .vmhub = AMDGPU_MMHUB,
  1425. .get_rptr = uvd_v7_0_enc_ring_get_rptr,
  1426. .get_wptr = uvd_v7_0_enc_ring_get_wptr,
  1427. .set_wptr = uvd_v7_0_enc_ring_set_wptr,
  1428. .emit_frame_size =
  1429. 3 + 3 + /* hdp flush / invalidate */
  1430. SOC15_FLUSH_GPU_TLB_NUM_WREG * 3 +
  1431. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 4 +
  1432. 4 + /* uvd_v7_0_enc_ring_emit_vm_flush */
  1433. 5 + 5 + /* uvd_v7_0_enc_ring_emit_fence x2 vm fence */
  1434. 1, /* uvd_v7_0_enc_ring_insert_end */
  1435. .emit_ib_size = 5, /* uvd_v7_0_enc_ring_emit_ib */
  1436. .emit_ib = uvd_v7_0_enc_ring_emit_ib,
  1437. .emit_fence = uvd_v7_0_enc_ring_emit_fence,
  1438. .emit_vm_flush = uvd_v7_0_enc_ring_emit_vm_flush,
  1439. .test_ring = uvd_v7_0_enc_ring_test_ring,
  1440. .test_ib = uvd_v7_0_enc_ring_test_ib,
  1441. .insert_nop = amdgpu_ring_insert_nop,
  1442. .insert_end = uvd_v7_0_enc_ring_insert_end,
  1443. .pad_ib = amdgpu_ring_generic_pad_ib,
  1444. .begin_use = amdgpu_uvd_ring_begin_use,
  1445. .end_use = amdgpu_uvd_ring_end_use,
  1446. .emit_wreg = uvd_v7_0_enc_ring_emit_wreg,
  1447. .emit_reg_wait = uvd_v7_0_enc_ring_emit_reg_wait,
  1448. };
  1449. static void uvd_v7_0_set_ring_funcs(struct amdgpu_device *adev)
  1450. {
  1451. adev->uvd.ring.funcs = &uvd_v7_0_ring_vm_funcs;
  1452. DRM_INFO("UVD is enabled in VM mode\n");
  1453. }
  1454. static void uvd_v7_0_set_enc_ring_funcs(struct amdgpu_device *adev)
  1455. {
  1456. int i;
  1457. for (i = 0; i < adev->uvd.num_enc_rings; ++i)
  1458. adev->uvd.ring_enc[i].funcs = &uvd_v7_0_enc_ring_vm_funcs;
  1459. DRM_INFO("UVD ENC is enabled in VM mode\n");
  1460. }
  1461. static const struct amdgpu_irq_src_funcs uvd_v7_0_irq_funcs = {
  1462. .set = uvd_v7_0_set_interrupt_state,
  1463. .process = uvd_v7_0_process_interrupt,
  1464. };
  1465. static void uvd_v7_0_set_irq_funcs(struct amdgpu_device *adev)
  1466. {
  1467. adev->uvd.irq.num_types = adev->uvd.num_enc_rings + 1;
  1468. adev->uvd.irq.funcs = &uvd_v7_0_irq_funcs;
  1469. }
  1470. const struct amdgpu_ip_block_version uvd_v7_0_ip_block =
  1471. {
  1472. .type = AMD_IP_BLOCK_TYPE_UVD,
  1473. .major = 7,
  1474. .minor = 0,
  1475. .rev = 0,
  1476. .funcs = &uvd_v7_0_ip_funcs,
  1477. };