uvd_v7_0.c 51 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include <linux/firmware.h>
  24. #include <drm/drmP.h>
  25. #include "amdgpu.h"
  26. #include "amdgpu_uvd.h"
  27. #include "soc15d.h"
  28. #include "soc15_common.h"
  29. #include "mmsch_v1_0.h"
  30. #include "soc15ip.h"
  31. #include "uvd/uvd_7_0_offset.h"
  32. #include "uvd/uvd_7_0_sh_mask.h"
  33. #include "vce/vce_4_0_offset.h"
  34. #include "vce/vce_4_0_default.h"
  35. #include "vce/vce_4_0_sh_mask.h"
  36. #include "nbif/nbif_6_1_offset.h"
  37. #include "hdp/hdp_4_0_offset.h"
  38. #include "mmhub/mmhub_1_0_offset.h"
  39. #include "mmhub/mmhub_1_0_sh_mask.h"
  40. static void uvd_v7_0_set_ring_funcs(struct amdgpu_device *adev);
  41. static void uvd_v7_0_set_enc_ring_funcs(struct amdgpu_device *adev);
  42. static void uvd_v7_0_set_irq_funcs(struct amdgpu_device *adev);
  43. static int uvd_v7_0_start(struct amdgpu_device *adev);
  44. static void uvd_v7_0_stop(struct amdgpu_device *adev);
  45. static int uvd_v7_0_sriov_start(struct amdgpu_device *adev);
  46. /**
  47. * uvd_v7_0_ring_get_rptr - get read pointer
  48. *
  49. * @ring: amdgpu_ring pointer
  50. *
  51. * Returns the current hardware read pointer
  52. */
  53. static uint64_t uvd_v7_0_ring_get_rptr(struct amdgpu_ring *ring)
  54. {
  55. struct amdgpu_device *adev = ring->adev;
  56. return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
  57. }
  58. /**
  59. * uvd_v7_0_enc_ring_get_rptr - get enc read pointer
  60. *
  61. * @ring: amdgpu_ring pointer
  62. *
  63. * Returns the current hardware enc read pointer
  64. */
  65. static uint64_t uvd_v7_0_enc_ring_get_rptr(struct amdgpu_ring *ring)
  66. {
  67. struct amdgpu_device *adev = ring->adev;
  68. if (ring == &adev->uvd.ring_enc[0])
  69. return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR);
  70. else
  71. return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2);
  72. }
  73. /**
  74. * uvd_v7_0_ring_get_wptr - get write pointer
  75. *
  76. * @ring: amdgpu_ring pointer
  77. *
  78. * Returns the current hardware write pointer
  79. */
  80. static uint64_t uvd_v7_0_ring_get_wptr(struct amdgpu_ring *ring)
  81. {
  82. struct amdgpu_device *adev = ring->adev;
  83. return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR);
  84. }
  85. /**
  86. * uvd_v7_0_enc_ring_get_wptr - get enc write pointer
  87. *
  88. * @ring: amdgpu_ring pointer
  89. *
  90. * Returns the current hardware enc write pointer
  91. */
  92. static uint64_t uvd_v7_0_enc_ring_get_wptr(struct amdgpu_ring *ring)
  93. {
  94. struct amdgpu_device *adev = ring->adev;
  95. if (ring->use_doorbell)
  96. return adev->wb.wb[ring->wptr_offs];
  97. if (ring == &adev->uvd.ring_enc[0])
  98. return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR);
  99. else
  100. return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2);
  101. }
  102. /**
  103. * uvd_v7_0_ring_set_wptr - set write pointer
  104. *
  105. * @ring: amdgpu_ring pointer
  106. *
  107. * Commits the write pointer to the hardware
  108. */
  109. static void uvd_v7_0_ring_set_wptr(struct amdgpu_ring *ring)
  110. {
  111. struct amdgpu_device *adev = ring->adev;
  112. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
  113. }
  114. /**
  115. * uvd_v7_0_enc_ring_set_wptr - set enc write pointer
  116. *
  117. * @ring: amdgpu_ring pointer
  118. *
  119. * Commits the enc write pointer to the hardware
  120. */
  121. static void uvd_v7_0_enc_ring_set_wptr(struct amdgpu_ring *ring)
  122. {
  123. struct amdgpu_device *adev = ring->adev;
  124. if (ring->use_doorbell) {
  125. /* XXX check if swapping is necessary on BE */
  126. adev->wb.wb[ring->wptr_offs] = lower_32_bits(ring->wptr);
  127. WDOORBELL32(ring->doorbell_index, lower_32_bits(ring->wptr));
  128. return;
  129. }
  130. if (ring == &adev->uvd.ring_enc[0])
  131. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR,
  132. lower_32_bits(ring->wptr));
  133. else
  134. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2,
  135. lower_32_bits(ring->wptr));
  136. }
  137. /**
  138. * uvd_v7_0_enc_ring_test_ring - test if UVD ENC ring is working
  139. *
  140. * @ring: the engine to test on
  141. *
  142. */
  143. static int uvd_v7_0_enc_ring_test_ring(struct amdgpu_ring *ring)
  144. {
  145. struct amdgpu_device *adev = ring->adev;
  146. uint32_t rptr = amdgpu_ring_get_rptr(ring);
  147. unsigned i;
  148. int r;
  149. if (amdgpu_sriov_vf(adev))
  150. return 0;
  151. r = amdgpu_ring_alloc(ring, 16);
  152. if (r) {
  153. DRM_ERROR("amdgpu: uvd enc failed to lock ring %d (%d).\n",
  154. ring->idx, r);
  155. return r;
  156. }
  157. amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
  158. amdgpu_ring_commit(ring);
  159. for (i = 0; i < adev->usec_timeout; i++) {
  160. if (amdgpu_ring_get_rptr(ring) != rptr)
  161. break;
  162. DRM_UDELAY(1);
  163. }
  164. if (i < adev->usec_timeout) {
  165. DRM_DEBUG("ring test on %d succeeded in %d usecs\n",
  166. ring->idx, i);
  167. } else {
  168. DRM_ERROR("amdgpu: ring %d test failed\n",
  169. ring->idx);
  170. r = -ETIMEDOUT;
  171. }
  172. return r;
  173. }
  174. /**
  175. * uvd_v7_0_enc_get_create_msg - generate a UVD ENC create msg
  176. *
  177. * @adev: amdgpu_device pointer
  178. * @ring: ring we should submit the msg to
  179. * @handle: session handle to use
  180. * @fence: optional fence to return
  181. *
  182. * Open up a stream for HW test
  183. */
  184. static int uvd_v7_0_enc_get_create_msg(struct amdgpu_ring *ring, uint32_t handle,
  185. struct dma_fence **fence)
  186. {
  187. const unsigned ib_size_dw = 16;
  188. struct amdgpu_job *job;
  189. struct amdgpu_ib *ib;
  190. struct dma_fence *f = NULL;
  191. uint64_t dummy;
  192. int i, r;
  193. r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
  194. if (r)
  195. return r;
  196. ib = &job->ibs[0];
  197. dummy = ib->gpu_addr + 1024;
  198. ib->length_dw = 0;
  199. ib->ptr[ib->length_dw++] = 0x00000018;
  200. ib->ptr[ib->length_dw++] = 0x00000001; /* session info */
  201. ib->ptr[ib->length_dw++] = handle;
  202. ib->ptr[ib->length_dw++] = 0x00000000;
  203. ib->ptr[ib->length_dw++] = upper_32_bits(dummy);
  204. ib->ptr[ib->length_dw++] = dummy;
  205. ib->ptr[ib->length_dw++] = 0x00000014;
  206. ib->ptr[ib->length_dw++] = 0x00000002; /* task info */
  207. ib->ptr[ib->length_dw++] = 0x0000001c;
  208. ib->ptr[ib->length_dw++] = 0x00000000;
  209. ib->ptr[ib->length_dw++] = 0x00000000;
  210. ib->ptr[ib->length_dw++] = 0x00000008;
  211. ib->ptr[ib->length_dw++] = 0x08000001; /* op initialize */
  212. for (i = ib->length_dw; i < ib_size_dw; ++i)
  213. ib->ptr[i] = 0x0;
  214. r = amdgpu_ib_schedule(ring, 1, ib, NULL, &f);
  215. job->fence = dma_fence_get(f);
  216. if (r)
  217. goto err;
  218. amdgpu_job_free(job);
  219. if (fence)
  220. *fence = dma_fence_get(f);
  221. dma_fence_put(f);
  222. return 0;
  223. err:
  224. amdgpu_job_free(job);
  225. return r;
  226. }
  227. /**
  228. * uvd_v7_0_enc_get_destroy_msg - generate a UVD ENC destroy msg
  229. *
  230. * @adev: amdgpu_device pointer
  231. * @ring: ring we should submit the msg to
  232. * @handle: session handle to use
  233. * @fence: optional fence to return
  234. *
  235. * Close up a stream for HW test or if userspace failed to do so
  236. */
  237. int uvd_v7_0_enc_get_destroy_msg(struct amdgpu_ring *ring, uint32_t handle,
  238. bool direct, struct dma_fence **fence)
  239. {
  240. const unsigned ib_size_dw = 16;
  241. struct amdgpu_job *job;
  242. struct amdgpu_ib *ib;
  243. struct dma_fence *f = NULL;
  244. uint64_t dummy;
  245. int i, r;
  246. r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
  247. if (r)
  248. return r;
  249. ib = &job->ibs[0];
  250. dummy = ib->gpu_addr + 1024;
  251. ib->length_dw = 0;
  252. ib->ptr[ib->length_dw++] = 0x00000018;
  253. ib->ptr[ib->length_dw++] = 0x00000001;
  254. ib->ptr[ib->length_dw++] = handle;
  255. ib->ptr[ib->length_dw++] = 0x00000000;
  256. ib->ptr[ib->length_dw++] = upper_32_bits(dummy);
  257. ib->ptr[ib->length_dw++] = dummy;
  258. ib->ptr[ib->length_dw++] = 0x00000014;
  259. ib->ptr[ib->length_dw++] = 0x00000002;
  260. ib->ptr[ib->length_dw++] = 0x0000001c;
  261. ib->ptr[ib->length_dw++] = 0x00000000;
  262. ib->ptr[ib->length_dw++] = 0x00000000;
  263. ib->ptr[ib->length_dw++] = 0x00000008;
  264. ib->ptr[ib->length_dw++] = 0x08000002; /* op close session */
  265. for (i = ib->length_dw; i < ib_size_dw; ++i)
  266. ib->ptr[i] = 0x0;
  267. if (direct) {
  268. r = amdgpu_ib_schedule(ring, 1, ib, NULL, &f);
  269. job->fence = dma_fence_get(f);
  270. if (r)
  271. goto err;
  272. amdgpu_job_free(job);
  273. } else {
  274. r = amdgpu_job_submit(job, ring, &ring->adev->vce.entity,
  275. AMDGPU_FENCE_OWNER_UNDEFINED, &f);
  276. if (r)
  277. goto err;
  278. }
  279. if (fence)
  280. *fence = dma_fence_get(f);
  281. dma_fence_put(f);
  282. return 0;
  283. err:
  284. amdgpu_job_free(job);
  285. return r;
  286. }
  287. /**
  288. * uvd_v7_0_enc_ring_test_ib - test if UVD ENC IBs are working
  289. *
  290. * @ring: the engine to test on
  291. *
  292. */
  293. static int uvd_v7_0_enc_ring_test_ib(struct amdgpu_ring *ring, long timeout)
  294. {
  295. struct dma_fence *fence = NULL;
  296. long r;
  297. r = uvd_v7_0_enc_get_create_msg(ring, 1, NULL);
  298. if (r) {
  299. DRM_ERROR("amdgpu: failed to get create msg (%ld).\n", r);
  300. goto error;
  301. }
  302. r = uvd_v7_0_enc_get_destroy_msg(ring, 1, true, &fence);
  303. if (r) {
  304. DRM_ERROR("amdgpu: failed to get destroy ib (%ld).\n", r);
  305. goto error;
  306. }
  307. r = dma_fence_wait_timeout(fence, false, timeout);
  308. if (r == 0) {
  309. DRM_ERROR("amdgpu: IB test timed out.\n");
  310. r = -ETIMEDOUT;
  311. } else if (r < 0) {
  312. DRM_ERROR("amdgpu: fence wait failed (%ld).\n", r);
  313. } else {
  314. DRM_DEBUG("ib test on ring %d succeeded\n", ring->idx);
  315. r = 0;
  316. }
  317. error:
  318. dma_fence_put(fence);
  319. return r;
  320. }
  321. static int uvd_v7_0_early_init(void *handle)
  322. {
  323. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  324. if (amdgpu_sriov_vf(adev))
  325. adev->uvd.num_enc_rings = 1;
  326. else
  327. adev->uvd.num_enc_rings = 2;
  328. uvd_v7_0_set_ring_funcs(adev);
  329. uvd_v7_0_set_enc_ring_funcs(adev);
  330. uvd_v7_0_set_irq_funcs(adev);
  331. return 0;
  332. }
  333. static int uvd_v7_0_sw_init(void *handle)
  334. {
  335. struct amdgpu_ring *ring;
  336. struct amd_sched_rq *rq;
  337. int i, r;
  338. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  339. /* UVD TRAP */
  340. r = amdgpu_irq_add_id(adev, AMDGPU_IH_CLIENTID_UVD, 124, &adev->uvd.irq);
  341. if (r)
  342. return r;
  343. /* UVD ENC TRAP */
  344. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  345. r = amdgpu_irq_add_id(adev, AMDGPU_IH_CLIENTID_UVD, i + 119, &adev->uvd.irq);
  346. if (r)
  347. return r;
  348. }
  349. r = amdgpu_uvd_sw_init(adev);
  350. if (r)
  351. return r;
  352. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  353. const struct common_firmware_header *hdr;
  354. hdr = (const struct common_firmware_header *)adev->uvd.fw->data;
  355. adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].ucode_id = AMDGPU_UCODE_ID_UVD;
  356. adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].fw = adev->uvd.fw;
  357. adev->firmware.fw_size +=
  358. ALIGN(le32_to_cpu(hdr->ucode_size_bytes), PAGE_SIZE);
  359. DRM_INFO("PSP loading UVD firmware\n");
  360. }
  361. ring = &adev->uvd.ring_enc[0];
  362. rq = &ring->sched.sched_rq[AMD_SCHED_PRIORITY_NORMAL];
  363. r = amd_sched_entity_init(&ring->sched, &adev->uvd.entity_enc,
  364. rq, amdgpu_sched_jobs, NULL);
  365. if (r) {
  366. DRM_ERROR("Failed setting up UVD ENC run queue.\n");
  367. return r;
  368. }
  369. r = amdgpu_uvd_resume(adev);
  370. if (r)
  371. return r;
  372. if (!amdgpu_sriov_vf(adev)) {
  373. ring = &adev->uvd.ring;
  374. sprintf(ring->name, "uvd");
  375. r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.irq, 0);
  376. if (r)
  377. return r;
  378. }
  379. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  380. ring = &adev->uvd.ring_enc[i];
  381. sprintf(ring->name, "uvd_enc%d", i);
  382. if (amdgpu_sriov_vf(adev)) {
  383. ring->use_doorbell = true;
  384. /* currently only use the first enconding ring for
  385. * sriov, so set unused location for other unused rings.
  386. */
  387. if (i == 0)
  388. ring->doorbell_index = AMDGPU_DOORBELL64_UVD_RING0_1 * 2;
  389. else
  390. ring->doorbell_index = AMDGPU_DOORBELL64_UVD_RING2_3 * 2 + 1;
  391. }
  392. r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.irq, 0);
  393. if (r)
  394. return r;
  395. }
  396. r = amdgpu_virt_alloc_mm_table(adev);
  397. if (r)
  398. return r;
  399. return r;
  400. }
  401. static int uvd_v7_0_sw_fini(void *handle)
  402. {
  403. int i, r;
  404. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  405. amdgpu_virt_free_mm_table(adev);
  406. r = amdgpu_uvd_suspend(adev);
  407. if (r)
  408. return r;
  409. amd_sched_entity_fini(&adev->uvd.ring_enc[0].sched, &adev->uvd.entity_enc);
  410. for (i = 0; i < adev->uvd.num_enc_rings; ++i)
  411. amdgpu_ring_fini(&adev->uvd.ring_enc[i]);
  412. return amdgpu_uvd_sw_fini(adev);
  413. }
  414. /**
  415. * uvd_v7_0_hw_init - start and test UVD block
  416. *
  417. * @adev: amdgpu_device pointer
  418. *
  419. * Initialize the hardware, boot up the VCPU and do some testing
  420. */
  421. static int uvd_v7_0_hw_init(void *handle)
  422. {
  423. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  424. struct amdgpu_ring *ring = &adev->uvd.ring;
  425. uint32_t tmp;
  426. int i, r;
  427. if (amdgpu_sriov_vf(adev))
  428. r = uvd_v7_0_sriov_start(adev);
  429. else
  430. r = uvd_v7_0_start(adev);
  431. if (r)
  432. goto done;
  433. if (!amdgpu_sriov_vf(adev)) {
  434. ring->ready = true;
  435. r = amdgpu_ring_test_ring(ring);
  436. if (r) {
  437. ring->ready = false;
  438. goto done;
  439. }
  440. r = amdgpu_ring_alloc(ring, 10);
  441. if (r) {
  442. DRM_ERROR("amdgpu: ring failed to lock UVD ring (%d).\n", r);
  443. goto done;
  444. }
  445. tmp = PACKET0(SOC15_REG_OFFSET(UVD, 0,
  446. mmUVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL), 0);
  447. amdgpu_ring_write(ring, tmp);
  448. amdgpu_ring_write(ring, 0xFFFFF);
  449. tmp = PACKET0(SOC15_REG_OFFSET(UVD, 0,
  450. mmUVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL), 0);
  451. amdgpu_ring_write(ring, tmp);
  452. amdgpu_ring_write(ring, 0xFFFFF);
  453. tmp = PACKET0(SOC15_REG_OFFSET(UVD, 0,
  454. mmUVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL), 0);
  455. amdgpu_ring_write(ring, tmp);
  456. amdgpu_ring_write(ring, 0xFFFFF);
  457. /* Clear timeout status bits */
  458. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, 0,
  459. mmUVD_SEMA_TIMEOUT_STATUS), 0));
  460. amdgpu_ring_write(ring, 0x8);
  461. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, 0,
  462. mmUVD_SEMA_CNTL), 0));
  463. amdgpu_ring_write(ring, 3);
  464. amdgpu_ring_commit(ring);
  465. }
  466. for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
  467. ring = &adev->uvd.ring_enc[i];
  468. ring->ready = true;
  469. r = amdgpu_ring_test_ring(ring);
  470. if (r) {
  471. ring->ready = false;
  472. goto done;
  473. }
  474. }
  475. done:
  476. if (!r)
  477. DRM_INFO("UVD and UVD ENC initialized successfully.\n");
  478. return r;
  479. }
  480. /**
  481. * uvd_v7_0_hw_fini - stop the hardware block
  482. *
  483. * @adev: amdgpu_device pointer
  484. *
  485. * Stop the UVD block, mark ring as not ready any more
  486. */
  487. static int uvd_v7_0_hw_fini(void *handle)
  488. {
  489. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  490. struct amdgpu_ring *ring = &adev->uvd.ring;
  491. if (!amdgpu_sriov_vf(adev))
  492. uvd_v7_0_stop(adev);
  493. else {
  494. /* full access mode, so don't touch any UVD register */
  495. DRM_DEBUG("For SRIOV client, shouldn't do anything.\n");
  496. }
  497. ring->ready = false;
  498. return 0;
  499. }
  500. static int uvd_v7_0_suspend(void *handle)
  501. {
  502. int r;
  503. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  504. r = uvd_v7_0_hw_fini(adev);
  505. if (r)
  506. return r;
  507. return amdgpu_uvd_suspend(adev);
  508. }
  509. static int uvd_v7_0_resume(void *handle)
  510. {
  511. int r;
  512. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  513. r = amdgpu_uvd_resume(adev);
  514. if (r)
  515. return r;
  516. return uvd_v7_0_hw_init(adev);
  517. }
  518. /**
  519. * uvd_v7_0_mc_resume - memory controller programming
  520. *
  521. * @adev: amdgpu_device pointer
  522. *
  523. * Let the UVD memory controller know it's offsets
  524. */
  525. static void uvd_v7_0_mc_resume(struct amdgpu_device *adev)
  526. {
  527. uint32_t size = AMDGPU_UVD_FIRMWARE_SIZE(adev);
  528. uint32_t offset;
  529. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  530. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  531. lower_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  532. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  533. upper_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  534. offset = 0;
  535. } else {
  536. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  537. lower_32_bits(adev->uvd.gpu_addr));
  538. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  539. upper_32_bits(adev->uvd.gpu_addr));
  540. offset = size;
  541. }
  542. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0,
  543. AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
  544. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE0, size);
  545. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW,
  546. lower_32_bits(adev->uvd.gpu_addr + offset));
  547. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH,
  548. upper_32_bits(adev->uvd.gpu_addr + offset));
  549. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET1, (1 << 21));
  550. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE1, AMDGPU_UVD_HEAP_SIZE);
  551. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW,
  552. lower_32_bits(adev->uvd.gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  553. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH,
  554. upper_32_bits(adev->uvd.gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  555. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET2, (2 << 21));
  556. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE2,
  557. AMDGPU_UVD_STACK_SIZE + (AMDGPU_UVD_SESSION_SIZE * 40));
  558. WREG32_SOC15(UVD, 0, mmUVD_UDEC_ADDR_CONFIG,
  559. adev->gfx.config.gb_addr_config);
  560. WREG32_SOC15(UVD, 0, mmUVD_UDEC_DB_ADDR_CONFIG,
  561. adev->gfx.config.gb_addr_config);
  562. WREG32_SOC15(UVD, 0, mmUVD_UDEC_DBW_ADDR_CONFIG,
  563. adev->gfx.config.gb_addr_config);
  564. WREG32_SOC15(UVD, 0, mmUVD_GP_SCRATCH4, adev->uvd.max_handles);
  565. }
  566. static int uvd_v7_0_mmsch_start(struct amdgpu_device *adev,
  567. struct amdgpu_mm_table *table)
  568. {
  569. uint32_t data = 0, loop;
  570. uint64_t addr = table->gpu_addr;
  571. struct mmsch_v1_0_init_header *header = (struct mmsch_v1_0_init_header *)table->cpu_addr;
  572. uint32_t size;
  573. size = header->header_size + header->vce_table_size + header->uvd_table_size;
  574. /* 1, write to vce_mmsch_vf_ctx_addr_lo/hi register with GPU mc addr of memory descriptor location */
  575. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_ADDR_LO, lower_32_bits(addr));
  576. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_ADDR_HI, upper_32_bits(addr));
  577. /* 2, update vmid of descriptor */
  578. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_VMID);
  579. data &= ~VCE_MMSCH_VF_VMID__VF_CTX_VMID_MASK;
  580. data |= (0 << VCE_MMSCH_VF_VMID__VF_CTX_VMID__SHIFT); /* use domain0 for MM scheduler */
  581. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_VMID, data);
  582. /* 3, notify mmsch about the size of this descriptor */
  583. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_CTX_SIZE, size);
  584. /* 4, set resp to zero */
  585. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP, 0);
  586. WDOORBELL32(adev->uvd.ring_enc[0].doorbell_index, 0);
  587. adev->wb.wb[adev->uvd.ring_enc[0].wptr_offs] = 0;
  588. adev->uvd.ring_enc[0].wptr = 0;
  589. adev->uvd.ring_enc[0].wptr_old = 0;
  590. /* 5, kick off the initialization and wait until VCE_MMSCH_VF_MAILBOX_RESP becomes non-zero */
  591. WREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_HOST, 0x10000001);
  592. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP);
  593. loop = 1000;
  594. while ((data & 0x10000002) != 0x10000002) {
  595. udelay(10);
  596. data = RREG32_SOC15(VCE, 0, mmVCE_MMSCH_VF_MAILBOX_RESP);
  597. loop--;
  598. if (!loop)
  599. break;
  600. }
  601. if (!loop) {
  602. dev_err(adev->dev, "failed to init MMSCH, mmVCE_MMSCH_VF_MAILBOX_RESP = %x\n", data);
  603. return -EBUSY;
  604. }
  605. return 0;
  606. }
  607. static int uvd_v7_0_sriov_start(struct amdgpu_device *adev)
  608. {
  609. struct amdgpu_ring *ring;
  610. uint32_t offset, size, tmp;
  611. uint32_t table_size = 0;
  612. struct mmsch_v1_0_cmd_direct_write direct_wt = { {0} };
  613. struct mmsch_v1_0_cmd_direct_read_modify_write direct_rd_mod_wt = { {0} };
  614. struct mmsch_v1_0_cmd_direct_polling direct_poll = { {0} };
  615. struct mmsch_v1_0_cmd_end end = { {0} };
  616. uint32_t *init_table = adev->virt.mm_table.cpu_addr;
  617. struct mmsch_v1_0_init_header *header = (struct mmsch_v1_0_init_header *)init_table;
  618. direct_wt.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_WRITE;
  619. direct_rd_mod_wt.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_READ_MODIFY_WRITE;
  620. direct_poll.cmd_header.command_type = MMSCH_COMMAND__DIRECT_REG_POLLING;
  621. end.cmd_header.command_type = MMSCH_COMMAND__END;
  622. if (header->uvd_table_offset == 0 && header->uvd_table_size == 0) {
  623. header->version = MMSCH_VERSION;
  624. header->header_size = sizeof(struct mmsch_v1_0_init_header) >> 2;
  625. if (header->vce_table_offset == 0 && header->vce_table_size == 0)
  626. header->uvd_table_offset = header->header_size;
  627. else
  628. header->uvd_table_offset = header->vce_table_size + header->vce_table_offset;
  629. init_table += header->uvd_table_offset;
  630. ring = &adev->uvd.ring;
  631. ring->wptr = 0;
  632. size = AMDGPU_GPU_PAGE_ALIGN(adev->uvd.fw->size + 4);
  633. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS),
  634. 0xFFFFFFFF, 0x00000004);
  635. /* mc resume*/
  636. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  637. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW),
  638. lower_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  639. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH),
  640. upper_32_bits(adev->firmware.ucode[AMDGPU_UCODE_ID_UVD].mc_addr));
  641. offset = 0;
  642. } else {
  643. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW),
  644. lower_32_bits(adev->uvd.gpu_addr));
  645. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH),
  646. upper_32_bits(adev->uvd.gpu_addr));
  647. offset = size;
  648. }
  649. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0),
  650. AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
  651. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_SIZE0), size);
  652. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW),
  653. lower_32_bits(adev->uvd.gpu_addr + offset));
  654. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH),
  655. upper_32_bits(adev->uvd.gpu_addr + offset));
  656. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_OFFSET1), (1 << 21));
  657. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_SIZE1), AMDGPU_UVD_HEAP_SIZE);
  658. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW),
  659. lower_32_bits(adev->uvd.gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  660. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH),
  661. upper_32_bits(adev->uvd.gpu_addr + offset + AMDGPU_UVD_HEAP_SIZE));
  662. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_OFFSET2), (2 << 21));
  663. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CACHE_SIZE2),
  664. AMDGPU_UVD_STACK_SIZE + (AMDGPU_UVD_SESSION_SIZE * 40));
  665. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_GP_SCRATCH4), adev->uvd.max_handles);
  666. /* mc resume end*/
  667. /* disable clock gating */
  668. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_CGC_CTRL),
  669. ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK, 0);
  670. /* disable interupt */
  671. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN),
  672. ~UVD_MASTINT_EN__VCPU_EN_MASK, 0);
  673. /* stall UMC and register bus before resetting VCPU */
  674. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
  675. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  676. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  677. /* put LMI, VCPU, RBC etc... into reset */
  678. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  679. (uint32_t)(UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  680. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
  681. UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  682. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
  683. UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  684. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
  685. UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  686. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK));
  687. /* initialize UVD memory controller */
  688. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL),
  689. (uint32_t)((0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  690. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  691. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  692. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  693. UVD_LMI_CTRL__REQ_MODE_MASK |
  694. 0x00100000L));
  695. /* take all subblocks out of reset, except VCPU */
  696. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  697. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  698. /* enable VCPU clock */
  699. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CNTL),
  700. UVD_VCPU_CNTL__CLK_EN_MASK);
  701. /* enable master interrupt */
  702. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN),
  703. ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
  704. (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
  705. /* clear the bit 4 of UVD_STATUS */
  706. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS),
  707. ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT), 0);
  708. /* force RBC into idle state */
  709. size = order_base_2(ring->ring_size);
  710. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, size);
  711. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  712. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_RB_CNTL), tmp);
  713. ring = &adev->uvd.ring_enc[0];
  714. ring->wptr = 0;
  715. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_RB_BASE_LO), ring->gpu_addr);
  716. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_RB_BASE_HI), upper_32_bits(ring->gpu_addr));
  717. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_RB_SIZE), ring->ring_size / 4);
  718. /* boot up the VCPU */
  719. MMSCH_V1_0_INSERT_DIRECT_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET), 0);
  720. /* enable UMC */
  721. MMSCH_V1_0_INSERT_DIRECT_RD_MOD_WT(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
  722. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK, 0);
  723. MMSCH_V1_0_INSERT_DIRECT_POLL(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS), 0x02, 0x02);
  724. /* add end packet */
  725. memcpy((void *)init_table, &end, sizeof(struct mmsch_v1_0_cmd_end));
  726. table_size += sizeof(struct mmsch_v1_0_cmd_end) / 4;
  727. header->uvd_table_size = table_size;
  728. }
  729. return uvd_v7_0_mmsch_start(adev, &adev->virt.mm_table);
  730. }
  731. /**
  732. * uvd_v7_0_start - start UVD block
  733. *
  734. * @adev: amdgpu_device pointer
  735. *
  736. * Setup and start the UVD block
  737. */
  738. static int uvd_v7_0_start(struct amdgpu_device *adev)
  739. {
  740. struct amdgpu_ring *ring = &adev->uvd.ring;
  741. uint32_t rb_bufsz, tmp;
  742. uint32_t lmi_swap_cntl;
  743. uint32_t mp_swap_cntl;
  744. int i, j, r;
  745. /* disable DPG */
  746. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_POWER_STATUS), 0,
  747. ~UVD_POWER_STATUS__UVD_PG_MODE_MASK);
  748. /* disable byte swapping */
  749. lmi_swap_cntl = 0;
  750. mp_swap_cntl = 0;
  751. uvd_v7_0_mc_resume(adev);
  752. /* disable clock gating */
  753. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_CGC_CTRL), 0,
  754. ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK);
  755. /* disable interupt */
  756. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN), 0,
  757. ~UVD_MASTINT_EN__VCPU_EN_MASK);
  758. /* stall UMC and register bus before resetting VCPU */
  759. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
  760. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  761. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  762. mdelay(1);
  763. /* put LMI, VCPU, RBC etc... into reset */
  764. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
  765. UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  766. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
  767. UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  768. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
  769. UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  770. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
  771. UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  772. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
  773. mdelay(5);
  774. /* initialize UVD memory controller */
  775. WREG32_SOC15(UVD, 0, mmUVD_LMI_CTRL,
  776. (0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  777. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  778. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  779. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  780. UVD_LMI_CTRL__REQ_MODE_MASK |
  781. 0x00100000L);
  782. #ifdef __BIG_ENDIAN
  783. /* swap (8 in 32) RB and IB */
  784. lmi_swap_cntl = 0xa;
  785. mp_swap_cntl = 0;
  786. #endif
  787. WREG32_SOC15(UVD, 0, mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
  788. WREG32_SOC15(UVD, 0, mmUVD_MP_SWAP_CNTL, mp_swap_cntl);
  789. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXA0, 0x40c2040);
  790. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXA1, 0x0);
  791. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXB0, 0x40c2040);
  792. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXB1, 0x0);
  793. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_ALU, 0);
  794. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUX, 0x88);
  795. /* take all subblocks out of reset, except VCPU */
  796. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
  797. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  798. mdelay(5);
  799. /* enable VCPU clock */
  800. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CNTL,
  801. UVD_VCPU_CNTL__CLK_EN_MASK);
  802. /* enable UMC */
  803. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2), 0,
  804. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  805. /* boot up the VCPU */
  806. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET, 0);
  807. mdelay(10);
  808. for (i = 0; i < 10; ++i) {
  809. uint32_t status;
  810. for (j = 0; j < 100; ++j) {
  811. status = RREG32_SOC15(UVD, 0, mmUVD_STATUS);
  812. if (status & 2)
  813. break;
  814. mdelay(10);
  815. }
  816. r = 0;
  817. if (status & 2)
  818. break;
  819. DRM_ERROR("UVD not responding, trying to reset the VCPU!!!\n");
  820. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  821. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
  822. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  823. mdelay(10);
  824. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET), 0,
  825. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  826. mdelay(10);
  827. r = -1;
  828. }
  829. if (r) {
  830. DRM_ERROR("UVD not responding, giving up!!!\n");
  831. return r;
  832. }
  833. /* enable master interrupt */
  834. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN),
  835. (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
  836. ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
  837. /* clear the bit 4 of UVD_STATUS */
  838. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS), 0,
  839. ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
  840. /* force RBC into idle state */
  841. rb_bufsz = order_base_2(ring->ring_size);
  842. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
  843. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
  844. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  845. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
  846. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
  847. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
  848. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, tmp);
  849. /* set the write pointer delay */
  850. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR_CNTL, 0);
  851. /* set the wb address */
  852. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR_ADDR,
  853. (upper_32_bits(ring->gpu_addr) >> 2));
  854. /* programm the RB_BASE for ring buffer */
  855. WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
  856. lower_32_bits(ring->gpu_addr));
  857. WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
  858. upper_32_bits(ring->gpu_addr));
  859. /* Initialize the ring buffer's read and write pointers */
  860. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR, 0);
  861. ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
  862. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR,
  863. lower_32_bits(ring->wptr));
  864. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_RB_CNTL), 0,
  865. ~UVD_RBC_RB_CNTL__RB_NO_FETCH_MASK);
  866. ring = &adev->uvd.ring_enc[0];
  867. WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
  868. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
  869. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO, ring->gpu_addr);
  870. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
  871. WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE, ring->ring_size / 4);
  872. ring = &adev->uvd.ring_enc[1];
  873. WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
  874. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
  875. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO2, ring->gpu_addr);
  876. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
  877. WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE2, ring->ring_size / 4);
  878. return 0;
  879. }
  880. /**
  881. * uvd_v7_0_stop - stop UVD block
  882. *
  883. * @adev: amdgpu_device pointer
  884. *
  885. * stop the UVD block
  886. */
  887. static void uvd_v7_0_stop(struct amdgpu_device *adev)
  888. {
  889. /* force RBC into idle state */
  890. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, 0x11010101);
  891. /* Stall UMC and register bus before resetting VCPU */
  892. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
  893. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  894. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  895. mdelay(1);
  896. /* put VCPU into reset */
  897. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
  898. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  899. mdelay(5);
  900. /* disable VCPU clock */
  901. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CNTL, 0x0);
  902. /* Unstall UMC and register bus */
  903. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2), 0,
  904. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  905. }
  906. /**
  907. * uvd_v7_0_ring_emit_fence - emit an fence & trap command
  908. *
  909. * @ring: amdgpu_ring pointer
  910. * @fence: fence to emit
  911. *
  912. * Write a fence and a trap command to the ring.
  913. */
  914. static void uvd_v7_0_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
  915. unsigned flags)
  916. {
  917. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  918. amdgpu_ring_write(ring,
  919. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_CONTEXT_ID), 0));
  920. amdgpu_ring_write(ring, seq);
  921. amdgpu_ring_write(ring,
  922. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  923. amdgpu_ring_write(ring, addr & 0xffffffff);
  924. amdgpu_ring_write(ring,
  925. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  926. amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
  927. amdgpu_ring_write(ring,
  928. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  929. amdgpu_ring_write(ring, 0);
  930. amdgpu_ring_write(ring,
  931. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  932. amdgpu_ring_write(ring, 0);
  933. amdgpu_ring_write(ring,
  934. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  935. amdgpu_ring_write(ring, 0);
  936. amdgpu_ring_write(ring,
  937. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  938. amdgpu_ring_write(ring, 2);
  939. }
  940. /**
  941. * uvd_v7_0_enc_ring_emit_fence - emit an enc fence & trap command
  942. *
  943. * @ring: amdgpu_ring pointer
  944. * @fence: fence to emit
  945. *
  946. * Write enc a fence and a trap command to the ring.
  947. */
  948. static void uvd_v7_0_enc_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
  949. u64 seq, unsigned flags)
  950. {
  951. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  952. amdgpu_ring_write(ring, HEVC_ENC_CMD_FENCE);
  953. amdgpu_ring_write(ring, addr);
  954. amdgpu_ring_write(ring, upper_32_bits(addr));
  955. amdgpu_ring_write(ring, seq);
  956. amdgpu_ring_write(ring, HEVC_ENC_CMD_TRAP);
  957. }
  958. /**
  959. * uvd_v7_0_ring_emit_hdp_flush - emit an hdp flush
  960. *
  961. * @ring: amdgpu_ring pointer
  962. *
  963. * Emits an hdp flush.
  964. */
  965. static void uvd_v7_0_ring_emit_hdp_flush(struct amdgpu_ring *ring)
  966. {
  967. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(NBIF, 0,
  968. mmHDP_MEM_COHERENCY_FLUSH_CNTL), 0));
  969. amdgpu_ring_write(ring, 0);
  970. }
  971. /**
  972. * uvd_v7_0_ring_hdp_invalidate - emit an hdp invalidate
  973. *
  974. * @ring: amdgpu_ring pointer
  975. *
  976. * Emits an hdp invalidate.
  977. */
  978. static void uvd_v7_0_ring_emit_hdp_invalidate(struct amdgpu_ring *ring)
  979. {
  980. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(HDP, 0, mmHDP_READ_CACHE_INVALIDATE), 0));
  981. amdgpu_ring_write(ring, 1);
  982. }
  983. /**
  984. * uvd_v7_0_ring_test_ring - register write test
  985. *
  986. * @ring: amdgpu_ring pointer
  987. *
  988. * Test if we can successfully write to the context register
  989. */
  990. static int uvd_v7_0_ring_test_ring(struct amdgpu_ring *ring)
  991. {
  992. struct amdgpu_device *adev = ring->adev;
  993. uint32_t tmp = 0;
  994. unsigned i;
  995. int r;
  996. WREG32_SOC15(UVD, 0, mmUVD_CONTEXT_ID, 0xCAFEDEAD);
  997. r = amdgpu_ring_alloc(ring, 3);
  998. if (r) {
  999. DRM_ERROR("amdgpu: cp failed to lock ring %d (%d).\n",
  1000. ring->idx, r);
  1001. return r;
  1002. }
  1003. amdgpu_ring_write(ring,
  1004. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_CONTEXT_ID), 0));
  1005. amdgpu_ring_write(ring, 0xDEADBEEF);
  1006. amdgpu_ring_commit(ring);
  1007. for (i = 0; i < adev->usec_timeout; i++) {
  1008. tmp = RREG32_SOC15(UVD, 0, mmUVD_CONTEXT_ID);
  1009. if (tmp == 0xDEADBEEF)
  1010. break;
  1011. DRM_UDELAY(1);
  1012. }
  1013. if (i < adev->usec_timeout) {
  1014. DRM_DEBUG("ring test on %d succeeded in %d usecs\n",
  1015. ring->idx, i);
  1016. } else {
  1017. DRM_ERROR("amdgpu: ring %d test failed (0x%08X)\n",
  1018. ring->idx, tmp);
  1019. r = -EINVAL;
  1020. }
  1021. return r;
  1022. }
  1023. /**
  1024. * uvd_v7_0_ring_emit_ib - execute indirect buffer
  1025. *
  1026. * @ring: amdgpu_ring pointer
  1027. * @ib: indirect buffer to execute
  1028. *
  1029. * Write ring commands to execute the indirect buffer
  1030. */
  1031. static void uvd_v7_0_ring_emit_ib(struct amdgpu_ring *ring,
  1032. struct amdgpu_ib *ib,
  1033. unsigned vm_id, bool ctx_switch)
  1034. {
  1035. amdgpu_ring_write(ring,
  1036. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_VMID), 0));
  1037. amdgpu_ring_write(ring, vm_id);
  1038. amdgpu_ring_write(ring,
  1039. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_64BIT_BAR_LOW), 0));
  1040. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1041. amdgpu_ring_write(ring,
  1042. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH), 0));
  1043. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1044. amdgpu_ring_write(ring,
  1045. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_IB_SIZE), 0));
  1046. amdgpu_ring_write(ring, ib->length_dw);
  1047. }
  1048. /**
  1049. * uvd_v7_0_enc_ring_emit_ib - enc execute indirect buffer
  1050. *
  1051. * @ring: amdgpu_ring pointer
  1052. * @ib: indirect buffer to execute
  1053. *
  1054. * Write enc ring commands to execute the indirect buffer
  1055. */
  1056. static void uvd_v7_0_enc_ring_emit_ib(struct amdgpu_ring *ring,
  1057. struct amdgpu_ib *ib, unsigned int vm_id, bool ctx_switch)
  1058. {
  1059. amdgpu_ring_write(ring, HEVC_ENC_CMD_IB_VM);
  1060. amdgpu_ring_write(ring, vm_id);
  1061. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1062. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1063. amdgpu_ring_write(ring, ib->length_dw);
  1064. }
  1065. static void uvd_v7_0_vm_reg_write(struct amdgpu_ring *ring,
  1066. uint32_t data0, uint32_t data1)
  1067. {
  1068. amdgpu_ring_write(ring,
  1069. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  1070. amdgpu_ring_write(ring, data0);
  1071. amdgpu_ring_write(ring,
  1072. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  1073. amdgpu_ring_write(ring, data1);
  1074. amdgpu_ring_write(ring,
  1075. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  1076. amdgpu_ring_write(ring, 8);
  1077. }
  1078. static void uvd_v7_0_vm_reg_wait(struct amdgpu_ring *ring,
  1079. uint32_t data0, uint32_t data1, uint32_t mask)
  1080. {
  1081. amdgpu_ring_write(ring,
  1082. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  1083. amdgpu_ring_write(ring, data0);
  1084. amdgpu_ring_write(ring,
  1085. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  1086. amdgpu_ring_write(ring, data1);
  1087. amdgpu_ring_write(ring,
  1088. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GP_SCRATCH8), 0));
  1089. amdgpu_ring_write(ring, mask);
  1090. amdgpu_ring_write(ring,
  1091. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  1092. amdgpu_ring_write(ring, 12);
  1093. }
  1094. static void uvd_v7_0_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1095. unsigned vm_id, uint64_t pd_addr)
  1096. {
  1097. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1098. uint32_t req = ring->adev->gart.gart_funcs->get_invalidate_req(vm_id);
  1099. uint32_t data0, data1, mask;
  1100. unsigned eng = ring->vm_inv_eng;
  1101. pd_addr = amdgpu_gart_get_vm_pde(ring->adev, pd_addr);
  1102. pd_addr |= AMDGPU_PTE_VALID;
  1103. data0 = (hub->ctx0_ptb_addr_hi32 + vm_id * 2) << 2;
  1104. data1 = upper_32_bits(pd_addr);
  1105. uvd_v7_0_vm_reg_write(ring, data0, data1);
  1106. data0 = (hub->ctx0_ptb_addr_lo32 + vm_id * 2) << 2;
  1107. data1 = lower_32_bits(pd_addr);
  1108. uvd_v7_0_vm_reg_write(ring, data0, data1);
  1109. data0 = (hub->ctx0_ptb_addr_lo32 + vm_id * 2) << 2;
  1110. data1 = lower_32_bits(pd_addr);
  1111. mask = 0xffffffff;
  1112. uvd_v7_0_vm_reg_wait(ring, data0, data1, mask);
  1113. /* flush TLB */
  1114. data0 = (hub->vm_inv_eng0_req + eng) << 2;
  1115. data1 = req;
  1116. uvd_v7_0_vm_reg_write(ring, data0, data1);
  1117. /* wait for flush */
  1118. data0 = (hub->vm_inv_eng0_ack + eng) << 2;
  1119. data1 = 1 << vm_id;
  1120. mask = 1 << vm_id;
  1121. uvd_v7_0_vm_reg_wait(ring, data0, data1, mask);
  1122. }
  1123. static void uvd_v7_0_enc_ring_insert_end(struct amdgpu_ring *ring)
  1124. {
  1125. amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
  1126. }
  1127. static void uvd_v7_0_enc_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1128. unsigned int vm_id, uint64_t pd_addr)
  1129. {
  1130. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1131. uint32_t req = ring->adev->gart.gart_funcs->get_invalidate_req(vm_id);
  1132. unsigned eng = ring->vm_inv_eng;
  1133. pd_addr = amdgpu_gart_get_vm_pde(ring->adev, pd_addr);
  1134. pd_addr |= AMDGPU_PTE_VALID;
  1135. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WRITE);
  1136. amdgpu_ring_write(ring, (hub->ctx0_ptb_addr_hi32 + vm_id * 2) << 2);
  1137. amdgpu_ring_write(ring, upper_32_bits(pd_addr));
  1138. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WRITE);
  1139. amdgpu_ring_write(ring, (hub->ctx0_ptb_addr_lo32 + vm_id * 2) << 2);
  1140. amdgpu_ring_write(ring, lower_32_bits(pd_addr));
  1141. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WAIT);
  1142. amdgpu_ring_write(ring, (hub->ctx0_ptb_addr_lo32 + vm_id * 2) << 2);
  1143. amdgpu_ring_write(ring, 0xffffffff);
  1144. amdgpu_ring_write(ring, lower_32_bits(pd_addr));
  1145. /* flush TLB */
  1146. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WRITE);
  1147. amdgpu_ring_write(ring, (hub->vm_inv_eng0_req + eng) << 2);
  1148. amdgpu_ring_write(ring, req);
  1149. /* wait for flush */
  1150. amdgpu_ring_write(ring, HEVC_ENC_CMD_REG_WAIT);
  1151. amdgpu_ring_write(ring, (hub->vm_inv_eng0_ack + eng) << 2);
  1152. amdgpu_ring_write(ring, 1 << vm_id);
  1153. amdgpu_ring_write(ring, 1 << vm_id);
  1154. }
  1155. #if 0
  1156. static bool uvd_v7_0_is_idle(void *handle)
  1157. {
  1158. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1159. return !(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK);
  1160. }
  1161. static int uvd_v7_0_wait_for_idle(void *handle)
  1162. {
  1163. unsigned i;
  1164. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1165. for (i = 0; i < adev->usec_timeout; i++) {
  1166. if (uvd_v7_0_is_idle(handle))
  1167. return 0;
  1168. }
  1169. return -ETIMEDOUT;
  1170. }
  1171. #define AMDGPU_UVD_STATUS_BUSY_MASK 0xfd
  1172. static bool uvd_v7_0_check_soft_reset(void *handle)
  1173. {
  1174. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1175. u32 srbm_soft_reset = 0;
  1176. u32 tmp = RREG32(mmSRBM_STATUS);
  1177. if (REG_GET_FIELD(tmp, SRBM_STATUS, UVD_RQ_PENDING) ||
  1178. REG_GET_FIELD(tmp, SRBM_STATUS, UVD_BUSY) ||
  1179. (RREG32_SOC15(UVD, 0, mmUVD_STATUS) &
  1180. AMDGPU_UVD_STATUS_BUSY_MASK))
  1181. srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset,
  1182. SRBM_SOFT_RESET, SOFT_RESET_UVD, 1);
  1183. if (srbm_soft_reset) {
  1184. adev->uvd.srbm_soft_reset = srbm_soft_reset;
  1185. return true;
  1186. } else {
  1187. adev->uvd.srbm_soft_reset = 0;
  1188. return false;
  1189. }
  1190. }
  1191. static int uvd_v7_0_pre_soft_reset(void *handle)
  1192. {
  1193. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1194. if (!adev->uvd.srbm_soft_reset)
  1195. return 0;
  1196. uvd_v7_0_stop(adev);
  1197. return 0;
  1198. }
  1199. static int uvd_v7_0_soft_reset(void *handle)
  1200. {
  1201. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1202. u32 srbm_soft_reset;
  1203. if (!adev->uvd.srbm_soft_reset)
  1204. return 0;
  1205. srbm_soft_reset = adev->uvd.srbm_soft_reset;
  1206. if (srbm_soft_reset) {
  1207. u32 tmp;
  1208. tmp = RREG32(mmSRBM_SOFT_RESET);
  1209. tmp |= srbm_soft_reset;
  1210. dev_info(adev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
  1211. WREG32(mmSRBM_SOFT_RESET, tmp);
  1212. tmp = RREG32(mmSRBM_SOFT_RESET);
  1213. udelay(50);
  1214. tmp &= ~srbm_soft_reset;
  1215. WREG32(mmSRBM_SOFT_RESET, tmp);
  1216. tmp = RREG32(mmSRBM_SOFT_RESET);
  1217. /* Wait a little for things to settle down */
  1218. udelay(50);
  1219. }
  1220. return 0;
  1221. }
  1222. static int uvd_v7_0_post_soft_reset(void *handle)
  1223. {
  1224. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1225. if (!adev->uvd.srbm_soft_reset)
  1226. return 0;
  1227. mdelay(5);
  1228. return uvd_v7_0_start(adev);
  1229. }
  1230. #endif
  1231. static int uvd_v7_0_set_interrupt_state(struct amdgpu_device *adev,
  1232. struct amdgpu_irq_src *source,
  1233. unsigned type,
  1234. enum amdgpu_interrupt_state state)
  1235. {
  1236. // TODO
  1237. return 0;
  1238. }
  1239. static int uvd_v7_0_process_interrupt(struct amdgpu_device *adev,
  1240. struct amdgpu_irq_src *source,
  1241. struct amdgpu_iv_entry *entry)
  1242. {
  1243. DRM_DEBUG("IH: UVD TRAP\n");
  1244. switch (entry->src_id) {
  1245. case 124:
  1246. amdgpu_fence_process(&adev->uvd.ring);
  1247. break;
  1248. case 119:
  1249. amdgpu_fence_process(&adev->uvd.ring_enc[0]);
  1250. break;
  1251. case 120:
  1252. if (!amdgpu_sriov_vf(adev))
  1253. amdgpu_fence_process(&adev->uvd.ring_enc[1]);
  1254. break;
  1255. default:
  1256. DRM_ERROR("Unhandled interrupt: %d %d\n",
  1257. entry->src_id, entry->src_data[0]);
  1258. break;
  1259. }
  1260. return 0;
  1261. }
  1262. #if 0
  1263. static void uvd_v7_0_set_sw_clock_gating(struct amdgpu_device *adev)
  1264. {
  1265. uint32_t data, data1, data2, suvd_flags;
  1266. data = RREG32_SOC15(UVD, 0, mmUVD_CGC_CTRL);
  1267. data1 = RREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_GATE);
  1268. data2 = RREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_CTRL);
  1269. data &= ~(UVD_CGC_CTRL__CLK_OFF_DELAY_MASK |
  1270. UVD_CGC_CTRL__CLK_GATE_DLY_TIMER_MASK);
  1271. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  1272. UVD_SUVD_CGC_GATE__SIT_MASK |
  1273. UVD_SUVD_CGC_GATE__SMP_MASK |
  1274. UVD_SUVD_CGC_GATE__SCM_MASK |
  1275. UVD_SUVD_CGC_GATE__SDB_MASK;
  1276. data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK |
  1277. (1 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_GATE_DLY_TIMER)) |
  1278. (4 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_OFF_DELAY));
  1279. data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
  1280. UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
  1281. UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
  1282. UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
  1283. UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
  1284. UVD_CGC_CTRL__SYS_MODE_MASK |
  1285. UVD_CGC_CTRL__UDEC_MODE_MASK |
  1286. UVD_CGC_CTRL__MPEG2_MODE_MASK |
  1287. UVD_CGC_CTRL__REGS_MODE_MASK |
  1288. UVD_CGC_CTRL__RBC_MODE_MASK |
  1289. UVD_CGC_CTRL__LMI_MC_MODE_MASK |
  1290. UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
  1291. UVD_CGC_CTRL__IDCT_MODE_MASK |
  1292. UVD_CGC_CTRL__MPRD_MODE_MASK |
  1293. UVD_CGC_CTRL__MPC_MODE_MASK |
  1294. UVD_CGC_CTRL__LBSI_MODE_MASK |
  1295. UVD_CGC_CTRL__LRBBM_MODE_MASK |
  1296. UVD_CGC_CTRL__WCB_MODE_MASK |
  1297. UVD_CGC_CTRL__VCPU_MODE_MASK |
  1298. UVD_CGC_CTRL__JPEG_MODE_MASK |
  1299. UVD_CGC_CTRL__JPEG2_MODE_MASK |
  1300. UVD_CGC_CTRL__SCPU_MODE_MASK);
  1301. data2 &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK |
  1302. UVD_SUVD_CGC_CTRL__SIT_MODE_MASK |
  1303. UVD_SUVD_CGC_CTRL__SMP_MODE_MASK |
  1304. UVD_SUVD_CGC_CTRL__SCM_MODE_MASK |
  1305. UVD_SUVD_CGC_CTRL__SDB_MODE_MASK);
  1306. data1 |= suvd_flags;
  1307. WREG32_SOC15(UVD, 0, mmUVD_CGC_CTRL, data);
  1308. WREG32_SOC15(UVD, 0, mmUVD_CGC_GATE, 0);
  1309. WREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_GATE, data1);
  1310. WREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_CTRL, data2);
  1311. }
  1312. static void uvd_v7_0_set_hw_clock_gating(struct amdgpu_device *adev)
  1313. {
  1314. uint32_t data, data1, cgc_flags, suvd_flags;
  1315. data = RREG32_SOC15(UVD, 0, mmUVD_CGC_GATE);
  1316. data1 = RREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_GATE);
  1317. cgc_flags = UVD_CGC_GATE__SYS_MASK |
  1318. UVD_CGC_GATE__UDEC_MASK |
  1319. UVD_CGC_GATE__MPEG2_MASK |
  1320. UVD_CGC_GATE__RBC_MASK |
  1321. UVD_CGC_GATE__LMI_MC_MASK |
  1322. UVD_CGC_GATE__IDCT_MASK |
  1323. UVD_CGC_GATE__MPRD_MASK |
  1324. UVD_CGC_GATE__MPC_MASK |
  1325. UVD_CGC_GATE__LBSI_MASK |
  1326. UVD_CGC_GATE__LRBBM_MASK |
  1327. UVD_CGC_GATE__UDEC_RE_MASK |
  1328. UVD_CGC_GATE__UDEC_CM_MASK |
  1329. UVD_CGC_GATE__UDEC_IT_MASK |
  1330. UVD_CGC_GATE__UDEC_DB_MASK |
  1331. UVD_CGC_GATE__UDEC_MP_MASK |
  1332. UVD_CGC_GATE__WCB_MASK |
  1333. UVD_CGC_GATE__VCPU_MASK |
  1334. UVD_CGC_GATE__SCPU_MASK |
  1335. UVD_CGC_GATE__JPEG_MASK |
  1336. UVD_CGC_GATE__JPEG2_MASK;
  1337. suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
  1338. UVD_SUVD_CGC_GATE__SIT_MASK |
  1339. UVD_SUVD_CGC_GATE__SMP_MASK |
  1340. UVD_SUVD_CGC_GATE__SCM_MASK |
  1341. UVD_SUVD_CGC_GATE__SDB_MASK;
  1342. data |= cgc_flags;
  1343. data1 |= suvd_flags;
  1344. WREG32_SOC15(UVD, 0, mmUVD_CGC_GATE, data);
  1345. WREG32_SOC15(UVD, 0, mmUVD_SUVD_CGC_GATE, data1);
  1346. }
  1347. static void uvd_v7_0_set_bypass_mode(struct amdgpu_device *adev, bool enable)
  1348. {
  1349. u32 tmp = RREG32_SMC(ixGCK_DFS_BYPASS_CNTL);
  1350. if (enable)
  1351. tmp |= (GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
  1352. GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
  1353. else
  1354. tmp &= ~(GCK_DFS_BYPASS_CNTL__BYPASSDCLK_MASK |
  1355. GCK_DFS_BYPASS_CNTL__BYPASSVCLK_MASK);
  1356. WREG32_SMC(ixGCK_DFS_BYPASS_CNTL, tmp);
  1357. }
  1358. static int uvd_v7_0_set_clockgating_state(void *handle,
  1359. enum amd_clockgating_state state)
  1360. {
  1361. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1362. bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
  1363. uvd_v7_0_set_bypass_mode(adev, enable);
  1364. if (!(adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG))
  1365. return 0;
  1366. if (enable) {
  1367. /* disable HW gating and enable Sw gating */
  1368. uvd_v7_0_set_sw_clock_gating(adev);
  1369. } else {
  1370. /* wait for STATUS to clear */
  1371. if (uvd_v7_0_wait_for_idle(handle))
  1372. return -EBUSY;
  1373. /* enable HW gates because UVD is idle */
  1374. /* uvd_v7_0_set_hw_clock_gating(adev); */
  1375. }
  1376. return 0;
  1377. }
  1378. static int uvd_v7_0_set_powergating_state(void *handle,
  1379. enum amd_powergating_state state)
  1380. {
  1381. /* This doesn't actually powergate the UVD block.
  1382. * That's done in the dpm code via the SMC. This
  1383. * just re-inits the block as necessary. The actual
  1384. * gating still happens in the dpm code. We should
  1385. * revisit this when there is a cleaner line between
  1386. * the smc and the hw blocks
  1387. */
  1388. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1389. if (!(adev->pg_flags & AMD_PG_SUPPORT_UVD))
  1390. return 0;
  1391. WREG32_SOC15(UVD, 0, mmUVD_POWER_STATUS, UVD_POWER_STATUS__UVD_PG_EN_MASK);
  1392. if (state == AMD_PG_STATE_GATE) {
  1393. uvd_v7_0_stop(adev);
  1394. return 0;
  1395. } else {
  1396. return uvd_v7_0_start(adev);
  1397. }
  1398. }
  1399. #endif
  1400. static int uvd_v7_0_set_clockgating_state(void *handle,
  1401. enum amd_clockgating_state state)
  1402. {
  1403. /* needed for driver unload*/
  1404. return 0;
  1405. }
  1406. const struct amd_ip_funcs uvd_v7_0_ip_funcs = {
  1407. .name = "uvd_v7_0",
  1408. .early_init = uvd_v7_0_early_init,
  1409. .late_init = NULL,
  1410. .sw_init = uvd_v7_0_sw_init,
  1411. .sw_fini = uvd_v7_0_sw_fini,
  1412. .hw_init = uvd_v7_0_hw_init,
  1413. .hw_fini = uvd_v7_0_hw_fini,
  1414. .suspend = uvd_v7_0_suspend,
  1415. .resume = uvd_v7_0_resume,
  1416. .is_idle = NULL /* uvd_v7_0_is_idle */,
  1417. .wait_for_idle = NULL /* uvd_v7_0_wait_for_idle */,
  1418. .check_soft_reset = NULL /* uvd_v7_0_check_soft_reset */,
  1419. .pre_soft_reset = NULL /* uvd_v7_0_pre_soft_reset */,
  1420. .soft_reset = NULL /* uvd_v7_0_soft_reset */,
  1421. .post_soft_reset = NULL /* uvd_v7_0_post_soft_reset */,
  1422. .set_clockgating_state = uvd_v7_0_set_clockgating_state,
  1423. .set_powergating_state = NULL /* uvd_v7_0_set_powergating_state */,
  1424. };
  1425. static const struct amdgpu_ring_funcs uvd_v7_0_ring_vm_funcs = {
  1426. .type = AMDGPU_RING_TYPE_UVD,
  1427. .align_mask = 0xf,
  1428. .nop = PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_NO_OP), 0),
  1429. .support_64bit_ptrs = false,
  1430. .vmhub = AMDGPU_MMHUB,
  1431. .get_rptr = uvd_v7_0_ring_get_rptr,
  1432. .get_wptr = uvd_v7_0_ring_get_wptr,
  1433. .set_wptr = uvd_v7_0_ring_set_wptr,
  1434. .emit_frame_size =
  1435. 2 + /* uvd_v7_0_ring_emit_hdp_flush */
  1436. 2 + /* uvd_v7_0_ring_emit_hdp_invalidate */
  1437. 34 + /* uvd_v7_0_ring_emit_vm_flush */
  1438. 14 + 14, /* uvd_v7_0_ring_emit_fence x2 vm fence */
  1439. .emit_ib_size = 8, /* uvd_v7_0_ring_emit_ib */
  1440. .emit_ib = uvd_v7_0_ring_emit_ib,
  1441. .emit_fence = uvd_v7_0_ring_emit_fence,
  1442. .emit_vm_flush = uvd_v7_0_ring_emit_vm_flush,
  1443. .emit_hdp_flush = uvd_v7_0_ring_emit_hdp_flush,
  1444. .emit_hdp_invalidate = uvd_v7_0_ring_emit_hdp_invalidate,
  1445. .test_ring = uvd_v7_0_ring_test_ring,
  1446. .test_ib = amdgpu_uvd_ring_test_ib,
  1447. .insert_nop = amdgpu_ring_insert_nop,
  1448. .pad_ib = amdgpu_ring_generic_pad_ib,
  1449. .begin_use = amdgpu_uvd_ring_begin_use,
  1450. .end_use = amdgpu_uvd_ring_end_use,
  1451. };
  1452. static const struct amdgpu_ring_funcs uvd_v7_0_enc_ring_vm_funcs = {
  1453. .type = AMDGPU_RING_TYPE_UVD_ENC,
  1454. .align_mask = 0x3f,
  1455. .nop = HEVC_ENC_CMD_NO_OP,
  1456. .support_64bit_ptrs = false,
  1457. .vmhub = AMDGPU_MMHUB,
  1458. .get_rptr = uvd_v7_0_enc_ring_get_rptr,
  1459. .get_wptr = uvd_v7_0_enc_ring_get_wptr,
  1460. .set_wptr = uvd_v7_0_enc_ring_set_wptr,
  1461. .emit_frame_size =
  1462. 17 + /* uvd_v7_0_enc_ring_emit_vm_flush */
  1463. 5 + 5 + /* uvd_v7_0_enc_ring_emit_fence x2 vm fence */
  1464. 1, /* uvd_v7_0_enc_ring_insert_end */
  1465. .emit_ib_size = 5, /* uvd_v7_0_enc_ring_emit_ib */
  1466. .emit_ib = uvd_v7_0_enc_ring_emit_ib,
  1467. .emit_fence = uvd_v7_0_enc_ring_emit_fence,
  1468. .emit_vm_flush = uvd_v7_0_enc_ring_emit_vm_flush,
  1469. .test_ring = uvd_v7_0_enc_ring_test_ring,
  1470. .test_ib = uvd_v7_0_enc_ring_test_ib,
  1471. .insert_nop = amdgpu_ring_insert_nop,
  1472. .insert_end = uvd_v7_0_enc_ring_insert_end,
  1473. .pad_ib = amdgpu_ring_generic_pad_ib,
  1474. .begin_use = amdgpu_uvd_ring_begin_use,
  1475. .end_use = amdgpu_uvd_ring_end_use,
  1476. };
  1477. static void uvd_v7_0_set_ring_funcs(struct amdgpu_device *adev)
  1478. {
  1479. adev->uvd.ring.funcs = &uvd_v7_0_ring_vm_funcs;
  1480. DRM_INFO("UVD is enabled in VM mode\n");
  1481. }
  1482. static void uvd_v7_0_set_enc_ring_funcs(struct amdgpu_device *adev)
  1483. {
  1484. int i;
  1485. for (i = 0; i < adev->uvd.num_enc_rings; ++i)
  1486. adev->uvd.ring_enc[i].funcs = &uvd_v7_0_enc_ring_vm_funcs;
  1487. DRM_INFO("UVD ENC is enabled in VM mode\n");
  1488. }
  1489. static const struct amdgpu_irq_src_funcs uvd_v7_0_irq_funcs = {
  1490. .set = uvd_v7_0_set_interrupt_state,
  1491. .process = uvd_v7_0_process_interrupt,
  1492. };
  1493. static void uvd_v7_0_set_irq_funcs(struct amdgpu_device *adev)
  1494. {
  1495. adev->uvd.irq.num_types = adev->uvd.num_enc_rings + 1;
  1496. adev->uvd.irq.funcs = &uvd_v7_0_irq_funcs;
  1497. }
  1498. const struct amdgpu_ip_block_version uvd_v7_0_ip_block =
  1499. {
  1500. .type = AMD_IP_BLOCK_TYPE_UVD,
  1501. .major = 7,
  1502. .minor = 0,
  1503. .rev = 0,
  1504. .funcs = &uvd_v7_0_ip_funcs,
  1505. };