vcn_v1_0.c 68 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include <linux/firmware.h>
  24. #include <drm/drmP.h>
  25. #include "amdgpu.h"
  26. #include "amdgpu_vcn.h"
  27. #include "soc15.h"
  28. #include "soc15d.h"
  29. #include "soc15_common.h"
  30. #include "vcn/vcn_1_0_offset.h"
  31. #include "vcn/vcn_1_0_sh_mask.h"
  32. #include "hdp/hdp_4_0_offset.h"
  33. #include "mmhub/mmhub_9_1_offset.h"
  34. #include "mmhub/mmhub_9_1_sh_mask.h"
  35. #include "ivsrcid/vcn/irqsrcs_vcn_1_0.h"
  36. #define mmUVD_RBC_XX_IB_REG_CHECK 0x05ab
  37. #define mmUVD_RBC_XX_IB_REG_CHECK_BASE_IDX 1
  38. #define mmUVD_REG_XX_MASK 0x05ac
  39. #define mmUVD_REG_XX_MASK_BASE_IDX 1
  40. static int vcn_v1_0_stop(struct amdgpu_device *adev);
  41. static void vcn_v1_0_set_dec_ring_funcs(struct amdgpu_device *adev);
  42. static void vcn_v1_0_set_enc_ring_funcs(struct amdgpu_device *adev);
  43. static void vcn_v1_0_set_jpeg_ring_funcs(struct amdgpu_device *adev);
  44. static void vcn_v1_0_set_irq_funcs(struct amdgpu_device *adev);
  45. static void vcn_v1_0_jpeg_ring_set_patch_ring(struct amdgpu_ring *ring, uint32_t ptr);
  46. static int vcn_v1_0_set_powergating_state(void *handle, enum amd_powergating_state state);
  47. /**
  48. * vcn_v1_0_early_init - set function pointers
  49. *
  50. * @handle: amdgpu_device pointer
  51. *
  52. * Set ring and irq function pointers
  53. */
  54. static int vcn_v1_0_early_init(void *handle)
  55. {
  56. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  57. adev->vcn.num_enc_rings = 2;
  58. vcn_v1_0_set_dec_ring_funcs(adev);
  59. vcn_v1_0_set_enc_ring_funcs(adev);
  60. vcn_v1_0_set_jpeg_ring_funcs(adev);
  61. vcn_v1_0_set_irq_funcs(adev);
  62. return 0;
  63. }
  64. /**
  65. * vcn_v1_0_sw_init - sw init for VCN block
  66. *
  67. * @handle: amdgpu_device pointer
  68. *
  69. * Load firmware and sw initialization
  70. */
  71. static int vcn_v1_0_sw_init(void *handle)
  72. {
  73. struct amdgpu_ring *ring;
  74. int i, r;
  75. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  76. /* VCN DEC TRAP */
  77. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN, VCN_1_0__SRCID__UVD_SYSTEM_MESSAGE_INTERRUPT, &adev->vcn.irq);
  78. if (r)
  79. return r;
  80. /* VCN ENC TRAP */
  81. for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
  82. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN, i + VCN_1_0__SRCID__UVD_ENC_GENERAL_PURPOSE,
  83. &adev->vcn.irq);
  84. if (r)
  85. return r;
  86. }
  87. /* VCN JPEG TRAP */
  88. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN, 126, &adev->vcn.irq);
  89. if (r)
  90. return r;
  91. r = amdgpu_vcn_sw_init(adev);
  92. if (r)
  93. return r;
  94. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  95. const struct common_firmware_header *hdr;
  96. hdr = (const struct common_firmware_header *)adev->vcn.fw->data;
  97. adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].ucode_id = AMDGPU_UCODE_ID_VCN;
  98. adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].fw = adev->vcn.fw;
  99. adev->firmware.fw_size +=
  100. ALIGN(le32_to_cpu(hdr->ucode_size_bytes), PAGE_SIZE);
  101. DRM_INFO("PSP loading VCN firmware\n");
  102. }
  103. r = amdgpu_vcn_resume(adev);
  104. if (r)
  105. return r;
  106. ring = &adev->vcn.ring_dec;
  107. sprintf(ring->name, "vcn_dec");
  108. r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.irq, 0);
  109. if (r)
  110. return r;
  111. for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
  112. ring = &adev->vcn.ring_enc[i];
  113. sprintf(ring->name, "vcn_enc%d", i);
  114. r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.irq, 0);
  115. if (r)
  116. return r;
  117. }
  118. ring = &adev->vcn.ring_jpeg;
  119. sprintf(ring->name, "vcn_jpeg");
  120. r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.irq, 0);
  121. if (r)
  122. return r;
  123. return r;
  124. }
  125. /**
  126. * vcn_v1_0_sw_fini - sw fini for VCN block
  127. *
  128. * @handle: amdgpu_device pointer
  129. *
  130. * VCN suspend and free up sw allocation
  131. */
  132. static int vcn_v1_0_sw_fini(void *handle)
  133. {
  134. int r;
  135. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  136. r = amdgpu_vcn_suspend(adev);
  137. if (r)
  138. return r;
  139. r = amdgpu_vcn_sw_fini(adev);
  140. return r;
  141. }
  142. /**
  143. * vcn_v1_0_hw_init - start and test VCN block
  144. *
  145. * @handle: amdgpu_device pointer
  146. *
  147. * Initialize the hardware, boot up the VCPU and do some testing
  148. */
  149. static int vcn_v1_0_hw_init(void *handle)
  150. {
  151. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  152. struct amdgpu_ring *ring = &adev->vcn.ring_dec;
  153. int i, r;
  154. ring->ready = true;
  155. r = amdgpu_ring_test_ring(ring);
  156. if (r) {
  157. ring->ready = false;
  158. goto done;
  159. }
  160. for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
  161. ring = &adev->vcn.ring_enc[i];
  162. ring->ready = true;
  163. r = amdgpu_ring_test_ring(ring);
  164. if (r) {
  165. ring->ready = false;
  166. goto done;
  167. }
  168. }
  169. ring = &adev->vcn.ring_jpeg;
  170. ring->ready = true;
  171. r = amdgpu_ring_test_ring(ring);
  172. if (r) {
  173. ring->ready = false;
  174. goto done;
  175. }
  176. done:
  177. if (!r)
  178. DRM_INFO("VCN decode and encode initialized successfully(under %s).\n",
  179. (adev->pg_flags & AMD_PG_SUPPORT_VCN_DPG)?"DPG Mode":"SPG Mode");
  180. return r;
  181. }
  182. /**
  183. * vcn_v1_0_hw_fini - stop the hardware block
  184. *
  185. * @handle: amdgpu_device pointer
  186. *
  187. * Stop the VCN block, mark ring as not ready any more
  188. */
  189. static int vcn_v1_0_hw_fini(void *handle)
  190. {
  191. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  192. struct amdgpu_ring *ring = &adev->vcn.ring_dec;
  193. if (RREG32_SOC15(VCN, 0, mmUVD_STATUS))
  194. vcn_v1_0_set_powergating_state(adev, AMD_PG_STATE_GATE);
  195. ring->ready = false;
  196. return 0;
  197. }
  198. /**
  199. * vcn_v1_0_suspend - suspend VCN block
  200. *
  201. * @handle: amdgpu_device pointer
  202. *
  203. * HW fini and suspend VCN block
  204. */
  205. static int vcn_v1_0_suspend(void *handle)
  206. {
  207. int r;
  208. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  209. r = vcn_v1_0_hw_fini(adev);
  210. if (r)
  211. return r;
  212. r = amdgpu_vcn_suspend(adev);
  213. return r;
  214. }
  215. /**
  216. * vcn_v1_0_resume - resume VCN block
  217. *
  218. * @handle: amdgpu_device pointer
  219. *
  220. * Resume firmware and hw init VCN block
  221. */
  222. static int vcn_v1_0_resume(void *handle)
  223. {
  224. int r;
  225. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  226. r = amdgpu_vcn_resume(adev);
  227. if (r)
  228. return r;
  229. r = vcn_v1_0_hw_init(adev);
  230. return r;
  231. }
  232. /**
  233. * vcn_v1_0_mc_resume_spg_mode - memory controller programming
  234. *
  235. * @adev: amdgpu_device pointer
  236. *
  237. * Let the VCN memory controller know it's offsets
  238. */
  239. static void vcn_v1_0_mc_resume_spg_mode(struct amdgpu_device *adev)
  240. {
  241. uint32_t size = AMDGPU_GPU_PAGE_ALIGN(adev->vcn.fw->size + 4);
  242. uint32_t offset;
  243. /* cache window 0: fw */
  244. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  245. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  246. (adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].tmr_mc_addr_lo));
  247. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  248. (adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].tmr_mc_addr_hi));
  249. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0, 0);
  250. offset = 0;
  251. } else {
  252. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  253. lower_32_bits(adev->vcn.gpu_addr));
  254. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  255. upper_32_bits(adev->vcn.gpu_addr));
  256. offset = size;
  257. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0,
  258. AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
  259. }
  260. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE0, size);
  261. /* cache window 1: stack */
  262. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW,
  263. lower_32_bits(adev->vcn.gpu_addr + offset));
  264. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH,
  265. upper_32_bits(adev->vcn.gpu_addr + offset));
  266. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET1, 0);
  267. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE1, AMDGPU_VCN_STACK_SIZE);
  268. /* cache window 2: context */
  269. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW,
  270. lower_32_bits(adev->vcn.gpu_addr + offset + AMDGPU_VCN_STACK_SIZE));
  271. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH,
  272. upper_32_bits(adev->vcn.gpu_addr + offset + AMDGPU_VCN_STACK_SIZE));
  273. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET2, 0);
  274. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE2, AMDGPU_VCN_CONTEXT_SIZE);
  275. WREG32_SOC15(UVD, 0, mmUVD_UDEC_ADDR_CONFIG,
  276. adev->gfx.config.gb_addr_config);
  277. WREG32_SOC15(UVD, 0, mmUVD_UDEC_DB_ADDR_CONFIG,
  278. adev->gfx.config.gb_addr_config);
  279. WREG32_SOC15(UVD, 0, mmUVD_UDEC_DBW_ADDR_CONFIG,
  280. adev->gfx.config.gb_addr_config);
  281. WREG32_SOC15(UVD, 0, mmUVD_UDEC_DBW_UV_ADDR_CONFIG,
  282. adev->gfx.config.gb_addr_config);
  283. WREG32_SOC15(UVD, 0, mmUVD_MIF_CURR_ADDR_CONFIG,
  284. adev->gfx.config.gb_addr_config);
  285. WREG32_SOC15(UVD, 0, mmUVD_MIF_CURR_UV_ADDR_CONFIG,
  286. adev->gfx.config.gb_addr_config);
  287. WREG32_SOC15(UVD, 0, mmUVD_MIF_RECON1_ADDR_CONFIG,
  288. adev->gfx.config.gb_addr_config);
  289. WREG32_SOC15(UVD, 0, mmUVD_MIF_RECON1_UV_ADDR_CONFIG,
  290. adev->gfx.config.gb_addr_config);
  291. WREG32_SOC15(UVD, 0, mmUVD_MIF_REF_ADDR_CONFIG,
  292. adev->gfx.config.gb_addr_config);
  293. WREG32_SOC15(UVD, 0, mmUVD_MIF_REF_UV_ADDR_CONFIG,
  294. adev->gfx.config.gb_addr_config);
  295. WREG32_SOC15(UVD, 0, mmUVD_JPEG_ADDR_CONFIG,
  296. adev->gfx.config.gb_addr_config);
  297. WREG32_SOC15(UVD, 0, mmUVD_JPEG_UV_ADDR_CONFIG,
  298. adev->gfx.config.gb_addr_config);
  299. }
  300. static void vcn_v1_0_mc_resume_dpg_mode(struct amdgpu_device *adev)
  301. {
  302. uint32_t size = AMDGPU_GPU_PAGE_ALIGN(adev->vcn.fw->size + 4);
  303. uint32_t offset;
  304. /* cache window 0: fw */
  305. if (adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) {
  306. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  307. (adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].tmr_mc_addr_lo),
  308. 0xFFFFFFFF, 0);
  309. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  310. (adev->firmware.ucode[AMDGPU_UCODE_ID_VCN].tmr_mc_addr_hi),
  311. 0xFFFFFFFF, 0);
  312. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0, 0,
  313. 0xFFFFFFFF, 0);
  314. offset = 0;
  315. } else {
  316. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  317. lower_32_bits(adev->vcn.gpu_addr), 0xFFFFFFFF, 0);
  318. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  319. upper_32_bits(adev->vcn.gpu_addr), 0xFFFFFFFF, 0);
  320. offset = size;
  321. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0,
  322. AMDGPU_UVD_FIRMWARE_OFFSET >> 3, 0xFFFFFFFF, 0);
  323. }
  324. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_VCPU_CACHE_SIZE0, size, 0xFFFFFFFF, 0);
  325. /* cache window 1: stack */
  326. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW,
  327. lower_32_bits(adev->vcn.gpu_addr + offset), 0xFFFFFFFF, 0);
  328. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH,
  329. upper_32_bits(adev->vcn.gpu_addr + offset), 0xFFFFFFFF, 0);
  330. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_VCPU_CACHE_OFFSET1, 0,
  331. 0xFFFFFFFF, 0);
  332. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_VCPU_CACHE_SIZE1, AMDGPU_VCN_STACK_SIZE,
  333. 0xFFFFFFFF, 0);
  334. /* cache window 2: context */
  335. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW,
  336. lower_32_bits(adev->vcn.gpu_addr + offset + AMDGPU_VCN_STACK_SIZE),
  337. 0xFFFFFFFF, 0);
  338. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH,
  339. upper_32_bits(adev->vcn.gpu_addr + offset + AMDGPU_VCN_STACK_SIZE),
  340. 0xFFFFFFFF, 0);
  341. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_VCPU_CACHE_OFFSET2, 0, 0xFFFFFFFF, 0);
  342. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_VCPU_CACHE_SIZE2, AMDGPU_VCN_CONTEXT_SIZE,
  343. 0xFFFFFFFF, 0);
  344. /* VCN global tiling registers */
  345. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_UDEC_ADDR_CONFIG,
  346. adev->gfx.config.gb_addr_config, 0xFFFFFFFF, 0);
  347. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_UDEC_DB_ADDR_CONFIG,
  348. adev->gfx.config.gb_addr_config, 0xFFFFFFFF, 0);
  349. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_UDEC_DBW_ADDR_CONFIG,
  350. adev->gfx.config.gb_addr_config, 0xFFFFFFFF, 0);
  351. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_UDEC_DBW_UV_ADDR_CONFIG,
  352. adev->gfx.config.gb_addr_config, 0xFFFFFFFF, 0);
  353. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MIF_CURR_ADDR_CONFIG,
  354. adev->gfx.config.gb_addr_config, 0xFFFFFFFF, 0);
  355. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MIF_CURR_UV_ADDR_CONFIG,
  356. adev->gfx.config.gb_addr_config, 0xFFFFFFFF, 0);
  357. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MIF_RECON1_ADDR_CONFIG,
  358. adev->gfx.config.gb_addr_config, 0xFFFFFFFF, 0);
  359. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MIF_RECON1_UV_ADDR_CONFIG,
  360. adev->gfx.config.gb_addr_config, 0xFFFFFFFF, 0);
  361. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MIF_REF_ADDR_CONFIG,
  362. adev->gfx.config.gb_addr_config, 0xFFFFFFFF, 0);
  363. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MIF_REF_UV_ADDR_CONFIG,
  364. adev->gfx.config.gb_addr_config, 0xFFFFFFFF, 0);
  365. }
  366. /**
  367. * vcn_v1_0_disable_clock_gating - disable VCN clock gating
  368. *
  369. * @adev: amdgpu_device pointer
  370. * @sw: enable SW clock gating
  371. *
  372. * Disable clock gating for VCN block
  373. */
  374. static void vcn_v1_0_disable_clock_gating(struct amdgpu_device *adev)
  375. {
  376. uint32_t data;
  377. /* JPEG disable CGC */
  378. data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL);
  379. if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
  380. data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  381. else
  382. data &= ~JPEG_CGC_CTRL__DYN_CLOCK_MODE_MASK;
  383. data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
  384. data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
  385. WREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL, data);
  386. data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE);
  387. data &= ~(JPEG_CGC_GATE__JPEG_MASK | JPEG_CGC_GATE__JPEG2_MASK);
  388. WREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE, data);
  389. /* UVD disable CGC */
  390. data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
  391. if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
  392. data |= 1 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  393. else
  394. data &= ~ UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
  395. data |= 1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
  396. data |= 4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
  397. WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
  398. data = RREG32_SOC15(VCN, 0, mmUVD_CGC_GATE);
  399. data &= ~(UVD_CGC_GATE__SYS_MASK
  400. | UVD_CGC_GATE__UDEC_MASK
  401. | UVD_CGC_GATE__MPEG2_MASK
  402. | UVD_CGC_GATE__REGS_MASK
  403. | UVD_CGC_GATE__RBC_MASK
  404. | UVD_CGC_GATE__LMI_MC_MASK
  405. | UVD_CGC_GATE__LMI_UMC_MASK
  406. | UVD_CGC_GATE__IDCT_MASK
  407. | UVD_CGC_GATE__MPRD_MASK
  408. | UVD_CGC_GATE__MPC_MASK
  409. | UVD_CGC_GATE__LBSI_MASK
  410. | UVD_CGC_GATE__LRBBM_MASK
  411. | UVD_CGC_GATE__UDEC_RE_MASK
  412. | UVD_CGC_GATE__UDEC_CM_MASK
  413. | UVD_CGC_GATE__UDEC_IT_MASK
  414. | UVD_CGC_GATE__UDEC_DB_MASK
  415. | UVD_CGC_GATE__UDEC_MP_MASK
  416. | UVD_CGC_GATE__WCB_MASK
  417. | UVD_CGC_GATE__VCPU_MASK
  418. | UVD_CGC_GATE__SCPU_MASK);
  419. WREG32_SOC15(VCN, 0, mmUVD_CGC_GATE, data);
  420. data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
  421. data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK
  422. | UVD_CGC_CTRL__UDEC_CM_MODE_MASK
  423. | UVD_CGC_CTRL__UDEC_IT_MODE_MASK
  424. | UVD_CGC_CTRL__UDEC_DB_MODE_MASK
  425. | UVD_CGC_CTRL__UDEC_MP_MODE_MASK
  426. | UVD_CGC_CTRL__SYS_MODE_MASK
  427. | UVD_CGC_CTRL__UDEC_MODE_MASK
  428. | UVD_CGC_CTRL__MPEG2_MODE_MASK
  429. | UVD_CGC_CTRL__REGS_MODE_MASK
  430. | UVD_CGC_CTRL__RBC_MODE_MASK
  431. | UVD_CGC_CTRL__LMI_MC_MODE_MASK
  432. | UVD_CGC_CTRL__LMI_UMC_MODE_MASK
  433. | UVD_CGC_CTRL__IDCT_MODE_MASK
  434. | UVD_CGC_CTRL__MPRD_MODE_MASK
  435. | UVD_CGC_CTRL__MPC_MODE_MASK
  436. | UVD_CGC_CTRL__LBSI_MODE_MASK
  437. | UVD_CGC_CTRL__LRBBM_MODE_MASK
  438. | UVD_CGC_CTRL__WCB_MODE_MASK
  439. | UVD_CGC_CTRL__VCPU_MODE_MASK
  440. | UVD_CGC_CTRL__SCPU_MODE_MASK);
  441. WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
  442. /* turn on */
  443. data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_GATE);
  444. data |= (UVD_SUVD_CGC_GATE__SRE_MASK
  445. | UVD_SUVD_CGC_GATE__SIT_MASK
  446. | UVD_SUVD_CGC_GATE__SMP_MASK
  447. | UVD_SUVD_CGC_GATE__SCM_MASK
  448. | UVD_SUVD_CGC_GATE__SDB_MASK
  449. | UVD_SUVD_CGC_GATE__SRE_H264_MASK
  450. | UVD_SUVD_CGC_GATE__SRE_HEVC_MASK
  451. | UVD_SUVD_CGC_GATE__SIT_H264_MASK
  452. | UVD_SUVD_CGC_GATE__SIT_HEVC_MASK
  453. | UVD_SUVD_CGC_GATE__SCM_H264_MASK
  454. | UVD_SUVD_CGC_GATE__SCM_HEVC_MASK
  455. | UVD_SUVD_CGC_GATE__SDB_H264_MASK
  456. | UVD_SUVD_CGC_GATE__SDB_HEVC_MASK
  457. | UVD_SUVD_CGC_GATE__SCLR_MASK
  458. | UVD_SUVD_CGC_GATE__UVD_SC_MASK
  459. | UVD_SUVD_CGC_GATE__ENT_MASK
  460. | UVD_SUVD_CGC_GATE__SIT_HEVC_DEC_MASK
  461. | UVD_SUVD_CGC_GATE__SIT_HEVC_ENC_MASK
  462. | UVD_SUVD_CGC_GATE__SITE_MASK
  463. | UVD_SUVD_CGC_GATE__SRE_VP9_MASK
  464. | UVD_SUVD_CGC_GATE__SCM_VP9_MASK
  465. | UVD_SUVD_CGC_GATE__SIT_VP9_DEC_MASK
  466. | UVD_SUVD_CGC_GATE__SDB_VP9_MASK
  467. | UVD_SUVD_CGC_GATE__IME_HEVC_MASK);
  468. WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_GATE, data);
  469. data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL);
  470. data &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK
  471. | UVD_SUVD_CGC_CTRL__SIT_MODE_MASK
  472. | UVD_SUVD_CGC_CTRL__SMP_MODE_MASK
  473. | UVD_SUVD_CGC_CTRL__SCM_MODE_MASK
  474. | UVD_SUVD_CGC_CTRL__SDB_MODE_MASK
  475. | UVD_SUVD_CGC_CTRL__SCLR_MODE_MASK
  476. | UVD_SUVD_CGC_CTRL__UVD_SC_MODE_MASK
  477. | UVD_SUVD_CGC_CTRL__ENT_MODE_MASK
  478. | UVD_SUVD_CGC_CTRL__IME_MODE_MASK
  479. | UVD_SUVD_CGC_CTRL__SITE_MODE_MASK);
  480. WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL, data);
  481. }
  482. /**
  483. * vcn_v1_0_enable_clock_gating - enable VCN clock gating
  484. *
  485. * @adev: amdgpu_device pointer
  486. * @sw: enable SW clock gating
  487. *
  488. * Enable clock gating for VCN block
  489. */
  490. static void vcn_v1_0_enable_clock_gating(struct amdgpu_device *adev)
  491. {
  492. uint32_t data = 0;
  493. /* enable JPEG CGC */
  494. data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL);
  495. if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
  496. data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  497. else
  498. data |= 0 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  499. data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
  500. data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
  501. WREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL, data);
  502. data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE);
  503. data |= (JPEG_CGC_GATE__JPEG_MASK | JPEG_CGC_GATE__JPEG2_MASK);
  504. WREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE, data);
  505. /* enable UVD CGC */
  506. data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
  507. if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
  508. data |= 1 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  509. else
  510. data |= 0 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  511. data |= 1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
  512. data |= 4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
  513. WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
  514. data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
  515. data |= (UVD_CGC_CTRL__UDEC_RE_MODE_MASK
  516. | UVD_CGC_CTRL__UDEC_CM_MODE_MASK
  517. | UVD_CGC_CTRL__UDEC_IT_MODE_MASK
  518. | UVD_CGC_CTRL__UDEC_DB_MODE_MASK
  519. | UVD_CGC_CTRL__UDEC_MP_MODE_MASK
  520. | UVD_CGC_CTRL__SYS_MODE_MASK
  521. | UVD_CGC_CTRL__UDEC_MODE_MASK
  522. | UVD_CGC_CTRL__MPEG2_MODE_MASK
  523. | UVD_CGC_CTRL__REGS_MODE_MASK
  524. | UVD_CGC_CTRL__RBC_MODE_MASK
  525. | UVD_CGC_CTRL__LMI_MC_MODE_MASK
  526. | UVD_CGC_CTRL__LMI_UMC_MODE_MASK
  527. | UVD_CGC_CTRL__IDCT_MODE_MASK
  528. | UVD_CGC_CTRL__MPRD_MODE_MASK
  529. | UVD_CGC_CTRL__MPC_MODE_MASK
  530. | UVD_CGC_CTRL__LBSI_MODE_MASK
  531. | UVD_CGC_CTRL__LRBBM_MODE_MASK
  532. | UVD_CGC_CTRL__WCB_MODE_MASK
  533. | UVD_CGC_CTRL__VCPU_MODE_MASK
  534. | UVD_CGC_CTRL__SCPU_MODE_MASK);
  535. WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
  536. data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL);
  537. data |= (UVD_SUVD_CGC_CTRL__SRE_MODE_MASK
  538. | UVD_SUVD_CGC_CTRL__SIT_MODE_MASK
  539. | UVD_SUVD_CGC_CTRL__SMP_MODE_MASK
  540. | UVD_SUVD_CGC_CTRL__SCM_MODE_MASK
  541. | UVD_SUVD_CGC_CTRL__SDB_MODE_MASK
  542. | UVD_SUVD_CGC_CTRL__SCLR_MODE_MASK
  543. | UVD_SUVD_CGC_CTRL__UVD_SC_MODE_MASK
  544. | UVD_SUVD_CGC_CTRL__ENT_MODE_MASK
  545. | UVD_SUVD_CGC_CTRL__IME_MODE_MASK
  546. | UVD_SUVD_CGC_CTRL__SITE_MODE_MASK);
  547. WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL, data);
  548. }
  549. static void vcn_v1_0_clock_gating_dpg_mode(struct amdgpu_device *adev, uint8_t sram_sel)
  550. {
  551. uint32_t reg_data = 0;
  552. /* disable JPEG CGC */
  553. if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
  554. reg_data = 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  555. else
  556. reg_data = 0 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  557. reg_data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
  558. reg_data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
  559. WREG32_SOC15_DPG_MODE(UVD, 0, mmJPEG_CGC_CTRL, reg_data, 0xFFFFFFFF, sram_sel);
  560. WREG32_SOC15_DPG_MODE(UVD, 0, mmJPEG_CGC_GATE, 0, 0xFFFFFFFF, sram_sel);
  561. /* enable sw clock gating control */
  562. if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
  563. reg_data = 1 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  564. else
  565. reg_data = 0 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  566. reg_data |= 1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
  567. reg_data |= 4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
  568. reg_data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
  569. UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
  570. UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
  571. UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
  572. UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
  573. UVD_CGC_CTRL__SYS_MODE_MASK |
  574. UVD_CGC_CTRL__UDEC_MODE_MASK |
  575. UVD_CGC_CTRL__MPEG2_MODE_MASK |
  576. UVD_CGC_CTRL__REGS_MODE_MASK |
  577. UVD_CGC_CTRL__RBC_MODE_MASK |
  578. UVD_CGC_CTRL__LMI_MC_MODE_MASK |
  579. UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
  580. UVD_CGC_CTRL__IDCT_MODE_MASK |
  581. UVD_CGC_CTRL__MPRD_MODE_MASK |
  582. UVD_CGC_CTRL__MPC_MODE_MASK |
  583. UVD_CGC_CTRL__LBSI_MODE_MASK |
  584. UVD_CGC_CTRL__LRBBM_MODE_MASK |
  585. UVD_CGC_CTRL__WCB_MODE_MASK |
  586. UVD_CGC_CTRL__VCPU_MODE_MASK |
  587. UVD_CGC_CTRL__SCPU_MODE_MASK);
  588. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_CGC_CTRL, reg_data, 0xFFFFFFFF, sram_sel);
  589. /* turn off clock gating */
  590. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_CGC_GATE, 0, 0xFFFFFFFF, sram_sel);
  591. /* turn on SUVD clock gating */
  592. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_SUVD_CGC_GATE, 1, 0xFFFFFFFF, sram_sel);
  593. /* turn on sw mode in UVD_SUVD_CGC_CTRL */
  594. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_SUVD_CGC_CTRL, 0, 0xFFFFFFFF, sram_sel);
  595. }
  596. static void vcn_1_0_disable_static_power_gating(struct amdgpu_device *adev)
  597. {
  598. uint32_t data = 0;
  599. int ret;
  600. if (adev->pg_flags & AMD_PG_SUPPORT_VCN) {
  601. data = (1 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
  602. | 1 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
  603. | 2 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
  604. | 2 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
  605. | 2 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
  606. | 2 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
  607. | 2 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
  608. | 2 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
  609. | 2 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
  610. | 2 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT
  611. | 2 << UVD_PGFSM_CONFIG__UVDW_PWR_CONFIG__SHIFT);
  612. WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
  613. SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, UVD_PGFSM_STATUS__UVDM_UVDU_PWR_ON, 0xFFFFFF, ret);
  614. } else {
  615. data = (1 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
  616. | 1 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
  617. | 1 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
  618. | 1 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
  619. | 1 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
  620. | 1 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
  621. | 1 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
  622. | 1 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
  623. | 1 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
  624. | 1 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT
  625. | 1 << UVD_PGFSM_CONFIG__UVDW_PWR_CONFIG__SHIFT);
  626. WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
  627. SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, 0, 0xFFFFFFFF, ret);
  628. }
  629. /* polling UVD_PGFSM_STATUS to confirm UVDM_PWR_STATUS , UVDU_PWR_STATUS are 0 (power on) */
  630. data = RREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS);
  631. data &= ~0x103;
  632. if (adev->pg_flags & AMD_PG_SUPPORT_VCN)
  633. data |= UVD_PGFSM_CONFIG__UVDM_UVDU_PWR_ON | UVD_POWER_STATUS__UVD_PG_EN_MASK;
  634. WREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS, data);
  635. }
  636. static void vcn_1_0_enable_static_power_gating(struct amdgpu_device *adev)
  637. {
  638. uint32_t data = 0;
  639. int ret;
  640. if (adev->pg_flags & AMD_PG_SUPPORT_VCN) {
  641. /* Before power off, this indicator has to be turned on */
  642. data = RREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS);
  643. data &= ~UVD_POWER_STATUS__UVD_POWER_STATUS_MASK;
  644. data |= UVD_POWER_STATUS__UVD_POWER_STATUS_TILES_OFF;
  645. WREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS, data);
  646. data = (2 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
  647. | 2 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
  648. | 2 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
  649. | 2 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
  650. | 2 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
  651. | 2 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
  652. | 2 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
  653. | 2 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
  654. | 2 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
  655. | 2 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT
  656. | 2 << UVD_PGFSM_CONFIG__UVDW_PWR_CONFIG__SHIFT);
  657. WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
  658. data = (2 << UVD_PGFSM_STATUS__UVDM_PWR_STATUS__SHIFT
  659. | 2 << UVD_PGFSM_STATUS__UVDU_PWR_STATUS__SHIFT
  660. | 2 << UVD_PGFSM_STATUS__UVDF_PWR_STATUS__SHIFT
  661. | 2 << UVD_PGFSM_STATUS__UVDC_PWR_STATUS__SHIFT
  662. | 2 << UVD_PGFSM_STATUS__UVDB_PWR_STATUS__SHIFT
  663. | 2 << UVD_PGFSM_STATUS__UVDIL_PWR_STATUS__SHIFT
  664. | 2 << UVD_PGFSM_STATUS__UVDIR_PWR_STATUS__SHIFT
  665. | 2 << UVD_PGFSM_STATUS__UVDTD_PWR_STATUS__SHIFT
  666. | 2 << UVD_PGFSM_STATUS__UVDTE_PWR_STATUS__SHIFT
  667. | 2 << UVD_PGFSM_STATUS__UVDE_PWR_STATUS__SHIFT
  668. | 2 << UVD_PGFSM_STATUS__UVDW_PWR_STATUS__SHIFT);
  669. SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, data, 0xFFFFFFFF, ret);
  670. }
  671. }
  672. /**
  673. * vcn_v1_0_start - start VCN block
  674. *
  675. * @adev: amdgpu_device pointer
  676. *
  677. * Setup and start the VCN block
  678. */
  679. static int vcn_v1_0_start_spg_mode(struct amdgpu_device *adev)
  680. {
  681. struct amdgpu_ring *ring = &adev->vcn.ring_dec;
  682. uint32_t rb_bufsz, tmp;
  683. uint32_t lmi_swap_cntl;
  684. int i, j, r;
  685. /* disable byte swapping */
  686. lmi_swap_cntl = 0;
  687. vcn_1_0_disable_static_power_gating(adev);
  688. tmp = RREG32_SOC15(UVD, 0, mmUVD_STATUS) | UVD_STATUS__UVD_BUSY;
  689. WREG32_SOC15(UVD, 0, mmUVD_STATUS, tmp);
  690. /* disable clock gating */
  691. vcn_v1_0_disable_clock_gating(adev);
  692. /* disable interupt */
  693. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN), 0,
  694. ~UVD_MASTINT_EN__VCPU_EN_MASK);
  695. /* initialize VCN memory controller */
  696. tmp = RREG32_SOC15(UVD, 0, mmUVD_LMI_CTRL);
  697. WREG32_SOC15(UVD, 0, mmUVD_LMI_CTRL, tmp |
  698. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  699. UVD_LMI_CTRL__MASK_MC_URGENT_MASK |
  700. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  701. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK);
  702. #ifdef __BIG_ENDIAN
  703. /* swap (8 in 32) RB and IB */
  704. lmi_swap_cntl = 0xa;
  705. #endif
  706. WREG32_SOC15(UVD, 0, mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
  707. tmp = RREG32_SOC15(UVD, 0, mmUVD_MPC_CNTL);
  708. tmp &= ~UVD_MPC_CNTL__REPLACEMENT_MODE_MASK;
  709. tmp |= 0x2 << UVD_MPC_CNTL__REPLACEMENT_MODE__SHIFT;
  710. WREG32_SOC15(UVD, 0, mmUVD_MPC_CNTL, tmp);
  711. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXA0,
  712. ((0x1 << UVD_MPC_SET_MUXA0__VARA_1__SHIFT) |
  713. (0x2 << UVD_MPC_SET_MUXA0__VARA_2__SHIFT) |
  714. (0x3 << UVD_MPC_SET_MUXA0__VARA_3__SHIFT) |
  715. (0x4 << UVD_MPC_SET_MUXA0__VARA_4__SHIFT)));
  716. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXB0,
  717. ((0x1 << UVD_MPC_SET_MUXB0__VARB_1__SHIFT) |
  718. (0x2 << UVD_MPC_SET_MUXB0__VARB_2__SHIFT) |
  719. (0x3 << UVD_MPC_SET_MUXB0__VARB_3__SHIFT) |
  720. (0x4 << UVD_MPC_SET_MUXB0__VARB_4__SHIFT)));
  721. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUX,
  722. ((0x0 << UVD_MPC_SET_MUX__SET_0__SHIFT) |
  723. (0x1 << UVD_MPC_SET_MUX__SET_1__SHIFT) |
  724. (0x2 << UVD_MPC_SET_MUX__SET_2__SHIFT)));
  725. vcn_v1_0_mc_resume_spg_mode(adev);
  726. WREG32_SOC15(UVD, 0, mmUVD_REG_XX_MASK, 0x10);
  727. WREG32_SOC15(UVD, 0, mmUVD_RBC_XX_IB_REG_CHECK,
  728. RREG32_SOC15(UVD, 0, mmUVD_RBC_XX_IB_REG_CHECK) | 0x3);
  729. /* enable VCPU clock */
  730. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CNTL, UVD_VCPU_CNTL__CLK_EN_MASK);
  731. /* boot up the VCPU */
  732. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET), 0,
  733. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  734. /* enable UMC */
  735. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2), 0,
  736. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  737. tmp = RREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET);
  738. tmp &= ~UVD_SOFT_RESET__LMI_SOFT_RESET_MASK;
  739. tmp &= ~UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK;
  740. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET, tmp);
  741. for (i = 0; i < 10; ++i) {
  742. uint32_t status;
  743. for (j = 0; j < 100; ++j) {
  744. status = RREG32_SOC15(UVD, 0, mmUVD_STATUS);
  745. if (status & UVD_STATUS__IDLE)
  746. break;
  747. mdelay(10);
  748. }
  749. r = 0;
  750. if (status & UVD_STATUS__IDLE)
  751. break;
  752. DRM_ERROR("VCN decode not responding, trying to reset the VCPU!!!\n");
  753. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  754. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
  755. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  756. mdelay(10);
  757. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET), 0,
  758. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  759. mdelay(10);
  760. r = -1;
  761. }
  762. if (r) {
  763. DRM_ERROR("VCN decode not responding, giving up!!!\n");
  764. return r;
  765. }
  766. /* enable master interrupt */
  767. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN),
  768. UVD_MASTINT_EN__VCPU_EN_MASK, ~UVD_MASTINT_EN__VCPU_EN_MASK);
  769. /* enable system interrupt for JRBC, TODO: move to set interrupt*/
  770. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SYS_INT_EN),
  771. UVD_SYS_INT_EN__UVD_JRBC_EN_MASK,
  772. ~UVD_SYS_INT_EN__UVD_JRBC_EN_MASK);
  773. /* clear the busy bit of UVD_STATUS */
  774. tmp = RREG32_SOC15(UVD, 0, mmUVD_STATUS) & ~UVD_STATUS__UVD_BUSY;
  775. WREG32_SOC15(UVD, 0, mmUVD_STATUS, tmp);
  776. /* force RBC into idle state */
  777. rb_bufsz = order_base_2(ring->ring_size);
  778. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
  779. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
  780. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  781. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
  782. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
  783. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, tmp);
  784. /* set the write pointer delay */
  785. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR_CNTL, 0);
  786. /* set the wb address */
  787. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR_ADDR,
  788. (upper_32_bits(ring->gpu_addr) >> 2));
  789. /* programm the RB_BASE for ring buffer */
  790. WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
  791. lower_32_bits(ring->gpu_addr));
  792. WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
  793. upper_32_bits(ring->gpu_addr));
  794. /* Initialize the ring buffer's read and write pointers */
  795. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR, 0);
  796. WREG32_SOC15(UVD, 0, mmUVD_SCRATCH2, 0);
  797. ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
  798. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR,
  799. lower_32_bits(ring->wptr));
  800. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_RB_CNTL), 0,
  801. ~UVD_RBC_RB_CNTL__RB_NO_FETCH_MASK);
  802. ring = &adev->vcn.ring_enc[0];
  803. WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
  804. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
  805. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO, ring->gpu_addr);
  806. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
  807. WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE, ring->ring_size / 4);
  808. ring = &adev->vcn.ring_enc[1];
  809. WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
  810. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
  811. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO2, ring->gpu_addr);
  812. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
  813. WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE2, ring->ring_size / 4);
  814. ring = &adev->vcn.ring_jpeg;
  815. WREG32_SOC15(UVD, 0, mmUVD_LMI_JRBC_RB_VMID, 0);
  816. WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_CNTL, UVD_JRBC_RB_CNTL__RB_NO_FETCH_MASK |
  817. UVD_JRBC_RB_CNTL__RB_RPTR_WR_EN_MASK);
  818. WREG32_SOC15(UVD, 0, mmUVD_LMI_JRBC_RB_64BIT_BAR_LOW, lower_32_bits(ring->gpu_addr));
  819. WREG32_SOC15(UVD, 0, mmUVD_LMI_JRBC_RB_64BIT_BAR_HIGH, upper_32_bits(ring->gpu_addr));
  820. WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_RPTR, 0);
  821. WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR, 0);
  822. WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_CNTL, UVD_JRBC_RB_CNTL__RB_RPTR_WR_EN_MASK);
  823. /* initialize wptr */
  824. ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR);
  825. /* copy patch commands to the jpeg ring */
  826. vcn_v1_0_jpeg_ring_set_patch_ring(ring,
  827. (ring->wptr + ring->max_dw * amdgpu_sched_hw_submission));
  828. return 0;
  829. }
  830. static int vcn_v1_0_start_dpg_mode(struct amdgpu_device *adev)
  831. {
  832. struct amdgpu_ring *ring = &adev->vcn.ring_dec;
  833. uint32_t rb_bufsz, tmp;
  834. uint32_t lmi_swap_cntl;
  835. /* disable byte swapping */
  836. lmi_swap_cntl = 0;
  837. vcn_1_0_enable_static_power_gating(adev);
  838. /* enable dynamic power gating mode */
  839. tmp = RREG32_SOC15(UVD, 0, mmUVD_POWER_STATUS);
  840. tmp |= UVD_POWER_STATUS__UVD_PG_MODE_MASK;
  841. tmp |= UVD_POWER_STATUS__UVD_PG_EN_MASK;
  842. WREG32_SOC15(UVD, 0, mmUVD_POWER_STATUS, tmp);
  843. /* enable clock gating */
  844. vcn_v1_0_clock_gating_dpg_mode(adev, 0);
  845. /* enable VCPU clock */
  846. tmp = (0xFF << UVD_VCPU_CNTL__PRB_TIMEOUT_VAL__SHIFT);
  847. tmp |= UVD_VCPU_CNTL__CLK_EN_MASK;
  848. tmp |= UVD_VCPU_CNTL__MIF_WR_LOW_THRESHOLD_BP_MASK;
  849. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_VCPU_CNTL, tmp, 0xFFFFFFFF, 0);
  850. /* disable interupt */
  851. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MASTINT_EN,
  852. 0, UVD_MASTINT_EN__VCPU_EN_MASK, 0);
  853. /* initialize VCN memory controller */
  854. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_CTRL,
  855. (8 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  856. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  857. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  858. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  859. UVD_LMI_CTRL__REQ_MODE_MASK |
  860. UVD_LMI_CTRL__CRC_RESET_MASK |
  861. UVD_LMI_CTRL__MASK_MC_URGENT_MASK |
  862. 0x00100000L, 0xFFFFFFFF, 0);
  863. #ifdef __BIG_ENDIAN
  864. /* swap (8 in 32) RB and IB */
  865. lmi_swap_cntl = 0xa;
  866. #endif
  867. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl, 0xFFFFFFFF, 0);
  868. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MPC_CNTL,
  869. 0x2 << UVD_MPC_CNTL__REPLACEMENT_MODE__SHIFT, 0xFFFFFFFF, 0);
  870. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MPC_SET_MUXA0,
  871. ((0x1 << UVD_MPC_SET_MUXA0__VARA_1__SHIFT) |
  872. (0x2 << UVD_MPC_SET_MUXA0__VARA_2__SHIFT) |
  873. (0x3 << UVD_MPC_SET_MUXA0__VARA_3__SHIFT) |
  874. (0x4 << UVD_MPC_SET_MUXA0__VARA_4__SHIFT)), 0xFFFFFFFF, 0);
  875. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MPC_SET_MUXB0,
  876. ((0x1 << UVD_MPC_SET_MUXB0__VARB_1__SHIFT) |
  877. (0x2 << UVD_MPC_SET_MUXB0__VARB_2__SHIFT) |
  878. (0x3 << UVD_MPC_SET_MUXB0__VARB_3__SHIFT) |
  879. (0x4 << UVD_MPC_SET_MUXB0__VARB_4__SHIFT)), 0xFFFFFFFF, 0);
  880. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MPC_SET_MUX,
  881. ((0x0 << UVD_MPC_SET_MUX__SET_0__SHIFT) |
  882. (0x1 << UVD_MPC_SET_MUX__SET_1__SHIFT) |
  883. (0x2 << UVD_MPC_SET_MUX__SET_2__SHIFT)), 0xFFFFFFFF, 0);
  884. vcn_v1_0_mc_resume_dpg_mode(adev);
  885. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_REG_XX_MASK, 0x10, 0xFFFFFFFF, 0);
  886. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_RBC_XX_IB_REG_CHECK, 0x3, 0xFFFFFFFF, 0);
  887. /* boot up the VCPU */
  888. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_SOFT_RESET, 0, 0xFFFFFFFF, 0);
  889. /* enable UMC */
  890. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_CTRL2,
  891. 0x1F << UVD_LMI_CTRL2__RE_OFLD_MIF_WR_REQ_NUM__SHIFT,
  892. 0xFFFFFFFF, 0);
  893. /* enable master interrupt */
  894. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_MASTINT_EN,
  895. UVD_MASTINT_EN__VCPU_EN_MASK, UVD_MASTINT_EN__VCPU_EN_MASK, 0);
  896. vcn_v1_0_clock_gating_dpg_mode(adev, 1);
  897. /* setup mmUVD_LMI_CTRL */
  898. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_LMI_CTRL,
  899. (8 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  900. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  901. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  902. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  903. UVD_LMI_CTRL__REQ_MODE_MASK |
  904. UVD_LMI_CTRL__CRC_RESET_MASK |
  905. UVD_LMI_CTRL__MASK_MC_URGENT_MASK |
  906. 0x00100000L, 0xFFFFFFFF, 1);
  907. tmp = adev->gfx.config.gb_addr_config;
  908. /* setup VCN global tiling registers */
  909. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_JPEG_ADDR_CONFIG, tmp, 0xFFFFFFFF, 1);
  910. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_JPEG_UV_ADDR_CONFIG, tmp, 0xFFFFFFFF, 1);
  911. /* enable System Interrupt for JRBC */
  912. WREG32_SOC15_DPG_MODE(UVD, 0, mmUVD_SYS_INT_EN,
  913. UVD_SYS_INT_EN__UVD_JRBC_EN_MASK, 0xFFFFFFFF, 1);
  914. /* force RBC into idle state */
  915. rb_bufsz = order_base_2(ring->ring_size);
  916. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
  917. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
  918. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  919. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
  920. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
  921. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, tmp);
  922. /* set the write pointer delay */
  923. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR_CNTL, 0);
  924. /* set the wb address */
  925. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR_ADDR,
  926. (upper_32_bits(ring->gpu_addr) >> 2));
  927. /* programm the RB_BASE for ring buffer */
  928. WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
  929. lower_32_bits(ring->gpu_addr));
  930. WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
  931. upper_32_bits(ring->gpu_addr));
  932. /* Initialize the ring buffer's read and write pointers */
  933. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR, 0);
  934. WREG32_SOC15(UVD, 0, mmUVD_SCRATCH2, 0);
  935. ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
  936. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR,
  937. lower_32_bits(ring->wptr));
  938. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_RB_CNTL), 0,
  939. ~UVD_RBC_RB_CNTL__RB_NO_FETCH_MASK);
  940. /* initialize wptr */
  941. ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR);
  942. /* copy patch commands to the jpeg ring */
  943. vcn_v1_0_jpeg_ring_set_patch_ring(ring,
  944. (ring->wptr + ring->max_dw * amdgpu_sched_hw_submission));
  945. return 0;
  946. }
  947. static int vcn_v1_0_start(struct amdgpu_device *adev)
  948. {
  949. int r;
  950. if (adev->pg_flags & AMD_PG_SUPPORT_VCN_DPG)
  951. r = vcn_v1_0_start_dpg_mode(adev);
  952. else
  953. r = vcn_v1_0_start_spg_mode(adev);
  954. return r;
  955. }
  956. /**
  957. * vcn_v1_0_stop - stop VCN block
  958. *
  959. * @adev: amdgpu_device pointer
  960. *
  961. * stop the VCN block
  962. */
  963. static int vcn_v1_0_stop_spg_mode(struct amdgpu_device *adev)
  964. {
  965. int ret_code, tmp;
  966. SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_STATUS, UVD_STATUS__IDLE, 0x7, ret_code);
  967. tmp = UVD_LMI_STATUS__VCPU_LMI_WRITE_CLEAN_MASK |
  968. UVD_LMI_STATUS__READ_CLEAN_MASK |
  969. UVD_LMI_STATUS__WRITE_CLEAN_MASK |
  970. UVD_LMI_STATUS__WRITE_CLEAN_RAW_MASK;
  971. SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_LMI_STATUS, tmp, tmp, ret_code);
  972. /* put VCPU into reset */
  973. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  974. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
  975. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  976. tmp = UVD_LMI_STATUS__UMC_READ_CLEAN_RAW_MASK |
  977. UVD_LMI_STATUS__UMC_WRITE_CLEAN_RAW_MASK;
  978. SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_LMI_STATUS, tmp, tmp, ret_code);
  979. /* disable VCPU clock */
  980. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_VCPU_CNTL), 0,
  981. ~UVD_VCPU_CNTL__CLK_EN_MASK);
  982. /* reset LMI UMC/LMI */
  983. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  984. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK,
  985. ~UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
  986. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  987. UVD_SOFT_RESET__LMI_SOFT_RESET_MASK,
  988. ~UVD_SOFT_RESET__LMI_SOFT_RESET_MASK);
  989. WREG32_SOC15(UVD, 0, mmUVD_STATUS, 0);
  990. vcn_v1_0_enable_clock_gating(adev);
  991. vcn_1_0_enable_static_power_gating(adev);
  992. return 0;
  993. }
  994. static int vcn_v1_0_stop_dpg_mode(struct amdgpu_device *adev)
  995. {
  996. int ret_code = 0;
  997. /* Wait for power status to be UVD_POWER_STATUS__UVD_POWER_STATUS_TILES_OFF */
  998. SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_POWER_STATUS,
  999. UVD_POWER_STATUS__UVD_POWER_STATUS_TILES_OFF,
  1000. UVD_POWER_STATUS__UVD_POWER_STATUS_MASK, ret_code);
  1001. if (!ret_code) {
  1002. int tmp = RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR) & 0x7FFFFFFF;
  1003. /* wait for read ptr to be equal to write ptr */
  1004. SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_RBC_RB_RPTR, tmp, 0xFFFFFFFF, ret_code);
  1005. SOC15_WAIT_ON_RREG(UVD, 0, mmUVD_POWER_STATUS,
  1006. UVD_POWER_STATUS__UVD_POWER_STATUS_TILES_OFF,
  1007. UVD_POWER_STATUS__UVD_POWER_STATUS_MASK, ret_code);
  1008. }
  1009. /* disable dynamic power gating mode */
  1010. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_POWER_STATUS), 0,
  1011. ~UVD_POWER_STATUS__UVD_PG_MODE_MASK);
  1012. return 0;
  1013. }
  1014. static int vcn_v1_0_stop(struct amdgpu_device *adev)
  1015. {
  1016. int r;
  1017. if (adev->pg_flags & AMD_PG_SUPPORT_VCN_DPG)
  1018. r = vcn_v1_0_stop_dpg_mode(adev);
  1019. else
  1020. r = vcn_v1_0_stop_spg_mode(adev);
  1021. return r;
  1022. }
  1023. static bool vcn_v1_0_is_idle(void *handle)
  1024. {
  1025. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1026. return (RREG32_SOC15(VCN, 0, mmUVD_STATUS) == UVD_STATUS__IDLE);
  1027. }
  1028. static int vcn_v1_0_wait_for_idle(void *handle)
  1029. {
  1030. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1031. int ret = 0;
  1032. SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_STATUS, UVD_STATUS__IDLE,
  1033. UVD_STATUS__IDLE, ret);
  1034. return ret;
  1035. }
  1036. static int vcn_v1_0_set_clockgating_state(void *handle,
  1037. enum amd_clockgating_state state)
  1038. {
  1039. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1040. bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
  1041. if (enable) {
  1042. /* wait for STATUS to clear */
  1043. if (vcn_v1_0_is_idle(handle))
  1044. return -EBUSY;
  1045. vcn_v1_0_enable_clock_gating(adev);
  1046. } else {
  1047. /* disable HW gating and enable Sw gating */
  1048. vcn_v1_0_disable_clock_gating(adev);
  1049. }
  1050. return 0;
  1051. }
  1052. /**
  1053. * vcn_v1_0_dec_ring_get_rptr - get read pointer
  1054. *
  1055. * @ring: amdgpu_ring pointer
  1056. *
  1057. * Returns the current hardware read pointer
  1058. */
  1059. static uint64_t vcn_v1_0_dec_ring_get_rptr(struct amdgpu_ring *ring)
  1060. {
  1061. struct amdgpu_device *adev = ring->adev;
  1062. return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
  1063. }
  1064. /**
  1065. * vcn_v1_0_dec_ring_get_wptr - get write pointer
  1066. *
  1067. * @ring: amdgpu_ring pointer
  1068. *
  1069. * Returns the current hardware write pointer
  1070. */
  1071. static uint64_t vcn_v1_0_dec_ring_get_wptr(struct amdgpu_ring *ring)
  1072. {
  1073. struct amdgpu_device *adev = ring->adev;
  1074. return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR);
  1075. }
  1076. /**
  1077. * vcn_v1_0_dec_ring_set_wptr - set write pointer
  1078. *
  1079. * @ring: amdgpu_ring pointer
  1080. *
  1081. * Commits the write pointer to the hardware
  1082. */
  1083. static void vcn_v1_0_dec_ring_set_wptr(struct amdgpu_ring *ring)
  1084. {
  1085. struct amdgpu_device *adev = ring->adev;
  1086. if (adev->pg_flags & AMD_PG_SUPPORT_VCN_DPG)
  1087. WREG32_SOC15(UVD, 0, mmUVD_SCRATCH2,
  1088. lower_32_bits(ring->wptr) | 0x80000000);
  1089. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
  1090. }
  1091. /**
  1092. * vcn_v1_0_dec_ring_insert_start - insert a start command
  1093. *
  1094. * @ring: amdgpu_ring pointer
  1095. *
  1096. * Write a start command to the ring.
  1097. */
  1098. static void vcn_v1_0_dec_ring_insert_start(struct amdgpu_ring *ring)
  1099. {
  1100. struct amdgpu_device *adev = ring->adev;
  1101. amdgpu_ring_write(ring,
  1102. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  1103. amdgpu_ring_write(ring, 0);
  1104. amdgpu_ring_write(ring,
  1105. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  1106. amdgpu_ring_write(ring, VCN_DEC_CMD_PACKET_START << 1);
  1107. }
  1108. /**
  1109. * vcn_v1_0_dec_ring_insert_end - insert a end command
  1110. *
  1111. * @ring: amdgpu_ring pointer
  1112. *
  1113. * Write a end command to the ring.
  1114. */
  1115. static void vcn_v1_0_dec_ring_insert_end(struct amdgpu_ring *ring)
  1116. {
  1117. struct amdgpu_device *adev = ring->adev;
  1118. amdgpu_ring_write(ring,
  1119. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  1120. amdgpu_ring_write(ring, VCN_DEC_CMD_PACKET_END << 1);
  1121. }
  1122. /**
  1123. * vcn_v1_0_dec_ring_emit_fence - emit an fence & trap command
  1124. *
  1125. * @ring: amdgpu_ring pointer
  1126. * @fence: fence to emit
  1127. *
  1128. * Write a fence and a trap command to the ring.
  1129. */
  1130. static void vcn_v1_0_dec_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
  1131. unsigned flags)
  1132. {
  1133. struct amdgpu_device *adev = ring->adev;
  1134. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  1135. amdgpu_ring_write(ring,
  1136. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_CONTEXT_ID), 0));
  1137. amdgpu_ring_write(ring, seq);
  1138. amdgpu_ring_write(ring,
  1139. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  1140. amdgpu_ring_write(ring, addr & 0xffffffff);
  1141. amdgpu_ring_write(ring,
  1142. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  1143. amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
  1144. amdgpu_ring_write(ring,
  1145. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  1146. amdgpu_ring_write(ring, VCN_DEC_CMD_FENCE << 1);
  1147. amdgpu_ring_write(ring,
  1148. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  1149. amdgpu_ring_write(ring, 0);
  1150. amdgpu_ring_write(ring,
  1151. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  1152. amdgpu_ring_write(ring, 0);
  1153. amdgpu_ring_write(ring,
  1154. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  1155. amdgpu_ring_write(ring, VCN_DEC_CMD_TRAP << 1);
  1156. }
  1157. /**
  1158. * vcn_v1_0_dec_ring_emit_ib - execute indirect buffer
  1159. *
  1160. * @ring: amdgpu_ring pointer
  1161. * @ib: indirect buffer to execute
  1162. *
  1163. * Write ring commands to execute the indirect buffer
  1164. */
  1165. static void vcn_v1_0_dec_ring_emit_ib(struct amdgpu_ring *ring,
  1166. struct amdgpu_ib *ib,
  1167. unsigned vmid, bool ctx_switch)
  1168. {
  1169. struct amdgpu_device *adev = ring->adev;
  1170. amdgpu_ring_write(ring,
  1171. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_VMID), 0));
  1172. amdgpu_ring_write(ring, vmid);
  1173. amdgpu_ring_write(ring,
  1174. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_64BIT_BAR_LOW), 0));
  1175. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1176. amdgpu_ring_write(ring,
  1177. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH), 0));
  1178. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1179. amdgpu_ring_write(ring,
  1180. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_IB_SIZE), 0));
  1181. amdgpu_ring_write(ring, ib->length_dw);
  1182. }
  1183. static void vcn_v1_0_dec_ring_emit_reg_wait(struct amdgpu_ring *ring,
  1184. uint32_t reg, uint32_t val,
  1185. uint32_t mask)
  1186. {
  1187. struct amdgpu_device *adev = ring->adev;
  1188. amdgpu_ring_write(ring,
  1189. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  1190. amdgpu_ring_write(ring, reg << 2);
  1191. amdgpu_ring_write(ring,
  1192. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  1193. amdgpu_ring_write(ring, val);
  1194. amdgpu_ring_write(ring,
  1195. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GP_SCRATCH8), 0));
  1196. amdgpu_ring_write(ring, mask);
  1197. amdgpu_ring_write(ring,
  1198. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  1199. amdgpu_ring_write(ring, VCN_DEC_CMD_REG_READ_COND_WAIT << 1);
  1200. }
  1201. static void vcn_v1_0_dec_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1202. unsigned vmid, uint64_t pd_addr)
  1203. {
  1204. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1205. uint32_t data0, data1, mask;
  1206. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  1207. /* wait for register write */
  1208. data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
  1209. data1 = lower_32_bits(pd_addr);
  1210. mask = 0xffffffff;
  1211. vcn_v1_0_dec_ring_emit_reg_wait(ring, data0, data1, mask);
  1212. }
  1213. static void vcn_v1_0_dec_ring_emit_wreg(struct amdgpu_ring *ring,
  1214. uint32_t reg, uint32_t val)
  1215. {
  1216. struct amdgpu_device *adev = ring->adev;
  1217. amdgpu_ring_write(ring,
  1218. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  1219. amdgpu_ring_write(ring, reg << 2);
  1220. amdgpu_ring_write(ring,
  1221. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  1222. amdgpu_ring_write(ring, val);
  1223. amdgpu_ring_write(ring,
  1224. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  1225. amdgpu_ring_write(ring, VCN_DEC_CMD_WRITE_REG << 1);
  1226. }
  1227. /**
  1228. * vcn_v1_0_enc_ring_get_rptr - get enc read pointer
  1229. *
  1230. * @ring: amdgpu_ring pointer
  1231. *
  1232. * Returns the current hardware enc read pointer
  1233. */
  1234. static uint64_t vcn_v1_0_enc_ring_get_rptr(struct amdgpu_ring *ring)
  1235. {
  1236. struct amdgpu_device *adev = ring->adev;
  1237. if (ring == &adev->vcn.ring_enc[0])
  1238. return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR);
  1239. else
  1240. return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2);
  1241. }
  1242. /**
  1243. * vcn_v1_0_enc_ring_get_wptr - get enc write pointer
  1244. *
  1245. * @ring: amdgpu_ring pointer
  1246. *
  1247. * Returns the current hardware enc write pointer
  1248. */
  1249. static uint64_t vcn_v1_0_enc_ring_get_wptr(struct amdgpu_ring *ring)
  1250. {
  1251. struct amdgpu_device *adev = ring->adev;
  1252. if (ring == &adev->vcn.ring_enc[0])
  1253. return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR);
  1254. else
  1255. return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2);
  1256. }
  1257. /**
  1258. * vcn_v1_0_enc_ring_set_wptr - set enc write pointer
  1259. *
  1260. * @ring: amdgpu_ring pointer
  1261. *
  1262. * Commits the enc write pointer to the hardware
  1263. */
  1264. static void vcn_v1_0_enc_ring_set_wptr(struct amdgpu_ring *ring)
  1265. {
  1266. struct amdgpu_device *adev = ring->adev;
  1267. if (ring == &adev->vcn.ring_enc[0])
  1268. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR,
  1269. lower_32_bits(ring->wptr));
  1270. else
  1271. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2,
  1272. lower_32_bits(ring->wptr));
  1273. }
  1274. /**
  1275. * vcn_v1_0_enc_ring_emit_fence - emit an enc fence & trap command
  1276. *
  1277. * @ring: amdgpu_ring pointer
  1278. * @fence: fence to emit
  1279. *
  1280. * Write enc a fence and a trap command to the ring.
  1281. */
  1282. static void vcn_v1_0_enc_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
  1283. u64 seq, unsigned flags)
  1284. {
  1285. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  1286. amdgpu_ring_write(ring, VCN_ENC_CMD_FENCE);
  1287. amdgpu_ring_write(ring, addr);
  1288. amdgpu_ring_write(ring, upper_32_bits(addr));
  1289. amdgpu_ring_write(ring, seq);
  1290. amdgpu_ring_write(ring, VCN_ENC_CMD_TRAP);
  1291. }
  1292. static void vcn_v1_0_enc_ring_insert_end(struct amdgpu_ring *ring)
  1293. {
  1294. amdgpu_ring_write(ring, VCN_ENC_CMD_END);
  1295. }
  1296. /**
  1297. * vcn_v1_0_enc_ring_emit_ib - enc execute indirect buffer
  1298. *
  1299. * @ring: amdgpu_ring pointer
  1300. * @ib: indirect buffer to execute
  1301. *
  1302. * Write enc ring commands to execute the indirect buffer
  1303. */
  1304. static void vcn_v1_0_enc_ring_emit_ib(struct amdgpu_ring *ring,
  1305. struct amdgpu_ib *ib, unsigned int vmid, bool ctx_switch)
  1306. {
  1307. amdgpu_ring_write(ring, VCN_ENC_CMD_IB);
  1308. amdgpu_ring_write(ring, vmid);
  1309. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1310. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1311. amdgpu_ring_write(ring, ib->length_dw);
  1312. }
  1313. static void vcn_v1_0_enc_ring_emit_reg_wait(struct amdgpu_ring *ring,
  1314. uint32_t reg, uint32_t val,
  1315. uint32_t mask)
  1316. {
  1317. amdgpu_ring_write(ring, VCN_ENC_CMD_REG_WAIT);
  1318. amdgpu_ring_write(ring, reg << 2);
  1319. amdgpu_ring_write(ring, mask);
  1320. amdgpu_ring_write(ring, val);
  1321. }
  1322. static void vcn_v1_0_enc_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1323. unsigned int vmid, uint64_t pd_addr)
  1324. {
  1325. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1326. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  1327. /* wait for reg writes */
  1328. vcn_v1_0_enc_ring_emit_reg_wait(ring, hub->ctx0_ptb_addr_lo32 + vmid * 2,
  1329. lower_32_bits(pd_addr), 0xffffffff);
  1330. }
  1331. static void vcn_v1_0_enc_ring_emit_wreg(struct amdgpu_ring *ring,
  1332. uint32_t reg, uint32_t val)
  1333. {
  1334. amdgpu_ring_write(ring, VCN_ENC_CMD_REG_WRITE);
  1335. amdgpu_ring_write(ring, reg << 2);
  1336. amdgpu_ring_write(ring, val);
  1337. }
  1338. /**
  1339. * vcn_v1_0_jpeg_ring_get_rptr - get read pointer
  1340. *
  1341. * @ring: amdgpu_ring pointer
  1342. *
  1343. * Returns the current hardware read pointer
  1344. */
  1345. static uint64_t vcn_v1_0_jpeg_ring_get_rptr(struct amdgpu_ring *ring)
  1346. {
  1347. struct amdgpu_device *adev = ring->adev;
  1348. return RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_RPTR);
  1349. }
  1350. /**
  1351. * vcn_v1_0_jpeg_ring_get_wptr - get write pointer
  1352. *
  1353. * @ring: amdgpu_ring pointer
  1354. *
  1355. * Returns the current hardware write pointer
  1356. */
  1357. static uint64_t vcn_v1_0_jpeg_ring_get_wptr(struct amdgpu_ring *ring)
  1358. {
  1359. struct amdgpu_device *adev = ring->adev;
  1360. return RREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR);
  1361. }
  1362. /**
  1363. * vcn_v1_0_jpeg_ring_set_wptr - set write pointer
  1364. *
  1365. * @ring: amdgpu_ring pointer
  1366. *
  1367. * Commits the write pointer to the hardware
  1368. */
  1369. static void vcn_v1_0_jpeg_ring_set_wptr(struct amdgpu_ring *ring)
  1370. {
  1371. struct amdgpu_device *adev = ring->adev;
  1372. WREG32_SOC15(UVD, 0, mmUVD_JRBC_RB_WPTR, lower_32_bits(ring->wptr));
  1373. }
  1374. /**
  1375. * vcn_v1_0_jpeg_ring_insert_start - insert a start command
  1376. *
  1377. * @ring: amdgpu_ring pointer
  1378. *
  1379. * Write a start command to the ring.
  1380. */
  1381. static void vcn_v1_0_jpeg_ring_insert_start(struct amdgpu_ring *ring)
  1382. {
  1383. struct amdgpu_device *adev = ring->adev;
  1384. amdgpu_ring_write(ring,
  1385. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0));
  1386. amdgpu_ring_write(ring, 0x68e04);
  1387. amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE0));
  1388. amdgpu_ring_write(ring, 0x80010000);
  1389. }
  1390. /**
  1391. * vcn_v1_0_jpeg_ring_insert_end - insert a end command
  1392. *
  1393. * @ring: amdgpu_ring pointer
  1394. *
  1395. * Write a end command to the ring.
  1396. */
  1397. static void vcn_v1_0_jpeg_ring_insert_end(struct amdgpu_ring *ring)
  1398. {
  1399. struct amdgpu_device *adev = ring->adev;
  1400. amdgpu_ring_write(ring,
  1401. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0));
  1402. amdgpu_ring_write(ring, 0x68e04);
  1403. amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE0));
  1404. amdgpu_ring_write(ring, 0x00010000);
  1405. }
  1406. /**
  1407. * vcn_v1_0_jpeg_ring_emit_fence - emit an fence & trap command
  1408. *
  1409. * @ring: amdgpu_ring pointer
  1410. * @fence: fence to emit
  1411. *
  1412. * Write a fence and a trap command to the ring.
  1413. */
  1414. static void vcn_v1_0_jpeg_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
  1415. unsigned flags)
  1416. {
  1417. struct amdgpu_device *adev = ring->adev;
  1418. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  1419. amdgpu_ring_write(ring,
  1420. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_GPCOM_DATA0), 0, 0, PACKETJ_TYPE0));
  1421. amdgpu_ring_write(ring, seq);
  1422. amdgpu_ring_write(ring,
  1423. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_GPCOM_DATA1), 0, 0, PACKETJ_TYPE0));
  1424. amdgpu_ring_write(ring, seq);
  1425. amdgpu_ring_write(ring,
  1426. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_LOW), 0, 0, PACKETJ_TYPE0));
  1427. amdgpu_ring_write(ring, lower_32_bits(addr));
  1428. amdgpu_ring_write(ring,
  1429. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_WR_64BIT_BAR_HIGH), 0, 0, PACKETJ_TYPE0));
  1430. amdgpu_ring_write(ring, upper_32_bits(addr));
  1431. amdgpu_ring_write(ring,
  1432. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_GPCOM_CMD), 0, 0, PACKETJ_TYPE0));
  1433. amdgpu_ring_write(ring, 0x8);
  1434. amdgpu_ring_write(ring,
  1435. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JPEG_GPCOM_CMD), 0, PACKETJ_CONDITION_CHECK0, PACKETJ_TYPE4));
  1436. amdgpu_ring_write(ring, 0);
  1437. amdgpu_ring_write(ring,
  1438. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_COND_RD_TIMER), 0, 0, PACKETJ_TYPE0));
  1439. amdgpu_ring_write(ring, 0x01400200);
  1440. amdgpu_ring_write(ring,
  1441. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_REF_DATA), 0, 0, PACKETJ_TYPE0));
  1442. amdgpu_ring_write(ring, seq);
  1443. amdgpu_ring_write(ring,
  1444. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW), 0, 0, PACKETJ_TYPE0));
  1445. amdgpu_ring_write(ring, lower_32_bits(addr));
  1446. amdgpu_ring_write(ring,
  1447. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH), 0, 0, PACKETJ_TYPE0));
  1448. amdgpu_ring_write(ring, upper_32_bits(addr));
  1449. amdgpu_ring_write(ring,
  1450. PACKETJ(0, 0, PACKETJ_CONDITION_CHECK3, PACKETJ_TYPE2));
  1451. amdgpu_ring_write(ring, 0xffffffff);
  1452. amdgpu_ring_write(ring,
  1453. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0));
  1454. amdgpu_ring_write(ring, 0x3fbc);
  1455. amdgpu_ring_write(ring,
  1456. PACKETJ(0, 0, 0, PACKETJ_TYPE0));
  1457. amdgpu_ring_write(ring, 0x1);
  1458. /* emit trap */
  1459. amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE7));
  1460. amdgpu_ring_write(ring, 0);
  1461. }
  1462. /**
  1463. * vcn_v1_0_jpeg_ring_emit_ib - execute indirect buffer
  1464. *
  1465. * @ring: amdgpu_ring pointer
  1466. * @ib: indirect buffer to execute
  1467. *
  1468. * Write ring commands to execute the indirect buffer.
  1469. */
  1470. static void vcn_v1_0_jpeg_ring_emit_ib(struct amdgpu_ring *ring,
  1471. struct amdgpu_ib *ib,
  1472. unsigned vmid, bool ctx_switch)
  1473. {
  1474. struct amdgpu_device *adev = ring->adev;
  1475. amdgpu_ring_write(ring,
  1476. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_IB_VMID), 0, 0, PACKETJ_TYPE0));
  1477. amdgpu_ring_write(ring, (vmid | (vmid << 4)));
  1478. amdgpu_ring_write(ring,
  1479. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JPEG_VMID), 0, 0, PACKETJ_TYPE0));
  1480. amdgpu_ring_write(ring, (vmid | (vmid << 4)));
  1481. amdgpu_ring_write(ring,
  1482. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_IB_64BIT_BAR_LOW), 0, 0, PACKETJ_TYPE0));
  1483. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  1484. amdgpu_ring_write(ring,
  1485. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_IB_64BIT_BAR_HIGH), 0, 0, PACKETJ_TYPE0));
  1486. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  1487. amdgpu_ring_write(ring,
  1488. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_IB_SIZE), 0, 0, PACKETJ_TYPE0));
  1489. amdgpu_ring_write(ring, ib->length_dw);
  1490. amdgpu_ring_write(ring,
  1491. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW), 0, 0, PACKETJ_TYPE0));
  1492. amdgpu_ring_write(ring, lower_32_bits(ring->gpu_addr));
  1493. amdgpu_ring_write(ring,
  1494. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH), 0, 0, PACKETJ_TYPE0));
  1495. amdgpu_ring_write(ring, upper_32_bits(ring->gpu_addr));
  1496. amdgpu_ring_write(ring,
  1497. PACKETJ(0, 0, PACKETJ_CONDITION_CHECK0, PACKETJ_TYPE2));
  1498. amdgpu_ring_write(ring, 0);
  1499. amdgpu_ring_write(ring,
  1500. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_COND_RD_TIMER), 0, 0, PACKETJ_TYPE0));
  1501. amdgpu_ring_write(ring, 0x01400200);
  1502. amdgpu_ring_write(ring,
  1503. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_REF_DATA), 0, 0, PACKETJ_TYPE0));
  1504. amdgpu_ring_write(ring, 0x2);
  1505. amdgpu_ring_write(ring,
  1506. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_STATUS), 0, PACKETJ_CONDITION_CHECK3, PACKETJ_TYPE3));
  1507. amdgpu_ring_write(ring, 0x2);
  1508. }
  1509. static void vcn_v1_0_jpeg_ring_emit_reg_wait(struct amdgpu_ring *ring,
  1510. uint32_t reg, uint32_t val,
  1511. uint32_t mask)
  1512. {
  1513. struct amdgpu_device *adev = ring->adev;
  1514. uint32_t reg_offset = (reg << 2);
  1515. amdgpu_ring_write(ring,
  1516. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_COND_RD_TIMER), 0, 0, PACKETJ_TYPE0));
  1517. amdgpu_ring_write(ring, 0x01400200);
  1518. amdgpu_ring_write(ring,
  1519. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_REF_DATA), 0, 0, PACKETJ_TYPE0));
  1520. amdgpu_ring_write(ring, val);
  1521. amdgpu_ring_write(ring,
  1522. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0));
  1523. if (((reg_offset >= 0x1f800) && (reg_offset <= 0x21fff)) ||
  1524. ((reg_offset >= 0x1e000) && (reg_offset <= 0x1e1ff))) {
  1525. amdgpu_ring_write(ring, 0);
  1526. amdgpu_ring_write(ring,
  1527. PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE3));
  1528. } else {
  1529. amdgpu_ring_write(ring, reg_offset);
  1530. amdgpu_ring_write(ring,
  1531. PACKETJ(0, 0, 0, PACKETJ_TYPE3));
  1532. }
  1533. amdgpu_ring_write(ring, mask);
  1534. }
  1535. static void vcn_v1_0_jpeg_ring_emit_vm_flush(struct amdgpu_ring *ring,
  1536. unsigned vmid, uint64_t pd_addr)
  1537. {
  1538. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  1539. uint32_t data0, data1, mask;
  1540. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  1541. /* wait for register write */
  1542. data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
  1543. data1 = lower_32_bits(pd_addr);
  1544. mask = 0xffffffff;
  1545. vcn_v1_0_jpeg_ring_emit_reg_wait(ring, data0, data1, mask);
  1546. }
  1547. static void vcn_v1_0_jpeg_ring_emit_wreg(struct amdgpu_ring *ring,
  1548. uint32_t reg, uint32_t val)
  1549. {
  1550. struct amdgpu_device *adev = ring->adev;
  1551. uint32_t reg_offset = (reg << 2);
  1552. amdgpu_ring_write(ring,
  1553. PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0));
  1554. if (((reg_offset >= 0x1f800) && (reg_offset <= 0x21fff)) ||
  1555. ((reg_offset >= 0x1e000) && (reg_offset <= 0x1e1ff))) {
  1556. amdgpu_ring_write(ring, 0);
  1557. amdgpu_ring_write(ring,
  1558. PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE0));
  1559. } else {
  1560. amdgpu_ring_write(ring, reg_offset);
  1561. amdgpu_ring_write(ring,
  1562. PACKETJ(0, 0, 0, PACKETJ_TYPE0));
  1563. }
  1564. amdgpu_ring_write(ring, val);
  1565. }
  1566. static void vcn_v1_0_jpeg_ring_nop(struct amdgpu_ring *ring, uint32_t count)
  1567. {
  1568. int i;
  1569. WARN_ON(ring->wptr % 2 || count % 2);
  1570. for (i = 0; i < count / 2; i++) {
  1571. amdgpu_ring_write(ring, PACKETJ(0, 0, 0, PACKETJ_TYPE6));
  1572. amdgpu_ring_write(ring, 0);
  1573. }
  1574. }
  1575. static void vcn_v1_0_jpeg_ring_patch_wreg(struct amdgpu_ring *ring, uint32_t *ptr, uint32_t reg_offset, uint32_t val)
  1576. {
  1577. struct amdgpu_device *adev = ring->adev;
  1578. ring->ring[(*ptr)++] = PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0);
  1579. if (((reg_offset >= 0x1f800) && (reg_offset <= 0x21fff)) ||
  1580. ((reg_offset >= 0x1e000) && (reg_offset <= 0x1e1ff))) {
  1581. ring->ring[(*ptr)++] = 0;
  1582. ring->ring[(*ptr)++] = PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE0);
  1583. } else {
  1584. ring->ring[(*ptr)++] = reg_offset;
  1585. ring->ring[(*ptr)++] = PACKETJ(0, 0, 0, PACKETJ_TYPE0);
  1586. }
  1587. ring->ring[(*ptr)++] = val;
  1588. }
  1589. static void vcn_v1_0_jpeg_ring_set_patch_ring(struct amdgpu_ring *ring, uint32_t ptr)
  1590. {
  1591. struct amdgpu_device *adev = ring->adev;
  1592. uint32_t reg, reg_offset, val, mask, i;
  1593. // 1st: program mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW
  1594. reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_LOW);
  1595. reg_offset = (reg << 2);
  1596. val = lower_32_bits(ring->gpu_addr);
  1597. vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
  1598. // 2nd: program mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH
  1599. reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_JRBC_RB_MEM_RD_64BIT_BAR_HIGH);
  1600. reg_offset = (reg << 2);
  1601. val = upper_32_bits(ring->gpu_addr);
  1602. vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
  1603. // 3rd to 5th: issue MEM_READ commands
  1604. for (i = 0; i <= 2; i++) {
  1605. ring->ring[ptr++] = PACKETJ(0, 0, 0, PACKETJ_TYPE2);
  1606. ring->ring[ptr++] = 0;
  1607. }
  1608. // 6th: program mmUVD_JRBC_RB_CNTL register to enable NO_FETCH and RPTR write ability
  1609. reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_CNTL);
  1610. reg_offset = (reg << 2);
  1611. val = 0x13;
  1612. vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
  1613. // 7th: program mmUVD_JRBC_RB_REF_DATA
  1614. reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_REF_DATA);
  1615. reg_offset = (reg << 2);
  1616. val = 0x1;
  1617. vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
  1618. // 8th: issue conditional register read mmUVD_JRBC_RB_CNTL
  1619. reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_CNTL);
  1620. reg_offset = (reg << 2);
  1621. val = 0x1;
  1622. mask = 0x1;
  1623. ring->ring[ptr++] = PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_COND_RD_TIMER), 0, 0, PACKETJ_TYPE0);
  1624. ring->ring[ptr++] = 0x01400200;
  1625. ring->ring[ptr++] = PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_REF_DATA), 0, 0, PACKETJ_TYPE0);
  1626. ring->ring[ptr++] = val;
  1627. ring->ring[ptr++] = PACKETJ(SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_EXTERNAL_REG_BASE), 0, 0, PACKETJ_TYPE0);
  1628. if (((reg_offset >= 0x1f800) && (reg_offset <= 0x21fff)) ||
  1629. ((reg_offset >= 0x1e000) && (reg_offset <= 0x1e1ff))) {
  1630. ring->ring[ptr++] = 0;
  1631. ring->ring[ptr++] = PACKETJ((reg_offset >> 2), 0, 0, PACKETJ_TYPE3);
  1632. } else {
  1633. ring->ring[ptr++] = reg_offset;
  1634. ring->ring[ptr++] = PACKETJ(0, 0, 0, PACKETJ_TYPE3);
  1635. }
  1636. ring->ring[ptr++] = mask;
  1637. //9th to 21st: insert no-op
  1638. for (i = 0; i <= 12; i++) {
  1639. ring->ring[ptr++] = PACKETJ(0, 0, 0, PACKETJ_TYPE6);
  1640. ring->ring[ptr++] = 0;
  1641. }
  1642. //22nd: reset mmUVD_JRBC_RB_RPTR
  1643. reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_RPTR);
  1644. reg_offset = (reg << 2);
  1645. val = 0;
  1646. vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
  1647. //23rd: program mmUVD_JRBC_RB_CNTL to disable no_fetch
  1648. reg = SOC15_REG_OFFSET(UVD, 0, mmUVD_JRBC_RB_CNTL);
  1649. reg_offset = (reg << 2);
  1650. val = 0x12;
  1651. vcn_v1_0_jpeg_ring_patch_wreg(ring, &ptr, reg_offset, val);
  1652. }
  1653. static int vcn_v1_0_set_interrupt_state(struct amdgpu_device *adev,
  1654. struct amdgpu_irq_src *source,
  1655. unsigned type,
  1656. enum amdgpu_interrupt_state state)
  1657. {
  1658. return 0;
  1659. }
  1660. static int vcn_v1_0_process_interrupt(struct amdgpu_device *adev,
  1661. struct amdgpu_irq_src *source,
  1662. struct amdgpu_iv_entry *entry)
  1663. {
  1664. DRM_DEBUG("IH: VCN TRAP\n");
  1665. switch (entry->src_id) {
  1666. case 124:
  1667. amdgpu_fence_process(&adev->vcn.ring_dec);
  1668. break;
  1669. case 119:
  1670. amdgpu_fence_process(&adev->vcn.ring_enc[0]);
  1671. break;
  1672. case 120:
  1673. amdgpu_fence_process(&adev->vcn.ring_enc[1]);
  1674. break;
  1675. case 126:
  1676. amdgpu_fence_process(&adev->vcn.ring_jpeg);
  1677. break;
  1678. default:
  1679. DRM_ERROR("Unhandled interrupt: %d %d\n",
  1680. entry->src_id, entry->src_data[0]);
  1681. break;
  1682. }
  1683. return 0;
  1684. }
  1685. static void vcn_v1_0_dec_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count)
  1686. {
  1687. struct amdgpu_device *adev = ring->adev;
  1688. int i;
  1689. WARN_ON(ring->wptr % 2 || count % 2);
  1690. for (i = 0; i < count / 2; i++) {
  1691. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_NO_OP), 0));
  1692. amdgpu_ring_write(ring, 0);
  1693. }
  1694. }
  1695. static int vcn_v1_0_set_powergating_state(void *handle,
  1696. enum amd_powergating_state state)
  1697. {
  1698. /* This doesn't actually powergate the VCN block.
  1699. * That's done in the dpm code via the SMC. This
  1700. * just re-inits the block as necessary. The actual
  1701. * gating still happens in the dpm code. We should
  1702. * revisit this when there is a cleaner line between
  1703. * the smc and the hw blocks
  1704. */
  1705. int ret;
  1706. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1707. if(state == adev->vcn.cur_state)
  1708. return 0;
  1709. if (state == AMD_PG_STATE_GATE)
  1710. ret = vcn_v1_0_stop(adev);
  1711. else
  1712. ret = vcn_v1_0_start(adev);
  1713. if(!ret)
  1714. adev->vcn.cur_state = state;
  1715. return ret;
  1716. }
  1717. static const struct amd_ip_funcs vcn_v1_0_ip_funcs = {
  1718. .name = "vcn_v1_0",
  1719. .early_init = vcn_v1_0_early_init,
  1720. .late_init = NULL,
  1721. .sw_init = vcn_v1_0_sw_init,
  1722. .sw_fini = vcn_v1_0_sw_fini,
  1723. .hw_init = vcn_v1_0_hw_init,
  1724. .hw_fini = vcn_v1_0_hw_fini,
  1725. .suspend = vcn_v1_0_suspend,
  1726. .resume = vcn_v1_0_resume,
  1727. .is_idle = vcn_v1_0_is_idle,
  1728. .wait_for_idle = vcn_v1_0_wait_for_idle,
  1729. .check_soft_reset = NULL /* vcn_v1_0_check_soft_reset */,
  1730. .pre_soft_reset = NULL /* vcn_v1_0_pre_soft_reset */,
  1731. .soft_reset = NULL /* vcn_v1_0_soft_reset */,
  1732. .post_soft_reset = NULL /* vcn_v1_0_post_soft_reset */,
  1733. .set_clockgating_state = vcn_v1_0_set_clockgating_state,
  1734. .set_powergating_state = vcn_v1_0_set_powergating_state,
  1735. };
  1736. static const struct amdgpu_ring_funcs vcn_v1_0_dec_ring_vm_funcs = {
  1737. .type = AMDGPU_RING_TYPE_VCN_DEC,
  1738. .align_mask = 0xf,
  1739. .support_64bit_ptrs = false,
  1740. .vmhub = AMDGPU_MMHUB,
  1741. .get_rptr = vcn_v1_0_dec_ring_get_rptr,
  1742. .get_wptr = vcn_v1_0_dec_ring_get_wptr,
  1743. .set_wptr = vcn_v1_0_dec_ring_set_wptr,
  1744. .emit_frame_size =
  1745. 6 + 6 + /* hdp invalidate / flush */
  1746. SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
  1747. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
  1748. 8 + /* vcn_v1_0_dec_ring_emit_vm_flush */
  1749. 14 + 14 + /* vcn_v1_0_dec_ring_emit_fence x2 vm fence */
  1750. 6,
  1751. .emit_ib_size = 8, /* vcn_v1_0_dec_ring_emit_ib */
  1752. .emit_ib = vcn_v1_0_dec_ring_emit_ib,
  1753. .emit_fence = vcn_v1_0_dec_ring_emit_fence,
  1754. .emit_vm_flush = vcn_v1_0_dec_ring_emit_vm_flush,
  1755. .test_ring = amdgpu_vcn_dec_ring_test_ring,
  1756. .test_ib = amdgpu_vcn_dec_ring_test_ib,
  1757. .insert_nop = vcn_v1_0_dec_ring_insert_nop,
  1758. .insert_start = vcn_v1_0_dec_ring_insert_start,
  1759. .insert_end = vcn_v1_0_dec_ring_insert_end,
  1760. .pad_ib = amdgpu_ring_generic_pad_ib,
  1761. .begin_use = amdgpu_vcn_ring_begin_use,
  1762. .end_use = amdgpu_vcn_ring_end_use,
  1763. .emit_wreg = vcn_v1_0_dec_ring_emit_wreg,
  1764. .emit_reg_wait = vcn_v1_0_dec_ring_emit_reg_wait,
  1765. .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
  1766. };
  1767. static const struct amdgpu_ring_funcs vcn_v1_0_enc_ring_vm_funcs = {
  1768. .type = AMDGPU_RING_TYPE_VCN_ENC,
  1769. .align_mask = 0x3f,
  1770. .nop = VCN_ENC_CMD_NO_OP,
  1771. .support_64bit_ptrs = false,
  1772. .vmhub = AMDGPU_MMHUB,
  1773. .get_rptr = vcn_v1_0_enc_ring_get_rptr,
  1774. .get_wptr = vcn_v1_0_enc_ring_get_wptr,
  1775. .set_wptr = vcn_v1_0_enc_ring_set_wptr,
  1776. .emit_frame_size =
  1777. SOC15_FLUSH_GPU_TLB_NUM_WREG * 3 +
  1778. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 4 +
  1779. 4 + /* vcn_v1_0_enc_ring_emit_vm_flush */
  1780. 5 + 5 + /* vcn_v1_0_enc_ring_emit_fence x2 vm fence */
  1781. 1, /* vcn_v1_0_enc_ring_insert_end */
  1782. .emit_ib_size = 5, /* vcn_v1_0_enc_ring_emit_ib */
  1783. .emit_ib = vcn_v1_0_enc_ring_emit_ib,
  1784. .emit_fence = vcn_v1_0_enc_ring_emit_fence,
  1785. .emit_vm_flush = vcn_v1_0_enc_ring_emit_vm_flush,
  1786. .test_ring = amdgpu_vcn_enc_ring_test_ring,
  1787. .test_ib = amdgpu_vcn_enc_ring_test_ib,
  1788. .insert_nop = amdgpu_ring_insert_nop,
  1789. .insert_end = vcn_v1_0_enc_ring_insert_end,
  1790. .pad_ib = amdgpu_ring_generic_pad_ib,
  1791. .begin_use = amdgpu_vcn_ring_begin_use,
  1792. .end_use = amdgpu_vcn_ring_end_use,
  1793. .emit_wreg = vcn_v1_0_enc_ring_emit_wreg,
  1794. .emit_reg_wait = vcn_v1_0_enc_ring_emit_reg_wait,
  1795. .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
  1796. };
  1797. static const struct amdgpu_ring_funcs vcn_v1_0_jpeg_ring_vm_funcs = {
  1798. .type = AMDGPU_RING_TYPE_VCN_JPEG,
  1799. .align_mask = 0xf,
  1800. .nop = PACKET0(0x81ff, 0),
  1801. .support_64bit_ptrs = false,
  1802. .vmhub = AMDGPU_MMHUB,
  1803. .extra_dw = 64,
  1804. .get_rptr = vcn_v1_0_jpeg_ring_get_rptr,
  1805. .get_wptr = vcn_v1_0_jpeg_ring_get_wptr,
  1806. .set_wptr = vcn_v1_0_jpeg_ring_set_wptr,
  1807. .emit_frame_size =
  1808. 6 + 6 + /* hdp invalidate / flush */
  1809. SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
  1810. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
  1811. 8 + /* vcn_v1_0_jpeg_ring_emit_vm_flush */
  1812. 26 + 26 + /* vcn_v1_0_jpeg_ring_emit_fence x2 vm fence */
  1813. 6,
  1814. .emit_ib_size = 22, /* vcn_v1_0_jpeg_ring_emit_ib */
  1815. .emit_ib = vcn_v1_0_jpeg_ring_emit_ib,
  1816. .emit_fence = vcn_v1_0_jpeg_ring_emit_fence,
  1817. .emit_vm_flush = vcn_v1_0_jpeg_ring_emit_vm_flush,
  1818. .test_ring = amdgpu_vcn_jpeg_ring_test_ring,
  1819. .test_ib = amdgpu_vcn_jpeg_ring_test_ib,
  1820. .insert_nop = vcn_v1_0_jpeg_ring_nop,
  1821. .insert_start = vcn_v1_0_jpeg_ring_insert_start,
  1822. .insert_end = vcn_v1_0_jpeg_ring_insert_end,
  1823. .pad_ib = amdgpu_ring_generic_pad_ib,
  1824. .begin_use = amdgpu_vcn_ring_begin_use,
  1825. .end_use = amdgpu_vcn_ring_end_use,
  1826. .emit_wreg = vcn_v1_0_jpeg_ring_emit_wreg,
  1827. .emit_reg_wait = vcn_v1_0_jpeg_ring_emit_reg_wait,
  1828. .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
  1829. };
  1830. static void vcn_v1_0_set_dec_ring_funcs(struct amdgpu_device *adev)
  1831. {
  1832. adev->vcn.ring_dec.funcs = &vcn_v1_0_dec_ring_vm_funcs;
  1833. DRM_INFO("VCN decode is enabled in VM mode\n");
  1834. }
  1835. static void vcn_v1_0_set_enc_ring_funcs(struct amdgpu_device *adev)
  1836. {
  1837. int i;
  1838. for (i = 0; i < adev->vcn.num_enc_rings; ++i)
  1839. adev->vcn.ring_enc[i].funcs = &vcn_v1_0_enc_ring_vm_funcs;
  1840. DRM_INFO("VCN encode is enabled in VM mode\n");
  1841. }
  1842. static void vcn_v1_0_set_jpeg_ring_funcs(struct amdgpu_device *adev)
  1843. {
  1844. adev->vcn.ring_jpeg.funcs = &vcn_v1_0_jpeg_ring_vm_funcs;
  1845. DRM_INFO("VCN jpeg decode is enabled in VM mode\n");
  1846. }
  1847. static const struct amdgpu_irq_src_funcs vcn_v1_0_irq_funcs = {
  1848. .set = vcn_v1_0_set_interrupt_state,
  1849. .process = vcn_v1_0_process_interrupt,
  1850. };
  1851. static void vcn_v1_0_set_irq_funcs(struct amdgpu_device *adev)
  1852. {
  1853. adev->vcn.irq.num_types = adev->vcn.num_enc_rings + 2;
  1854. adev->vcn.irq.funcs = &vcn_v1_0_irq_funcs;
  1855. }
  1856. const struct amdgpu_ip_block_version vcn_v1_0_ip_block =
  1857. {
  1858. .type = AMD_IP_BLOCK_TYPE_VCN,
  1859. .major = 1,
  1860. .minor = 0,
  1861. .rev = 0,
  1862. .funcs = &vcn_v1_0_ip_funcs,
  1863. };