vcn_v1_0.c 38 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include <linux/firmware.h>
  24. #include <drm/drmP.h>
  25. #include "amdgpu.h"
  26. #include "amdgpu_vcn.h"
  27. #include "soc15.h"
  28. #include "soc15d.h"
  29. #include "soc15_common.h"
  30. #include "vcn/vcn_1_0_offset.h"
  31. #include "vcn/vcn_1_0_sh_mask.h"
  32. #include "hdp/hdp_4_0_offset.h"
  33. #include "mmhub/mmhub_9_1_offset.h"
  34. #include "mmhub/mmhub_9_1_sh_mask.h"
  35. static int vcn_v1_0_stop(struct amdgpu_device *adev);
  36. static void vcn_v1_0_set_dec_ring_funcs(struct amdgpu_device *adev);
  37. static void vcn_v1_0_set_enc_ring_funcs(struct amdgpu_device *adev);
  38. static void vcn_v1_0_set_irq_funcs(struct amdgpu_device *adev);
  39. /**
  40. * vcn_v1_0_early_init - set function pointers
  41. *
  42. * @handle: amdgpu_device pointer
  43. *
  44. * Set ring and irq function pointers
  45. */
  46. static int vcn_v1_0_early_init(void *handle)
  47. {
  48. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  49. adev->vcn.num_enc_rings = 2;
  50. vcn_v1_0_set_dec_ring_funcs(adev);
  51. vcn_v1_0_set_enc_ring_funcs(adev);
  52. vcn_v1_0_set_irq_funcs(adev);
  53. return 0;
  54. }
  55. /**
  56. * vcn_v1_0_sw_init - sw init for VCN block
  57. *
  58. * @handle: amdgpu_device pointer
  59. *
  60. * Load firmware and sw initialization
  61. */
  62. static int vcn_v1_0_sw_init(void *handle)
  63. {
  64. struct amdgpu_ring *ring;
  65. int i, r;
  66. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  67. /* VCN DEC TRAP */
  68. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN, 124, &adev->vcn.irq);
  69. if (r)
  70. return r;
  71. /* VCN ENC TRAP */
  72. for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
  73. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN, i + 119,
  74. &adev->vcn.irq);
  75. if (r)
  76. return r;
  77. }
  78. r = amdgpu_vcn_sw_init(adev);
  79. if (r)
  80. return r;
  81. r = amdgpu_vcn_resume(adev);
  82. if (r)
  83. return r;
  84. ring = &adev->vcn.ring_dec;
  85. sprintf(ring->name, "vcn_dec");
  86. r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.irq, 0);
  87. if (r)
  88. return r;
  89. for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
  90. ring = &adev->vcn.ring_enc[i];
  91. sprintf(ring->name, "vcn_enc%d", i);
  92. r = amdgpu_ring_init(adev, ring, 512, &adev->vcn.irq, 0);
  93. if (r)
  94. return r;
  95. }
  96. return r;
  97. }
  98. /**
  99. * vcn_v1_0_sw_fini - sw fini for VCN block
  100. *
  101. * @handle: amdgpu_device pointer
  102. *
  103. * VCN suspend and free up sw allocation
  104. */
  105. static int vcn_v1_0_sw_fini(void *handle)
  106. {
  107. int r;
  108. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  109. r = amdgpu_vcn_suspend(adev);
  110. if (r)
  111. return r;
  112. r = amdgpu_vcn_sw_fini(adev);
  113. return r;
  114. }
  115. /**
  116. * vcn_v1_0_hw_init - start and test VCN block
  117. *
  118. * @handle: amdgpu_device pointer
  119. *
  120. * Initialize the hardware, boot up the VCPU and do some testing
  121. */
  122. static int vcn_v1_0_hw_init(void *handle)
  123. {
  124. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  125. struct amdgpu_ring *ring = &adev->vcn.ring_dec;
  126. int i, r;
  127. ring->ready = true;
  128. r = amdgpu_ring_test_ring(ring);
  129. if (r) {
  130. ring->ready = false;
  131. goto done;
  132. }
  133. for (i = 0; i < adev->vcn.num_enc_rings; ++i) {
  134. ring = &adev->vcn.ring_enc[i];
  135. ring->ready = true;
  136. r = amdgpu_ring_test_ring(ring);
  137. if (r) {
  138. ring->ready = false;
  139. goto done;
  140. }
  141. }
  142. done:
  143. if (!r)
  144. DRM_INFO("VCN decode and encode initialized successfully.\n");
  145. return r;
  146. }
  147. /**
  148. * vcn_v1_0_hw_fini - stop the hardware block
  149. *
  150. * @handle: amdgpu_device pointer
  151. *
  152. * Stop the VCN block, mark ring as not ready any more
  153. */
  154. static int vcn_v1_0_hw_fini(void *handle)
  155. {
  156. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  157. struct amdgpu_ring *ring = &adev->vcn.ring_dec;
  158. if (RREG32_SOC15(VCN, 0, mmUVD_STATUS))
  159. vcn_v1_0_stop(adev);
  160. ring->ready = false;
  161. return 0;
  162. }
  163. /**
  164. * vcn_v1_0_suspend - suspend VCN block
  165. *
  166. * @handle: amdgpu_device pointer
  167. *
  168. * HW fini and suspend VCN block
  169. */
  170. static int vcn_v1_0_suspend(void *handle)
  171. {
  172. int r;
  173. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  174. r = vcn_v1_0_hw_fini(adev);
  175. if (r)
  176. return r;
  177. r = amdgpu_vcn_suspend(adev);
  178. return r;
  179. }
  180. /**
  181. * vcn_v1_0_resume - resume VCN block
  182. *
  183. * @handle: amdgpu_device pointer
  184. *
  185. * Resume firmware and hw init VCN block
  186. */
  187. static int vcn_v1_0_resume(void *handle)
  188. {
  189. int r;
  190. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  191. r = amdgpu_vcn_resume(adev);
  192. if (r)
  193. return r;
  194. r = vcn_v1_0_hw_init(adev);
  195. return r;
  196. }
  197. /**
  198. * vcn_v1_0_mc_resume - memory controller programming
  199. *
  200. * @adev: amdgpu_device pointer
  201. *
  202. * Let the VCN memory controller know it's offsets
  203. */
  204. static void vcn_v1_0_mc_resume(struct amdgpu_device *adev)
  205. {
  206. uint32_t size = AMDGPU_GPU_PAGE_ALIGN(adev->vcn.fw->size + 4);
  207. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
  208. lower_32_bits(adev->vcn.gpu_addr));
  209. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
  210. upper_32_bits(adev->vcn.gpu_addr));
  211. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET0,
  212. AMDGPU_UVD_FIRMWARE_OFFSET >> 3);
  213. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE0, size);
  214. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_LOW,
  215. lower_32_bits(adev->vcn.gpu_addr + size));
  216. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE1_64BIT_BAR_HIGH,
  217. upper_32_bits(adev->vcn.gpu_addr + size));
  218. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET1, 0);
  219. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE1, AMDGPU_VCN_HEAP_SIZE);
  220. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_LOW,
  221. lower_32_bits(adev->vcn.gpu_addr + size + AMDGPU_VCN_HEAP_SIZE));
  222. WREG32_SOC15(UVD, 0, mmUVD_LMI_VCPU_CACHE2_64BIT_BAR_HIGH,
  223. upper_32_bits(adev->vcn.gpu_addr + size + AMDGPU_VCN_HEAP_SIZE));
  224. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_OFFSET2, 0);
  225. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CACHE_SIZE2,
  226. AMDGPU_VCN_STACK_SIZE + (AMDGPU_VCN_SESSION_SIZE * 40));
  227. WREG32_SOC15(UVD, 0, mmUVD_UDEC_ADDR_CONFIG,
  228. adev->gfx.config.gb_addr_config);
  229. WREG32_SOC15(UVD, 0, mmUVD_UDEC_DB_ADDR_CONFIG,
  230. adev->gfx.config.gb_addr_config);
  231. WREG32_SOC15(UVD, 0, mmUVD_UDEC_DBW_ADDR_CONFIG,
  232. adev->gfx.config.gb_addr_config);
  233. }
  234. /**
  235. * vcn_v1_0_disable_clock_gating - disable VCN clock gating
  236. *
  237. * @adev: amdgpu_device pointer
  238. * @sw: enable SW clock gating
  239. *
  240. * Disable clock gating for VCN block
  241. */
  242. static void vcn_v1_0_disable_clock_gating(struct amdgpu_device *adev)
  243. {
  244. uint32_t data;
  245. /* JPEG disable CGC */
  246. data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL);
  247. if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
  248. data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  249. else
  250. data &= ~JPEG_CGC_CTRL__DYN_CLOCK_MODE_MASK;
  251. data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
  252. data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
  253. WREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL, data);
  254. data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE);
  255. data &= ~(JPEG_CGC_GATE__JPEG_MASK | JPEG_CGC_GATE__JPEG2_MASK);
  256. WREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE, data);
  257. /* UVD disable CGC */
  258. data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
  259. if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
  260. data |= 1 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  261. else
  262. data &= ~ UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
  263. data |= 1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
  264. data |= 4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
  265. WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
  266. data = RREG32_SOC15(VCN, 0, mmUVD_CGC_GATE);
  267. data &= ~(UVD_CGC_GATE__SYS_MASK
  268. | UVD_CGC_GATE__UDEC_MASK
  269. | UVD_CGC_GATE__MPEG2_MASK
  270. | UVD_CGC_GATE__REGS_MASK
  271. | UVD_CGC_GATE__RBC_MASK
  272. | UVD_CGC_GATE__LMI_MC_MASK
  273. | UVD_CGC_GATE__LMI_UMC_MASK
  274. | UVD_CGC_GATE__IDCT_MASK
  275. | UVD_CGC_GATE__MPRD_MASK
  276. | UVD_CGC_GATE__MPC_MASK
  277. | UVD_CGC_GATE__LBSI_MASK
  278. | UVD_CGC_GATE__LRBBM_MASK
  279. | UVD_CGC_GATE__UDEC_RE_MASK
  280. | UVD_CGC_GATE__UDEC_CM_MASK
  281. | UVD_CGC_GATE__UDEC_IT_MASK
  282. | UVD_CGC_GATE__UDEC_DB_MASK
  283. | UVD_CGC_GATE__UDEC_MP_MASK
  284. | UVD_CGC_GATE__WCB_MASK
  285. | UVD_CGC_GATE__VCPU_MASK
  286. | UVD_CGC_GATE__SCPU_MASK);
  287. WREG32_SOC15(VCN, 0, mmUVD_CGC_GATE, data);
  288. data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
  289. data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK
  290. | UVD_CGC_CTRL__UDEC_CM_MODE_MASK
  291. | UVD_CGC_CTRL__UDEC_IT_MODE_MASK
  292. | UVD_CGC_CTRL__UDEC_DB_MODE_MASK
  293. | UVD_CGC_CTRL__UDEC_MP_MODE_MASK
  294. | UVD_CGC_CTRL__SYS_MODE_MASK
  295. | UVD_CGC_CTRL__UDEC_MODE_MASK
  296. | UVD_CGC_CTRL__MPEG2_MODE_MASK
  297. | UVD_CGC_CTRL__REGS_MODE_MASK
  298. | UVD_CGC_CTRL__RBC_MODE_MASK
  299. | UVD_CGC_CTRL__LMI_MC_MODE_MASK
  300. | UVD_CGC_CTRL__LMI_UMC_MODE_MASK
  301. | UVD_CGC_CTRL__IDCT_MODE_MASK
  302. | UVD_CGC_CTRL__MPRD_MODE_MASK
  303. | UVD_CGC_CTRL__MPC_MODE_MASK
  304. | UVD_CGC_CTRL__LBSI_MODE_MASK
  305. | UVD_CGC_CTRL__LRBBM_MODE_MASK
  306. | UVD_CGC_CTRL__WCB_MODE_MASK
  307. | UVD_CGC_CTRL__VCPU_MODE_MASK
  308. | UVD_CGC_CTRL__SCPU_MODE_MASK);
  309. WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
  310. /* turn on */
  311. data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_GATE);
  312. data |= (UVD_SUVD_CGC_GATE__SRE_MASK
  313. | UVD_SUVD_CGC_GATE__SIT_MASK
  314. | UVD_SUVD_CGC_GATE__SMP_MASK
  315. | UVD_SUVD_CGC_GATE__SCM_MASK
  316. | UVD_SUVD_CGC_GATE__SDB_MASK
  317. | UVD_SUVD_CGC_GATE__SRE_H264_MASK
  318. | UVD_SUVD_CGC_GATE__SRE_HEVC_MASK
  319. | UVD_SUVD_CGC_GATE__SIT_H264_MASK
  320. | UVD_SUVD_CGC_GATE__SIT_HEVC_MASK
  321. | UVD_SUVD_CGC_GATE__SCM_H264_MASK
  322. | UVD_SUVD_CGC_GATE__SCM_HEVC_MASK
  323. | UVD_SUVD_CGC_GATE__SDB_H264_MASK
  324. | UVD_SUVD_CGC_GATE__SDB_HEVC_MASK
  325. | UVD_SUVD_CGC_GATE__SCLR_MASK
  326. | UVD_SUVD_CGC_GATE__UVD_SC_MASK
  327. | UVD_SUVD_CGC_GATE__ENT_MASK
  328. | UVD_SUVD_CGC_GATE__SIT_HEVC_DEC_MASK
  329. | UVD_SUVD_CGC_GATE__SIT_HEVC_ENC_MASK
  330. | UVD_SUVD_CGC_GATE__SITE_MASK
  331. | UVD_SUVD_CGC_GATE__SRE_VP9_MASK
  332. | UVD_SUVD_CGC_GATE__SCM_VP9_MASK
  333. | UVD_SUVD_CGC_GATE__SIT_VP9_DEC_MASK
  334. | UVD_SUVD_CGC_GATE__SDB_VP9_MASK
  335. | UVD_SUVD_CGC_GATE__IME_HEVC_MASK);
  336. WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_GATE, data);
  337. data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL);
  338. data &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK
  339. | UVD_SUVD_CGC_CTRL__SIT_MODE_MASK
  340. | UVD_SUVD_CGC_CTRL__SMP_MODE_MASK
  341. | UVD_SUVD_CGC_CTRL__SCM_MODE_MASK
  342. | UVD_SUVD_CGC_CTRL__SDB_MODE_MASK
  343. | UVD_SUVD_CGC_CTRL__SCLR_MODE_MASK
  344. | UVD_SUVD_CGC_CTRL__UVD_SC_MODE_MASK
  345. | UVD_SUVD_CGC_CTRL__ENT_MODE_MASK
  346. | UVD_SUVD_CGC_CTRL__IME_MODE_MASK
  347. | UVD_SUVD_CGC_CTRL__SITE_MODE_MASK);
  348. WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL, data);
  349. }
  350. /**
  351. * vcn_v1_0_enable_clock_gating - enable VCN clock gating
  352. *
  353. * @adev: amdgpu_device pointer
  354. * @sw: enable SW clock gating
  355. *
  356. * Enable clock gating for VCN block
  357. */
  358. static void vcn_v1_0_enable_clock_gating(struct amdgpu_device *adev)
  359. {
  360. uint32_t data = 0;
  361. /* enable JPEG CGC */
  362. data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL);
  363. if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
  364. data |= 1 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  365. else
  366. data |= 0 << JPEG_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  367. data |= 1 << JPEG_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
  368. data |= 4 << JPEG_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
  369. WREG32_SOC15(VCN, 0, mmJPEG_CGC_CTRL, data);
  370. data = RREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE);
  371. data |= (JPEG_CGC_GATE__JPEG_MASK | JPEG_CGC_GATE__JPEG2_MASK);
  372. WREG32_SOC15(VCN, 0, mmJPEG_CGC_GATE, data);
  373. /* enable UVD CGC */
  374. data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
  375. if (adev->cg_flags & AMD_CG_SUPPORT_VCN_MGCG)
  376. data |= 1 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  377. else
  378. data |= 0 << UVD_CGC_CTRL__DYN_CLOCK_MODE__SHIFT;
  379. data |= 1 << UVD_CGC_CTRL__CLK_GATE_DLY_TIMER__SHIFT;
  380. data |= 4 << UVD_CGC_CTRL__CLK_OFF_DELAY__SHIFT;
  381. WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
  382. data = RREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL);
  383. data |= (UVD_CGC_CTRL__UDEC_RE_MODE_MASK
  384. | UVD_CGC_CTRL__UDEC_CM_MODE_MASK
  385. | UVD_CGC_CTRL__UDEC_IT_MODE_MASK
  386. | UVD_CGC_CTRL__UDEC_DB_MODE_MASK
  387. | UVD_CGC_CTRL__UDEC_MP_MODE_MASK
  388. | UVD_CGC_CTRL__SYS_MODE_MASK
  389. | UVD_CGC_CTRL__UDEC_MODE_MASK
  390. | UVD_CGC_CTRL__MPEG2_MODE_MASK
  391. | UVD_CGC_CTRL__REGS_MODE_MASK
  392. | UVD_CGC_CTRL__RBC_MODE_MASK
  393. | UVD_CGC_CTRL__LMI_MC_MODE_MASK
  394. | UVD_CGC_CTRL__LMI_UMC_MODE_MASK
  395. | UVD_CGC_CTRL__IDCT_MODE_MASK
  396. | UVD_CGC_CTRL__MPRD_MODE_MASK
  397. | UVD_CGC_CTRL__MPC_MODE_MASK
  398. | UVD_CGC_CTRL__LBSI_MODE_MASK
  399. | UVD_CGC_CTRL__LRBBM_MODE_MASK
  400. | UVD_CGC_CTRL__WCB_MODE_MASK
  401. | UVD_CGC_CTRL__VCPU_MODE_MASK
  402. | UVD_CGC_CTRL__SCPU_MODE_MASK);
  403. WREG32_SOC15(VCN, 0, mmUVD_CGC_CTRL, data);
  404. data = RREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL);
  405. data |= (UVD_SUVD_CGC_CTRL__SRE_MODE_MASK
  406. | UVD_SUVD_CGC_CTRL__SIT_MODE_MASK
  407. | UVD_SUVD_CGC_CTRL__SMP_MODE_MASK
  408. | UVD_SUVD_CGC_CTRL__SCM_MODE_MASK
  409. | UVD_SUVD_CGC_CTRL__SDB_MODE_MASK
  410. | UVD_SUVD_CGC_CTRL__SCLR_MODE_MASK
  411. | UVD_SUVD_CGC_CTRL__UVD_SC_MODE_MASK
  412. | UVD_SUVD_CGC_CTRL__ENT_MODE_MASK
  413. | UVD_SUVD_CGC_CTRL__IME_MODE_MASK
  414. | UVD_SUVD_CGC_CTRL__SITE_MODE_MASK);
  415. WREG32_SOC15(VCN, 0, mmUVD_SUVD_CGC_CTRL, data);
  416. }
  417. static void vcn_1_0_disable_static_power_gating(struct amdgpu_device *adev)
  418. {
  419. uint32_t data = 0;
  420. int ret;
  421. if (adev->pg_flags & AMD_PG_SUPPORT_VCN) {
  422. data = (1 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
  423. | 1 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
  424. | 2 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
  425. | 2 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
  426. | 2 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
  427. | 2 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
  428. | 2 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
  429. | 2 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
  430. | 2 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
  431. | 2 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT
  432. | 2 << UVD_PGFSM_CONFIG__UVDW_PWR_CONFIG__SHIFT);
  433. WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
  434. SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, UVD_PGFSM_STATUS__UVDM_UVDU_PWR_ON, 0xFFFFFF, ret);
  435. } else {
  436. data = (1 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
  437. | 1 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
  438. | 1 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
  439. | 1 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
  440. | 1 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
  441. | 1 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
  442. | 1 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
  443. | 1 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
  444. | 1 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
  445. | 1 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT
  446. | 1 << UVD_PGFSM_CONFIG__UVDW_PWR_CONFIG__SHIFT);
  447. WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
  448. SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, 0, 0xFFFFFFFF, ret);
  449. }
  450. /* polling UVD_PGFSM_STATUS to confirm UVDM_PWR_STATUS , UVDU_PWR_STATUS are 0 (power on) */
  451. data = RREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS);
  452. data &= ~0x103;
  453. if (adev->pg_flags & AMD_PG_SUPPORT_VCN)
  454. data |= UVD_PGFSM_CONFIG__UVDM_UVDU_PWR_ON | UVD_POWER_STATUS__UVD_PG_EN_MASK;
  455. WREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS, data);
  456. }
  457. static void vcn_1_0_enable_static_power_gating(struct amdgpu_device *adev)
  458. {
  459. uint32_t data = 0;
  460. int ret;
  461. if (adev->pg_flags & AMD_PG_SUPPORT_VCN) {
  462. /* Before power off, this indicator has to be turned on */
  463. data = RREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS);
  464. data &= ~UVD_POWER_STATUS__UVD_POWER_STATUS_MASK;
  465. data |= UVD_POWER_STATUS__UVD_POWER_STATUS_TILES_OFF;
  466. WREG32_SOC15(VCN, 0, mmUVD_POWER_STATUS, data);
  467. data = (2 << UVD_PGFSM_CONFIG__UVDM_PWR_CONFIG__SHIFT
  468. | 2 << UVD_PGFSM_CONFIG__UVDU_PWR_CONFIG__SHIFT
  469. | 2 << UVD_PGFSM_CONFIG__UVDF_PWR_CONFIG__SHIFT
  470. | 2 << UVD_PGFSM_CONFIG__UVDC_PWR_CONFIG__SHIFT
  471. | 2 << UVD_PGFSM_CONFIG__UVDB_PWR_CONFIG__SHIFT
  472. | 2 << UVD_PGFSM_CONFIG__UVDIL_PWR_CONFIG__SHIFT
  473. | 2 << UVD_PGFSM_CONFIG__UVDIR_PWR_CONFIG__SHIFT
  474. | 2 << UVD_PGFSM_CONFIG__UVDTD_PWR_CONFIG__SHIFT
  475. | 2 << UVD_PGFSM_CONFIG__UVDTE_PWR_CONFIG__SHIFT
  476. | 2 << UVD_PGFSM_CONFIG__UVDE_PWR_CONFIG__SHIFT
  477. | 2 << UVD_PGFSM_CONFIG__UVDW_PWR_CONFIG__SHIFT);
  478. WREG32_SOC15(VCN, 0, mmUVD_PGFSM_CONFIG, data);
  479. data = (2 << UVD_PGFSM_STATUS__UVDM_PWR_STATUS__SHIFT
  480. | 2 << UVD_PGFSM_STATUS__UVDU_PWR_STATUS__SHIFT
  481. | 2 << UVD_PGFSM_STATUS__UVDF_PWR_STATUS__SHIFT
  482. | 2 << UVD_PGFSM_STATUS__UVDC_PWR_STATUS__SHIFT
  483. | 2 << UVD_PGFSM_STATUS__UVDB_PWR_STATUS__SHIFT
  484. | 2 << UVD_PGFSM_STATUS__UVDIL_PWR_STATUS__SHIFT
  485. | 2 << UVD_PGFSM_STATUS__UVDIR_PWR_STATUS__SHIFT
  486. | 2 << UVD_PGFSM_STATUS__UVDTD_PWR_STATUS__SHIFT
  487. | 2 << UVD_PGFSM_STATUS__UVDTE_PWR_STATUS__SHIFT
  488. | 2 << UVD_PGFSM_STATUS__UVDE_PWR_STATUS__SHIFT
  489. | 2 << UVD_PGFSM_STATUS__UVDW_PWR_STATUS__SHIFT);
  490. SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_PGFSM_STATUS, data, 0xFFFFFFFF, ret);
  491. }
  492. }
  493. /**
  494. * vcn_v1_0_start - start VCN block
  495. *
  496. * @adev: amdgpu_device pointer
  497. *
  498. * Setup and start the VCN block
  499. */
  500. static int vcn_v1_0_start(struct amdgpu_device *adev)
  501. {
  502. struct amdgpu_ring *ring = &adev->vcn.ring_dec;
  503. uint32_t rb_bufsz, tmp;
  504. uint32_t lmi_swap_cntl;
  505. int i, j, r;
  506. /* disable byte swapping */
  507. lmi_swap_cntl = 0;
  508. vcn_v1_0_mc_resume(adev);
  509. vcn_1_0_disable_static_power_gating(adev);
  510. /* disable clock gating */
  511. vcn_v1_0_disable_clock_gating(adev);
  512. /* disable interupt */
  513. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN), 0,
  514. ~UVD_MASTINT_EN__VCPU_EN_MASK);
  515. /* stall UMC and register bus before resetting VCPU */
  516. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
  517. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  518. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  519. mdelay(1);
  520. /* put LMI, VCPU, RBC etc... into reset */
  521. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
  522. UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
  523. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
  524. UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
  525. UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
  526. UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
  527. UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
  528. UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
  529. UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
  530. mdelay(5);
  531. /* initialize VCN memory controller */
  532. WREG32_SOC15(UVD, 0, mmUVD_LMI_CTRL,
  533. (0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
  534. UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
  535. UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
  536. UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
  537. UVD_LMI_CTRL__REQ_MODE_MASK |
  538. 0x00100000L);
  539. #ifdef __BIG_ENDIAN
  540. /* swap (8 in 32) RB and IB */
  541. lmi_swap_cntl = 0xa;
  542. #endif
  543. WREG32_SOC15(UVD, 0, mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
  544. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXA0, 0x40c2040);
  545. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXA1, 0x0);
  546. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXB0, 0x40c2040);
  547. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUXB1, 0x0);
  548. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_ALU, 0);
  549. WREG32_SOC15(UVD, 0, mmUVD_MPC_SET_MUX, 0x88);
  550. /* take all subblocks out of reset, except VCPU */
  551. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
  552. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  553. mdelay(5);
  554. /* enable VCPU clock */
  555. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CNTL,
  556. UVD_VCPU_CNTL__CLK_EN_MASK);
  557. /* enable UMC */
  558. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2), 0,
  559. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  560. /* boot up the VCPU */
  561. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET, 0);
  562. mdelay(10);
  563. for (i = 0; i < 10; ++i) {
  564. uint32_t status;
  565. for (j = 0; j < 100; ++j) {
  566. status = RREG32_SOC15(UVD, 0, mmUVD_STATUS);
  567. if (status & 2)
  568. break;
  569. mdelay(10);
  570. }
  571. r = 0;
  572. if (status & 2)
  573. break;
  574. DRM_ERROR("VCN decode not responding, trying to reset the VCPU!!!\n");
  575. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET),
  576. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK,
  577. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  578. mdelay(10);
  579. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_SOFT_RESET), 0,
  580. ~UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  581. mdelay(10);
  582. r = -1;
  583. }
  584. if (r) {
  585. DRM_ERROR("VCN decode not responding, giving up!!!\n");
  586. return r;
  587. }
  588. /* enable master interrupt */
  589. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_MASTINT_EN),
  590. (UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
  591. ~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
  592. /* clear the bit 4 of VCN_STATUS */
  593. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_STATUS), 0,
  594. ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
  595. /* force RBC into idle state */
  596. rb_bufsz = order_base_2(ring->ring_size);
  597. tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
  598. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
  599. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
  600. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
  601. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
  602. tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
  603. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, tmp);
  604. /* set the write pointer delay */
  605. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR_CNTL, 0);
  606. /* set the wb address */
  607. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR_ADDR,
  608. (upper_32_bits(ring->gpu_addr) >> 2));
  609. /* programm the RB_BASE for ring buffer */
  610. WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
  611. lower_32_bits(ring->gpu_addr));
  612. WREG32_SOC15(UVD, 0, mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
  613. upper_32_bits(ring->gpu_addr));
  614. /* Initialize the ring buffer's read and write pointers */
  615. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR, 0);
  616. ring->wptr = RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
  617. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR,
  618. lower_32_bits(ring->wptr));
  619. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_RB_CNTL), 0,
  620. ~UVD_RBC_RB_CNTL__RB_NO_FETCH_MASK);
  621. ring = &adev->vcn.ring_enc[0];
  622. WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
  623. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
  624. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO, ring->gpu_addr);
  625. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
  626. WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE, ring->ring_size / 4);
  627. ring = &adev->vcn.ring_enc[1];
  628. WREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
  629. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
  630. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_LO2, ring->gpu_addr);
  631. WREG32_SOC15(UVD, 0, mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
  632. WREG32_SOC15(UVD, 0, mmUVD_RB_SIZE2, ring->ring_size / 4);
  633. return 0;
  634. }
  635. /**
  636. * vcn_v1_0_stop - stop VCN block
  637. *
  638. * @adev: amdgpu_device pointer
  639. *
  640. * stop the VCN block
  641. */
  642. static int vcn_v1_0_stop(struct amdgpu_device *adev)
  643. {
  644. /* force RBC into idle state */
  645. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_CNTL, 0x11010101);
  646. /* Stall UMC and register bus before resetting VCPU */
  647. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2),
  648. UVD_LMI_CTRL2__STALL_ARB_UMC_MASK,
  649. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  650. mdelay(1);
  651. /* put VCPU into reset */
  652. WREG32_SOC15(UVD, 0, mmUVD_SOFT_RESET,
  653. UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
  654. mdelay(5);
  655. /* disable VCPU clock */
  656. WREG32_SOC15(UVD, 0, mmUVD_VCPU_CNTL, 0x0);
  657. /* Unstall UMC and register bus */
  658. WREG32_P(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_CTRL2), 0,
  659. ~UVD_LMI_CTRL2__STALL_ARB_UMC_MASK);
  660. WREG32_SOC15(VCN, 0, mmUVD_STATUS, 0);
  661. vcn_v1_0_enable_clock_gating(adev);
  662. vcn_1_0_enable_static_power_gating(adev);
  663. return 0;
  664. }
  665. static bool vcn_v1_0_is_idle(void *handle)
  666. {
  667. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  668. return (RREG32_SOC15(VCN, 0, mmUVD_STATUS) == 0x2);
  669. }
  670. static int vcn_v1_0_wait_for_idle(void *handle)
  671. {
  672. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  673. int ret = 0;
  674. SOC15_WAIT_ON_RREG(VCN, 0, mmUVD_STATUS, 0x2, 0x2, ret);
  675. return ret;
  676. }
  677. static int vcn_v1_0_set_clockgating_state(void *handle,
  678. enum amd_clockgating_state state)
  679. {
  680. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  681. bool enable = (state == AMD_CG_STATE_GATE) ? true : false;
  682. if (enable) {
  683. /* wait for STATUS to clear */
  684. if (vcn_v1_0_is_idle(handle))
  685. return -EBUSY;
  686. vcn_v1_0_enable_clock_gating(adev);
  687. } else {
  688. /* disable HW gating and enable Sw gating */
  689. vcn_v1_0_disable_clock_gating(adev);
  690. }
  691. return 0;
  692. }
  693. /**
  694. * vcn_v1_0_dec_ring_get_rptr - get read pointer
  695. *
  696. * @ring: amdgpu_ring pointer
  697. *
  698. * Returns the current hardware read pointer
  699. */
  700. static uint64_t vcn_v1_0_dec_ring_get_rptr(struct amdgpu_ring *ring)
  701. {
  702. struct amdgpu_device *adev = ring->adev;
  703. return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_RPTR);
  704. }
  705. /**
  706. * vcn_v1_0_dec_ring_get_wptr - get write pointer
  707. *
  708. * @ring: amdgpu_ring pointer
  709. *
  710. * Returns the current hardware write pointer
  711. */
  712. static uint64_t vcn_v1_0_dec_ring_get_wptr(struct amdgpu_ring *ring)
  713. {
  714. struct amdgpu_device *adev = ring->adev;
  715. return RREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR);
  716. }
  717. /**
  718. * vcn_v1_0_dec_ring_set_wptr - set write pointer
  719. *
  720. * @ring: amdgpu_ring pointer
  721. *
  722. * Commits the write pointer to the hardware
  723. */
  724. static void vcn_v1_0_dec_ring_set_wptr(struct amdgpu_ring *ring)
  725. {
  726. struct amdgpu_device *adev = ring->adev;
  727. WREG32_SOC15(UVD, 0, mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
  728. }
  729. /**
  730. * vcn_v1_0_dec_ring_insert_start - insert a start command
  731. *
  732. * @ring: amdgpu_ring pointer
  733. *
  734. * Write a start command to the ring.
  735. */
  736. static void vcn_v1_0_dec_ring_insert_start(struct amdgpu_ring *ring)
  737. {
  738. struct amdgpu_device *adev = ring->adev;
  739. amdgpu_ring_write(ring,
  740. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  741. amdgpu_ring_write(ring, 0);
  742. amdgpu_ring_write(ring,
  743. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  744. amdgpu_ring_write(ring, VCN_DEC_CMD_PACKET_START << 1);
  745. }
  746. /**
  747. * vcn_v1_0_dec_ring_insert_end - insert a end command
  748. *
  749. * @ring: amdgpu_ring pointer
  750. *
  751. * Write a end command to the ring.
  752. */
  753. static void vcn_v1_0_dec_ring_insert_end(struct amdgpu_ring *ring)
  754. {
  755. struct amdgpu_device *adev = ring->adev;
  756. amdgpu_ring_write(ring,
  757. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  758. amdgpu_ring_write(ring, VCN_DEC_CMD_PACKET_END << 1);
  759. }
  760. /**
  761. * vcn_v1_0_dec_ring_emit_fence - emit an fence & trap command
  762. *
  763. * @ring: amdgpu_ring pointer
  764. * @fence: fence to emit
  765. *
  766. * Write a fence and a trap command to the ring.
  767. */
  768. static void vcn_v1_0_dec_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
  769. unsigned flags)
  770. {
  771. struct amdgpu_device *adev = ring->adev;
  772. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  773. amdgpu_ring_write(ring,
  774. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_CONTEXT_ID), 0));
  775. amdgpu_ring_write(ring, seq);
  776. amdgpu_ring_write(ring,
  777. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  778. amdgpu_ring_write(ring, addr & 0xffffffff);
  779. amdgpu_ring_write(ring,
  780. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  781. amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
  782. amdgpu_ring_write(ring,
  783. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  784. amdgpu_ring_write(ring, VCN_DEC_CMD_FENCE << 1);
  785. amdgpu_ring_write(ring,
  786. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  787. amdgpu_ring_write(ring, 0);
  788. amdgpu_ring_write(ring,
  789. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  790. amdgpu_ring_write(ring, 0);
  791. amdgpu_ring_write(ring,
  792. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  793. amdgpu_ring_write(ring, VCN_DEC_CMD_TRAP << 1);
  794. }
  795. /**
  796. * vcn_v1_0_dec_ring_emit_ib - execute indirect buffer
  797. *
  798. * @ring: amdgpu_ring pointer
  799. * @ib: indirect buffer to execute
  800. *
  801. * Write ring commands to execute the indirect buffer
  802. */
  803. static void vcn_v1_0_dec_ring_emit_ib(struct amdgpu_ring *ring,
  804. struct amdgpu_ib *ib,
  805. unsigned vmid, bool ctx_switch)
  806. {
  807. struct amdgpu_device *adev = ring->adev;
  808. amdgpu_ring_write(ring,
  809. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_VMID), 0));
  810. amdgpu_ring_write(ring, vmid);
  811. amdgpu_ring_write(ring,
  812. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_64BIT_BAR_LOW), 0));
  813. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  814. amdgpu_ring_write(ring,
  815. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH), 0));
  816. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  817. amdgpu_ring_write(ring,
  818. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_RBC_IB_SIZE), 0));
  819. amdgpu_ring_write(ring, ib->length_dw);
  820. }
  821. static void vcn_v1_0_dec_ring_emit_reg_wait(struct amdgpu_ring *ring,
  822. uint32_t reg, uint32_t val,
  823. uint32_t mask)
  824. {
  825. struct amdgpu_device *adev = ring->adev;
  826. amdgpu_ring_write(ring,
  827. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  828. amdgpu_ring_write(ring, reg << 2);
  829. amdgpu_ring_write(ring,
  830. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  831. amdgpu_ring_write(ring, val);
  832. amdgpu_ring_write(ring,
  833. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GP_SCRATCH8), 0));
  834. amdgpu_ring_write(ring, mask);
  835. amdgpu_ring_write(ring,
  836. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  837. amdgpu_ring_write(ring, VCN_DEC_CMD_REG_READ_COND_WAIT << 1);
  838. }
  839. static void vcn_v1_0_dec_ring_emit_vm_flush(struct amdgpu_ring *ring,
  840. unsigned vmid, uint64_t pd_addr)
  841. {
  842. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  843. uint32_t data0, data1, mask;
  844. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  845. /* wait for register write */
  846. data0 = hub->ctx0_ptb_addr_lo32 + vmid * 2;
  847. data1 = lower_32_bits(pd_addr);
  848. mask = 0xffffffff;
  849. vcn_v1_0_dec_ring_emit_reg_wait(ring, data0, data1, mask);
  850. }
  851. static void vcn_v1_0_dec_ring_emit_wreg(struct amdgpu_ring *ring,
  852. uint32_t reg, uint32_t val)
  853. {
  854. struct amdgpu_device *adev = ring->adev;
  855. amdgpu_ring_write(ring,
  856. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA0), 0));
  857. amdgpu_ring_write(ring, reg << 2);
  858. amdgpu_ring_write(ring,
  859. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_DATA1), 0));
  860. amdgpu_ring_write(ring, val);
  861. amdgpu_ring_write(ring,
  862. PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_GPCOM_VCPU_CMD), 0));
  863. amdgpu_ring_write(ring, VCN_DEC_CMD_WRITE_REG << 1);
  864. }
  865. /**
  866. * vcn_v1_0_enc_ring_get_rptr - get enc read pointer
  867. *
  868. * @ring: amdgpu_ring pointer
  869. *
  870. * Returns the current hardware enc read pointer
  871. */
  872. static uint64_t vcn_v1_0_enc_ring_get_rptr(struct amdgpu_ring *ring)
  873. {
  874. struct amdgpu_device *adev = ring->adev;
  875. if (ring == &adev->vcn.ring_enc[0])
  876. return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR);
  877. else
  878. return RREG32_SOC15(UVD, 0, mmUVD_RB_RPTR2);
  879. }
  880. /**
  881. * vcn_v1_0_enc_ring_get_wptr - get enc write pointer
  882. *
  883. * @ring: amdgpu_ring pointer
  884. *
  885. * Returns the current hardware enc write pointer
  886. */
  887. static uint64_t vcn_v1_0_enc_ring_get_wptr(struct amdgpu_ring *ring)
  888. {
  889. struct amdgpu_device *adev = ring->adev;
  890. if (ring == &adev->vcn.ring_enc[0])
  891. return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR);
  892. else
  893. return RREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2);
  894. }
  895. /**
  896. * vcn_v1_0_enc_ring_set_wptr - set enc write pointer
  897. *
  898. * @ring: amdgpu_ring pointer
  899. *
  900. * Commits the enc write pointer to the hardware
  901. */
  902. static void vcn_v1_0_enc_ring_set_wptr(struct amdgpu_ring *ring)
  903. {
  904. struct amdgpu_device *adev = ring->adev;
  905. if (ring == &adev->vcn.ring_enc[0])
  906. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR,
  907. lower_32_bits(ring->wptr));
  908. else
  909. WREG32_SOC15(UVD, 0, mmUVD_RB_WPTR2,
  910. lower_32_bits(ring->wptr));
  911. }
  912. /**
  913. * vcn_v1_0_enc_ring_emit_fence - emit an enc fence & trap command
  914. *
  915. * @ring: amdgpu_ring pointer
  916. * @fence: fence to emit
  917. *
  918. * Write enc a fence and a trap command to the ring.
  919. */
  920. static void vcn_v1_0_enc_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
  921. u64 seq, unsigned flags)
  922. {
  923. WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
  924. amdgpu_ring_write(ring, VCN_ENC_CMD_FENCE);
  925. amdgpu_ring_write(ring, addr);
  926. amdgpu_ring_write(ring, upper_32_bits(addr));
  927. amdgpu_ring_write(ring, seq);
  928. amdgpu_ring_write(ring, VCN_ENC_CMD_TRAP);
  929. }
  930. static void vcn_v1_0_enc_ring_insert_end(struct amdgpu_ring *ring)
  931. {
  932. amdgpu_ring_write(ring, VCN_ENC_CMD_END);
  933. }
  934. /**
  935. * vcn_v1_0_enc_ring_emit_ib - enc execute indirect buffer
  936. *
  937. * @ring: amdgpu_ring pointer
  938. * @ib: indirect buffer to execute
  939. *
  940. * Write enc ring commands to execute the indirect buffer
  941. */
  942. static void vcn_v1_0_enc_ring_emit_ib(struct amdgpu_ring *ring,
  943. struct amdgpu_ib *ib, unsigned int vmid, bool ctx_switch)
  944. {
  945. amdgpu_ring_write(ring, VCN_ENC_CMD_IB);
  946. amdgpu_ring_write(ring, vmid);
  947. amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
  948. amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
  949. amdgpu_ring_write(ring, ib->length_dw);
  950. }
  951. static void vcn_v1_0_enc_ring_emit_reg_wait(struct amdgpu_ring *ring,
  952. uint32_t reg, uint32_t val,
  953. uint32_t mask)
  954. {
  955. amdgpu_ring_write(ring, VCN_ENC_CMD_REG_WAIT);
  956. amdgpu_ring_write(ring, reg << 2);
  957. amdgpu_ring_write(ring, mask);
  958. amdgpu_ring_write(ring, val);
  959. }
  960. static void vcn_v1_0_enc_ring_emit_vm_flush(struct amdgpu_ring *ring,
  961. unsigned int vmid, uint64_t pd_addr)
  962. {
  963. struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
  964. pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
  965. /* wait for reg writes */
  966. vcn_v1_0_enc_ring_emit_reg_wait(ring, hub->ctx0_ptb_addr_lo32 + vmid * 2,
  967. lower_32_bits(pd_addr), 0xffffffff);
  968. }
  969. static void vcn_v1_0_enc_ring_emit_wreg(struct amdgpu_ring *ring,
  970. uint32_t reg, uint32_t val)
  971. {
  972. amdgpu_ring_write(ring, VCN_ENC_CMD_REG_WRITE);
  973. amdgpu_ring_write(ring, reg << 2);
  974. amdgpu_ring_write(ring, val);
  975. }
  976. static int vcn_v1_0_set_interrupt_state(struct amdgpu_device *adev,
  977. struct amdgpu_irq_src *source,
  978. unsigned type,
  979. enum amdgpu_interrupt_state state)
  980. {
  981. return 0;
  982. }
  983. static int vcn_v1_0_process_interrupt(struct amdgpu_device *adev,
  984. struct amdgpu_irq_src *source,
  985. struct amdgpu_iv_entry *entry)
  986. {
  987. DRM_DEBUG("IH: VCN TRAP\n");
  988. switch (entry->src_id) {
  989. case 124:
  990. amdgpu_fence_process(&adev->vcn.ring_dec);
  991. break;
  992. case 119:
  993. amdgpu_fence_process(&adev->vcn.ring_enc[0]);
  994. break;
  995. case 120:
  996. amdgpu_fence_process(&adev->vcn.ring_enc[1]);
  997. break;
  998. default:
  999. DRM_ERROR("Unhandled interrupt: %d %d\n",
  1000. entry->src_id, entry->src_data[0]);
  1001. break;
  1002. }
  1003. return 0;
  1004. }
  1005. static void vcn_v1_0_dec_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count)
  1006. {
  1007. struct amdgpu_device *adev = ring->adev;
  1008. int i;
  1009. WARN_ON(ring->wptr % 2 || count % 2);
  1010. for (i = 0; i < count / 2; i++) {
  1011. amdgpu_ring_write(ring, PACKET0(SOC15_REG_OFFSET(UVD, 0, mmUVD_NO_OP), 0));
  1012. amdgpu_ring_write(ring, 0);
  1013. }
  1014. }
  1015. static int vcn_v1_0_set_powergating_state(void *handle,
  1016. enum amd_powergating_state state)
  1017. {
  1018. /* This doesn't actually powergate the VCN block.
  1019. * That's done in the dpm code via the SMC. This
  1020. * just re-inits the block as necessary. The actual
  1021. * gating still happens in the dpm code. We should
  1022. * revisit this when there is a cleaner line between
  1023. * the smc and the hw blocks
  1024. */
  1025. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1026. if (state == AMD_PG_STATE_GATE)
  1027. return vcn_v1_0_stop(adev);
  1028. else
  1029. return vcn_v1_0_start(adev);
  1030. }
  1031. static const struct amd_ip_funcs vcn_v1_0_ip_funcs = {
  1032. .name = "vcn_v1_0",
  1033. .early_init = vcn_v1_0_early_init,
  1034. .late_init = NULL,
  1035. .sw_init = vcn_v1_0_sw_init,
  1036. .sw_fini = vcn_v1_0_sw_fini,
  1037. .hw_init = vcn_v1_0_hw_init,
  1038. .hw_fini = vcn_v1_0_hw_fini,
  1039. .suspend = vcn_v1_0_suspend,
  1040. .resume = vcn_v1_0_resume,
  1041. .is_idle = vcn_v1_0_is_idle,
  1042. .wait_for_idle = vcn_v1_0_wait_for_idle,
  1043. .check_soft_reset = NULL /* vcn_v1_0_check_soft_reset */,
  1044. .pre_soft_reset = NULL /* vcn_v1_0_pre_soft_reset */,
  1045. .soft_reset = NULL /* vcn_v1_0_soft_reset */,
  1046. .post_soft_reset = NULL /* vcn_v1_0_post_soft_reset */,
  1047. .set_clockgating_state = vcn_v1_0_set_clockgating_state,
  1048. .set_powergating_state = vcn_v1_0_set_powergating_state,
  1049. };
  1050. static const struct amdgpu_ring_funcs vcn_v1_0_dec_ring_vm_funcs = {
  1051. .type = AMDGPU_RING_TYPE_VCN_DEC,
  1052. .align_mask = 0xf,
  1053. .support_64bit_ptrs = false,
  1054. .vmhub = AMDGPU_MMHUB,
  1055. .get_rptr = vcn_v1_0_dec_ring_get_rptr,
  1056. .get_wptr = vcn_v1_0_dec_ring_get_wptr,
  1057. .set_wptr = vcn_v1_0_dec_ring_set_wptr,
  1058. .emit_frame_size =
  1059. 6 + 6 + /* hdp invalidate / flush */
  1060. SOC15_FLUSH_GPU_TLB_NUM_WREG * 6 +
  1061. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 8 +
  1062. 8 + /* vcn_v1_0_dec_ring_emit_vm_flush */
  1063. 14 + 14 + /* vcn_v1_0_dec_ring_emit_fence x2 vm fence */
  1064. 6,
  1065. .emit_ib_size = 8, /* vcn_v1_0_dec_ring_emit_ib */
  1066. .emit_ib = vcn_v1_0_dec_ring_emit_ib,
  1067. .emit_fence = vcn_v1_0_dec_ring_emit_fence,
  1068. .emit_vm_flush = vcn_v1_0_dec_ring_emit_vm_flush,
  1069. .test_ring = amdgpu_vcn_dec_ring_test_ring,
  1070. .test_ib = amdgpu_vcn_dec_ring_test_ib,
  1071. .insert_nop = vcn_v1_0_dec_ring_insert_nop,
  1072. .insert_start = vcn_v1_0_dec_ring_insert_start,
  1073. .insert_end = vcn_v1_0_dec_ring_insert_end,
  1074. .pad_ib = amdgpu_ring_generic_pad_ib,
  1075. .begin_use = amdgpu_vcn_ring_begin_use,
  1076. .end_use = amdgpu_vcn_ring_end_use,
  1077. .emit_wreg = vcn_v1_0_dec_ring_emit_wreg,
  1078. .emit_reg_wait = vcn_v1_0_dec_ring_emit_reg_wait,
  1079. .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
  1080. };
  1081. static const struct amdgpu_ring_funcs vcn_v1_0_enc_ring_vm_funcs = {
  1082. .type = AMDGPU_RING_TYPE_VCN_ENC,
  1083. .align_mask = 0x3f,
  1084. .nop = VCN_ENC_CMD_NO_OP,
  1085. .support_64bit_ptrs = false,
  1086. .vmhub = AMDGPU_MMHUB,
  1087. .get_rptr = vcn_v1_0_enc_ring_get_rptr,
  1088. .get_wptr = vcn_v1_0_enc_ring_get_wptr,
  1089. .set_wptr = vcn_v1_0_enc_ring_set_wptr,
  1090. .emit_frame_size =
  1091. SOC15_FLUSH_GPU_TLB_NUM_WREG * 3 +
  1092. SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 4 +
  1093. 4 + /* vcn_v1_0_enc_ring_emit_vm_flush */
  1094. 5 + 5 + /* vcn_v1_0_enc_ring_emit_fence x2 vm fence */
  1095. 1, /* vcn_v1_0_enc_ring_insert_end */
  1096. .emit_ib_size = 5, /* vcn_v1_0_enc_ring_emit_ib */
  1097. .emit_ib = vcn_v1_0_enc_ring_emit_ib,
  1098. .emit_fence = vcn_v1_0_enc_ring_emit_fence,
  1099. .emit_vm_flush = vcn_v1_0_enc_ring_emit_vm_flush,
  1100. .test_ring = amdgpu_vcn_enc_ring_test_ring,
  1101. .test_ib = amdgpu_vcn_enc_ring_test_ib,
  1102. .insert_nop = amdgpu_ring_insert_nop,
  1103. .insert_end = vcn_v1_0_enc_ring_insert_end,
  1104. .pad_ib = amdgpu_ring_generic_pad_ib,
  1105. .begin_use = amdgpu_vcn_ring_begin_use,
  1106. .end_use = amdgpu_vcn_ring_end_use,
  1107. .emit_wreg = vcn_v1_0_enc_ring_emit_wreg,
  1108. .emit_reg_wait = vcn_v1_0_enc_ring_emit_reg_wait,
  1109. .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
  1110. };
  1111. static void vcn_v1_0_set_dec_ring_funcs(struct amdgpu_device *adev)
  1112. {
  1113. adev->vcn.ring_dec.funcs = &vcn_v1_0_dec_ring_vm_funcs;
  1114. DRM_INFO("VCN decode is enabled in VM mode\n");
  1115. }
  1116. static void vcn_v1_0_set_enc_ring_funcs(struct amdgpu_device *adev)
  1117. {
  1118. int i;
  1119. for (i = 0; i < adev->vcn.num_enc_rings; ++i)
  1120. adev->vcn.ring_enc[i].funcs = &vcn_v1_0_enc_ring_vm_funcs;
  1121. DRM_INFO("VCN encode is enabled in VM mode\n");
  1122. }
  1123. static const struct amdgpu_irq_src_funcs vcn_v1_0_irq_funcs = {
  1124. .set = vcn_v1_0_set_interrupt_state,
  1125. .process = vcn_v1_0_process_interrupt,
  1126. };
  1127. static void vcn_v1_0_set_irq_funcs(struct amdgpu_device *adev)
  1128. {
  1129. adev->vcn.irq.num_types = adev->vcn.num_enc_rings + 1;
  1130. adev->vcn.irq.funcs = &vcn_v1_0_irq_funcs;
  1131. }
  1132. const struct amdgpu_ip_block_version vcn_v1_0_ip_block =
  1133. {
  1134. .type = AMD_IP_BLOCK_TYPE_VCN,
  1135. .major = 1,
  1136. .minor = 0,
  1137. .rev = 0,
  1138. .funcs = &vcn_v1_0_ip_funcs,
  1139. };