psp_v10_0.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. * Author: Huang Rui
  23. *
  24. */
  25. #include <linux/firmware.h>
  26. #include "amdgpu.h"
  27. #include "amdgpu_psp.h"
  28. #include "amdgpu_ucode.h"
  29. #include "soc15_common.h"
  30. #include "psp_v10_0.h"
  31. #include "mp/mp_10_0_offset.h"
  32. #include "gc/gc_9_1_offset.h"
  33. #include "sdma0/sdma0_4_1_offset.h"
  34. MODULE_FIRMWARE("amdgpu/raven_asd.bin");
  35. static int
  36. psp_v10_0_get_fw_type(struct amdgpu_firmware_info *ucode, enum psp_gfx_fw_type *type)
  37. {
  38. switch(ucode->ucode_id) {
  39. case AMDGPU_UCODE_ID_SDMA0:
  40. *type = GFX_FW_TYPE_SDMA0;
  41. break;
  42. case AMDGPU_UCODE_ID_SDMA1:
  43. *type = GFX_FW_TYPE_SDMA1;
  44. break;
  45. case AMDGPU_UCODE_ID_CP_CE:
  46. *type = GFX_FW_TYPE_CP_CE;
  47. break;
  48. case AMDGPU_UCODE_ID_CP_PFP:
  49. *type = GFX_FW_TYPE_CP_PFP;
  50. break;
  51. case AMDGPU_UCODE_ID_CP_ME:
  52. *type = GFX_FW_TYPE_CP_ME;
  53. break;
  54. case AMDGPU_UCODE_ID_CP_MEC1:
  55. *type = GFX_FW_TYPE_CP_MEC;
  56. break;
  57. case AMDGPU_UCODE_ID_CP_MEC1_JT:
  58. *type = GFX_FW_TYPE_CP_MEC_ME1;
  59. break;
  60. case AMDGPU_UCODE_ID_CP_MEC2:
  61. *type = GFX_FW_TYPE_CP_MEC;
  62. break;
  63. case AMDGPU_UCODE_ID_CP_MEC2_JT:
  64. *type = GFX_FW_TYPE_CP_MEC_ME2;
  65. break;
  66. case AMDGPU_UCODE_ID_RLC_G:
  67. *type = GFX_FW_TYPE_RLC_G;
  68. break;
  69. case AMDGPU_UCODE_ID_RLC_RESTORE_LIST_CNTL:
  70. *type = GFX_FW_TYPE_RLC_RESTORE_LIST_CNTL;
  71. break;
  72. case AMDGPU_UCODE_ID_RLC_RESTORE_LIST_GPM_MEM:
  73. *type = GFX_FW_TYPE_RLC_RESTORE_LIST_GPM_MEM;
  74. break;
  75. case AMDGPU_UCODE_ID_RLC_RESTORE_LIST_SRM_MEM:
  76. *type = GFX_FW_TYPE_RLC_RESTORE_LIST_SRM_MEM;
  77. break;
  78. case AMDGPU_UCODE_ID_SMC:
  79. *type = GFX_FW_TYPE_SMU;
  80. break;
  81. case AMDGPU_UCODE_ID_UVD:
  82. *type = GFX_FW_TYPE_UVD;
  83. break;
  84. case AMDGPU_UCODE_ID_VCE:
  85. *type = GFX_FW_TYPE_VCE;
  86. break;
  87. case AMDGPU_UCODE_ID_MAXIMUM:
  88. default:
  89. return -EINVAL;
  90. }
  91. return 0;
  92. }
  93. static int psp_v10_0_init_microcode(struct psp_context *psp)
  94. {
  95. struct amdgpu_device *adev = psp->adev;
  96. const char *chip_name;
  97. char fw_name[30];
  98. int err = 0;
  99. const struct psp_firmware_header_v1_0 *hdr;
  100. DRM_DEBUG("\n");
  101. switch (adev->asic_type) {
  102. case CHIP_RAVEN:
  103. chip_name = "raven";
  104. break;
  105. default: BUG();
  106. }
  107. snprintf(fw_name, sizeof(fw_name), "amdgpu/%s_asd.bin", chip_name);
  108. err = request_firmware(&adev->psp.asd_fw, fw_name, adev->dev);
  109. if (err)
  110. goto out;
  111. err = amdgpu_ucode_validate(adev->psp.asd_fw);
  112. if (err)
  113. goto out;
  114. hdr = (const struct psp_firmware_header_v1_0 *)adev->psp.asd_fw->data;
  115. adev->psp.asd_fw_version = le32_to_cpu(hdr->header.ucode_version);
  116. adev->psp.asd_feature_version = le32_to_cpu(hdr->ucode_feature_version);
  117. adev->psp.asd_ucode_size = le32_to_cpu(hdr->header.ucode_size_bytes);
  118. adev->psp.asd_start_addr = (uint8_t *)hdr +
  119. le32_to_cpu(hdr->header.ucode_array_offset_bytes);
  120. return 0;
  121. out:
  122. if (err) {
  123. dev_err(adev->dev,
  124. "psp v10.0: Failed to load firmware \"%s\"\n",
  125. fw_name);
  126. release_firmware(adev->psp.asd_fw);
  127. adev->psp.asd_fw = NULL;
  128. }
  129. return err;
  130. }
  131. static int psp_v10_0_prep_cmd_buf(struct amdgpu_firmware_info *ucode,
  132. struct psp_gfx_cmd_resp *cmd)
  133. {
  134. int ret;
  135. uint64_t fw_mem_mc_addr = ucode->mc_addr;
  136. memset(cmd, 0, sizeof(struct psp_gfx_cmd_resp));
  137. cmd->cmd_id = GFX_CMD_ID_LOAD_IP_FW;
  138. cmd->cmd.cmd_load_ip_fw.fw_phy_addr_lo = lower_32_bits(fw_mem_mc_addr);
  139. cmd->cmd.cmd_load_ip_fw.fw_phy_addr_hi = upper_32_bits(fw_mem_mc_addr);
  140. cmd->cmd.cmd_load_ip_fw.fw_size = ucode->ucode_size;
  141. ret = psp_v10_0_get_fw_type(ucode, &cmd->cmd.cmd_load_ip_fw.fw_type);
  142. if (ret)
  143. DRM_ERROR("Unknown firmware type\n");
  144. return ret;
  145. }
  146. static int psp_v10_0_ring_init(struct psp_context *psp,
  147. enum psp_ring_type ring_type)
  148. {
  149. int ret = 0;
  150. struct psp_ring *ring;
  151. struct amdgpu_device *adev = psp->adev;
  152. ring = &psp->km_ring;
  153. ring->ring_type = ring_type;
  154. /* allocate 4k Page of Local Frame Buffer memory for ring */
  155. ring->ring_size = 0x1000;
  156. ret = amdgpu_bo_create_kernel(adev, ring->ring_size, PAGE_SIZE,
  157. AMDGPU_GEM_DOMAIN_VRAM,
  158. &adev->firmware.rbuf,
  159. &ring->ring_mem_mc_addr,
  160. (void **)&ring->ring_mem);
  161. if (ret) {
  162. ring->ring_size = 0;
  163. return ret;
  164. }
  165. return 0;
  166. }
  167. static int psp_v10_0_ring_create(struct psp_context *psp,
  168. enum psp_ring_type ring_type)
  169. {
  170. int ret = 0;
  171. unsigned int psp_ring_reg = 0;
  172. struct psp_ring *ring = &psp->km_ring;
  173. struct amdgpu_device *adev = psp->adev;
  174. /* Write low address of the ring to C2PMSG_69 */
  175. psp_ring_reg = lower_32_bits(ring->ring_mem_mc_addr);
  176. WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_69, psp_ring_reg);
  177. /* Write high address of the ring to C2PMSG_70 */
  178. psp_ring_reg = upper_32_bits(ring->ring_mem_mc_addr);
  179. WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_70, psp_ring_reg);
  180. /* Write size of ring to C2PMSG_71 */
  181. psp_ring_reg = ring->ring_size;
  182. WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_71, psp_ring_reg);
  183. /* Write the ring initialization command to C2PMSG_64 */
  184. psp_ring_reg = ring_type;
  185. psp_ring_reg = psp_ring_reg << 16;
  186. WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_64, psp_ring_reg);
  187. /* There might be handshake issue with hardware which needs delay */
  188. mdelay(20);
  189. /* Wait for response flag (bit 31) in C2PMSG_64 */
  190. ret = psp_wait_for(psp, SOC15_REG_OFFSET(MP0, 0, mmMP0_SMN_C2PMSG_64),
  191. 0x80000000, 0x8000FFFF, false);
  192. return ret;
  193. }
  194. static int psp_v10_0_ring_stop(struct psp_context *psp,
  195. enum psp_ring_type ring_type)
  196. {
  197. int ret = 0;
  198. struct psp_ring *ring;
  199. unsigned int psp_ring_reg = 0;
  200. struct amdgpu_device *adev = psp->adev;
  201. ring = &psp->km_ring;
  202. /* Write the ring destroy command to C2PMSG_64 */
  203. psp_ring_reg = 3 << 16;
  204. WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_64, psp_ring_reg);
  205. /* There might be handshake issue with hardware which needs delay */
  206. mdelay(20);
  207. /* Wait for response flag (bit 31) in C2PMSG_64 */
  208. ret = psp_wait_for(psp, SOC15_REG_OFFSET(MP0, 0, mmMP0_SMN_C2PMSG_64),
  209. 0x80000000, 0x80000000, false);
  210. return ret;
  211. }
  212. static int psp_v10_0_ring_destroy(struct psp_context *psp,
  213. enum psp_ring_type ring_type)
  214. {
  215. int ret = 0;
  216. struct psp_ring *ring = &psp->km_ring;
  217. struct amdgpu_device *adev = psp->adev;
  218. ret = psp_v10_0_ring_stop(psp, ring_type);
  219. if (ret)
  220. DRM_ERROR("Fail to stop psp ring\n");
  221. amdgpu_bo_free_kernel(&adev->firmware.rbuf,
  222. &ring->ring_mem_mc_addr,
  223. (void **)&ring->ring_mem);
  224. return ret;
  225. }
  226. static int psp_v10_0_cmd_submit(struct psp_context *psp,
  227. struct amdgpu_firmware_info *ucode,
  228. uint64_t cmd_buf_mc_addr, uint64_t fence_mc_addr,
  229. int index)
  230. {
  231. unsigned int psp_write_ptr_reg = 0;
  232. struct psp_gfx_rb_frame * write_frame = psp->km_ring.ring_mem;
  233. struct psp_ring *ring = &psp->km_ring;
  234. struct psp_gfx_rb_frame *ring_buffer_start = ring->ring_mem;
  235. struct psp_gfx_rb_frame *ring_buffer_end = ring_buffer_start +
  236. ring->ring_size / sizeof(struct psp_gfx_rb_frame) - 1;
  237. struct amdgpu_device *adev = psp->adev;
  238. uint32_t ring_size_dw = ring->ring_size / 4;
  239. uint32_t rb_frame_size_dw = sizeof(struct psp_gfx_rb_frame) / 4;
  240. /* KM (GPCOM) prepare write pointer */
  241. psp_write_ptr_reg = RREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_67);
  242. /* Update KM RB frame pointer to new frame */
  243. if ((psp_write_ptr_reg % ring_size_dw) == 0)
  244. write_frame = ring_buffer_start;
  245. else
  246. write_frame = ring_buffer_start + (psp_write_ptr_reg / rb_frame_size_dw);
  247. /* Check invalid write_frame ptr address */
  248. if ((write_frame < ring_buffer_start) || (ring_buffer_end < write_frame)) {
  249. DRM_ERROR("ring_buffer_start = %p; ring_buffer_end = %p; write_frame = %p\n",
  250. ring_buffer_start, ring_buffer_end, write_frame);
  251. DRM_ERROR("write_frame is pointing to address out of bounds\n");
  252. return -EINVAL;
  253. }
  254. /* Initialize KM RB frame */
  255. memset(write_frame, 0, sizeof(struct psp_gfx_rb_frame));
  256. /* Update KM RB frame */
  257. write_frame->cmd_buf_addr_hi = upper_32_bits(cmd_buf_mc_addr);
  258. write_frame->cmd_buf_addr_lo = lower_32_bits(cmd_buf_mc_addr);
  259. write_frame->fence_addr_hi = upper_32_bits(fence_mc_addr);
  260. write_frame->fence_addr_lo = lower_32_bits(fence_mc_addr);
  261. write_frame->fence_value = index;
  262. /* Update the write Pointer in DWORDs */
  263. psp_write_ptr_reg = (psp_write_ptr_reg + rb_frame_size_dw) % ring_size_dw;
  264. WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_67, psp_write_ptr_reg);
  265. return 0;
  266. }
  267. static int
  268. psp_v10_0_sram_map(struct amdgpu_device *adev,
  269. unsigned int *sram_offset, unsigned int *sram_addr_reg_offset,
  270. unsigned int *sram_data_reg_offset,
  271. enum AMDGPU_UCODE_ID ucode_id)
  272. {
  273. int ret = 0;
  274. switch(ucode_id) {
  275. /* TODO: needs to confirm */
  276. #if 0
  277. case AMDGPU_UCODE_ID_SMC:
  278. *sram_offset = 0;
  279. *sram_addr_reg_offset = 0;
  280. *sram_data_reg_offset = 0;
  281. break;
  282. #endif
  283. case AMDGPU_UCODE_ID_CP_CE:
  284. *sram_offset = 0x0;
  285. *sram_addr_reg_offset = SOC15_REG_OFFSET(GC, 0, mmCP_CE_UCODE_ADDR);
  286. *sram_data_reg_offset = SOC15_REG_OFFSET(GC, 0, mmCP_CE_UCODE_DATA);
  287. break;
  288. case AMDGPU_UCODE_ID_CP_PFP:
  289. *sram_offset = 0x0;
  290. *sram_addr_reg_offset = SOC15_REG_OFFSET(GC, 0, mmCP_PFP_UCODE_ADDR);
  291. *sram_data_reg_offset = SOC15_REG_OFFSET(GC, 0, mmCP_PFP_UCODE_DATA);
  292. break;
  293. case AMDGPU_UCODE_ID_CP_ME:
  294. *sram_offset = 0x0;
  295. *sram_addr_reg_offset = SOC15_REG_OFFSET(GC, 0, mmCP_HYP_ME_UCODE_ADDR);
  296. *sram_data_reg_offset = SOC15_REG_OFFSET(GC, 0, mmCP_HYP_ME_UCODE_DATA);
  297. break;
  298. case AMDGPU_UCODE_ID_CP_MEC1:
  299. *sram_offset = 0x10000;
  300. *sram_addr_reg_offset = SOC15_REG_OFFSET(GC, 0, mmCP_MEC_ME1_UCODE_ADDR);
  301. *sram_data_reg_offset = SOC15_REG_OFFSET(GC, 0, mmCP_MEC_ME1_UCODE_DATA);
  302. break;
  303. case AMDGPU_UCODE_ID_CP_MEC2:
  304. *sram_offset = 0x10000;
  305. *sram_addr_reg_offset = SOC15_REG_OFFSET(GC, 0, mmCP_HYP_MEC2_UCODE_ADDR);
  306. *sram_data_reg_offset = SOC15_REG_OFFSET(GC, 0, mmCP_HYP_MEC2_UCODE_DATA);
  307. break;
  308. case AMDGPU_UCODE_ID_RLC_G:
  309. *sram_offset = 0x2000;
  310. *sram_addr_reg_offset = SOC15_REG_OFFSET(GC, 0, mmRLC_GPM_UCODE_ADDR);
  311. *sram_data_reg_offset = SOC15_REG_OFFSET(GC, 0, mmRLC_GPM_UCODE_DATA);
  312. break;
  313. case AMDGPU_UCODE_ID_SDMA0:
  314. *sram_offset = 0x0;
  315. *sram_addr_reg_offset = SOC15_REG_OFFSET(SDMA0, 0, mmSDMA0_UCODE_ADDR);
  316. *sram_data_reg_offset = SOC15_REG_OFFSET(SDMA0, 0, mmSDMA0_UCODE_DATA);
  317. break;
  318. /* TODO: needs to confirm */
  319. #if 0
  320. case AMDGPU_UCODE_ID_SDMA1:
  321. *sram_offset = ;
  322. *sram_addr_reg_offset = ;
  323. break;
  324. case AMDGPU_UCODE_ID_UVD:
  325. *sram_offset = ;
  326. *sram_addr_reg_offset = ;
  327. break;
  328. case AMDGPU_UCODE_ID_VCE:
  329. *sram_offset = ;
  330. *sram_addr_reg_offset = ;
  331. break;
  332. #endif
  333. case AMDGPU_UCODE_ID_MAXIMUM:
  334. default:
  335. ret = -EINVAL;
  336. break;
  337. }
  338. return ret;
  339. }
  340. static bool psp_v10_0_compare_sram_data(struct psp_context *psp,
  341. struct amdgpu_firmware_info *ucode,
  342. enum AMDGPU_UCODE_ID ucode_type)
  343. {
  344. int err = 0;
  345. unsigned int fw_sram_reg_val = 0;
  346. unsigned int fw_sram_addr_reg_offset = 0;
  347. unsigned int fw_sram_data_reg_offset = 0;
  348. unsigned int ucode_size;
  349. uint32_t *ucode_mem = NULL;
  350. struct amdgpu_device *adev = psp->adev;
  351. err = psp_v10_0_sram_map(adev, &fw_sram_reg_val, &fw_sram_addr_reg_offset,
  352. &fw_sram_data_reg_offset, ucode_type);
  353. if (err)
  354. return false;
  355. WREG32(fw_sram_addr_reg_offset, fw_sram_reg_val);
  356. ucode_size = ucode->ucode_size;
  357. ucode_mem = (uint32_t *)ucode->kaddr;
  358. while (!ucode_size) {
  359. fw_sram_reg_val = RREG32(fw_sram_data_reg_offset);
  360. if (*ucode_mem != fw_sram_reg_val)
  361. return false;
  362. ucode_mem++;
  363. /* 4 bytes */
  364. ucode_size -= 4;
  365. }
  366. return true;
  367. }
  368. static int psp_v10_0_mode1_reset(struct psp_context *psp)
  369. {
  370. DRM_INFO("psp mode 1 reset not supported now! \n");
  371. return -EINVAL;
  372. }
  373. static const struct psp_funcs psp_v10_0_funcs = {
  374. .init_microcode = psp_v10_0_init_microcode,
  375. .prep_cmd_buf = psp_v10_0_prep_cmd_buf,
  376. .ring_init = psp_v10_0_ring_init,
  377. .ring_create = psp_v10_0_ring_create,
  378. .ring_stop = psp_v10_0_ring_stop,
  379. .ring_destroy = psp_v10_0_ring_destroy,
  380. .cmd_submit = psp_v10_0_cmd_submit,
  381. .compare_sram_data = psp_v10_0_compare_sram_data,
  382. .mode1_reset = psp_v10_0_mode1_reset,
  383. };
  384. void psp_v10_0_set_psp_funcs(struct psp_context *psp)
  385. {
  386. psp->funcs = &psp_v10_0_funcs;
  387. }