amdgpu_ucode.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446
  1. /*
  2. * Copyright 2014 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include <linux/firmware.h>
  24. #include <linux/slab.h>
  25. #include <linux/module.h>
  26. #include <drm/drmP.h>
  27. #include "amdgpu.h"
  28. #include "amdgpu_ucode.h"
  29. static void amdgpu_ucode_print_common_hdr(const struct common_firmware_header *hdr)
  30. {
  31. DRM_DEBUG("size_bytes: %u\n", le32_to_cpu(hdr->size_bytes));
  32. DRM_DEBUG("header_size_bytes: %u\n", le32_to_cpu(hdr->header_size_bytes));
  33. DRM_DEBUG("header_version_major: %u\n", le16_to_cpu(hdr->header_version_major));
  34. DRM_DEBUG("header_version_minor: %u\n", le16_to_cpu(hdr->header_version_minor));
  35. DRM_DEBUG("ip_version_major: %u\n", le16_to_cpu(hdr->ip_version_major));
  36. DRM_DEBUG("ip_version_minor: %u\n", le16_to_cpu(hdr->ip_version_minor));
  37. DRM_DEBUG("ucode_version: 0x%08x\n", le32_to_cpu(hdr->ucode_version));
  38. DRM_DEBUG("ucode_size_bytes: %u\n", le32_to_cpu(hdr->ucode_size_bytes));
  39. DRM_DEBUG("ucode_array_offset_bytes: %u\n",
  40. le32_to_cpu(hdr->ucode_array_offset_bytes));
  41. DRM_DEBUG("crc32: 0x%08x\n", le32_to_cpu(hdr->crc32));
  42. }
  43. void amdgpu_ucode_print_mc_hdr(const struct common_firmware_header *hdr)
  44. {
  45. uint16_t version_major = le16_to_cpu(hdr->header_version_major);
  46. uint16_t version_minor = le16_to_cpu(hdr->header_version_minor);
  47. DRM_DEBUG("MC\n");
  48. amdgpu_ucode_print_common_hdr(hdr);
  49. if (version_major == 1) {
  50. const struct mc_firmware_header_v1_0 *mc_hdr =
  51. container_of(hdr, struct mc_firmware_header_v1_0, header);
  52. DRM_DEBUG("io_debug_size_bytes: %u\n",
  53. le32_to_cpu(mc_hdr->io_debug_size_bytes));
  54. DRM_DEBUG("io_debug_array_offset_bytes: %u\n",
  55. le32_to_cpu(mc_hdr->io_debug_array_offset_bytes));
  56. } else {
  57. DRM_ERROR("Unknown MC ucode version: %u.%u\n", version_major, version_minor);
  58. }
  59. }
  60. void amdgpu_ucode_print_smc_hdr(const struct common_firmware_header *hdr)
  61. {
  62. uint16_t version_major = le16_to_cpu(hdr->header_version_major);
  63. uint16_t version_minor = le16_to_cpu(hdr->header_version_minor);
  64. DRM_DEBUG("SMC\n");
  65. amdgpu_ucode_print_common_hdr(hdr);
  66. if (version_major == 1) {
  67. const struct smc_firmware_header_v1_0 *smc_hdr =
  68. container_of(hdr, struct smc_firmware_header_v1_0, header);
  69. DRM_DEBUG("ucode_start_addr: %u\n", le32_to_cpu(smc_hdr->ucode_start_addr));
  70. } else {
  71. DRM_ERROR("Unknown SMC ucode version: %u.%u\n", version_major, version_minor);
  72. }
  73. }
  74. void amdgpu_ucode_print_gfx_hdr(const struct common_firmware_header *hdr)
  75. {
  76. uint16_t version_major = le16_to_cpu(hdr->header_version_major);
  77. uint16_t version_minor = le16_to_cpu(hdr->header_version_minor);
  78. DRM_DEBUG("GFX\n");
  79. amdgpu_ucode_print_common_hdr(hdr);
  80. if (version_major == 1) {
  81. const struct gfx_firmware_header_v1_0 *gfx_hdr =
  82. container_of(hdr, struct gfx_firmware_header_v1_0, header);
  83. DRM_DEBUG("ucode_feature_version: %u\n",
  84. le32_to_cpu(gfx_hdr->ucode_feature_version));
  85. DRM_DEBUG("jt_offset: %u\n", le32_to_cpu(gfx_hdr->jt_offset));
  86. DRM_DEBUG("jt_size: %u\n", le32_to_cpu(gfx_hdr->jt_size));
  87. } else {
  88. DRM_ERROR("Unknown GFX ucode version: %u.%u\n", version_major, version_minor);
  89. }
  90. }
  91. void amdgpu_ucode_print_rlc_hdr(const struct common_firmware_header *hdr)
  92. {
  93. uint16_t version_major = le16_to_cpu(hdr->header_version_major);
  94. uint16_t version_minor = le16_to_cpu(hdr->header_version_minor);
  95. DRM_DEBUG("RLC\n");
  96. amdgpu_ucode_print_common_hdr(hdr);
  97. if (version_major == 1) {
  98. const struct rlc_firmware_header_v1_0 *rlc_hdr =
  99. container_of(hdr, struct rlc_firmware_header_v1_0, header);
  100. DRM_DEBUG("ucode_feature_version: %u\n",
  101. le32_to_cpu(rlc_hdr->ucode_feature_version));
  102. DRM_DEBUG("save_and_restore_offset: %u\n",
  103. le32_to_cpu(rlc_hdr->save_and_restore_offset));
  104. DRM_DEBUG("clear_state_descriptor_offset: %u\n",
  105. le32_to_cpu(rlc_hdr->clear_state_descriptor_offset));
  106. DRM_DEBUG("avail_scratch_ram_locations: %u\n",
  107. le32_to_cpu(rlc_hdr->avail_scratch_ram_locations));
  108. DRM_DEBUG("master_pkt_description_offset: %u\n",
  109. le32_to_cpu(rlc_hdr->master_pkt_description_offset));
  110. } else if (version_major == 2) {
  111. const struct rlc_firmware_header_v2_0 *rlc_hdr =
  112. container_of(hdr, struct rlc_firmware_header_v2_0, header);
  113. DRM_DEBUG("ucode_feature_version: %u\n",
  114. le32_to_cpu(rlc_hdr->ucode_feature_version));
  115. DRM_DEBUG("jt_offset: %u\n", le32_to_cpu(rlc_hdr->jt_offset));
  116. DRM_DEBUG("jt_size: %u\n", le32_to_cpu(rlc_hdr->jt_size));
  117. DRM_DEBUG("save_and_restore_offset: %u\n",
  118. le32_to_cpu(rlc_hdr->save_and_restore_offset));
  119. DRM_DEBUG("clear_state_descriptor_offset: %u\n",
  120. le32_to_cpu(rlc_hdr->clear_state_descriptor_offset));
  121. DRM_DEBUG("avail_scratch_ram_locations: %u\n",
  122. le32_to_cpu(rlc_hdr->avail_scratch_ram_locations));
  123. DRM_DEBUG("reg_restore_list_size: %u\n",
  124. le32_to_cpu(rlc_hdr->reg_restore_list_size));
  125. DRM_DEBUG("reg_list_format_start: %u\n",
  126. le32_to_cpu(rlc_hdr->reg_list_format_start));
  127. DRM_DEBUG("reg_list_format_separate_start: %u\n",
  128. le32_to_cpu(rlc_hdr->reg_list_format_separate_start));
  129. DRM_DEBUG("starting_offsets_start: %u\n",
  130. le32_to_cpu(rlc_hdr->starting_offsets_start));
  131. DRM_DEBUG("reg_list_format_size_bytes: %u\n",
  132. le32_to_cpu(rlc_hdr->reg_list_format_size_bytes));
  133. DRM_DEBUG("reg_list_format_array_offset_bytes: %u\n",
  134. le32_to_cpu(rlc_hdr->reg_list_format_array_offset_bytes));
  135. DRM_DEBUG("reg_list_size_bytes: %u\n",
  136. le32_to_cpu(rlc_hdr->reg_list_size_bytes));
  137. DRM_DEBUG("reg_list_array_offset_bytes: %u\n",
  138. le32_to_cpu(rlc_hdr->reg_list_array_offset_bytes));
  139. DRM_DEBUG("reg_list_format_separate_size_bytes: %u\n",
  140. le32_to_cpu(rlc_hdr->reg_list_format_separate_size_bytes));
  141. DRM_DEBUG("reg_list_format_separate_array_offset_bytes: %u\n",
  142. le32_to_cpu(rlc_hdr->reg_list_format_separate_array_offset_bytes));
  143. DRM_DEBUG("reg_list_separate_size_bytes: %u\n",
  144. le32_to_cpu(rlc_hdr->reg_list_separate_size_bytes));
  145. DRM_DEBUG("reg_list_separate_size_bytes: %u\n",
  146. le32_to_cpu(rlc_hdr->reg_list_separate_size_bytes));
  147. } else {
  148. DRM_ERROR("Unknown RLC ucode version: %u.%u\n", version_major, version_minor);
  149. }
  150. }
  151. void amdgpu_ucode_print_sdma_hdr(const struct common_firmware_header *hdr)
  152. {
  153. uint16_t version_major = le16_to_cpu(hdr->header_version_major);
  154. uint16_t version_minor = le16_to_cpu(hdr->header_version_minor);
  155. DRM_DEBUG("SDMA\n");
  156. amdgpu_ucode_print_common_hdr(hdr);
  157. if (version_major == 1) {
  158. const struct sdma_firmware_header_v1_0 *sdma_hdr =
  159. container_of(hdr, struct sdma_firmware_header_v1_0, header);
  160. DRM_DEBUG("ucode_feature_version: %u\n",
  161. le32_to_cpu(sdma_hdr->ucode_feature_version));
  162. DRM_DEBUG("ucode_change_version: %u\n",
  163. le32_to_cpu(sdma_hdr->ucode_change_version));
  164. DRM_DEBUG("jt_offset: %u\n", le32_to_cpu(sdma_hdr->jt_offset));
  165. DRM_DEBUG("jt_size: %u\n", le32_to_cpu(sdma_hdr->jt_size));
  166. if (version_minor >= 1) {
  167. const struct sdma_firmware_header_v1_1 *sdma_v1_1_hdr =
  168. container_of(sdma_hdr, struct sdma_firmware_header_v1_1, v1_0);
  169. DRM_DEBUG("digest_size: %u\n", le32_to_cpu(sdma_v1_1_hdr->digest_size));
  170. }
  171. } else {
  172. DRM_ERROR("Unknown SDMA ucode version: %u.%u\n",
  173. version_major, version_minor);
  174. }
  175. }
  176. void amdgpu_ucode_print_gpu_info_hdr(const struct common_firmware_header *hdr)
  177. {
  178. uint16_t version_major = le16_to_cpu(hdr->header_version_major);
  179. uint16_t version_minor = le16_to_cpu(hdr->header_version_minor);
  180. DRM_DEBUG("GPU_INFO\n");
  181. amdgpu_ucode_print_common_hdr(hdr);
  182. if (version_major == 1) {
  183. const struct gpu_info_firmware_header_v1_0 *gpu_info_hdr =
  184. container_of(hdr, struct gpu_info_firmware_header_v1_0, header);
  185. DRM_DEBUG("version_major: %u\n",
  186. le16_to_cpu(gpu_info_hdr->version_major));
  187. DRM_DEBUG("version_minor: %u\n",
  188. le16_to_cpu(gpu_info_hdr->version_minor));
  189. } else {
  190. DRM_ERROR("Unknown gpu_info ucode version: %u.%u\n", version_major, version_minor);
  191. }
  192. }
  193. int amdgpu_ucode_validate(const struct firmware *fw)
  194. {
  195. const struct common_firmware_header *hdr =
  196. (const struct common_firmware_header *)fw->data;
  197. if (fw->size == le32_to_cpu(hdr->size_bytes))
  198. return 0;
  199. return -EINVAL;
  200. }
  201. bool amdgpu_ucode_hdr_version(union amdgpu_firmware_header *hdr,
  202. uint16_t hdr_major, uint16_t hdr_minor)
  203. {
  204. if ((hdr->common.header_version_major == hdr_major) &&
  205. (hdr->common.header_version_minor == hdr_minor))
  206. return false;
  207. return true;
  208. }
  209. enum amdgpu_firmware_load_type
  210. amdgpu_ucode_get_load_type(struct amdgpu_device *adev, int load_type)
  211. {
  212. switch (adev->asic_type) {
  213. #ifdef CONFIG_DRM_AMDGPU_SI
  214. case CHIP_TAHITI:
  215. case CHIP_PITCAIRN:
  216. case CHIP_VERDE:
  217. case CHIP_OLAND:
  218. return AMDGPU_FW_LOAD_DIRECT;
  219. #endif
  220. #ifdef CONFIG_DRM_AMDGPU_CIK
  221. case CHIP_BONAIRE:
  222. case CHIP_KAVERI:
  223. case CHIP_KABINI:
  224. case CHIP_HAWAII:
  225. case CHIP_MULLINS:
  226. return AMDGPU_FW_LOAD_DIRECT;
  227. #endif
  228. case CHIP_TOPAZ:
  229. case CHIP_TONGA:
  230. case CHIP_FIJI:
  231. case CHIP_CARRIZO:
  232. case CHIP_STONEY:
  233. case CHIP_POLARIS10:
  234. case CHIP_POLARIS11:
  235. case CHIP_POLARIS12:
  236. if (!load_type)
  237. return AMDGPU_FW_LOAD_DIRECT;
  238. else
  239. return AMDGPU_FW_LOAD_SMU;
  240. case CHIP_VEGA10:
  241. case CHIP_RAVEN:
  242. if (!load_type)
  243. return AMDGPU_FW_LOAD_DIRECT;
  244. else
  245. return AMDGPU_FW_LOAD_PSP;
  246. default:
  247. DRM_ERROR("Unknown firmware load type\n");
  248. }
  249. return AMDGPU_FW_LOAD_DIRECT;
  250. }
  251. static int amdgpu_ucode_init_single_fw(struct amdgpu_device *adev,
  252. struct amdgpu_firmware_info *ucode,
  253. uint64_t mc_addr, void *kptr)
  254. {
  255. const struct common_firmware_header *header = NULL;
  256. const struct gfx_firmware_header_v1_0 *cp_hdr = NULL;
  257. if (NULL == ucode->fw)
  258. return 0;
  259. ucode->mc_addr = mc_addr;
  260. ucode->kaddr = kptr;
  261. if (ucode->ucode_id == AMDGPU_UCODE_ID_STORAGE)
  262. return 0;
  263. header = (const struct common_firmware_header *)ucode->fw->data;
  264. cp_hdr = (const struct gfx_firmware_header_v1_0 *)ucode->fw->data;
  265. if (adev->firmware.load_type != AMDGPU_FW_LOAD_PSP ||
  266. (ucode->ucode_id != AMDGPU_UCODE_ID_CP_MEC1 &&
  267. ucode->ucode_id != AMDGPU_UCODE_ID_CP_MEC2 &&
  268. ucode->ucode_id != AMDGPU_UCODE_ID_CP_MEC1_JT &&
  269. ucode->ucode_id != AMDGPU_UCODE_ID_CP_MEC2_JT)) {
  270. ucode->ucode_size = le32_to_cpu(header->ucode_size_bytes);
  271. memcpy(ucode->kaddr, (void *)((uint8_t *)ucode->fw->data +
  272. le32_to_cpu(header->ucode_array_offset_bytes)),
  273. ucode->ucode_size);
  274. } else if (ucode->ucode_id == AMDGPU_UCODE_ID_CP_MEC1 ||
  275. ucode->ucode_id == AMDGPU_UCODE_ID_CP_MEC2) {
  276. ucode->ucode_size = le32_to_cpu(header->ucode_size_bytes) -
  277. le32_to_cpu(cp_hdr->jt_size) * 4;
  278. memcpy(ucode->kaddr, (void *)((uint8_t *)ucode->fw->data +
  279. le32_to_cpu(header->ucode_array_offset_bytes)),
  280. ucode->ucode_size);
  281. } else if (ucode->ucode_id == AMDGPU_UCODE_ID_CP_MEC1_JT ||
  282. ucode->ucode_id == AMDGPU_UCODE_ID_CP_MEC2_JT) {
  283. ucode->ucode_size = le32_to_cpu(cp_hdr->jt_size) * 4;
  284. memcpy(ucode->kaddr, (void *)((uint8_t *)ucode->fw->data +
  285. le32_to_cpu(header->ucode_array_offset_bytes) +
  286. le32_to_cpu(cp_hdr->jt_offset) * 4),
  287. ucode->ucode_size);
  288. }
  289. return 0;
  290. }
  291. static int amdgpu_ucode_patch_jt(struct amdgpu_firmware_info *ucode,
  292. uint64_t mc_addr, void *kptr)
  293. {
  294. const struct gfx_firmware_header_v1_0 *header = NULL;
  295. const struct common_firmware_header *comm_hdr = NULL;
  296. uint8_t* src_addr = NULL;
  297. uint8_t* dst_addr = NULL;
  298. if (NULL == ucode->fw)
  299. return 0;
  300. comm_hdr = (const struct common_firmware_header *)ucode->fw->data;
  301. header = (const struct gfx_firmware_header_v1_0 *)ucode->fw->data;
  302. dst_addr = ucode->kaddr +
  303. ALIGN(le32_to_cpu(comm_hdr->ucode_size_bytes),
  304. PAGE_SIZE);
  305. src_addr = (uint8_t *)ucode->fw->data +
  306. le32_to_cpu(comm_hdr->ucode_array_offset_bytes) +
  307. (le32_to_cpu(header->jt_offset) * 4);
  308. memcpy(dst_addr, src_addr, le32_to_cpu(header->jt_size) * 4);
  309. return 0;
  310. }
  311. int amdgpu_ucode_init_bo(struct amdgpu_device *adev)
  312. {
  313. uint64_t fw_offset = 0;
  314. int i, err;
  315. struct amdgpu_firmware_info *ucode = NULL;
  316. const struct common_firmware_header *header = NULL;
  317. if (!adev->firmware.fw_size) {
  318. dev_warn(adev->dev, "No ip firmware need to load\n");
  319. return 0;
  320. }
  321. if (!adev->in_gpu_reset) {
  322. err = amdgpu_bo_create_kernel(adev, adev->firmware.fw_size, PAGE_SIZE,
  323. amdgpu_sriov_vf(adev) ? AMDGPU_GEM_DOMAIN_VRAM : AMDGPU_GEM_DOMAIN_GTT,
  324. &adev->firmware.fw_buf,
  325. &adev->firmware.fw_buf_mc,
  326. &adev->firmware.fw_buf_ptr);
  327. if (err) {
  328. dev_err(adev->dev, "failed to create kernel buffer for firmware.fw_buf\n");
  329. goto failed;
  330. }
  331. }
  332. memset(adev->firmware.fw_buf_ptr, 0, adev->firmware.fw_size);
  333. /*
  334. * if SMU loaded firmware, it needn't add SMC, UVD, and VCE
  335. * ucode info here
  336. */
  337. if (adev->firmware.load_type != AMDGPU_FW_LOAD_PSP) {
  338. if (amdgpu_sriov_vf(adev))
  339. adev->firmware.max_ucodes = AMDGPU_UCODE_ID_MAXIMUM - 3;
  340. else
  341. adev->firmware.max_ucodes = AMDGPU_UCODE_ID_MAXIMUM - 4;
  342. } else {
  343. adev->firmware.max_ucodes = AMDGPU_UCODE_ID_MAXIMUM;
  344. }
  345. for (i = 0; i < adev->firmware.max_ucodes; i++) {
  346. ucode = &adev->firmware.ucode[i];
  347. if (ucode->fw) {
  348. header = (const struct common_firmware_header *)ucode->fw->data;
  349. amdgpu_ucode_init_single_fw(adev, ucode, adev->firmware.fw_buf_mc + fw_offset,
  350. adev->firmware.fw_buf_ptr + fw_offset);
  351. if (i == AMDGPU_UCODE_ID_CP_MEC1 &&
  352. adev->firmware.load_type != AMDGPU_FW_LOAD_PSP) {
  353. const struct gfx_firmware_header_v1_0 *cp_hdr;
  354. cp_hdr = (const struct gfx_firmware_header_v1_0 *)ucode->fw->data;
  355. amdgpu_ucode_patch_jt(ucode, adev->firmware.fw_buf_mc + fw_offset,
  356. adev->firmware.fw_buf_ptr + fw_offset);
  357. fw_offset += ALIGN(le32_to_cpu(cp_hdr->jt_size) << 2, PAGE_SIZE);
  358. }
  359. fw_offset += ALIGN(ucode->ucode_size, PAGE_SIZE);
  360. }
  361. }
  362. return 0;
  363. failed:
  364. if (err)
  365. adev->firmware.load_type = AMDGPU_FW_LOAD_DIRECT;
  366. return err;
  367. }
  368. int amdgpu_ucode_fini_bo(struct amdgpu_device *adev)
  369. {
  370. int i;
  371. struct amdgpu_firmware_info *ucode = NULL;
  372. if (!adev->firmware.fw_size)
  373. return 0;
  374. for (i = 0; i < adev->firmware.max_ucodes; i++) {
  375. ucode = &adev->firmware.ucode[i];
  376. if (ucode->fw) {
  377. ucode->mc_addr = 0;
  378. ucode->kaddr = NULL;
  379. }
  380. }
  381. amdgpu_bo_free_kernel(&adev->firmware.fw_buf,
  382. &adev->firmware.fw_buf_mc,
  383. &adev->firmware.fw_buf_ptr);
  384. return 0;
  385. }