gmc_v6_0.c 31 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168
  1. /*
  2. * Copyright 2014 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include <linux/firmware.h>
  24. #include <drm/drmP.h>
  25. #include "amdgpu.h"
  26. #include "gmc_v6_0.h"
  27. #include "amdgpu_ucode.h"
  28. #include "bif/bif_3_0_d.h"
  29. #include "bif/bif_3_0_sh_mask.h"
  30. #include "oss/oss_1_0_d.h"
  31. #include "oss/oss_1_0_sh_mask.h"
  32. #include "gmc/gmc_6_0_d.h"
  33. #include "gmc/gmc_6_0_sh_mask.h"
  34. #include "dce/dce_6_0_d.h"
  35. #include "dce/dce_6_0_sh_mask.h"
  36. #include "si_enums.h"
  37. static void gmc_v6_0_set_gart_funcs(struct amdgpu_device *adev);
  38. static void gmc_v6_0_set_irq_funcs(struct amdgpu_device *adev);
  39. static int gmc_v6_0_wait_for_idle(void *handle);
  40. MODULE_FIRMWARE("radeon/tahiti_mc.bin");
  41. MODULE_FIRMWARE("radeon/pitcairn_mc.bin");
  42. MODULE_FIRMWARE("radeon/verde_mc.bin");
  43. MODULE_FIRMWARE("radeon/oland_mc.bin");
  44. MODULE_FIRMWARE("radeon/si58_mc.bin");
  45. #define MC_SEQ_MISC0__MT__MASK 0xf0000000
  46. #define MC_SEQ_MISC0__MT__GDDR1 0x10000000
  47. #define MC_SEQ_MISC0__MT__DDR2 0x20000000
  48. #define MC_SEQ_MISC0__MT__GDDR3 0x30000000
  49. #define MC_SEQ_MISC0__MT__GDDR4 0x40000000
  50. #define MC_SEQ_MISC0__MT__GDDR5 0x50000000
  51. #define MC_SEQ_MISC0__MT__HBM 0x60000000
  52. #define MC_SEQ_MISC0__MT__DDR3 0xB0000000
  53. static const u32 crtc_offsets[6] =
  54. {
  55. SI_CRTC0_REGISTER_OFFSET,
  56. SI_CRTC1_REGISTER_OFFSET,
  57. SI_CRTC2_REGISTER_OFFSET,
  58. SI_CRTC3_REGISTER_OFFSET,
  59. SI_CRTC4_REGISTER_OFFSET,
  60. SI_CRTC5_REGISTER_OFFSET
  61. };
  62. static void gmc_v6_0_mc_stop(struct amdgpu_device *adev)
  63. {
  64. u32 blackout;
  65. gmc_v6_0_wait_for_idle((void *)adev);
  66. blackout = RREG32(mmMC_SHARED_BLACKOUT_CNTL);
  67. if (REG_GET_FIELD(blackout, MC_SHARED_BLACKOUT_CNTL, BLACKOUT_MODE) != 1) {
  68. /* Block CPU access */
  69. WREG32(mmBIF_FB_EN, 0);
  70. /* blackout the MC */
  71. blackout = REG_SET_FIELD(blackout,
  72. MC_SHARED_BLACKOUT_CNTL, BLACKOUT_MODE, 0);
  73. WREG32(mmMC_SHARED_BLACKOUT_CNTL, blackout | 1);
  74. }
  75. /* wait for the MC to settle */
  76. udelay(100);
  77. }
  78. static void gmc_v6_0_mc_resume(struct amdgpu_device *adev)
  79. {
  80. u32 tmp;
  81. /* unblackout the MC */
  82. tmp = RREG32(mmMC_SHARED_BLACKOUT_CNTL);
  83. tmp = REG_SET_FIELD(tmp, MC_SHARED_BLACKOUT_CNTL, BLACKOUT_MODE, 0);
  84. WREG32(mmMC_SHARED_BLACKOUT_CNTL, tmp);
  85. /* allow CPU access */
  86. tmp = REG_SET_FIELD(0, BIF_FB_EN, FB_READ_EN, 1);
  87. tmp = REG_SET_FIELD(tmp, BIF_FB_EN, FB_WRITE_EN, 1);
  88. WREG32(mmBIF_FB_EN, tmp);
  89. }
  90. static int gmc_v6_0_init_microcode(struct amdgpu_device *adev)
  91. {
  92. const char *chip_name;
  93. char fw_name[30];
  94. int err;
  95. bool is_58_fw = false;
  96. DRM_DEBUG("\n");
  97. switch (adev->asic_type) {
  98. case CHIP_TAHITI:
  99. chip_name = "tahiti";
  100. break;
  101. case CHIP_PITCAIRN:
  102. chip_name = "pitcairn";
  103. break;
  104. case CHIP_VERDE:
  105. chip_name = "verde";
  106. break;
  107. case CHIP_OLAND:
  108. chip_name = "oland";
  109. break;
  110. case CHIP_HAINAN:
  111. chip_name = "hainan";
  112. break;
  113. default: BUG();
  114. }
  115. /* this memory configuration requires special firmware */
  116. if (((RREG32(mmMC_SEQ_MISC0) & 0xff000000) >> 24) == 0x58)
  117. is_58_fw = true;
  118. if (is_58_fw)
  119. snprintf(fw_name, sizeof(fw_name), "radeon/si58_mc.bin");
  120. else
  121. snprintf(fw_name, sizeof(fw_name), "radeon/%s_mc.bin", chip_name);
  122. err = request_firmware(&adev->mc.fw, fw_name, adev->dev);
  123. if (err)
  124. goto out;
  125. err = amdgpu_ucode_validate(adev->mc.fw);
  126. out:
  127. if (err) {
  128. dev_err(adev->dev,
  129. "si_mc: Failed to load firmware \"%s\"\n",
  130. fw_name);
  131. release_firmware(adev->mc.fw);
  132. adev->mc.fw = NULL;
  133. }
  134. return err;
  135. }
  136. static int gmc_v6_0_mc_load_microcode(struct amdgpu_device *adev)
  137. {
  138. const __le32 *new_fw_data = NULL;
  139. u32 running;
  140. const __le32 *new_io_mc_regs = NULL;
  141. int i, regs_size, ucode_size;
  142. const struct mc_firmware_header_v1_0 *hdr;
  143. if (!adev->mc.fw)
  144. return -EINVAL;
  145. hdr = (const struct mc_firmware_header_v1_0 *)adev->mc.fw->data;
  146. amdgpu_ucode_print_mc_hdr(&hdr->header);
  147. adev->mc.fw_version = le32_to_cpu(hdr->header.ucode_version);
  148. regs_size = le32_to_cpu(hdr->io_debug_size_bytes) / (4 * 2);
  149. new_io_mc_regs = (const __le32 *)
  150. (adev->mc.fw->data + le32_to_cpu(hdr->io_debug_array_offset_bytes));
  151. ucode_size = le32_to_cpu(hdr->header.ucode_size_bytes) / 4;
  152. new_fw_data = (const __le32 *)
  153. (adev->mc.fw->data + le32_to_cpu(hdr->header.ucode_array_offset_bytes));
  154. running = RREG32(mmMC_SEQ_SUP_CNTL) & MC_SEQ_SUP_CNTL__RUN_MASK;
  155. if (running == 0) {
  156. /* reset the engine and set to writable */
  157. WREG32(mmMC_SEQ_SUP_CNTL, 0x00000008);
  158. WREG32(mmMC_SEQ_SUP_CNTL, 0x00000010);
  159. /* load mc io regs */
  160. for (i = 0; i < regs_size; i++) {
  161. WREG32(mmMC_SEQ_IO_DEBUG_INDEX, le32_to_cpup(new_io_mc_regs++));
  162. WREG32(mmMC_SEQ_IO_DEBUG_DATA, le32_to_cpup(new_io_mc_regs++));
  163. }
  164. /* load the MC ucode */
  165. for (i = 0; i < ucode_size; i++) {
  166. WREG32(mmMC_SEQ_SUP_PGM, le32_to_cpup(new_fw_data++));
  167. }
  168. /* put the engine back into the active state */
  169. WREG32(mmMC_SEQ_SUP_CNTL, 0x00000008);
  170. WREG32(mmMC_SEQ_SUP_CNTL, 0x00000004);
  171. WREG32(mmMC_SEQ_SUP_CNTL, 0x00000001);
  172. /* wait for training to complete */
  173. for (i = 0; i < adev->usec_timeout; i++) {
  174. if (RREG32(mmMC_SEQ_TRAIN_WAKEUP_CNTL) & MC_SEQ_TRAIN_WAKEUP_CNTL__TRAIN_DONE_D0_MASK)
  175. break;
  176. udelay(1);
  177. }
  178. for (i = 0; i < adev->usec_timeout; i++) {
  179. if (RREG32(mmMC_SEQ_TRAIN_WAKEUP_CNTL) & MC_SEQ_TRAIN_WAKEUP_CNTL__TRAIN_DONE_D1_MASK)
  180. break;
  181. udelay(1);
  182. }
  183. }
  184. return 0;
  185. }
  186. static void gmc_v6_0_vram_gtt_location(struct amdgpu_device *adev,
  187. struct amdgpu_mc *mc)
  188. {
  189. u64 base = RREG32(mmMC_VM_FB_LOCATION) & 0xFFFF;
  190. base <<= 24;
  191. if (mc->mc_vram_size > 0xFFC0000000ULL) {
  192. dev_warn(adev->dev, "limiting VRAM\n");
  193. mc->real_vram_size = 0xFFC0000000ULL;
  194. mc->mc_vram_size = 0xFFC0000000ULL;
  195. }
  196. amdgpu_vram_location(adev, &adev->mc, base);
  197. amdgpu_gart_location(adev, mc);
  198. }
  199. static void gmc_v6_0_mc_program(struct amdgpu_device *adev)
  200. {
  201. int i, j;
  202. /* Initialize HDP */
  203. for (i = 0, j = 0; i < 32; i++, j += 0x6) {
  204. WREG32((0xb05 + j), 0x00000000);
  205. WREG32((0xb06 + j), 0x00000000);
  206. WREG32((0xb07 + j), 0x00000000);
  207. WREG32((0xb08 + j), 0x00000000);
  208. WREG32((0xb09 + j), 0x00000000);
  209. }
  210. WREG32(mmHDP_REG_COHERENCY_FLUSH_CNTL, 0);
  211. if (gmc_v6_0_wait_for_idle((void *)adev)) {
  212. dev_warn(adev->dev, "Wait for MC idle timedout !\n");
  213. }
  214. if (adev->mode_info.num_crtc) {
  215. u32 tmp;
  216. /* Lockout access through VGA aperture*/
  217. tmp = RREG32(mmVGA_HDP_CONTROL);
  218. tmp |= VGA_HDP_CONTROL__VGA_MEMORY_DISABLE_MASK;
  219. WREG32(mmVGA_HDP_CONTROL, tmp);
  220. /* disable VGA render */
  221. tmp = RREG32(mmVGA_RENDER_CONTROL);
  222. tmp &= ~VGA_VSTATUS_CNTL;
  223. WREG32(mmVGA_RENDER_CONTROL, tmp);
  224. }
  225. /* Update configuration */
  226. WREG32(mmMC_VM_SYSTEM_APERTURE_LOW_ADDR,
  227. adev->mc.vram_start >> 12);
  228. WREG32(mmMC_VM_SYSTEM_APERTURE_HIGH_ADDR,
  229. adev->mc.vram_end >> 12);
  230. WREG32(mmMC_VM_SYSTEM_APERTURE_DEFAULT_ADDR,
  231. adev->vram_scratch.gpu_addr >> 12);
  232. WREG32(mmMC_VM_AGP_BASE, 0);
  233. WREG32(mmMC_VM_AGP_TOP, 0x0FFFFFFF);
  234. WREG32(mmMC_VM_AGP_BOT, 0x0FFFFFFF);
  235. if (gmc_v6_0_wait_for_idle((void *)adev)) {
  236. dev_warn(adev->dev, "Wait for MC idle timedout !\n");
  237. }
  238. }
  239. static int gmc_v6_0_mc_init(struct amdgpu_device *adev)
  240. {
  241. u32 tmp;
  242. int chansize, numchan;
  243. int r;
  244. tmp = RREG32(mmMC_ARB_RAMCFG);
  245. if (tmp & (1 << 11)) {
  246. chansize = 16;
  247. } else if (tmp & MC_ARB_RAMCFG__CHANSIZE_MASK) {
  248. chansize = 64;
  249. } else {
  250. chansize = 32;
  251. }
  252. tmp = RREG32(mmMC_SHARED_CHMAP);
  253. switch ((tmp & MC_SHARED_CHMAP__NOOFCHAN_MASK) >> MC_SHARED_CHMAP__NOOFCHAN__SHIFT) {
  254. case 0:
  255. default:
  256. numchan = 1;
  257. break;
  258. case 1:
  259. numchan = 2;
  260. break;
  261. case 2:
  262. numchan = 4;
  263. break;
  264. case 3:
  265. numchan = 8;
  266. break;
  267. case 4:
  268. numchan = 3;
  269. break;
  270. case 5:
  271. numchan = 6;
  272. break;
  273. case 6:
  274. numchan = 10;
  275. break;
  276. case 7:
  277. numchan = 12;
  278. break;
  279. case 8:
  280. numchan = 16;
  281. break;
  282. }
  283. adev->mc.vram_width = numchan * chansize;
  284. /* size in MB on si */
  285. adev->mc.mc_vram_size = RREG32(mmCONFIG_MEMSIZE) * 1024ULL * 1024ULL;
  286. adev->mc.real_vram_size = RREG32(mmCONFIG_MEMSIZE) * 1024ULL * 1024ULL;
  287. if (!(adev->flags & AMD_IS_APU)) {
  288. r = amdgpu_device_resize_fb_bar(adev);
  289. if (r)
  290. return r;
  291. }
  292. adev->mc.aper_base = pci_resource_start(adev->pdev, 0);
  293. adev->mc.aper_size = pci_resource_len(adev->pdev, 0);
  294. adev->mc.visible_vram_size = adev->mc.aper_size;
  295. /* set the gart size */
  296. if (amdgpu_gart_size == -1) {
  297. switch (adev->asic_type) {
  298. case CHIP_HAINAN: /* no MM engines */
  299. default:
  300. adev->mc.gart_size = 256ULL << 20;
  301. break;
  302. case CHIP_VERDE: /* UVD, VCE do not support GPUVM */
  303. case CHIP_TAHITI: /* UVD, VCE do not support GPUVM */
  304. case CHIP_PITCAIRN: /* UVD, VCE do not support GPUVM */
  305. case CHIP_OLAND: /* UVD, VCE do not support GPUVM */
  306. adev->mc.gart_size = 1024ULL << 20;
  307. break;
  308. }
  309. } else {
  310. adev->mc.gart_size = (u64)amdgpu_gart_size << 20;
  311. }
  312. gmc_v6_0_vram_gtt_location(adev, &adev->mc);
  313. return 0;
  314. }
  315. static void gmc_v6_0_gart_flush_gpu_tlb(struct amdgpu_device *adev,
  316. uint32_t vmid)
  317. {
  318. WREG32(mmHDP_MEM_COHERENCY_FLUSH_CNTL, 0);
  319. WREG32(mmVM_INVALIDATE_REQUEST, 1 << vmid);
  320. }
  321. static int gmc_v6_0_gart_set_pte_pde(struct amdgpu_device *adev,
  322. void *cpu_pt_addr,
  323. uint32_t gpu_page_idx,
  324. uint64_t addr,
  325. uint64_t flags)
  326. {
  327. void __iomem *ptr = (void *)cpu_pt_addr;
  328. uint64_t value;
  329. value = addr & 0xFFFFFFFFFFFFF000ULL;
  330. value |= flags;
  331. writeq(value, ptr + (gpu_page_idx * 8));
  332. return 0;
  333. }
  334. static uint64_t gmc_v6_0_get_vm_pte_flags(struct amdgpu_device *adev,
  335. uint32_t flags)
  336. {
  337. uint64_t pte_flag = 0;
  338. if (flags & AMDGPU_VM_PAGE_READABLE)
  339. pte_flag |= AMDGPU_PTE_READABLE;
  340. if (flags & AMDGPU_VM_PAGE_WRITEABLE)
  341. pte_flag |= AMDGPU_PTE_WRITEABLE;
  342. if (flags & AMDGPU_VM_PAGE_PRT)
  343. pte_flag |= AMDGPU_PTE_PRT;
  344. return pte_flag;
  345. }
  346. static uint64_t gmc_v6_0_get_vm_pde(struct amdgpu_device *adev, uint64_t addr)
  347. {
  348. BUG_ON(addr & 0xFFFFFF0000000FFFULL);
  349. return addr;
  350. }
  351. static void gmc_v6_0_set_fault_enable_default(struct amdgpu_device *adev,
  352. bool value)
  353. {
  354. u32 tmp;
  355. tmp = RREG32(mmVM_CONTEXT1_CNTL);
  356. tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
  357. RANGE_PROTECTION_FAULT_ENABLE_DEFAULT, value);
  358. tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
  359. DUMMY_PAGE_PROTECTION_FAULT_ENABLE_DEFAULT, value);
  360. tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
  361. PDE0_PROTECTION_FAULT_ENABLE_DEFAULT, value);
  362. tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
  363. VALID_PROTECTION_FAULT_ENABLE_DEFAULT, value);
  364. tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
  365. READ_PROTECTION_FAULT_ENABLE_DEFAULT, value);
  366. tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
  367. WRITE_PROTECTION_FAULT_ENABLE_DEFAULT, value);
  368. WREG32(mmVM_CONTEXT1_CNTL, tmp);
  369. }
  370. /**
  371. + * gmc_v8_0_set_prt - set PRT VM fault
  372. + *
  373. + * @adev: amdgpu_device pointer
  374. + * @enable: enable/disable VM fault handling for PRT
  375. +*/
  376. static void gmc_v6_0_set_prt(struct amdgpu_device *adev, bool enable)
  377. {
  378. u32 tmp;
  379. if (enable && !adev->mc.prt_warning) {
  380. dev_warn(adev->dev, "Disabling VM faults because of PRT request!\n");
  381. adev->mc.prt_warning = true;
  382. }
  383. tmp = RREG32(mmVM_PRT_CNTL);
  384. tmp = REG_SET_FIELD(tmp, VM_PRT_CNTL,
  385. CB_DISABLE_FAULT_ON_UNMAPPED_ACCESS,
  386. enable);
  387. tmp = REG_SET_FIELD(tmp, VM_PRT_CNTL,
  388. TC_DISABLE_FAULT_ON_UNMAPPED_ACCESS,
  389. enable);
  390. tmp = REG_SET_FIELD(tmp, VM_PRT_CNTL,
  391. L2_CACHE_STORE_INVALID_ENTRIES,
  392. enable);
  393. tmp = REG_SET_FIELD(tmp, VM_PRT_CNTL,
  394. L1_TLB_STORE_INVALID_ENTRIES,
  395. enable);
  396. WREG32(mmVM_PRT_CNTL, tmp);
  397. if (enable) {
  398. uint32_t low = AMDGPU_VA_RESERVED_SIZE >> AMDGPU_GPU_PAGE_SHIFT;
  399. uint32_t high = adev->vm_manager.max_pfn;
  400. WREG32(mmVM_PRT_APERTURE0_LOW_ADDR, low);
  401. WREG32(mmVM_PRT_APERTURE1_LOW_ADDR, low);
  402. WREG32(mmVM_PRT_APERTURE2_LOW_ADDR, low);
  403. WREG32(mmVM_PRT_APERTURE3_LOW_ADDR, low);
  404. WREG32(mmVM_PRT_APERTURE0_HIGH_ADDR, high);
  405. WREG32(mmVM_PRT_APERTURE1_HIGH_ADDR, high);
  406. WREG32(mmVM_PRT_APERTURE2_HIGH_ADDR, high);
  407. WREG32(mmVM_PRT_APERTURE3_HIGH_ADDR, high);
  408. } else {
  409. WREG32(mmVM_PRT_APERTURE0_LOW_ADDR, 0xfffffff);
  410. WREG32(mmVM_PRT_APERTURE1_LOW_ADDR, 0xfffffff);
  411. WREG32(mmVM_PRT_APERTURE2_LOW_ADDR, 0xfffffff);
  412. WREG32(mmVM_PRT_APERTURE3_LOW_ADDR, 0xfffffff);
  413. WREG32(mmVM_PRT_APERTURE0_HIGH_ADDR, 0x0);
  414. WREG32(mmVM_PRT_APERTURE1_HIGH_ADDR, 0x0);
  415. WREG32(mmVM_PRT_APERTURE2_HIGH_ADDR, 0x0);
  416. WREG32(mmVM_PRT_APERTURE3_HIGH_ADDR, 0x0);
  417. }
  418. }
  419. static int gmc_v6_0_gart_enable(struct amdgpu_device *adev)
  420. {
  421. int r, i;
  422. u32 field;
  423. if (adev->gart.robj == NULL) {
  424. dev_err(adev->dev, "No VRAM object for PCIE GART.\n");
  425. return -EINVAL;
  426. }
  427. r = amdgpu_gart_table_vram_pin(adev);
  428. if (r)
  429. return r;
  430. /* Setup TLB control */
  431. WREG32(mmMC_VM_MX_L1_TLB_CNTL,
  432. (0xA << 7) |
  433. MC_VM_MX_L1_TLB_CNTL__ENABLE_L1_TLB_MASK |
  434. MC_VM_MX_L1_TLB_CNTL__ENABLE_L1_FRAGMENT_PROCESSING_MASK |
  435. MC_VM_MX_L1_TLB_CNTL__SYSTEM_ACCESS_MODE_MASK |
  436. MC_VM_MX_L1_TLB_CNTL__ENABLE_ADVANCED_DRIVER_MODEL_MASK |
  437. (0UL << MC_VM_MX_L1_TLB_CNTL__SYSTEM_APERTURE_UNMAPPED_ACCESS__SHIFT));
  438. /* Setup L2 cache */
  439. WREG32(mmVM_L2_CNTL,
  440. VM_L2_CNTL__ENABLE_L2_CACHE_MASK |
  441. VM_L2_CNTL__ENABLE_L2_FRAGMENT_PROCESSING_MASK |
  442. VM_L2_CNTL__ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE_MASK |
  443. VM_L2_CNTL__ENABLE_L2_PDE0_CACHE_LRU_UPDATE_BY_WRITE_MASK |
  444. (7UL << VM_L2_CNTL__EFFECTIVE_L2_QUEUE_SIZE__SHIFT) |
  445. (1UL << VM_L2_CNTL__CONTEXT1_IDENTITY_ACCESS_MODE__SHIFT));
  446. WREG32(mmVM_L2_CNTL2,
  447. VM_L2_CNTL2__INVALIDATE_ALL_L1_TLBS_MASK |
  448. VM_L2_CNTL2__INVALIDATE_L2_CACHE_MASK);
  449. field = adev->vm_manager.fragment_size;
  450. WREG32(mmVM_L2_CNTL3,
  451. VM_L2_CNTL3__L2_CACHE_BIGK_ASSOCIATIVITY_MASK |
  452. (field << VM_L2_CNTL3__BANK_SELECT__SHIFT) |
  453. (field << VM_L2_CNTL3__L2_CACHE_BIGK_FRAGMENT_SIZE__SHIFT));
  454. /* setup context0 */
  455. WREG32(mmVM_CONTEXT0_PAGE_TABLE_START_ADDR, adev->mc.gart_start >> 12);
  456. WREG32(mmVM_CONTEXT0_PAGE_TABLE_END_ADDR, adev->mc.gart_end >> 12);
  457. WREG32(mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR, adev->gart.table_addr >> 12);
  458. WREG32(mmVM_CONTEXT0_PROTECTION_FAULT_DEFAULT_ADDR,
  459. (u32)(adev->dummy_page.addr >> 12));
  460. WREG32(mmVM_CONTEXT0_CNTL2, 0);
  461. WREG32(mmVM_CONTEXT0_CNTL,
  462. VM_CONTEXT0_CNTL__ENABLE_CONTEXT_MASK |
  463. (0UL << VM_CONTEXT0_CNTL__PAGE_TABLE_DEPTH__SHIFT) |
  464. VM_CONTEXT0_CNTL__RANGE_PROTECTION_FAULT_ENABLE_DEFAULT_MASK);
  465. WREG32(0x575, 0);
  466. WREG32(0x576, 0);
  467. WREG32(0x577, 0);
  468. /* empty context1-15 */
  469. /* set vm size, must be a multiple of 4 */
  470. WREG32(mmVM_CONTEXT1_PAGE_TABLE_START_ADDR, 0);
  471. WREG32(mmVM_CONTEXT1_PAGE_TABLE_END_ADDR, adev->vm_manager.max_pfn - 1);
  472. /* Assign the pt base to something valid for now; the pts used for
  473. * the VMs are determined by the application and setup and assigned
  474. * on the fly in the vm part of radeon_gart.c
  475. */
  476. for (i = 1; i < 16; i++) {
  477. if (i < 8)
  478. WREG32(mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR + i,
  479. adev->gart.table_addr >> 12);
  480. else
  481. WREG32(mmVM_CONTEXT8_PAGE_TABLE_BASE_ADDR + i - 8,
  482. adev->gart.table_addr >> 12);
  483. }
  484. /* enable context1-15 */
  485. WREG32(mmVM_CONTEXT1_PROTECTION_FAULT_DEFAULT_ADDR,
  486. (u32)(adev->dummy_page.addr >> 12));
  487. WREG32(mmVM_CONTEXT1_CNTL2, 4);
  488. WREG32(mmVM_CONTEXT1_CNTL,
  489. VM_CONTEXT1_CNTL__ENABLE_CONTEXT_MASK |
  490. (1UL << VM_CONTEXT1_CNTL__PAGE_TABLE_DEPTH__SHIFT) |
  491. ((adev->vm_manager.block_size - 9)
  492. << VM_CONTEXT1_CNTL__PAGE_TABLE_BLOCK_SIZE__SHIFT));
  493. if (amdgpu_vm_fault_stop == AMDGPU_VM_FAULT_STOP_ALWAYS)
  494. gmc_v6_0_set_fault_enable_default(adev, false);
  495. else
  496. gmc_v6_0_set_fault_enable_default(adev, true);
  497. gmc_v6_0_gart_flush_gpu_tlb(adev, 0);
  498. dev_info(adev->dev, "PCIE GART of %uM enabled (table at 0x%016llX).\n",
  499. (unsigned)(adev->mc.gart_size >> 20),
  500. (unsigned long long)adev->gart.table_addr);
  501. adev->gart.ready = true;
  502. return 0;
  503. }
  504. static int gmc_v6_0_gart_init(struct amdgpu_device *adev)
  505. {
  506. int r;
  507. if (adev->gart.robj) {
  508. dev_warn(adev->dev, "gmc_v6_0 PCIE GART already initialized\n");
  509. return 0;
  510. }
  511. r = amdgpu_gart_init(adev);
  512. if (r)
  513. return r;
  514. adev->gart.table_size = adev->gart.num_gpu_pages * 8;
  515. adev->gart.gart_pte_flags = 0;
  516. return amdgpu_gart_table_vram_alloc(adev);
  517. }
  518. static void gmc_v6_0_gart_disable(struct amdgpu_device *adev)
  519. {
  520. /*unsigned i;
  521. for (i = 1; i < 16; ++i) {
  522. uint32_t reg;
  523. if (i < 8)
  524. reg = VM_CONTEXT0_PAGE_TABLE_BASE_ADDR + i ;
  525. else
  526. reg = VM_CONTEXT8_PAGE_TABLE_BASE_ADDR + (i - 8);
  527. adev->vm_manager.saved_table_addr[i] = RREG32(reg);
  528. }*/
  529. /* Disable all tables */
  530. WREG32(mmVM_CONTEXT0_CNTL, 0);
  531. WREG32(mmVM_CONTEXT1_CNTL, 0);
  532. /* Setup TLB control */
  533. WREG32(mmMC_VM_MX_L1_TLB_CNTL,
  534. MC_VM_MX_L1_TLB_CNTL__SYSTEM_ACCESS_MODE_MASK |
  535. (0UL << MC_VM_MX_L1_TLB_CNTL__SYSTEM_APERTURE_UNMAPPED_ACCESS__SHIFT));
  536. /* Setup L2 cache */
  537. WREG32(mmVM_L2_CNTL,
  538. VM_L2_CNTL__ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE_MASK |
  539. VM_L2_CNTL__ENABLE_L2_PDE0_CACHE_LRU_UPDATE_BY_WRITE_MASK |
  540. (7UL << VM_L2_CNTL__EFFECTIVE_L2_QUEUE_SIZE__SHIFT) |
  541. (1UL << VM_L2_CNTL__CONTEXT1_IDENTITY_ACCESS_MODE__SHIFT));
  542. WREG32(mmVM_L2_CNTL2, 0);
  543. WREG32(mmVM_L2_CNTL3,
  544. VM_L2_CNTL3__L2_CACHE_BIGK_ASSOCIATIVITY_MASK |
  545. (0UL << VM_L2_CNTL3__L2_CACHE_BIGK_FRAGMENT_SIZE__SHIFT));
  546. amdgpu_gart_table_vram_unpin(adev);
  547. }
  548. static void gmc_v6_0_gart_fini(struct amdgpu_device *adev)
  549. {
  550. amdgpu_gart_table_vram_free(adev);
  551. amdgpu_gart_fini(adev);
  552. }
  553. static void gmc_v6_0_vm_decode_fault(struct amdgpu_device *adev,
  554. u32 status, u32 addr, u32 mc_client)
  555. {
  556. u32 mc_id;
  557. u32 vmid = REG_GET_FIELD(status, VM_CONTEXT1_PROTECTION_FAULT_STATUS, VMID);
  558. u32 protections = REG_GET_FIELD(status, VM_CONTEXT1_PROTECTION_FAULT_STATUS,
  559. PROTECTIONS);
  560. char block[5] = { mc_client >> 24, (mc_client >> 16) & 0xff,
  561. (mc_client >> 8) & 0xff, mc_client & 0xff, 0 };
  562. mc_id = REG_GET_FIELD(status, VM_CONTEXT1_PROTECTION_FAULT_STATUS,
  563. MEMORY_CLIENT_ID);
  564. dev_err(adev->dev, "VM fault (0x%02x, vmid %d) at page %u, %s from '%s' (0x%08x) (%d)\n",
  565. protections, vmid, addr,
  566. REG_GET_FIELD(status, VM_CONTEXT1_PROTECTION_FAULT_STATUS,
  567. MEMORY_CLIENT_RW) ?
  568. "write" : "read", block, mc_client, mc_id);
  569. }
  570. /*
  571. static const u32 mc_cg_registers[] = {
  572. MC_HUB_MISC_HUB_CG,
  573. MC_HUB_MISC_SIP_CG,
  574. MC_HUB_MISC_VM_CG,
  575. MC_XPB_CLK_GAT,
  576. ATC_MISC_CG,
  577. MC_CITF_MISC_WR_CG,
  578. MC_CITF_MISC_RD_CG,
  579. MC_CITF_MISC_VM_CG,
  580. VM_L2_CG,
  581. };
  582. static const u32 mc_cg_ls_en[] = {
  583. MC_HUB_MISC_HUB_CG__MEM_LS_ENABLE_MASK,
  584. MC_HUB_MISC_SIP_CG__MEM_LS_ENABLE_MASK,
  585. MC_HUB_MISC_VM_CG__MEM_LS_ENABLE_MASK,
  586. MC_XPB_CLK_GAT__MEM_LS_ENABLE_MASK,
  587. ATC_MISC_CG__MEM_LS_ENABLE_MASK,
  588. MC_CITF_MISC_WR_CG__MEM_LS_ENABLE_MASK,
  589. MC_CITF_MISC_RD_CG__MEM_LS_ENABLE_MASK,
  590. MC_CITF_MISC_VM_CG__MEM_LS_ENABLE_MASK,
  591. VM_L2_CG__MEM_LS_ENABLE_MASK,
  592. };
  593. static const u32 mc_cg_en[] = {
  594. MC_HUB_MISC_HUB_CG__ENABLE_MASK,
  595. MC_HUB_MISC_SIP_CG__ENABLE_MASK,
  596. MC_HUB_MISC_VM_CG__ENABLE_MASK,
  597. MC_XPB_CLK_GAT__ENABLE_MASK,
  598. ATC_MISC_CG__ENABLE_MASK,
  599. MC_CITF_MISC_WR_CG__ENABLE_MASK,
  600. MC_CITF_MISC_RD_CG__ENABLE_MASK,
  601. MC_CITF_MISC_VM_CG__ENABLE_MASK,
  602. VM_L2_CG__ENABLE_MASK,
  603. };
  604. static void gmc_v6_0_enable_mc_ls(struct amdgpu_device *adev,
  605. bool enable)
  606. {
  607. int i;
  608. u32 orig, data;
  609. for (i = 0; i < ARRAY_SIZE(mc_cg_registers); i++) {
  610. orig = data = RREG32(mc_cg_registers[i]);
  611. if (enable && (adev->cg_flags & AMDGPU_CG_SUPPORT_MC_LS))
  612. data |= mc_cg_ls_en[i];
  613. else
  614. data &= ~mc_cg_ls_en[i];
  615. if (data != orig)
  616. WREG32(mc_cg_registers[i], data);
  617. }
  618. }
  619. static void gmc_v6_0_enable_mc_mgcg(struct amdgpu_device *adev,
  620. bool enable)
  621. {
  622. int i;
  623. u32 orig, data;
  624. for (i = 0; i < ARRAY_SIZE(mc_cg_registers); i++) {
  625. orig = data = RREG32(mc_cg_registers[i]);
  626. if (enable && (adev->cg_flags & AMDGPU_CG_SUPPORT_MC_MGCG))
  627. data |= mc_cg_en[i];
  628. else
  629. data &= ~mc_cg_en[i];
  630. if (data != orig)
  631. WREG32(mc_cg_registers[i], data);
  632. }
  633. }
  634. static void gmc_v6_0_enable_bif_mgls(struct amdgpu_device *adev,
  635. bool enable)
  636. {
  637. u32 orig, data;
  638. orig = data = RREG32_PCIE(ixPCIE_CNTL2);
  639. if (enable && (adev->cg_flags & AMDGPU_CG_SUPPORT_BIF_LS)) {
  640. data = REG_SET_FIELD(data, PCIE_CNTL2, SLV_MEM_LS_EN, 1);
  641. data = REG_SET_FIELD(data, PCIE_CNTL2, MST_MEM_LS_EN, 1);
  642. data = REG_SET_FIELD(data, PCIE_CNTL2, REPLAY_MEM_LS_EN, 1);
  643. data = REG_SET_FIELD(data, PCIE_CNTL2, SLV_MEM_AGGRESSIVE_LS_EN, 1);
  644. } else {
  645. data = REG_SET_FIELD(data, PCIE_CNTL2, SLV_MEM_LS_EN, 0);
  646. data = REG_SET_FIELD(data, PCIE_CNTL2, MST_MEM_LS_EN, 0);
  647. data = REG_SET_FIELD(data, PCIE_CNTL2, REPLAY_MEM_LS_EN, 0);
  648. data = REG_SET_FIELD(data, PCIE_CNTL2, SLV_MEM_AGGRESSIVE_LS_EN, 0);
  649. }
  650. if (orig != data)
  651. WREG32_PCIE(ixPCIE_CNTL2, data);
  652. }
  653. static void gmc_v6_0_enable_hdp_mgcg(struct amdgpu_device *adev,
  654. bool enable)
  655. {
  656. u32 orig, data;
  657. orig = data = RREG32(mmHDP_HOST_PATH_CNTL);
  658. if (enable && (adev->cg_flags & AMDGPU_CG_SUPPORT_HDP_MGCG))
  659. data = REG_SET_FIELD(data, HDP_HOST_PATH_CNTL, CLOCK_GATING_DIS, 0);
  660. else
  661. data = REG_SET_FIELD(data, HDP_HOST_PATH_CNTL, CLOCK_GATING_DIS, 1);
  662. if (orig != data)
  663. WREG32(mmHDP_HOST_PATH_CNTL, data);
  664. }
  665. static void gmc_v6_0_enable_hdp_ls(struct amdgpu_device *adev,
  666. bool enable)
  667. {
  668. u32 orig, data;
  669. orig = data = RREG32(mmHDP_MEM_POWER_LS);
  670. if (enable && (adev->cg_flags & AMDGPU_CG_SUPPORT_HDP_LS))
  671. data = REG_SET_FIELD(data, HDP_MEM_POWER_LS, LS_ENABLE, 1);
  672. else
  673. data = REG_SET_FIELD(data, HDP_MEM_POWER_LS, LS_ENABLE, 0);
  674. if (orig != data)
  675. WREG32(mmHDP_MEM_POWER_LS, data);
  676. }
  677. */
  678. static int gmc_v6_0_convert_vram_type(int mc_seq_vram_type)
  679. {
  680. switch (mc_seq_vram_type) {
  681. case MC_SEQ_MISC0__MT__GDDR1:
  682. return AMDGPU_VRAM_TYPE_GDDR1;
  683. case MC_SEQ_MISC0__MT__DDR2:
  684. return AMDGPU_VRAM_TYPE_DDR2;
  685. case MC_SEQ_MISC0__MT__GDDR3:
  686. return AMDGPU_VRAM_TYPE_GDDR3;
  687. case MC_SEQ_MISC0__MT__GDDR4:
  688. return AMDGPU_VRAM_TYPE_GDDR4;
  689. case MC_SEQ_MISC0__MT__GDDR5:
  690. return AMDGPU_VRAM_TYPE_GDDR5;
  691. case MC_SEQ_MISC0__MT__DDR3:
  692. return AMDGPU_VRAM_TYPE_DDR3;
  693. default:
  694. return AMDGPU_VRAM_TYPE_UNKNOWN;
  695. }
  696. }
  697. static int gmc_v6_0_early_init(void *handle)
  698. {
  699. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  700. gmc_v6_0_set_gart_funcs(adev);
  701. gmc_v6_0_set_irq_funcs(adev);
  702. return 0;
  703. }
  704. static int gmc_v6_0_late_init(void *handle)
  705. {
  706. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  707. if (amdgpu_vm_fault_stop != AMDGPU_VM_FAULT_STOP_ALWAYS)
  708. return amdgpu_irq_get(adev, &adev->mc.vm_fault, 0);
  709. else
  710. return 0;
  711. }
  712. static int gmc_v6_0_sw_init(void *handle)
  713. {
  714. int r;
  715. int dma_bits;
  716. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  717. if (adev->flags & AMD_IS_APU) {
  718. adev->mc.vram_type = AMDGPU_VRAM_TYPE_UNKNOWN;
  719. } else {
  720. u32 tmp = RREG32(mmMC_SEQ_MISC0);
  721. tmp &= MC_SEQ_MISC0__MT__MASK;
  722. adev->mc.vram_type = gmc_v6_0_convert_vram_type(tmp);
  723. }
  724. r = amdgpu_irq_add_id(adev, AMDGPU_IH_CLIENTID_LEGACY, 146, &adev->mc.vm_fault);
  725. if (r)
  726. return r;
  727. r = amdgpu_irq_add_id(adev, AMDGPU_IH_CLIENTID_LEGACY, 147, &adev->mc.vm_fault);
  728. if (r)
  729. return r;
  730. amdgpu_vm_adjust_size(adev, 64, 9);
  731. adev->mc.mc_mask = 0xffffffffffULL;
  732. adev->mc.stolen_size = 256 * 1024;
  733. adev->need_dma32 = false;
  734. dma_bits = adev->need_dma32 ? 32 : 40;
  735. r = pci_set_dma_mask(adev->pdev, DMA_BIT_MASK(dma_bits));
  736. if (r) {
  737. adev->need_dma32 = true;
  738. dma_bits = 32;
  739. dev_warn(adev->dev, "amdgpu: No suitable DMA available.\n");
  740. }
  741. r = pci_set_consistent_dma_mask(adev->pdev, DMA_BIT_MASK(dma_bits));
  742. if (r) {
  743. pci_set_consistent_dma_mask(adev->pdev, DMA_BIT_MASK(32));
  744. dev_warn(adev->dev, "amdgpu: No coherent DMA available.\n");
  745. }
  746. r = gmc_v6_0_init_microcode(adev);
  747. if (r) {
  748. dev_err(adev->dev, "Failed to load mc firmware!\n");
  749. return r;
  750. }
  751. r = gmc_v6_0_mc_init(adev);
  752. if (r)
  753. return r;
  754. r = amdgpu_bo_init(adev);
  755. if (r)
  756. return r;
  757. r = gmc_v6_0_gart_init(adev);
  758. if (r)
  759. return r;
  760. /*
  761. * number of VMs
  762. * VMID 0 is reserved for System
  763. * amdgpu graphics/compute will use VMIDs 1-7
  764. * amdkfd will use VMIDs 8-15
  765. */
  766. adev->vm_manager.id_mgr[0].num_ids = AMDGPU_NUM_OF_VMIDS;
  767. adev->vm_manager.num_level = 1;
  768. amdgpu_vm_manager_init(adev);
  769. /* base offset of vram pages */
  770. if (adev->flags & AMD_IS_APU) {
  771. u64 tmp = RREG32(mmMC_VM_FB_OFFSET);
  772. tmp <<= 22;
  773. adev->vm_manager.vram_base_offset = tmp;
  774. } else {
  775. adev->vm_manager.vram_base_offset = 0;
  776. }
  777. return 0;
  778. }
  779. static int gmc_v6_0_sw_fini(void *handle)
  780. {
  781. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  782. amdgpu_vm_manager_fini(adev);
  783. gmc_v6_0_gart_fini(adev);
  784. amdgpu_gem_force_release(adev);
  785. amdgpu_bo_fini(adev);
  786. release_firmware(adev->mc.fw);
  787. adev->mc.fw = NULL;
  788. return 0;
  789. }
  790. static int gmc_v6_0_hw_init(void *handle)
  791. {
  792. int r;
  793. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  794. gmc_v6_0_mc_program(adev);
  795. if (!(adev->flags & AMD_IS_APU)) {
  796. r = gmc_v6_0_mc_load_microcode(adev);
  797. if (r) {
  798. dev_err(adev->dev, "Failed to load MC firmware!\n");
  799. return r;
  800. }
  801. }
  802. r = gmc_v6_0_gart_enable(adev);
  803. if (r)
  804. return r;
  805. return r;
  806. }
  807. static int gmc_v6_0_hw_fini(void *handle)
  808. {
  809. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  810. amdgpu_irq_put(adev, &adev->mc.vm_fault, 0);
  811. gmc_v6_0_gart_disable(adev);
  812. return 0;
  813. }
  814. static int gmc_v6_0_suspend(void *handle)
  815. {
  816. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  817. gmc_v6_0_hw_fini(adev);
  818. return 0;
  819. }
  820. static int gmc_v6_0_resume(void *handle)
  821. {
  822. int r;
  823. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  824. r = gmc_v6_0_hw_init(adev);
  825. if (r)
  826. return r;
  827. amdgpu_vm_reset_all_ids(adev);
  828. return 0;
  829. }
  830. static bool gmc_v6_0_is_idle(void *handle)
  831. {
  832. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  833. u32 tmp = RREG32(mmSRBM_STATUS);
  834. if (tmp & (SRBM_STATUS__MCB_BUSY_MASK | SRBM_STATUS__MCB_NON_DISPLAY_BUSY_MASK |
  835. SRBM_STATUS__MCC_BUSY_MASK | SRBM_STATUS__MCD_BUSY_MASK | SRBM_STATUS__VMC_BUSY_MASK))
  836. return false;
  837. return true;
  838. }
  839. static int gmc_v6_0_wait_for_idle(void *handle)
  840. {
  841. unsigned i;
  842. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  843. for (i = 0; i < adev->usec_timeout; i++) {
  844. if (gmc_v6_0_is_idle(handle))
  845. return 0;
  846. udelay(1);
  847. }
  848. return -ETIMEDOUT;
  849. }
  850. static int gmc_v6_0_soft_reset(void *handle)
  851. {
  852. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  853. u32 srbm_soft_reset = 0;
  854. u32 tmp = RREG32(mmSRBM_STATUS);
  855. if (tmp & SRBM_STATUS__VMC_BUSY_MASK)
  856. srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset,
  857. SRBM_SOFT_RESET, SOFT_RESET_VMC, 1);
  858. if (tmp & (SRBM_STATUS__MCB_BUSY_MASK | SRBM_STATUS__MCB_NON_DISPLAY_BUSY_MASK |
  859. SRBM_STATUS__MCC_BUSY_MASK | SRBM_STATUS__MCD_BUSY_MASK)) {
  860. if (!(adev->flags & AMD_IS_APU))
  861. srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset,
  862. SRBM_SOFT_RESET, SOFT_RESET_MC, 1);
  863. }
  864. if (srbm_soft_reset) {
  865. gmc_v6_0_mc_stop(adev);
  866. if (gmc_v6_0_wait_for_idle(adev)) {
  867. dev_warn(adev->dev, "Wait for GMC idle timed out !\n");
  868. }
  869. tmp = RREG32(mmSRBM_SOFT_RESET);
  870. tmp |= srbm_soft_reset;
  871. dev_info(adev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
  872. WREG32(mmSRBM_SOFT_RESET, tmp);
  873. tmp = RREG32(mmSRBM_SOFT_RESET);
  874. udelay(50);
  875. tmp &= ~srbm_soft_reset;
  876. WREG32(mmSRBM_SOFT_RESET, tmp);
  877. tmp = RREG32(mmSRBM_SOFT_RESET);
  878. udelay(50);
  879. gmc_v6_0_mc_resume(adev);
  880. udelay(50);
  881. }
  882. return 0;
  883. }
  884. static int gmc_v6_0_vm_fault_interrupt_state(struct amdgpu_device *adev,
  885. struct amdgpu_irq_src *src,
  886. unsigned type,
  887. enum amdgpu_interrupt_state state)
  888. {
  889. u32 tmp;
  890. u32 bits = (VM_CONTEXT1_CNTL__RANGE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  891. VM_CONTEXT1_CNTL__DUMMY_PAGE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  892. VM_CONTEXT1_CNTL__PDE0_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  893. VM_CONTEXT1_CNTL__VALID_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  894. VM_CONTEXT1_CNTL__READ_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  895. VM_CONTEXT1_CNTL__WRITE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK);
  896. switch (state) {
  897. case AMDGPU_IRQ_STATE_DISABLE:
  898. tmp = RREG32(mmVM_CONTEXT0_CNTL);
  899. tmp &= ~bits;
  900. WREG32(mmVM_CONTEXT0_CNTL, tmp);
  901. tmp = RREG32(mmVM_CONTEXT1_CNTL);
  902. tmp &= ~bits;
  903. WREG32(mmVM_CONTEXT1_CNTL, tmp);
  904. break;
  905. case AMDGPU_IRQ_STATE_ENABLE:
  906. tmp = RREG32(mmVM_CONTEXT0_CNTL);
  907. tmp |= bits;
  908. WREG32(mmVM_CONTEXT0_CNTL, tmp);
  909. tmp = RREG32(mmVM_CONTEXT1_CNTL);
  910. tmp |= bits;
  911. WREG32(mmVM_CONTEXT1_CNTL, tmp);
  912. break;
  913. default:
  914. break;
  915. }
  916. return 0;
  917. }
  918. static int gmc_v6_0_process_interrupt(struct amdgpu_device *adev,
  919. struct amdgpu_irq_src *source,
  920. struct amdgpu_iv_entry *entry)
  921. {
  922. u32 addr, status;
  923. addr = RREG32(mmVM_CONTEXT1_PROTECTION_FAULT_ADDR);
  924. status = RREG32(mmVM_CONTEXT1_PROTECTION_FAULT_STATUS);
  925. WREG32_P(mmVM_CONTEXT1_CNTL2, 1, ~1);
  926. if (!addr && !status)
  927. return 0;
  928. if (amdgpu_vm_fault_stop == AMDGPU_VM_FAULT_STOP_FIRST)
  929. gmc_v6_0_set_fault_enable_default(adev, false);
  930. if (printk_ratelimit()) {
  931. dev_err(adev->dev, "GPU fault detected: %d 0x%08x\n",
  932. entry->src_id, entry->src_data[0]);
  933. dev_err(adev->dev, " VM_CONTEXT1_PROTECTION_FAULT_ADDR 0x%08X\n",
  934. addr);
  935. dev_err(adev->dev, " VM_CONTEXT1_PROTECTION_FAULT_STATUS 0x%08X\n",
  936. status);
  937. gmc_v6_0_vm_decode_fault(adev, status, addr, 0);
  938. }
  939. return 0;
  940. }
  941. static int gmc_v6_0_set_clockgating_state(void *handle,
  942. enum amd_clockgating_state state)
  943. {
  944. return 0;
  945. }
  946. static int gmc_v6_0_set_powergating_state(void *handle,
  947. enum amd_powergating_state state)
  948. {
  949. return 0;
  950. }
  951. static const struct amd_ip_funcs gmc_v6_0_ip_funcs = {
  952. .name = "gmc_v6_0",
  953. .early_init = gmc_v6_0_early_init,
  954. .late_init = gmc_v6_0_late_init,
  955. .sw_init = gmc_v6_0_sw_init,
  956. .sw_fini = gmc_v6_0_sw_fini,
  957. .hw_init = gmc_v6_0_hw_init,
  958. .hw_fini = gmc_v6_0_hw_fini,
  959. .suspend = gmc_v6_0_suspend,
  960. .resume = gmc_v6_0_resume,
  961. .is_idle = gmc_v6_0_is_idle,
  962. .wait_for_idle = gmc_v6_0_wait_for_idle,
  963. .soft_reset = gmc_v6_0_soft_reset,
  964. .set_clockgating_state = gmc_v6_0_set_clockgating_state,
  965. .set_powergating_state = gmc_v6_0_set_powergating_state,
  966. };
  967. static const struct amdgpu_gart_funcs gmc_v6_0_gart_funcs = {
  968. .flush_gpu_tlb = gmc_v6_0_gart_flush_gpu_tlb,
  969. .set_pte_pde = gmc_v6_0_gart_set_pte_pde,
  970. .set_prt = gmc_v6_0_set_prt,
  971. .get_vm_pde = gmc_v6_0_get_vm_pde,
  972. .get_vm_pte_flags = gmc_v6_0_get_vm_pte_flags
  973. };
  974. static const struct amdgpu_irq_src_funcs gmc_v6_0_irq_funcs = {
  975. .set = gmc_v6_0_vm_fault_interrupt_state,
  976. .process = gmc_v6_0_process_interrupt,
  977. };
  978. static void gmc_v6_0_set_gart_funcs(struct amdgpu_device *adev)
  979. {
  980. if (adev->gart.gart_funcs == NULL)
  981. adev->gart.gart_funcs = &gmc_v6_0_gart_funcs;
  982. }
  983. static void gmc_v6_0_set_irq_funcs(struct amdgpu_device *adev)
  984. {
  985. adev->mc.vm_fault.num_types = 1;
  986. adev->mc.vm_fault.funcs = &gmc_v6_0_irq_funcs;
  987. }
  988. const struct amdgpu_ip_block_version gmc_v6_0_ip_block =
  989. {
  990. .type = AMD_IP_BLOCK_TYPE_GMC,
  991. .major = 6,
  992. .minor = 0,
  993. .rev = 0,
  994. .funcs = &gmc_v6_0_ip_funcs,
  995. };