gmc_v9_0.c 32 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include <linux/firmware.h>
  24. #include <drm/drm_cache.h>
  25. #include "amdgpu.h"
  26. #include "gmc_v9_0.h"
  27. #include "amdgpu_atomfirmware.h"
  28. #include "hdp/hdp_4_0_offset.h"
  29. #include "hdp/hdp_4_0_sh_mask.h"
  30. #include "gc/gc_9_0_sh_mask.h"
  31. #include "dce/dce_12_0_offset.h"
  32. #include "dce/dce_12_0_sh_mask.h"
  33. #include "vega10_enum.h"
  34. #include "mmhub/mmhub_1_0_offset.h"
  35. #include "athub/athub_1_0_offset.h"
  36. #include "oss/osssys_4_0_offset.h"
  37. #include "soc15.h"
  38. #include "soc15_common.h"
  39. #include "umc/umc_6_0_sh_mask.h"
  40. #include "gfxhub_v1_0.h"
  41. #include "mmhub_v1_0.h"
  42. /* add these here since we already include dce12 headers and these are for DCN */
  43. #define mmHUBP0_DCSURF_PRI_VIEWPORT_DIMENSION 0x055d
  44. #define mmHUBP0_DCSURF_PRI_VIEWPORT_DIMENSION_BASE_IDX 2
  45. #define HUBP0_DCSURF_PRI_VIEWPORT_DIMENSION__PRI_VIEWPORT_WIDTH__SHIFT 0x0
  46. #define HUBP0_DCSURF_PRI_VIEWPORT_DIMENSION__PRI_VIEWPORT_HEIGHT__SHIFT 0x10
  47. #define HUBP0_DCSURF_PRI_VIEWPORT_DIMENSION__PRI_VIEWPORT_WIDTH_MASK 0x00003FFFL
  48. #define HUBP0_DCSURF_PRI_VIEWPORT_DIMENSION__PRI_VIEWPORT_HEIGHT_MASK 0x3FFF0000L
  49. /* XXX Move this macro to VEGA10 header file, which is like vid.h for VI.*/
  50. #define AMDGPU_NUM_OF_VMIDS 8
  51. static const u32 golden_settings_vega10_hdp[] =
  52. {
  53. 0xf64, 0x0fffffff, 0x00000000,
  54. 0xf65, 0x0fffffff, 0x00000000,
  55. 0xf66, 0x0fffffff, 0x00000000,
  56. 0xf67, 0x0fffffff, 0x00000000,
  57. 0xf68, 0x0fffffff, 0x00000000,
  58. 0xf6a, 0x0fffffff, 0x00000000,
  59. 0xf6b, 0x0fffffff, 0x00000000,
  60. 0xf6c, 0x0fffffff, 0x00000000,
  61. 0xf6d, 0x0fffffff, 0x00000000,
  62. 0xf6e, 0x0fffffff, 0x00000000,
  63. };
  64. static const struct soc15_reg_golden golden_settings_mmhub_1_0_0[] =
  65. {
  66. SOC15_REG_GOLDEN_VALUE(MMHUB, 0, mmDAGB1_WRCLI2, 0x00000007, 0xfe5fe0fa),
  67. SOC15_REG_GOLDEN_VALUE(MMHUB, 0, mmMMEA1_DRAM_WR_CLI2GRP_MAP0, 0x00000030, 0x55555565)
  68. };
  69. static const struct soc15_reg_golden golden_settings_athub_1_0_0[] =
  70. {
  71. SOC15_REG_GOLDEN_VALUE(ATHUB, 0, mmRPB_ARB_CNTL, 0x0000ff00, 0x00000800),
  72. SOC15_REG_GOLDEN_VALUE(ATHUB, 0, mmRPB_ARB_CNTL2, 0x00ff00ff, 0x00080008)
  73. };
  74. /* Ecc related register addresses, (BASE + reg offset) */
  75. /* Universal Memory Controller caps (may be fused). */
  76. /* UMCCH:UmcLocalCap */
  77. #define UMCLOCALCAPS_ADDR0 (0x00014306 + 0x00000000)
  78. #define UMCLOCALCAPS_ADDR1 (0x00014306 + 0x00000800)
  79. #define UMCLOCALCAPS_ADDR2 (0x00014306 + 0x00001000)
  80. #define UMCLOCALCAPS_ADDR3 (0x00014306 + 0x00001800)
  81. #define UMCLOCALCAPS_ADDR4 (0x00054306 + 0x00000000)
  82. #define UMCLOCALCAPS_ADDR5 (0x00054306 + 0x00000800)
  83. #define UMCLOCALCAPS_ADDR6 (0x00054306 + 0x00001000)
  84. #define UMCLOCALCAPS_ADDR7 (0x00054306 + 0x00001800)
  85. #define UMCLOCALCAPS_ADDR8 (0x00094306 + 0x00000000)
  86. #define UMCLOCALCAPS_ADDR9 (0x00094306 + 0x00000800)
  87. #define UMCLOCALCAPS_ADDR10 (0x00094306 + 0x00001000)
  88. #define UMCLOCALCAPS_ADDR11 (0x00094306 + 0x00001800)
  89. #define UMCLOCALCAPS_ADDR12 (0x000d4306 + 0x00000000)
  90. #define UMCLOCALCAPS_ADDR13 (0x000d4306 + 0x00000800)
  91. #define UMCLOCALCAPS_ADDR14 (0x000d4306 + 0x00001000)
  92. #define UMCLOCALCAPS_ADDR15 (0x000d4306 + 0x00001800)
  93. /* Universal Memory Controller Channel config. */
  94. /* UMCCH:UMC_CONFIG */
  95. #define UMCCH_UMC_CONFIG_ADDR0 (0x00014040 + 0x00000000)
  96. #define UMCCH_UMC_CONFIG_ADDR1 (0x00014040 + 0x00000800)
  97. #define UMCCH_UMC_CONFIG_ADDR2 (0x00014040 + 0x00001000)
  98. #define UMCCH_UMC_CONFIG_ADDR3 (0x00014040 + 0x00001800)
  99. #define UMCCH_UMC_CONFIG_ADDR4 (0x00054040 + 0x00000000)
  100. #define UMCCH_UMC_CONFIG_ADDR5 (0x00054040 + 0x00000800)
  101. #define UMCCH_UMC_CONFIG_ADDR6 (0x00054040 + 0x00001000)
  102. #define UMCCH_UMC_CONFIG_ADDR7 (0x00054040 + 0x00001800)
  103. #define UMCCH_UMC_CONFIG_ADDR8 (0x00094040 + 0x00000000)
  104. #define UMCCH_UMC_CONFIG_ADDR9 (0x00094040 + 0x00000800)
  105. #define UMCCH_UMC_CONFIG_ADDR10 (0x00094040 + 0x00001000)
  106. #define UMCCH_UMC_CONFIG_ADDR11 (0x00094040 + 0x00001800)
  107. #define UMCCH_UMC_CONFIG_ADDR12 (0x000d4040 + 0x00000000)
  108. #define UMCCH_UMC_CONFIG_ADDR13 (0x000d4040 + 0x00000800)
  109. #define UMCCH_UMC_CONFIG_ADDR14 (0x000d4040 + 0x00001000)
  110. #define UMCCH_UMC_CONFIG_ADDR15 (0x000d4040 + 0x00001800)
  111. /* Universal Memory Controller Channel Ecc config. */
  112. /* UMCCH:EccCtrl */
  113. #define UMCCH_ECCCTRL_ADDR0 (0x00014053 + 0x00000000)
  114. #define UMCCH_ECCCTRL_ADDR1 (0x00014053 + 0x00000800)
  115. #define UMCCH_ECCCTRL_ADDR2 (0x00014053 + 0x00001000)
  116. #define UMCCH_ECCCTRL_ADDR3 (0x00014053 + 0x00001800)
  117. #define UMCCH_ECCCTRL_ADDR4 (0x00054053 + 0x00000000)
  118. #define UMCCH_ECCCTRL_ADDR5 (0x00054053 + 0x00000800)
  119. #define UMCCH_ECCCTRL_ADDR6 (0x00054053 + 0x00001000)
  120. #define UMCCH_ECCCTRL_ADDR7 (0x00054053 + 0x00001800)
  121. #define UMCCH_ECCCTRL_ADDR8 (0x00094053 + 0x00000000)
  122. #define UMCCH_ECCCTRL_ADDR9 (0x00094053 + 0x00000800)
  123. #define UMCCH_ECCCTRL_ADDR10 (0x00094053 + 0x00001000)
  124. #define UMCCH_ECCCTRL_ADDR11 (0x00094053 + 0x00001800)
  125. #define UMCCH_ECCCTRL_ADDR12 (0x000d4053 + 0x00000000)
  126. #define UMCCH_ECCCTRL_ADDR13 (0x000d4053 + 0x00000800)
  127. #define UMCCH_ECCCTRL_ADDR14 (0x000d4053 + 0x00001000)
  128. #define UMCCH_ECCCTRL_ADDR15 (0x000d4053 + 0x00001800)
  129. static const uint32_t ecc_umclocalcap_addrs[] = {
  130. UMCLOCALCAPS_ADDR0,
  131. UMCLOCALCAPS_ADDR1,
  132. UMCLOCALCAPS_ADDR2,
  133. UMCLOCALCAPS_ADDR3,
  134. UMCLOCALCAPS_ADDR4,
  135. UMCLOCALCAPS_ADDR5,
  136. UMCLOCALCAPS_ADDR6,
  137. UMCLOCALCAPS_ADDR7,
  138. UMCLOCALCAPS_ADDR8,
  139. UMCLOCALCAPS_ADDR9,
  140. UMCLOCALCAPS_ADDR10,
  141. UMCLOCALCAPS_ADDR11,
  142. UMCLOCALCAPS_ADDR12,
  143. UMCLOCALCAPS_ADDR13,
  144. UMCLOCALCAPS_ADDR14,
  145. UMCLOCALCAPS_ADDR15,
  146. };
  147. static const uint32_t ecc_umcch_umc_config_addrs[] = {
  148. UMCCH_UMC_CONFIG_ADDR0,
  149. UMCCH_UMC_CONFIG_ADDR1,
  150. UMCCH_UMC_CONFIG_ADDR2,
  151. UMCCH_UMC_CONFIG_ADDR3,
  152. UMCCH_UMC_CONFIG_ADDR4,
  153. UMCCH_UMC_CONFIG_ADDR5,
  154. UMCCH_UMC_CONFIG_ADDR6,
  155. UMCCH_UMC_CONFIG_ADDR7,
  156. UMCCH_UMC_CONFIG_ADDR8,
  157. UMCCH_UMC_CONFIG_ADDR9,
  158. UMCCH_UMC_CONFIG_ADDR10,
  159. UMCCH_UMC_CONFIG_ADDR11,
  160. UMCCH_UMC_CONFIG_ADDR12,
  161. UMCCH_UMC_CONFIG_ADDR13,
  162. UMCCH_UMC_CONFIG_ADDR14,
  163. UMCCH_UMC_CONFIG_ADDR15,
  164. };
  165. static const uint32_t ecc_umcch_eccctrl_addrs[] = {
  166. UMCCH_ECCCTRL_ADDR0,
  167. UMCCH_ECCCTRL_ADDR1,
  168. UMCCH_ECCCTRL_ADDR2,
  169. UMCCH_ECCCTRL_ADDR3,
  170. UMCCH_ECCCTRL_ADDR4,
  171. UMCCH_ECCCTRL_ADDR5,
  172. UMCCH_ECCCTRL_ADDR6,
  173. UMCCH_ECCCTRL_ADDR7,
  174. UMCCH_ECCCTRL_ADDR8,
  175. UMCCH_ECCCTRL_ADDR9,
  176. UMCCH_ECCCTRL_ADDR10,
  177. UMCCH_ECCCTRL_ADDR11,
  178. UMCCH_ECCCTRL_ADDR12,
  179. UMCCH_ECCCTRL_ADDR13,
  180. UMCCH_ECCCTRL_ADDR14,
  181. UMCCH_ECCCTRL_ADDR15,
  182. };
  183. static int gmc_v9_0_vm_fault_interrupt_state(struct amdgpu_device *adev,
  184. struct amdgpu_irq_src *src,
  185. unsigned type,
  186. enum amdgpu_interrupt_state state)
  187. {
  188. struct amdgpu_vmhub *hub;
  189. u32 tmp, reg, bits, i, j;
  190. bits = VM_CONTEXT1_CNTL__RANGE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  191. VM_CONTEXT1_CNTL__DUMMY_PAGE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  192. VM_CONTEXT1_CNTL__PDE0_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  193. VM_CONTEXT1_CNTL__VALID_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  194. VM_CONTEXT1_CNTL__READ_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  195. VM_CONTEXT1_CNTL__WRITE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK |
  196. VM_CONTEXT1_CNTL__EXECUTE_PROTECTION_FAULT_ENABLE_INTERRUPT_MASK;
  197. switch (state) {
  198. case AMDGPU_IRQ_STATE_DISABLE:
  199. for (j = 0; j < AMDGPU_MAX_VMHUBS; j++) {
  200. hub = &adev->vmhub[j];
  201. for (i = 0; i < 16; i++) {
  202. reg = hub->vm_context0_cntl + i;
  203. tmp = RREG32(reg);
  204. tmp &= ~bits;
  205. WREG32(reg, tmp);
  206. }
  207. }
  208. break;
  209. case AMDGPU_IRQ_STATE_ENABLE:
  210. for (j = 0; j < AMDGPU_MAX_VMHUBS; j++) {
  211. hub = &adev->vmhub[j];
  212. for (i = 0; i < 16; i++) {
  213. reg = hub->vm_context0_cntl + i;
  214. tmp = RREG32(reg);
  215. tmp |= bits;
  216. WREG32(reg, tmp);
  217. }
  218. }
  219. default:
  220. break;
  221. }
  222. return 0;
  223. }
  224. static int gmc_v9_0_process_interrupt(struct amdgpu_device *adev,
  225. struct amdgpu_irq_src *source,
  226. struct amdgpu_iv_entry *entry)
  227. {
  228. struct amdgpu_vmhub *hub = &adev->vmhub[entry->vmid_src];
  229. uint32_t status = 0;
  230. u64 addr;
  231. addr = (u64)entry->src_data[0] << 12;
  232. addr |= ((u64)entry->src_data[1] & 0xf) << 44;
  233. if (!amdgpu_sriov_vf(adev)) {
  234. status = RREG32(hub->vm_l2_pro_fault_status);
  235. WREG32_P(hub->vm_l2_pro_fault_cntl, 1, ~1);
  236. }
  237. if (printk_ratelimit()) {
  238. dev_err(adev->dev,
  239. "[%s] VMC page fault (src_id:%u ring:%u vmid:%u pasid:%u)\n",
  240. entry->vmid_src ? "mmhub" : "gfxhub",
  241. entry->src_id, entry->ring_id, entry->vmid,
  242. entry->pasid);
  243. dev_err(adev->dev, " at page 0x%016llx from %d\n",
  244. addr, entry->client_id);
  245. if (!amdgpu_sriov_vf(adev))
  246. dev_err(adev->dev,
  247. "VM_L2_PROTECTION_FAULT_STATUS:0x%08X\n",
  248. status);
  249. }
  250. return 0;
  251. }
  252. static const struct amdgpu_irq_src_funcs gmc_v9_0_irq_funcs = {
  253. .set = gmc_v9_0_vm_fault_interrupt_state,
  254. .process = gmc_v9_0_process_interrupt,
  255. };
  256. static void gmc_v9_0_set_irq_funcs(struct amdgpu_device *adev)
  257. {
  258. adev->gmc.vm_fault.num_types = 1;
  259. adev->gmc.vm_fault.funcs = &gmc_v9_0_irq_funcs;
  260. }
  261. static uint32_t gmc_v9_0_get_invalidate_req(unsigned int vmid)
  262. {
  263. u32 req = 0;
  264. /* invalidate using legacy mode on vmid*/
  265. req = REG_SET_FIELD(req, VM_INVALIDATE_ENG0_REQ,
  266. PER_VMID_INVALIDATE_REQ, 1 << vmid);
  267. req = REG_SET_FIELD(req, VM_INVALIDATE_ENG0_REQ, FLUSH_TYPE, 0);
  268. req = REG_SET_FIELD(req, VM_INVALIDATE_ENG0_REQ, INVALIDATE_L2_PTES, 1);
  269. req = REG_SET_FIELD(req, VM_INVALIDATE_ENG0_REQ, INVALIDATE_L2_PDE0, 1);
  270. req = REG_SET_FIELD(req, VM_INVALIDATE_ENG0_REQ, INVALIDATE_L2_PDE1, 1);
  271. req = REG_SET_FIELD(req, VM_INVALIDATE_ENG0_REQ, INVALIDATE_L2_PDE2, 1);
  272. req = REG_SET_FIELD(req, VM_INVALIDATE_ENG0_REQ, INVALIDATE_L1_PTES, 1);
  273. req = REG_SET_FIELD(req, VM_INVALIDATE_ENG0_REQ,
  274. CLEAR_PROTECTION_FAULT_STATUS_ADDR, 0);
  275. return req;
  276. }
  277. /*
  278. * GART
  279. * VMID 0 is the physical GPU addresses as used by the kernel.
  280. * VMIDs 1-15 are used for userspace clients and are handled
  281. * by the amdgpu vm/hsa code.
  282. */
  283. /**
  284. * gmc_v9_0_flush_gpu_tlb - gart tlb flush callback
  285. *
  286. * @adev: amdgpu_device pointer
  287. * @vmid: vm instance to flush
  288. *
  289. * Flush the TLB for the requested page table.
  290. */
  291. static void gmc_v9_0_flush_gpu_tlb(struct amdgpu_device *adev,
  292. uint32_t vmid)
  293. {
  294. /* Use register 17 for GART */
  295. const unsigned eng = 17;
  296. unsigned i, j;
  297. spin_lock(&adev->gmc.invalidate_lock);
  298. for (i = 0; i < AMDGPU_MAX_VMHUBS; ++i) {
  299. struct amdgpu_vmhub *hub = &adev->vmhub[i];
  300. u32 tmp = gmc_v9_0_get_invalidate_req(vmid);
  301. WREG32_NO_KIQ(hub->vm_inv_eng0_req + eng, tmp);
  302. /* Busy wait for ACK.*/
  303. for (j = 0; j < 100; j++) {
  304. tmp = RREG32_NO_KIQ(hub->vm_inv_eng0_ack + eng);
  305. tmp &= 1 << vmid;
  306. if (tmp)
  307. break;
  308. cpu_relax();
  309. }
  310. if (j < 100)
  311. continue;
  312. /* Wait for ACK with a delay.*/
  313. for (j = 0; j < adev->usec_timeout; j++) {
  314. tmp = RREG32_NO_KIQ(hub->vm_inv_eng0_ack + eng);
  315. tmp &= 1 << vmid;
  316. if (tmp)
  317. break;
  318. udelay(1);
  319. }
  320. if (j < adev->usec_timeout)
  321. continue;
  322. DRM_ERROR("Timeout waiting for VM flush ACK!\n");
  323. }
  324. spin_unlock(&adev->gmc.invalidate_lock);
  325. }
  326. static uint64_t gmc_v9_0_emit_flush_gpu_tlb(struct amdgpu_ring *ring,
  327. unsigned vmid, uint64_t pd_addr)
  328. {
  329. struct amdgpu_device *adev = ring->adev;
  330. struct amdgpu_vmhub *hub = &adev->vmhub[ring->funcs->vmhub];
  331. uint32_t req = gmc_v9_0_get_invalidate_req(vmid);
  332. uint64_t flags = AMDGPU_PTE_VALID;
  333. unsigned eng = ring->vm_inv_eng;
  334. amdgpu_gmc_get_vm_pde(adev, -1, &pd_addr, &flags);
  335. pd_addr |= flags;
  336. amdgpu_ring_emit_wreg(ring, hub->ctx0_ptb_addr_lo32 + (2 * vmid),
  337. lower_32_bits(pd_addr));
  338. amdgpu_ring_emit_wreg(ring, hub->ctx0_ptb_addr_hi32 + (2 * vmid),
  339. upper_32_bits(pd_addr));
  340. amdgpu_ring_emit_reg_write_reg_wait(ring, hub->vm_inv_eng0_req + eng,
  341. hub->vm_inv_eng0_ack + eng,
  342. req, 1 << vmid);
  343. return pd_addr;
  344. }
  345. static void gmc_v9_0_emit_pasid_mapping(struct amdgpu_ring *ring, unsigned vmid,
  346. unsigned pasid)
  347. {
  348. struct amdgpu_device *adev = ring->adev;
  349. uint32_t reg;
  350. if (ring->funcs->vmhub == AMDGPU_GFXHUB)
  351. reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_VMID_0_LUT) + vmid;
  352. else
  353. reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_VMID_0_LUT_MM) + vmid;
  354. amdgpu_ring_emit_wreg(ring, reg, pasid);
  355. }
  356. /**
  357. * gmc_v9_0_set_pte_pde - update the page tables using MMIO
  358. *
  359. * @adev: amdgpu_device pointer
  360. * @cpu_pt_addr: cpu address of the page table
  361. * @gpu_page_idx: entry in the page table to update
  362. * @addr: dst addr to write into pte/pde
  363. * @flags: access flags
  364. *
  365. * Update the page tables using the CPU.
  366. */
  367. static int gmc_v9_0_set_pte_pde(struct amdgpu_device *adev, void *cpu_pt_addr,
  368. uint32_t gpu_page_idx, uint64_t addr,
  369. uint64_t flags)
  370. {
  371. void __iomem *ptr = (void *)cpu_pt_addr;
  372. uint64_t value;
  373. /*
  374. * PTE format on VEGA 10:
  375. * 63:59 reserved
  376. * 58:57 mtype
  377. * 56 F
  378. * 55 L
  379. * 54 P
  380. * 53 SW
  381. * 52 T
  382. * 50:48 reserved
  383. * 47:12 4k physical page base address
  384. * 11:7 fragment
  385. * 6 write
  386. * 5 read
  387. * 4 exe
  388. * 3 Z
  389. * 2 snooped
  390. * 1 system
  391. * 0 valid
  392. *
  393. * PDE format on VEGA 10:
  394. * 63:59 block fragment size
  395. * 58:55 reserved
  396. * 54 P
  397. * 53:48 reserved
  398. * 47:6 physical base address of PD or PTE
  399. * 5:3 reserved
  400. * 2 C
  401. * 1 system
  402. * 0 valid
  403. */
  404. /*
  405. * The following is for PTE only. GART does not have PDEs.
  406. */
  407. value = addr & 0x0000FFFFFFFFF000ULL;
  408. value |= flags;
  409. writeq(value, ptr + (gpu_page_idx * 8));
  410. return 0;
  411. }
  412. static uint64_t gmc_v9_0_get_vm_pte_flags(struct amdgpu_device *adev,
  413. uint32_t flags)
  414. {
  415. uint64_t pte_flag = 0;
  416. if (flags & AMDGPU_VM_PAGE_EXECUTABLE)
  417. pte_flag |= AMDGPU_PTE_EXECUTABLE;
  418. if (flags & AMDGPU_VM_PAGE_READABLE)
  419. pte_flag |= AMDGPU_PTE_READABLE;
  420. if (flags & AMDGPU_VM_PAGE_WRITEABLE)
  421. pte_flag |= AMDGPU_PTE_WRITEABLE;
  422. switch (flags & AMDGPU_VM_MTYPE_MASK) {
  423. case AMDGPU_VM_MTYPE_DEFAULT:
  424. pte_flag |= AMDGPU_PTE_MTYPE(MTYPE_NC);
  425. break;
  426. case AMDGPU_VM_MTYPE_NC:
  427. pte_flag |= AMDGPU_PTE_MTYPE(MTYPE_NC);
  428. break;
  429. case AMDGPU_VM_MTYPE_WC:
  430. pte_flag |= AMDGPU_PTE_MTYPE(MTYPE_WC);
  431. break;
  432. case AMDGPU_VM_MTYPE_CC:
  433. pte_flag |= AMDGPU_PTE_MTYPE(MTYPE_CC);
  434. break;
  435. case AMDGPU_VM_MTYPE_UC:
  436. pte_flag |= AMDGPU_PTE_MTYPE(MTYPE_UC);
  437. break;
  438. default:
  439. pte_flag |= AMDGPU_PTE_MTYPE(MTYPE_NC);
  440. break;
  441. }
  442. if (flags & AMDGPU_VM_PAGE_PRT)
  443. pte_flag |= AMDGPU_PTE_PRT;
  444. return pte_flag;
  445. }
  446. static void gmc_v9_0_get_vm_pde(struct amdgpu_device *adev, int level,
  447. uint64_t *addr, uint64_t *flags)
  448. {
  449. if (!(*flags & AMDGPU_PDE_PTE))
  450. *addr = adev->vm_manager.vram_base_offset + *addr -
  451. adev->gmc.vram_start;
  452. BUG_ON(*addr & 0xFFFF00000000003FULL);
  453. if (!adev->gmc.translate_further)
  454. return;
  455. if (level == AMDGPU_VM_PDB1) {
  456. /* Set the block fragment size */
  457. if (!(*flags & AMDGPU_PDE_PTE))
  458. *flags |= AMDGPU_PDE_BFS(0x9);
  459. } else if (level == AMDGPU_VM_PDB0) {
  460. if (*flags & AMDGPU_PDE_PTE)
  461. *flags &= ~AMDGPU_PDE_PTE;
  462. else
  463. *flags |= AMDGPU_PTE_TF;
  464. }
  465. }
  466. static const struct amdgpu_gmc_funcs gmc_v9_0_gmc_funcs = {
  467. .flush_gpu_tlb = gmc_v9_0_flush_gpu_tlb,
  468. .emit_flush_gpu_tlb = gmc_v9_0_emit_flush_gpu_tlb,
  469. .emit_pasid_mapping = gmc_v9_0_emit_pasid_mapping,
  470. .set_pte_pde = gmc_v9_0_set_pte_pde,
  471. .get_vm_pte_flags = gmc_v9_0_get_vm_pte_flags,
  472. .get_vm_pde = gmc_v9_0_get_vm_pde
  473. };
  474. static void gmc_v9_0_set_gmc_funcs(struct amdgpu_device *adev)
  475. {
  476. if (adev->gmc.gmc_funcs == NULL)
  477. adev->gmc.gmc_funcs = &gmc_v9_0_gmc_funcs;
  478. }
  479. static int gmc_v9_0_early_init(void *handle)
  480. {
  481. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  482. gmc_v9_0_set_gmc_funcs(adev);
  483. gmc_v9_0_set_irq_funcs(adev);
  484. adev->gmc.shared_aperture_start = 0x2000000000000000ULL;
  485. adev->gmc.shared_aperture_end =
  486. adev->gmc.shared_aperture_start + (4ULL << 30) - 1;
  487. adev->gmc.private_aperture_start = 0x1000000000000000ULL;
  488. adev->gmc.private_aperture_end =
  489. adev->gmc.private_aperture_start + (4ULL << 30) - 1;
  490. return 0;
  491. }
  492. static int gmc_v9_0_ecc_available(struct amdgpu_device *adev)
  493. {
  494. uint32_t reg_val;
  495. uint32_t reg_addr;
  496. uint32_t field_val;
  497. size_t i;
  498. uint32_t fv2;
  499. size_t lost_sheep;
  500. DRM_DEBUG("ecc: gmc_v9_0_ecc_available()\n");
  501. lost_sheep = 0;
  502. for (i = 0; i < ARRAY_SIZE(ecc_umclocalcap_addrs); ++i) {
  503. reg_addr = ecc_umclocalcap_addrs[i];
  504. DRM_DEBUG("ecc: "
  505. "UMCCH_UmcLocalCap[%zu]: reg_addr: 0x%08x\n",
  506. i, reg_addr);
  507. reg_val = RREG32(reg_addr);
  508. field_val = REG_GET_FIELD(reg_val, UMCCH0_0_UmcLocalCap,
  509. EccDis);
  510. DRM_DEBUG("ecc: "
  511. "reg_val: 0x%08x, "
  512. "EccDis: 0x%08x, ",
  513. reg_val, field_val);
  514. if (field_val) {
  515. DRM_ERROR("ecc: UmcLocalCap:EccDis is set.\n");
  516. ++lost_sheep;
  517. }
  518. }
  519. for (i = 0; i < ARRAY_SIZE(ecc_umcch_umc_config_addrs); ++i) {
  520. reg_addr = ecc_umcch_umc_config_addrs[i];
  521. DRM_DEBUG("ecc: "
  522. "UMCCH0_0_UMC_CONFIG[%zu]: reg_addr: 0x%08x",
  523. i, reg_addr);
  524. reg_val = RREG32(reg_addr);
  525. field_val = REG_GET_FIELD(reg_val, UMCCH0_0_UMC_CONFIG,
  526. DramReady);
  527. DRM_DEBUG("ecc: "
  528. "reg_val: 0x%08x, "
  529. "DramReady: 0x%08x\n",
  530. reg_val, field_val);
  531. if (!field_val) {
  532. DRM_ERROR("ecc: UMC_CONFIG:DramReady is not set.\n");
  533. ++lost_sheep;
  534. }
  535. }
  536. for (i = 0; i < ARRAY_SIZE(ecc_umcch_eccctrl_addrs); ++i) {
  537. reg_addr = ecc_umcch_eccctrl_addrs[i];
  538. DRM_DEBUG("ecc: "
  539. "UMCCH_EccCtrl[%zu]: reg_addr: 0x%08x, ",
  540. i, reg_addr);
  541. reg_val = RREG32(reg_addr);
  542. field_val = REG_GET_FIELD(reg_val, UMCCH0_0_EccCtrl,
  543. WrEccEn);
  544. fv2 = REG_GET_FIELD(reg_val, UMCCH0_0_EccCtrl,
  545. RdEccEn);
  546. DRM_DEBUG("ecc: "
  547. "reg_val: 0x%08x, "
  548. "WrEccEn: 0x%08x, "
  549. "RdEccEn: 0x%08x\n",
  550. reg_val, field_val, fv2);
  551. if (!field_val) {
  552. DRM_DEBUG("ecc: WrEccEn is not set\n");
  553. ++lost_sheep;
  554. }
  555. if (!fv2) {
  556. DRM_DEBUG("ecc: RdEccEn is not set\n");
  557. ++lost_sheep;
  558. }
  559. }
  560. DRM_DEBUG("ecc: lost_sheep: %zu\n", lost_sheep);
  561. return lost_sheep == 0;
  562. }
  563. static int gmc_v9_0_late_init(void *handle)
  564. {
  565. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  566. /*
  567. * The latest engine allocation on gfx9 is:
  568. * Engine 0, 1: idle
  569. * Engine 2, 3: firmware
  570. * Engine 4~13: amdgpu ring, subject to change when ring number changes
  571. * Engine 14~15: idle
  572. * Engine 16: kfd tlb invalidation
  573. * Engine 17: Gart flushes
  574. */
  575. unsigned vm_inv_eng[AMDGPU_MAX_VMHUBS] = { 4, 4 };
  576. unsigned i;
  577. int r;
  578. /*
  579. * TODO - Uncomment once GART corruption issue is fixed.
  580. */
  581. /* amdgpu_bo_late_init(adev); */
  582. for(i = 0; i < adev->num_rings; ++i) {
  583. struct amdgpu_ring *ring = adev->rings[i];
  584. unsigned vmhub = ring->funcs->vmhub;
  585. ring->vm_inv_eng = vm_inv_eng[vmhub]++;
  586. dev_info(adev->dev, "ring %u(%s) uses VM inv eng %u on hub %u\n",
  587. ring->idx, ring->name, ring->vm_inv_eng,
  588. ring->funcs->vmhub);
  589. }
  590. /* Engine 16 is used for KFD and 17 for GART flushes */
  591. for(i = 0; i < AMDGPU_MAX_VMHUBS; ++i)
  592. BUG_ON(vm_inv_eng[i] > 16);
  593. if (adev->asic_type == CHIP_VEGA10 && !amdgpu_sriov_vf(adev)) {
  594. r = gmc_v9_0_ecc_available(adev);
  595. if (r == 1) {
  596. DRM_INFO("ECC is active.\n");
  597. } else if (r == 0) {
  598. DRM_INFO("ECC is not present.\n");
  599. adev->df_funcs->enable_ecc_force_par_wr_rmw(adev, false);
  600. } else {
  601. DRM_ERROR("gmc_v9_0_ecc_available() failed. r: %d\n", r);
  602. return r;
  603. }
  604. }
  605. return amdgpu_irq_get(adev, &adev->gmc.vm_fault, 0);
  606. }
  607. static void gmc_v9_0_vram_gtt_location(struct amdgpu_device *adev,
  608. struct amdgpu_gmc *mc)
  609. {
  610. u64 base = 0;
  611. if (!amdgpu_sriov_vf(adev))
  612. base = mmhub_v1_0_get_fb_location(adev);
  613. amdgpu_device_vram_location(adev, &adev->gmc, base);
  614. amdgpu_device_gart_location(adev, mc);
  615. /* base offset of vram pages */
  616. adev->vm_manager.vram_base_offset = gfxhub_v1_0_get_mc_fb_offset(adev);
  617. }
  618. /**
  619. * gmc_v9_0_mc_init - initialize the memory controller driver params
  620. *
  621. * @adev: amdgpu_device pointer
  622. *
  623. * Look up the amount of vram, vram width, and decide how to place
  624. * vram and gart within the GPU's physical address space.
  625. * Returns 0 for success.
  626. */
  627. static int gmc_v9_0_mc_init(struct amdgpu_device *adev)
  628. {
  629. int chansize, numchan;
  630. int r;
  631. if (amdgpu_emu_mode != 1)
  632. adev->gmc.vram_width = amdgpu_atomfirmware_get_vram_width(adev);
  633. if (!adev->gmc.vram_width) {
  634. /* hbm memory channel size */
  635. if (adev->flags & AMD_IS_APU)
  636. chansize = 64;
  637. else
  638. chansize = 128;
  639. numchan = adev->df_funcs->get_hbm_channel_number(adev);
  640. adev->gmc.vram_width = numchan * chansize;
  641. }
  642. /* size in MB on si */
  643. adev->gmc.mc_vram_size =
  644. adev->nbio_funcs->get_memsize(adev) * 1024ULL * 1024ULL;
  645. adev->gmc.real_vram_size = adev->gmc.mc_vram_size;
  646. if (!(adev->flags & AMD_IS_APU)) {
  647. r = amdgpu_device_resize_fb_bar(adev);
  648. if (r)
  649. return r;
  650. }
  651. adev->gmc.aper_base = pci_resource_start(adev->pdev, 0);
  652. adev->gmc.aper_size = pci_resource_len(adev->pdev, 0);
  653. #ifdef CONFIG_X86_64
  654. if (adev->flags & AMD_IS_APU) {
  655. adev->gmc.aper_base = gfxhub_v1_0_get_mc_fb_offset(adev);
  656. adev->gmc.aper_size = adev->gmc.real_vram_size;
  657. }
  658. #endif
  659. /* In case the PCI BAR is larger than the actual amount of vram */
  660. adev->gmc.visible_vram_size = adev->gmc.aper_size;
  661. if (adev->gmc.visible_vram_size > adev->gmc.real_vram_size)
  662. adev->gmc.visible_vram_size = adev->gmc.real_vram_size;
  663. /* set the gart size */
  664. if (amdgpu_gart_size == -1) {
  665. switch (adev->asic_type) {
  666. case CHIP_VEGA10: /* all engines support GPUVM */
  667. case CHIP_VEGA12: /* all engines support GPUVM */
  668. case CHIP_VEGA20:
  669. default:
  670. adev->gmc.gart_size = 512ULL << 20;
  671. break;
  672. case CHIP_RAVEN: /* DCE SG support */
  673. adev->gmc.gart_size = 1024ULL << 20;
  674. break;
  675. }
  676. } else {
  677. adev->gmc.gart_size = (u64)amdgpu_gart_size << 20;
  678. }
  679. gmc_v9_0_vram_gtt_location(adev, &adev->gmc);
  680. return 0;
  681. }
  682. static int gmc_v9_0_gart_init(struct amdgpu_device *adev)
  683. {
  684. int r;
  685. if (adev->gart.robj) {
  686. WARN(1, "VEGA10 PCIE GART already initialized\n");
  687. return 0;
  688. }
  689. /* Initialize common gart structure */
  690. r = amdgpu_gart_init(adev);
  691. if (r)
  692. return r;
  693. adev->gart.table_size = adev->gart.num_gpu_pages * 8;
  694. adev->gart.gart_pte_flags = AMDGPU_PTE_MTYPE(MTYPE_UC) |
  695. AMDGPU_PTE_EXECUTABLE;
  696. return amdgpu_gart_table_vram_alloc(adev);
  697. }
  698. static unsigned gmc_v9_0_get_vbios_fb_size(struct amdgpu_device *adev)
  699. {
  700. #if 0
  701. u32 d1vga_control = RREG32_SOC15(DCE, 0, mmD1VGA_CONTROL);
  702. #endif
  703. unsigned size;
  704. /*
  705. * TODO Remove once GART corruption is resolved
  706. * Check related code in gmc_v9_0_sw_fini
  707. * */
  708. size = 9 * 1024 * 1024;
  709. #if 0
  710. if (REG_GET_FIELD(d1vga_control, D1VGA_CONTROL, D1VGA_MODE_ENABLE)) {
  711. size = 9 * 1024 * 1024; /* reserve 8MB for vga emulator and 1 MB for FB */
  712. } else {
  713. u32 viewport;
  714. switch (adev->asic_type) {
  715. case CHIP_RAVEN:
  716. viewport = RREG32_SOC15(DCE, 0, mmHUBP0_DCSURF_PRI_VIEWPORT_DIMENSION);
  717. size = (REG_GET_FIELD(viewport,
  718. HUBP0_DCSURF_PRI_VIEWPORT_DIMENSION, PRI_VIEWPORT_HEIGHT) *
  719. REG_GET_FIELD(viewport,
  720. HUBP0_DCSURF_PRI_VIEWPORT_DIMENSION, PRI_VIEWPORT_WIDTH) *
  721. 4);
  722. break;
  723. case CHIP_VEGA10:
  724. case CHIP_VEGA12:
  725. default:
  726. viewport = RREG32_SOC15(DCE, 0, mmSCL0_VIEWPORT_SIZE);
  727. size = (REG_GET_FIELD(viewport, SCL0_VIEWPORT_SIZE, VIEWPORT_HEIGHT) *
  728. REG_GET_FIELD(viewport, SCL0_VIEWPORT_SIZE, VIEWPORT_WIDTH) *
  729. 4);
  730. break;
  731. }
  732. }
  733. /* return 0 if the pre-OS buffer uses up most of vram */
  734. if ((adev->gmc.real_vram_size - size) < (8 * 1024 * 1024))
  735. return 0;
  736. #endif
  737. return size;
  738. }
  739. static int gmc_v9_0_sw_init(void *handle)
  740. {
  741. int r;
  742. int dma_bits;
  743. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  744. gfxhub_v1_0_init(adev);
  745. mmhub_v1_0_init(adev);
  746. spin_lock_init(&adev->gmc.invalidate_lock);
  747. adev->gmc.vram_type = amdgpu_atomfirmware_get_vram_type(adev);
  748. switch (adev->asic_type) {
  749. case CHIP_RAVEN:
  750. if (adev->rev_id == 0x0 || adev->rev_id == 0x1) {
  751. amdgpu_vm_adjust_size(adev, 256 * 1024, 9, 3, 48);
  752. } else {
  753. /* vm_size is 128TB + 512GB for legacy 3-level page support */
  754. amdgpu_vm_adjust_size(adev, 128 * 1024 + 512, 9, 2, 48);
  755. adev->gmc.translate_further =
  756. adev->vm_manager.num_level > 1;
  757. }
  758. break;
  759. case CHIP_VEGA10:
  760. case CHIP_VEGA12:
  761. case CHIP_VEGA20:
  762. /*
  763. * To fulfill 4-level page support,
  764. * vm size is 256TB (48bit), maximum size of Vega10,
  765. * block size 512 (9bit)
  766. */
  767. amdgpu_vm_adjust_size(adev, 256 * 1024, 9, 3, 48);
  768. break;
  769. default:
  770. break;
  771. }
  772. /* This interrupt is VMC page fault.*/
  773. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VMC, 0,
  774. &adev->gmc.vm_fault);
  775. r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_UTCL2, 0,
  776. &adev->gmc.vm_fault);
  777. if (r)
  778. return r;
  779. /* Set the internal MC address mask
  780. * This is the max address of the GPU's
  781. * internal address space.
  782. */
  783. adev->gmc.mc_mask = 0xffffffffffffULL; /* 48 bit MC */
  784. /* set DMA mask + need_dma32 flags.
  785. * PCIE - can handle 44-bits.
  786. * IGP - can handle 44-bits
  787. * PCI - dma32 for legacy pci gart, 44 bits on vega10
  788. */
  789. adev->need_dma32 = false;
  790. dma_bits = adev->need_dma32 ? 32 : 44;
  791. r = pci_set_dma_mask(adev->pdev, DMA_BIT_MASK(dma_bits));
  792. if (r) {
  793. adev->need_dma32 = true;
  794. dma_bits = 32;
  795. printk(KERN_WARNING "amdgpu: No suitable DMA available.\n");
  796. }
  797. r = pci_set_consistent_dma_mask(adev->pdev, DMA_BIT_MASK(dma_bits));
  798. if (r) {
  799. pci_set_consistent_dma_mask(adev->pdev, DMA_BIT_MASK(32));
  800. printk(KERN_WARNING "amdgpu: No coherent DMA available.\n");
  801. }
  802. adev->need_swiotlb = drm_get_max_iomem() > ((u64)1 << dma_bits);
  803. r = gmc_v9_0_mc_init(adev);
  804. if (r)
  805. return r;
  806. adev->gmc.stolen_size = gmc_v9_0_get_vbios_fb_size(adev);
  807. /* Memory manager */
  808. r = amdgpu_bo_init(adev);
  809. if (r)
  810. return r;
  811. r = gmc_v9_0_gart_init(adev);
  812. if (r)
  813. return r;
  814. /*
  815. * number of VMs
  816. * VMID 0 is reserved for System
  817. * amdgpu graphics/compute will use VMIDs 1-7
  818. * amdkfd will use VMIDs 8-15
  819. */
  820. adev->vm_manager.id_mgr[AMDGPU_GFXHUB].num_ids = AMDGPU_NUM_OF_VMIDS;
  821. adev->vm_manager.id_mgr[AMDGPU_MMHUB].num_ids = AMDGPU_NUM_OF_VMIDS;
  822. amdgpu_vm_manager_init(adev);
  823. return 0;
  824. }
  825. /**
  826. * gmc_v9_0_gart_fini - vm fini callback
  827. *
  828. * @adev: amdgpu_device pointer
  829. *
  830. * Tears down the driver GART/VM setup (CIK).
  831. */
  832. static void gmc_v9_0_gart_fini(struct amdgpu_device *adev)
  833. {
  834. amdgpu_gart_table_vram_free(adev);
  835. amdgpu_gart_fini(adev);
  836. }
  837. static int gmc_v9_0_sw_fini(void *handle)
  838. {
  839. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  840. amdgpu_gem_force_release(adev);
  841. amdgpu_vm_manager_fini(adev);
  842. gmc_v9_0_gart_fini(adev);
  843. /*
  844. * TODO:
  845. * Currently there is a bug where some memory client outside
  846. * of the driver writes to first 8M of VRAM on S3 resume,
  847. * this overrides GART which by default gets placed in first 8M and
  848. * causes VM_FAULTS once GTT is accessed.
  849. * Keep the stolen memory reservation until the while this is not solved.
  850. * Also check code in gmc_v9_0_get_vbios_fb_size and gmc_v9_0_late_init
  851. */
  852. amdgpu_bo_free_kernel(&adev->stolen_vga_memory, NULL, NULL);
  853. amdgpu_bo_fini(adev);
  854. return 0;
  855. }
  856. static void gmc_v9_0_init_golden_registers(struct amdgpu_device *adev)
  857. {
  858. switch (adev->asic_type) {
  859. case CHIP_VEGA10:
  860. case CHIP_VEGA20:
  861. soc15_program_register_sequence(adev,
  862. golden_settings_mmhub_1_0_0,
  863. ARRAY_SIZE(golden_settings_mmhub_1_0_0));
  864. soc15_program_register_sequence(adev,
  865. golden_settings_athub_1_0_0,
  866. ARRAY_SIZE(golden_settings_athub_1_0_0));
  867. break;
  868. case CHIP_VEGA12:
  869. break;
  870. case CHIP_RAVEN:
  871. soc15_program_register_sequence(adev,
  872. golden_settings_athub_1_0_0,
  873. ARRAY_SIZE(golden_settings_athub_1_0_0));
  874. break;
  875. default:
  876. break;
  877. }
  878. }
  879. /**
  880. * gmc_v9_0_gart_enable - gart enable
  881. *
  882. * @adev: amdgpu_device pointer
  883. */
  884. static int gmc_v9_0_gart_enable(struct amdgpu_device *adev)
  885. {
  886. int r;
  887. bool value;
  888. u32 tmp;
  889. amdgpu_device_program_register_sequence(adev,
  890. golden_settings_vega10_hdp,
  891. ARRAY_SIZE(golden_settings_vega10_hdp));
  892. if (adev->gart.robj == NULL) {
  893. dev_err(adev->dev, "No VRAM object for PCIE GART.\n");
  894. return -EINVAL;
  895. }
  896. r = amdgpu_gart_table_vram_pin(adev);
  897. if (r)
  898. return r;
  899. switch (adev->asic_type) {
  900. case CHIP_RAVEN:
  901. mmhub_v1_0_initialize_power_gating(adev);
  902. mmhub_v1_0_update_power_gating(adev, true);
  903. break;
  904. default:
  905. break;
  906. }
  907. r = gfxhub_v1_0_gart_enable(adev);
  908. if (r)
  909. return r;
  910. r = mmhub_v1_0_gart_enable(adev);
  911. if (r)
  912. return r;
  913. WREG32_FIELD15(HDP, 0, HDP_MISC_CNTL, FLUSH_INVALIDATE_CACHE, 1);
  914. tmp = RREG32_SOC15(HDP, 0, mmHDP_HOST_PATH_CNTL);
  915. WREG32_SOC15(HDP, 0, mmHDP_HOST_PATH_CNTL, tmp);
  916. /* After HDP is initialized, flush HDP.*/
  917. adev->nbio_funcs->hdp_flush(adev, NULL);
  918. if (amdgpu_vm_fault_stop == AMDGPU_VM_FAULT_STOP_ALWAYS)
  919. value = false;
  920. else
  921. value = true;
  922. gfxhub_v1_0_set_fault_enable_default(adev, value);
  923. mmhub_v1_0_set_fault_enable_default(adev, value);
  924. gmc_v9_0_flush_gpu_tlb(adev, 0);
  925. DRM_INFO("PCIE GART of %uM enabled (table at 0x%016llX).\n",
  926. (unsigned)(adev->gmc.gart_size >> 20),
  927. (unsigned long long)adev->gart.table_addr);
  928. adev->gart.ready = true;
  929. return 0;
  930. }
  931. static int gmc_v9_0_hw_init(void *handle)
  932. {
  933. int r;
  934. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  935. /* The sequence of these two function calls matters.*/
  936. gmc_v9_0_init_golden_registers(adev);
  937. if (adev->mode_info.num_crtc) {
  938. /* Lockout access through VGA aperture*/
  939. WREG32_FIELD15(DCE, 0, VGA_HDP_CONTROL, VGA_MEMORY_DISABLE, 1);
  940. /* disable VGA render */
  941. WREG32_FIELD15(DCE, 0, VGA_RENDER_CONTROL, VGA_VSTATUS_CNTL, 0);
  942. }
  943. r = gmc_v9_0_gart_enable(adev);
  944. return r;
  945. }
  946. /**
  947. * gmc_v9_0_gart_disable - gart disable
  948. *
  949. * @adev: amdgpu_device pointer
  950. *
  951. * This disables all VM page table.
  952. */
  953. static void gmc_v9_0_gart_disable(struct amdgpu_device *adev)
  954. {
  955. gfxhub_v1_0_gart_disable(adev);
  956. mmhub_v1_0_gart_disable(adev);
  957. amdgpu_gart_table_vram_unpin(adev);
  958. }
  959. static int gmc_v9_0_hw_fini(void *handle)
  960. {
  961. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  962. if (amdgpu_sriov_vf(adev)) {
  963. /* full access mode, so don't touch any GMC register */
  964. DRM_DEBUG("For SRIOV client, shouldn't do anything.\n");
  965. return 0;
  966. }
  967. amdgpu_irq_put(adev, &adev->gmc.vm_fault, 0);
  968. gmc_v9_0_gart_disable(adev);
  969. return 0;
  970. }
  971. static int gmc_v9_0_suspend(void *handle)
  972. {
  973. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  974. return gmc_v9_0_hw_fini(adev);
  975. }
  976. static int gmc_v9_0_resume(void *handle)
  977. {
  978. int r;
  979. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  980. r = gmc_v9_0_hw_init(adev);
  981. if (r)
  982. return r;
  983. amdgpu_vmid_reset_all(adev);
  984. return 0;
  985. }
  986. static bool gmc_v9_0_is_idle(void *handle)
  987. {
  988. /* MC is always ready in GMC v9.*/
  989. return true;
  990. }
  991. static int gmc_v9_0_wait_for_idle(void *handle)
  992. {
  993. /* There is no need to wait for MC idle in GMC v9.*/
  994. return 0;
  995. }
  996. static int gmc_v9_0_soft_reset(void *handle)
  997. {
  998. /* XXX for emulation.*/
  999. return 0;
  1000. }
  1001. static int gmc_v9_0_set_clockgating_state(void *handle,
  1002. enum amd_clockgating_state state)
  1003. {
  1004. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1005. return mmhub_v1_0_set_clockgating(adev, state);
  1006. }
  1007. static void gmc_v9_0_get_clockgating_state(void *handle, u32 *flags)
  1008. {
  1009. struct amdgpu_device *adev = (struct amdgpu_device *)handle;
  1010. mmhub_v1_0_get_clockgating(adev, flags);
  1011. }
  1012. static int gmc_v9_0_set_powergating_state(void *handle,
  1013. enum amd_powergating_state state)
  1014. {
  1015. return 0;
  1016. }
  1017. const struct amd_ip_funcs gmc_v9_0_ip_funcs = {
  1018. .name = "gmc_v9_0",
  1019. .early_init = gmc_v9_0_early_init,
  1020. .late_init = gmc_v9_0_late_init,
  1021. .sw_init = gmc_v9_0_sw_init,
  1022. .sw_fini = gmc_v9_0_sw_fini,
  1023. .hw_init = gmc_v9_0_hw_init,
  1024. .hw_fini = gmc_v9_0_hw_fini,
  1025. .suspend = gmc_v9_0_suspend,
  1026. .resume = gmc_v9_0_resume,
  1027. .is_idle = gmc_v9_0_is_idle,
  1028. .wait_for_idle = gmc_v9_0_wait_for_idle,
  1029. .soft_reset = gmc_v9_0_soft_reset,
  1030. .set_clockgating_state = gmc_v9_0_set_clockgating_state,
  1031. .set_powergating_state = gmc_v9_0_set_powergating_state,
  1032. .get_clockgating_state = gmc_v9_0_get_clockgating_state,
  1033. };
  1034. const struct amdgpu_ip_block_version gmc_v9_0_ip_block =
  1035. {
  1036. .type = AMD_IP_BLOCK_TYPE_GMC,
  1037. .major = 9,
  1038. .minor = 0,
  1039. .rev = 0,
  1040. .funcs = &gmc_v9_0_ip_funcs,
  1041. };