amdgpu.h 58 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890
  1. /*
  2. * Copyright 2008 Advanced Micro Devices, Inc.
  3. * Copyright 2008 Red Hat Inc.
  4. * Copyright 2009 Jerome Glisse.
  5. *
  6. * Permission is hereby granted, free of charge, to any person obtaining a
  7. * copy of this software and associated documentation files (the "Software"),
  8. * to deal in the Software without restriction, including without limitation
  9. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10. * and/or sell copies of the Software, and to permit persons to whom the
  11. * Software is furnished to do so, subject to the following conditions:
  12. *
  13. * The above copyright notice and this permission notice shall be included in
  14. * all copies or substantial portions of the Software.
  15. *
  16. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  19. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22. * OTHER DEALINGS IN THE SOFTWARE.
  23. *
  24. * Authors: Dave Airlie
  25. * Alex Deucher
  26. * Jerome Glisse
  27. */
  28. #ifndef __AMDGPU_H__
  29. #define __AMDGPU_H__
  30. #include <linux/atomic.h>
  31. #include <linux/wait.h>
  32. #include <linux/list.h>
  33. #include <linux/kref.h>
  34. #include <linux/rbtree.h>
  35. #include <linux/hashtable.h>
  36. #include <linux/dma-fence.h>
  37. #include <drm/ttm/ttm_bo_api.h>
  38. #include <drm/ttm/ttm_bo_driver.h>
  39. #include <drm/ttm/ttm_placement.h>
  40. #include <drm/ttm/ttm_module.h>
  41. #include <drm/ttm/ttm_execbuf_util.h>
  42. #include <drm/drmP.h>
  43. #include <drm/drm_gem.h>
  44. #include <drm/amdgpu_drm.h>
  45. #include <kgd_kfd_interface.h>
  46. #include "amd_shared.h"
  47. #include "amdgpu_mode.h"
  48. #include "amdgpu_ih.h"
  49. #include "amdgpu_irq.h"
  50. #include "amdgpu_ucode.h"
  51. #include "amdgpu_ttm.h"
  52. #include "amdgpu_psp.h"
  53. #include "amdgpu_gds.h"
  54. #include "amdgpu_sync.h"
  55. #include "amdgpu_ring.h"
  56. #include "amdgpu_vm.h"
  57. #include "amd_powerplay.h"
  58. #include "amdgpu_dpm.h"
  59. #include "amdgpu_acp.h"
  60. #include "amdgpu_uvd.h"
  61. #include "amdgpu_vce.h"
  62. #include "amdgpu_vcn.h"
  63. #include "amdgpu_mn.h"
  64. #include "gpu_scheduler.h"
  65. #include "amdgpu_virt.h"
  66. #include "amdgpu_gart.h"
  67. /*
  68. * Modules parameters.
  69. */
  70. extern int amdgpu_modeset;
  71. extern int amdgpu_vram_limit;
  72. extern int amdgpu_vis_vram_limit;
  73. extern int amdgpu_gart_size;
  74. extern int amdgpu_gtt_size;
  75. extern int amdgpu_moverate;
  76. extern int amdgpu_benchmarking;
  77. extern int amdgpu_testing;
  78. extern int amdgpu_audio;
  79. extern int amdgpu_disp_priority;
  80. extern int amdgpu_hw_i2c;
  81. extern int amdgpu_pcie_gen2;
  82. extern int amdgpu_msi;
  83. extern int amdgpu_lockup_timeout;
  84. extern int amdgpu_dpm;
  85. extern int amdgpu_fw_load_type;
  86. extern int amdgpu_aspm;
  87. extern int amdgpu_runtime_pm;
  88. extern uint amdgpu_ip_block_mask;
  89. extern int amdgpu_bapm;
  90. extern int amdgpu_deep_color;
  91. extern int amdgpu_vm_size;
  92. extern int amdgpu_vm_block_size;
  93. extern int amdgpu_vm_fragment_size;
  94. extern int amdgpu_vm_fault_stop;
  95. extern int amdgpu_vm_debug;
  96. extern int amdgpu_vm_update_mode;
  97. extern int amdgpu_sched_jobs;
  98. extern int amdgpu_sched_hw_submission;
  99. extern int amdgpu_no_evict;
  100. extern int amdgpu_direct_gma_size;
  101. extern uint amdgpu_pcie_gen_cap;
  102. extern uint amdgpu_pcie_lane_cap;
  103. extern uint amdgpu_cg_mask;
  104. extern uint amdgpu_pg_mask;
  105. extern uint amdgpu_sdma_phase_quantum;
  106. extern char *amdgpu_disable_cu;
  107. extern char *amdgpu_virtual_display;
  108. extern uint amdgpu_pp_feature_mask;
  109. extern int amdgpu_vram_page_split;
  110. extern int amdgpu_ngg;
  111. extern int amdgpu_prim_buf_per_se;
  112. extern int amdgpu_pos_buf_per_se;
  113. extern int amdgpu_cntl_sb_buf_per_se;
  114. extern int amdgpu_param_buf_per_se;
  115. extern int amdgpu_job_hang_limit;
  116. extern int amdgpu_lbpw;
  117. extern int amdgpu_compute_multipipe;
  118. #ifdef CONFIG_DRM_AMDGPU_SI
  119. extern int amdgpu_si_support;
  120. #endif
  121. #ifdef CONFIG_DRM_AMDGPU_CIK
  122. extern int amdgpu_cik_support;
  123. #endif
  124. #define AMDGPU_DEFAULT_GTT_SIZE_MB 3072ULL /* 3GB by default */
  125. #define AMDGPU_WAIT_IDLE_TIMEOUT_IN_MS 3000
  126. #define AMDGPU_MAX_USEC_TIMEOUT 100000 /* 100 ms */
  127. #define AMDGPU_FENCE_JIFFIES_TIMEOUT (HZ / 2)
  128. /* AMDGPU_IB_POOL_SIZE must be a power of 2 */
  129. #define AMDGPU_IB_POOL_SIZE 16
  130. #define AMDGPU_DEBUGFS_MAX_COMPONENTS 32
  131. #define AMDGPUFB_CONN_LIMIT 4
  132. #define AMDGPU_BIOS_NUM_SCRATCH 16
  133. /* max number of IP instances */
  134. #define AMDGPU_MAX_SDMA_INSTANCES 2
  135. /* hard reset data */
  136. #define AMDGPU_ASIC_RESET_DATA 0x39d5e86b
  137. /* reset flags */
  138. #define AMDGPU_RESET_GFX (1 << 0)
  139. #define AMDGPU_RESET_COMPUTE (1 << 1)
  140. #define AMDGPU_RESET_DMA (1 << 2)
  141. #define AMDGPU_RESET_CP (1 << 3)
  142. #define AMDGPU_RESET_GRBM (1 << 4)
  143. #define AMDGPU_RESET_DMA1 (1 << 5)
  144. #define AMDGPU_RESET_RLC (1 << 6)
  145. #define AMDGPU_RESET_SEM (1 << 7)
  146. #define AMDGPU_RESET_IH (1 << 8)
  147. #define AMDGPU_RESET_VMC (1 << 9)
  148. #define AMDGPU_RESET_MC (1 << 10)
  149. #define AMDGPU_RESET_DISPLAY (1 << 11)
  150. #define AMDGPU_RESET_UVD (1 << 12)
  151. #define AMDGPU_RESET_VCE (1 << 13)
  152. #define AMDGPU_RESET_VCE1 (1 << 14)
  153. /* GFX current status */
  154. #define AMDGPU_GFX_NORMAL_MODE 0x00000000L
  155. #define AMDGPU_GFX_SAFE_MODE 0x00000001L
  156. #define AMDGPU_GFX_PG_DISABLED_MODE 0x00000002L
  157. #define AMDGPU_GFX_CG_DISABLED_MODE 0x00000004L
  158. #define AMDGPU_GFX_LBPW_DISABLED_MODE 0x00000008L
  159. /* max cursor sizes (in pixels) */
  160. #define CIK_CURSOR_WIDTH 128
  161. #define CIK_CURSOR_HEIGHT 128
  162. struct amdgpu_device;
  163. struct amdgpu_ib;
  164. struct amdgpu_cs_parser;
  165. struct amdgpu_job;
  166. struct amdgpu_irq_src;
  167. struct amdgpu_fpriv;
  168. struct amdgpu_bo_va_mapping;
  169. enum amdgpu_cp_irq {
  170. AMDGPU_CP_IRQ_GFX_EOP = 0,
  171. AMDGPU_CP_IRQ_COMPUTE_MEC1_PIPE0_EOP,
  172. AMDGPU_CP_IRQ_COMPUTE_MEC1_PIPE1_EOP,
  173. AMDGPU_CP_IRQ_COMPUTE_MEC1_PIPE2_EOP,
  174. AMDGPU_CP_IRQ_COMPUTE_MEC1_PIPE3_EOP,
  175. AMDGPU_CP_IRQ_COMPUTE_MEC2_PIPE0_EOP,
  176. AMDGPU_CP_IRQ_COMPUTE_MEC2_PIPE1_EOP,
  177. AMDGPU_CP_IRQ_COMPUTE_MEC2_PIPE2_EOP,
  178. AMDGPU_CP_IRQ_COMPUTE_MEC2_PIPE3_EOP,
  179. AMDGPU_CP_IRQ_LAST
  180. };
  181. enum amdgpu_sdma_irq {
  182. AMDGPU_SDMA_IRQ_TRAP0 = 0,
  183. AMDGPU_SDMA_IRQ_TRAP1,
  184. AMDGPU_SDMA_IRQ_LAST
  185. };
  186. enum amdgpu_thermal_irq {
  187. AMDGPU_THERMAL_IRQ_LOW_TO_HIGH = 0,
  188. AMDGPU_THERMAL_IRQ_HIGH_TO_LOW,
  189. AMDGPU_THERMAL_IRQ_LAST
  190. };
  191. enum amdgpu_kiq_irq {
  192. AMDGPU_CP_KIQ_IRQ_DRIVER0 = 0,
  193. AMDGPU_CP_KIQ_IRQ_LAST
  194. };
  195. int amdgpu_set_clockgating_state(struct amdgpu_device *adev,
  196. enum amd_ip_block_type block_type,
  197. enum amd_clockgating_state state);
  198. int amdgpu_set_powergating_state(struct amdgpu_device *adev,
  199. enum amd_ip_block_type block_type,
  200. enum amd_powergating_state state);
  201. void amdgpu_get_clockgating_state(struct amdgpu_device *adev, u32 *flags);
  202. int amdgpu_wait_for_idle(struct amdgpu_device *adev,
  203. enum amd_ip_block_type block_type);
  204. bool amdgpu_is_idle(struct amdgpu_device *adev,
  205. enum amd_ip_block_type block_type);
  206. #define AMDGPU_MAX_IP_NUM 16
  207. struct amdgpu_ip_block_status {
  208. bool valid;
  209. bool sw;
  210. bool hw;
  211. bool late_initialized;
  212. bool hang;
  213. };
  214. struct amdgpu_ip_block_version {
  215. const enum amd_ip_block_type type;
  216. const u32 major;
  217. const u32 minor;
  218. const u32 rev;
  219. const struct amd_ip_funcs *funcs;
  220. };
  221. struct amdgpu_ip_block {
  222. struct amdgpu_ip_block_status status;
  223. const struct amdgpu_ip_block_version *version;
  224. };
  225. int amdgpu_ip_block_version_cmp(struct amdgpu_device *adev,
  226. enum amd_ip_block_type type,
  227. u32 major, u32 minor);
  228. struct amdgpu_ip_block * amdgpu_get_ip_block(struct amdgpu_device *adev,
  229. enum amd_ip_block_type type);
  230. int amdgpu_ip_block_add(struct amdgpu_device *adev,
  231. const struct amdgpu_ip_block_version *ip_block_version);
  232. /* provided by hw blocks that can move/clear data. e.g., gfx or sdma */
  233. struct amdgpu_buffer_funcs {
  234. /* maximum bytes in a single operation */
  235. uint32_t copy_max_bytes;
  236. /* number of dw to reserve per operation */
  237. unsigned copy_num_dw;
  238. /* used for buffer migration */
  239. void (*emit_copy_buffer)(struct amdgpu_ib *ib,
  240. /* src addr in bytes */
  241. uint64_t src_offset,
  242. /* dst addr in bytes */
  243. uint64_t dst_offset,
  244. /* number of byte to transfer */
  245. uint32_t byte_count);
  246. /* maximum bytes in a single operation */
  247. uint32_t fill_max_bytes;
  248. /* number of dw to reserve per operation */
  249. unsigned fill_num_dw;
  250. /* used for buffer clearing */
  251. void (*emit_fill_buffer)(struct amdgpu_ib *ib,
  252. /* value to write to memory */
  253. uint32_t src_data,
  254. /* dst addr in bytes */
  255. uint64_t dst_offset,
  256. /* number of byte to fill */
  257. uint32_t byte_count);
  258. };
  259. /* provided by hw blocks that can write ptes, e.g., sdma */
  260. struct amdgpu_vm_pte_funcs {
  261. /* number of dw to reserve per operation */
  262. unsigned copy_pte_num_dw;
  263. /* copy pte entries from GART */
  264. void (*copy_pte)(struct amdgpu_ib *ib,
  265. uint64_t pe, uint64_t src,
  266. unsigned count);
  267. /* write pte one entry at a time with addr mapping */
  268. void (*write_pte)(struct amdgpu_ib *ib, uint64_t pe,
  269. uint64_t value, unsigned count,
  270. uint32_t incr);
  271. /* maximum nums of PTEs/PDEs in a single operation */
  272. uint32_t set_max_nums_pte_pde;
  273. /* number of dw to reserve per operation */
  274. unsigned set_pte_pde_num_dw;
  275. /* for linear pte/pde updates without addr mapping */
  276. void (*set_pte_pde)(struct amdgpu_ib *ib,
  277. uint64_t pe,
  278. uint64_t addr, unsigned count,
  279. uint32_t incr, uint64_t flags);
  280. };
  281. /* provided by the gmc block */
  282. struct amdgpu_gart_funcs {
  283. /* flush the vm tlb via mmio */
  284. void (*flush_gpu_tlb)(struct amdgpu_device *adev,
  285. uint32_t vmid);
  286. /* write pte/pde updates using the cpu */
  287. int (*set_pte_pde)(struct amdgpu_device *adev,
  288. void *cpu_pt_addr, /* cpu addr of page table */
  289. uint32_t gpu_page_idx, /* pte/pde to update */
  290. uint64_t addr, /* addr to write into pte/pde */
  291. uint64_t flags); /* access flags */
  292. /* enable/disable PRT support */
  293. void (*set_prt)(struct amdgpu_device *adev, bool enable);
  294. /* set pte flags based per asic */
  295. uint64_t (*get_vm_pte_flags)(struct amdgpu_device *adev,
  296. uint32_t flags);
  297. /* get the pde for a given mc addr */
  298. u64 (*get_vm_pde)(struct amdgpu_device *adev, u64 addr);
  299. uint32_t (*get_invalidate_req)(unsigned int vm_id);
  300. };
  301. /* provided by the ih block */
  302. struct amdgpu_ih_funcs {
  303. /* ring read/write ptr handling, called from interrupt context */
  304. u32 (*get_wptr)(struct amdgpu_device *adev);
  305. bool (*prescreen_iv)(struct amdgpu_device *adev);
  306. void (*decode_iv)(struct amdgpu_device *adev,
  307. struct amdgpu_iv_entry *entry);
  308. void (*set_rptr)(struct amdgpu_device *adev);
  309. };
  310. /*
  311. * BIOS.
  312. */
  313. bool amdgpu_get_bios(struct amdgpu_device *adev);
  314. bool amdgpu_read_bios(struct amdgpu_device *adev);
  315. /*
  316. * Dummy page
  317. */
  318. struct amdgpu_dummy_page {
  319. struct page *page;
  320. dma_addr_t addr;
  321. };
  322. int amdgpu_dummy_page_init(struct amdgpu_device *adev);
  323. void amdgpu_dummy_page_fini(struct amdgpu_device *adev);
  324. /*
  325. * Clocks
  326. */
  327. #define AMDGPU_MAX_PPLL 3
  328. struct amdgpu_clock {
  329. struct amdgpu_pll ppll[AMDGPU_MAX_PPLL];
  330. struct amdgpu_pll spll;
  331. struct amdgpu_pll mpll;
  332. /* 10 Khz units */
  333. uint32_t default_mclk;
  334. uint32_t default_sclk;
  335. uint32_t default_dispclk;
  336. uint32_t current_dispclk;
  337. uint32_t dp_extclk;
  338. uint32_t max_pixel_clock;
  339. };
  340. /*
  341. * GEM.
  342. */
  343. #define AMDGPU_GEM_DOMAIN_MAX 0x3
  344. #define gem_to_amdgpu_bo(gobj) container_of((gobj), struct amdgpu_bo, gem_base)
  345. void amdgpu_gem_object_free(struct drm_gem_object *obj);
  346. int amdgpu_gem_object_open(struct drm_gem_object *obj,
  347. struct drm_file *file_priv);
  348. void amdgpu_gem_object_close(struct drm_gem_object *obj,
  349. struct drm_file *file_priv);
  350. unsigned long amdgpu_gem_timeout(uint64_t timeout_ns);
  351. struct sg_table *amdgpu_gem_prime_get_sg_table(struct drm_gem_object *obj);
  352. struct drm_gem_object *
  353. amdgpu_gem_prime_import_sg_table(struct drm_device *dev,
  354. struct dma_buf_attachment *attach,
  355. struct sg_table *sg);
  356. struct dma_buf *amdgpu_gem_prime_export(struct drm_device *dev,
  357. struct drm_gem_object *gobj,
  358. int flags);
  359. int amdgpu_gem_prime_pin(struct drm_gem_object *obj);
  360. void amdgpu_gem_prime_unpin(struct drm_gem_object *obj);
  361. struct reservation_object *amdgpu_gem_prime_res_obj(struct drm_gem_object *);
  362. void *amdgpu_gem_prime_vmap(struct drm_gem_object *obj);
  363. void amdgpu_gem_prime_vunmap(struct drm_gem_object *obj, void *vaddr);
  364. int amdgpu_gem_prime_mmap(struct drm_gem_object *obj, struct vm_area_struct *vma);
  365. int amdgpu_gem_debugfs_init(struct amdgpu_device *adev);
  366. /* sub-allocation manager, it has to be protected by another lock.
  367. * By conception this is an helper for other part of the driver
  368. * like the indirect buffer or semaphore, which both have their
  369. * locking.
  370. *
  371. * Principe is simple, we keep a list of sub allocation in offset
  372. * order (first entry has offset == 0, last entry has the highest
  373. * offset).
  374. *
  375. * When allocating new object we first check if there is room at
  376. * the end total_size - (last_object_offset + last_object_size) >=
  377. * alloc_size. If so we allocate new object there.
  378. *
  379. * When there is not enough room at the end, we start waiting for
  380. * each sub object until we reach object_offset+object_size >=
  381. * alloc_size, this object then become the sub object we return.
  382. *
  383. * Alignment can't be bigger than page size.
  384. *
  385. * Hole are not considered for allocation to keep things simple.
  386. * Assumption is that there won't be hole (all object on same
  387. * alignment).
  388. */
  389. #define AMDGPU_SA_NUM_FENCE_LISTS 32
  390. struct amdgpu_sa_manager {
  391. wait_queue_head_t wq;
  392. struct amdgpu_bo *bo;
  393. struct list_head *hole;
  394. struct list_head flist[AMDGPU_SA_NUM_FENCE_LISTS];
  395. struct list_head olist;
  396. unsigned size;
  397. uint64_t gpu_addr;
  398. void *cpu_ptr;
  399. uint32_t domain;
  400. uint32_t align;
  401. };
  402. /* sub-allocation buffer */
  403. struct amdgpu_sa_bo {
  404. struct list_head olist;
  405. struct list_head flist;
  406. struct amdgpu_sa_manager *manager;
  407. unsigned soffset;
  408. unsigned eoffset;
  409. struct dma_fence *fence;
  410. };
  411. /*
  412. * GEM objects.
  413. */
  414. void amdgpu_gem_force_release(struct amdgpu_device *adev);
  415. int amdgpu_gem_object_create(struct amdgpu_device *adev, unsigned long size,
  416. int alignment, u32 initial_domain,
  417. u64 flags, bool kernel,
  418. struct reservation_object *resv,
  419. struct drm_gem_object **obj);
  420. int amdgpu_mode_dumb_create(struct drm_file *file_priv,
  421. struct drm_device *dev,
  422. struct drm_mode_create_dumb *args);
  423. int amdgpu_mode_dumb_mmap(struct drm_file *filp,
  424. struct drm_device *dev,
  425. uint32_t handle, uint64_t *offset_p);
  426. int amdgpu_fence_slab_init(void);
  427. void amdgpu_fence_slab_fini(void);
  428. /*
  429. * VMHUB structures, functions & helpers
  430. */
  431. struct amdgpu_vmhub {
  432. uint32_t ctx0_ptb_addr_lo32;
  433. uint32_t ctx0_ptb_addr_hi32;
  434. uint32_t vm_inv_eng0_req;
  435. uint32_t vm_inv_eng0_ack;
  436. uint32_t vm_context0_cntl;
  437. uint32_t vm_l2_pro_fault_status;
  438. uint32_t vm_l2_pro_fault_cntl;
  439. };
  440. /*
  441. * GPU MC structures, functions & helpers
  442. */
  443. struct amdgpu_mc {
  444. resource_size_t aper_size;
  445. resource_size_t aper_base;
  446. resource_size_t agp_base;
  447. /* for some chips with <= 32MB we need to lie
  448. * about vram size near mc fb location */
  449. u64 mc_vram_size;
  450. u64 visible_vram_size;
  451. u64 gart_size;
  452. u64 gart_start;
  453. u64 gart_end;
  454. u64 vram_start;
  455. u64 vram_end;
  456. unsigned vram_width;
  457. u64 real_vram_size;
  458. int vram_mtrr;
  459. u64 mc_mask;
  460. const struct firmware *fw; /* MC firmware */
  461. uint32_t fw_version;
  462. struct amdgpu_irq_src vm_fault;
  463. uint32_t vram_type;
  464. uint32_t srbm_soft_reset;
  465. bool prt_warning;
  466. uint64_t stolen_size;
  467. /* apertures */
  468. u64 shared_aperture_start;
  469. u64 shared_aperture_end;
  470. u64 private_aperture_start;
  471. u64 private_aperture_end;
  472. /* protects concurrent invalidation */
  473. spinlock_t invalidate_lock;
  474. };
  475. /*
  476. * GPU doorbell structures, functions & helpers
  477. */
  478. typedef enum _AMDGPU_DOORBELL_ASSIGNMENT
  479. {
  480. AMDGPU_DOORBELL_KIQ = 0x000,
  481. AMDGPU_DOORBELL_HIQ = 0x001,
  482. AMDGPU_DOORBELL_DIQ = 0x002,
  483. AMDGPU_DOORBELL_MEC_RING0 = 0x010,
  484. AMDGPU_DOORBELL_MEC_RING1 = 0x011,
  485. AMDGPU_DOORBELL_MEC_RING2 = 0x012,
  486. AMDGPU_DOORBELL_MEC_RING3 = 0x013,
  487. AMDGPU_DOORBELL_MEC_RING4 = 0x014,
  488. AMDGPU_DOORBELL_MEC_RING5 = 0x015,
  489. AMDGPU_DOORBELL_MEC_RING6 = 0x016,
  490. AMDGPU_DOORBELL_MEC_RING7 = 0x017,
  491. AMDGPU_DOORBELL_GFX_RING0 = 0x020,
  492. AMDGPU_DOORBELL_sDMA_ENGINE0 = 0x1E0,
  493. AMDGPU_DOORBELL_sDMA_ENGINE1 = 0x1E1,
  494. AMDGPU_DOORBELL_IH = 0x1E8,
  495. AMDGPU_DOORBELL_MAX_ASSIGNMENT = 0x3FF,
  496. AMDGPU_DOORBELL_INVALID = 0xFFFF
  497. } AMDGPU_DOORBELL_ASSIGNMENT;
  498. struct amdgpu_doorbell {
  499. /* doorbell mmio */
  500. resource_size_t base;
  501. resource_size_t size;
  502. u32 __iomem *ptr;
  503. u32 num_doorbells; /* Number of doorbells actually reserved for amdgpu. */
  504. };
  505. /*
  506. * 64bit doorbell, offset are in QWORD, occupy 2KB doorbell space
  507. */
  508. typedef enum _AMDGPU_DOORBELL64_ASSIGNMENT
  509. {
  510. /*
  511. * All compute related doorbells: kiq, hiq, diq, traditional compute queue, user queue, should locate in
  512. * a continues range so that programming CP_MEC_DOORBELL_RANGE_LOWER/UPPER can cover this range.
  513. * Compute related doorbells are allocated from 0x00 to 0x8a
  514. */
  515. /* kernel scheduling */
  516. AMDGPU_DOORBELL64_KIQ = 0x00,
  517. /* HSA interface queue and debug queue */
  518. AMDGPU_DOORBELL64_HIQ = 0x01,
  519. AMDGPU_DOORBELL64_DIQ = 0x02,
  520. /* Compute engines */
  521. AMDGPU_DOORBELL64_MEC_RING0 = 0x03,
  522. AMDGPU_DOORBELL64_MEC_RING1 = 0x04,
  523. AMDGPU_DOORBELL64_MEC_RING2 = 0x05,
  524. AMDGPU_DOORBELL64_MEC_RING3 = 0x06,
  525. AMDGPU_DOORBELL64_MEC_RING4 = 0x07,
  526. AMDGPU_DOORBELL64_MEC_RING5 = 0x08,
  527. AMDGPU_DOORBELL64_MEC_RING6 = 0x09,
  528. AMDGPU_DOORBELL64_MEC_RING7 = 0x0a,
  529. /* User queue doorbell range (128 doorbells) */
  530. AMDGPU_DOORBELL64_USERQUEUE_START = 0x0b,
  531. AMDGPU_DOORBELL64_USERQUEUE_END = 0x8a,
  532. /* Graphics engine */
  533. AMDGPU_DOORBELL64_GFX_RING0 = 0x8b,
  534. /*
  535. * Other graphics doorbells can be allocated here: from 0x8c to 0xef
  536. * Graphics voltage island aperture 1
  537. * default non-graphics QWORD index is 0xF0 - 0xFF inclusive
  538. */
  539. /* sDMA engines */
  540. AMDGPU_DOORBELL64_sDMA_ENGINE0 = 0xF0,
  541. AMDGPU_DOORBELL64_sDMA_HI_PRI_ENGINE0 = 0xF1,
  542. AMDGPU_DOORBELL64_sDMA_ENGINE1 = 0xF2,
  543. AMDGPU_DOORBELL64_sDMA_HI_PRI_ENGINE1 = 0xF3,
  544. /* Interrupt handler */
  545. AMDGPU_DOORBELL64_IH = 0xF4, /* For legacy interrupt ring buffer */
  546. AMDGPU_DOORBELL64_IH_RING1 = 0xF5, /* For page migration request log */
  547. AMDGPU_DOORBELL64_IH_RING2 = 0xF6, /* For page migration translation/invalidation log */
  548. /* VCN engine use 32 bits doorbell */
  549. AMDGPU_DOORBELL64_VCN0_1 = 0xF8, /* lower 32 bits for VNC0 and upper 32 bits for VNC1 */
  550. AMDGPU_DOORBELL64_VCN2_3 = 0xF9,
  551. AMDGPU_DOORBELL64_VCN4_5 = 0xFA,
  552. AMDGPU_DOORBELL64_VCN6_7 = 0xFB,
  553. /* overlap the doorbell assignment with VCN as they are mutually exclusive
  554. * VCE engine's doorbell is 32 bit and two VCE ring share one QWORD
  555. */
  556. AMDGPU_DOORBELL64_UVD_RING0_1 = 0xF8,
  557. AMDGPU_DOORBELL64_UVD_RING2_3 = 0xF9,
  558. AMDGPU_DOORBELL64_UVD_RING4_5 = 0xFA,
  559. AMDGPU_DOORBELL64_UVD_RING6_7 = 0xFB,
  560. AMDGPU_DOORBELL64_VCE_RING0_1 = 0xFC,
  561. AMDGPU_DOORBELL64_VCE_RING2_3 = 0xFD,
  562. AMDGPU_DOORBELL64_VCE_RING4_5 = 0xFE,
  563. AMDGPU_DOORBELL64_VCE_RING6_7 = 0xFF,
  564. AMDGPU_DOORBELL64_MAX_ASSIGNMENT = 0xFF,
  565. AMDGPU_DOORBELL64_INVALID = 0xFFFF
  566. } AMDGPU_DOORBELL64_ASSIGNMENT;
  567. void amdgpu_doorbell_get_kfd_info(struct amdgpu_device *adev,
  568. phys_addr_t *aperture_base,
  569. size_t *aperture_size,
  570. size_t *start_offset);
  571. /*
  572. * IRQS.
  573. */
  574. struct amdgpu_flip_work {
  575. struct delayed_work flip_work;
  576. struct work_struct unpin_work;
  577. struct amdgpu_device *adev;
  578. int crtc_id;
  579. u32 target_vblank;
  580. uint64_t base;
  581. struct drm_pending_vblank_event *event;
  582. struct amdgpu_bo *old_abo;
  583. struct dma_fence *excl;
  584. unsigned shared_count;
  585. struct dma_fence **shared;
  586. struct dma_fence_cb cb;
  587. bool async;
  588. };
  589. /*
  590. * CP & rings.
  591. */
  592. struct amdgpu_ib {
  593. struct amdgpu_sa_bo *sa_bo;
  594. uint32_t length_dw;
  595. uint64_t gpu_addr;
  596. uint32_t *ptr;
  597. uint32_t flags;
  598. };
  599. extern const struct amd_sched_backend_ops amdgpu_sched_ops;
  600. int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs,
  601. struct amdgpu_job **job, struct amdgpu_vm *vm);
  602. int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size,
  603. struct amdgpu_job **job);
  604. void amdgpu_job_free_resources(struct amdgpu_job *job);
  605. void amdgpu_job_free(struct amdgpu_job *job);
  606. int amdgpu_job_submit(struct amdgpu_job *job, struct amdgpu_ring *ring,
  607. struct amd_sched_entity *entity, void *owner,
  608. struct dma_fence **f);
  609. /*
  610. * Queue manager
  611. */
  612. struct amdgpu_queue_mapper {
  613. int hw_ip;
  614. struct mutex lock;
  615. /* protected by lock */
  616. struct amdgpu_ring *queue_map[AMDGPU_MAX_RINGS];
  617. };
  618. struct amdgpu_queue_mgr {
  619. struct amdgpu_queue_mapper mapper[AMDGPU_MAX_IP_NUM];
  620. };
  621. int amdgpu_queue_mgr_init(struct amdgpu_device *adev,
  622. struct amdgpu_queue_mgr *mgr);
  623. int amdgpu_queue_mgr_fini(struct amdgpu_device *adev,
  624. struct amdgpu_queue_mgr *mgr);
  625. int amdgpu_queue_mgr_map(struct amdgpu_device *adev,
  626. struct amdgpu_queue_mgr *mgr,
  627. int hw_ip, int instance, int ring,
  628. struct amdgpu_ring **out_ring);
  629. /*
  630. * context related structures
  631. */
  632. struct amdgpu_ctx_ring {
  633. uint64_t sequence;
  634. struct dma_fence **fences;
  635. struct amd_sched_entity entity;
  636. };
  637. struct amdgpu_ctx {
  638. struct kref refcount;
  639. struct amdgpu_device *adev;
  640. struct amdgpu_queue_mgr queue_mgr;
  641. unsigned reset_counter;
  642. spinlock_t ring_lock;
  643. struct dma_fence **fences;
  644. struct amdgpu_ctx_ring rings[AMDGPU_MAX_RINGS];
  645. bool preamble_presented;
  646. };
  647. struct amdgpu_ctx_mgr {
  648. struct amdgpu_device *adev;
  649. struct mutex lock;
  650. /* protected by lock */
  651. struct idr ctx_handles;
  652. };
  653. struct amdgpu_ctx *amdgpu_ctx_get(struct amdgpu_fpriv *fpriv, uint32_t id);
  654. int amdgpu_ctx_put(struct amdgpu_ctx *ctx);
  655. int amdgpu_ctx_add_fence(struct amdgpu_ctx *ctx, struct amdgpu_ring *ring,
  656. struct dma_fence *fence, uint64_t *seq);
  657. struct dma_fence *amdgpu_ctx_get_fence(struct amdgpu_ctx *ctx,
  658. struct amdgpu_ring *ring, uint64_t seq);
  659. int amdgpu_ctx_ioctl(struct drm_device *dev, void *data,
  660. struct drm_file *filp);
  661. void amdgpu_ctx_mgr_init(struct amdgpu_ctx_mgr *mgr);
  662. void amdgpu_ctx_mgr_fini(struct amdgpu_ctx_mgr *mgr);
  663. /*
  664. * file private structure
  665. */
  666. struct amdgpu_fpriv {
  667. struct amdgpu_vm vm;
  668. struct amdgpu_bo_va *prt_va;
  669. struct amdgpu_bo_va *csa_va;
  670. struct mutex bo_list_lock;
  671. struct idr bo_list_handles;
  672. struct amdgpu_ctx_mgr ctx_mgr;
  673. u32 vram_lost_counter;
  674. };
  675. /*
  676. * residency list
  677. */
  678. struct amdgpu_bo_list_entry {
  679. struct amdgpu_bo *robj;
  680. struct ttm_validate_buffer tv;
  681. struct amdgpu_bo_va *bo_va;
  682. uint32_t priority;
  683. struct page **user_pages;
  684. int user_invalidated;
  685. };
  686. struct amdgpu_bo_list {
  687. struct mutex lock;
  688. struct rcu_head rhead;
  689. struct kref refcount;
  690. struct amdgpu_bo *gds_obj;
  691. struct amdgpu_bo *gws_obj;
  692. struct amdgpu_bo *oa_obj;
  693. unsigned first_userptr;
  694. unsigned num_entries;
  695. struct amdgpu_bo_list_entry *array;
  696. };
  697. struct amdgpu_bo_list *
  698. amdgpu_bo_list_get(struct amdgpu_fpriv *fpriv, int id);
  699. void amdgpu_bo_list_get_list(struct amdgpu_bo_list *list,
  700. struct list_head *validated);
  701. void amdgpu_bo_list_put(struct amdgpu_bo_list *list);
  702. void amdgpu_bo_list_free(struct amdgpu_bo_list *list);
  703. /*
  704. * GFX stuff
  705. */
  706. #include "clearstate_defs.h"
  707. struct amdgpu_rlc_funcs {
  708. void (*enter_safe_mode)(struct amdgpu_device *adev);
  709. void (*exit_safe_mode)(struct amdgpu_device *adev);
  710. };
  711. struct amdgpu_rlc {
  712. /* for power gating */
  713. struct amdgpu_bo *save_restore_obj;
  714. uint64_t save_restore_gpu_addr;
  715. volatile uint32_t *sr_ptr;
  716. const u32 *reg_list;
  717. u32 reg_list_size;
  718. /* for clear state */
  719. struct amdgpu_bo *clear_state_obj;
  720. uint64_t clear_state_gpu_addr;
  721. volatile uint32_t *cs_ptr;
  722. const struct cs_section_def *cs_data;
  723. u32 clear_state_size;
  724. /* for cp tables */
  725. struct amdgpu_bo *cp_table_obj;
  726. uint64_t cp_table_gpu_addr;
  727. volatile uint32_t *cp_table_ptr;
  728. u32 cp_table_size;
  729. /* safe mode for updating CG/PG state */
  730. bool in_safe_mode;
  731. const struct amdgpu_rlc_funcs *funcs;
  732. /* for firmware data */
  733. u32 save_and_restore_offset;
  734. u32 clear_state_descriptor_offset;
  735. u32 avail_scratch_ram_locations;
  736. u32 reg_restore_list_size;
  737. u32 reg_list_format_start;
  738. u32 reg_list_format_separate_start;
  739. u32 starting_offsets_start;
  740. u32 reg_list_format_size_bytes;
  741. u32 reg_list_size_bytes;
  742. u32 *register_list_format;
  743. u32 *register_restore;
  744. };
  745. #define AMDGPU_MAX_COMPUTE_QUEUES KGD_MAX_QUEUES
  746. struct amdgpu_mec {
  747. struct amdgpu_bo *hpd_eop_obj;
  748. u64 hpd_eop_gpu_addr;
  749. struct amdgpu_bo *mec_fw_obj;
  750. u64 mec_fw_gpu_addr;
  751. u32 num_mec;
  752. u32 num_pipe_per_mec;
  753. u32 num_queue_per_pipe;
  754. void *mqd_backup[AMDGPU_MAX_COMPUTE_RINGS + 1];
  755. /* These are the resources for which amdgpu takes ownership */
  756. DECLARE_BITMAP(queue_bitmap, AMDGPU_MAX_COMPUTE_QUEUES);
  757. };
  758. struct amdgpu_kiq {
  759. u64 eop_gpu_addr;
  760. struct amdgpu_bo *eop_obj;
  761. struct mutex ring_mutex;
  762. struct amdgpu_ring ring;
  763. struct amdgpu_irq_src irq;
  764. };
  765. /*
  766. * GPU scratch registers structures, functions & helpers
  767. */
  768. struct amdgpu_scratch {
  769. unsigned num_reg;
  770. uint32_t reg_base;
  771. uint32_t free_mask;
  772. };
  773. /*
  774. * GFX configurations
  775. */
  776. #define AMDGPU_GFX_MAX_SE 4
  777. #define AMDGPU_GFX_MAX_SH_PER_SE 2
  778. struct amdgpu_rb_config {
  779. uint32_t rb_backend_disable;
  780. uint32_t user_rb_backend_disable;
  781. uint32_t raster_config;
  782. uint32_t raster_config_1;
  783. };
  784. struct gb_addr_config {
  785. uint16_t pipe_interleave_size;
  786. uint8_t num_pipes;
  787. uint8_t max_compress_frags;
  788. uint8_t num_banks;
  789. uint8_t num_se;
  790. uint8_t num_rb_per_se;
  791. };
  792. struct amdgpu_gfx_config {
  793. unsigned max_shader_engines;
  794. unsigned max_tile_pipes;
  795. unsigned max_cu_per_sh;
  796. unsigned max_sh_per_se;
  797. unsigned max_backends_per_se;
  798. unsigned max_texture_channel_caches;
  799. unsigned max_gprs;
  800. unsigned max_gs_threads;
  801. unsigned max_hw_contexts;
  802. unsigned sc_prim_fifo_size_frontend;
  803. unsigned sc_prim_fifo_size_backend;
  804. unsigned sc_hiz_tile_fifo_size;
  805. unsigned sc_earlyz_tile_fifo_size;
  806. unsigned num_tile_pipes;
  807. unsigned backend_enable_mask;
  808. unsigned mem_max_burst_length_bytes;
  809. unsigned mem_row_size_in_kb;
  810. unsigned shader_engine_tile_size;
  811. unsigned num_gpus;
  812. unsigned multi_gpu_tile_size;
  813. unsigned mc_arb_ramcfg;
  814. unsigned gb_addr_config;
  815. unsigned num_rbs;
  816. unsigned gs_vgt_table_depth;
  817. unsigned gs_prim_buffer_depth;
  818. uint32_t tile_mode_array[32];
  819. uint32_t macrotile_mode_array[16];
  820. struct gb_addr_config gb_addr_config_fields;
  821. struct amdgpu_rb_config rb_config[AMDGPU_GFX_MAX_SE][AMDGPU_GFX_MAX_SH_PER_SE];
  822. /* gfx configure feature */
  823. uint32_t double_offchip_lds_buf;
  824. };
  825. struct amdgpu_cu_info {
  826. uint32_t max_waves_per_simd;
  827. uint32_t wave_front_size;
  828. uint32_t max_scratch_slots_per_cu;
  829. uint32_t lds_size;
  830. /* total active CU number */
  831. uint32_t number;
  832. uint32_t ao_cu_mask;
  833. uint32_t ao_cu_bitmap[4][4];
  834. uint32_t bitmap[4][4];
  835. };
  836. struct amdgpu_gfx_funcs {
  837. /* get the gpu clock counter */
  838. uint64_t (*get_gpu_clock_counter)(struct amdgpu_device *adev);
  839. void (*select_se_sh)(struct amdgpu_device *adev, u32 se_num, u32 sh_num, u32 instance);
  840. void (*read_wave_data)(struct amdgpu_device *adev, uint32_t simd, uint32_t wave, uint32_t *dst, int *no_fields);
  841. void (*read_wave_vgprs)(struct amdgpu_device *adev, uint32_t simd, uint32_t wave, uint32_t thread, uint32_t start, uint32_t size, uint32_t *dst);
  842. void (*read_wave_sgprs)(struct amdgpu_device *adev, uint32_t simd, uint32_t wave, uint32_t start, uint32_t size, uint32_t *dst);
  843. };
  844. struct amdgpu_ngg_buf {
  845. struct amdgpu_bo *bo;
  846. uint64_t gpu_addr;
  847. uint32_t size;
  848. uint32_t bo_size;
  849. };
  850. enum {
  851. NGG_PRIM = 0,
  852. NGG_POS,
  853. NGG_CNTL,
  854. NGG_PARAM,
  855. NGG_BUF_MAX
  856. };
  857. struct amdgpu_ngg {
  858. struct amdgpu_ngg_buf buf[NGG_BUF_MAX];
  859. uint32_t gds_reserve_addr;
  860. uint32_t gds_reserve_size;
  861. bool init;
  862. };
  863. struct amdgpu_gfx {
  864. struct mutex gpu_clock_mutex;
  865. struct amdgpu_gfx_config config;
  866. struct amdgpu_rlc rlc;
  867. struct amdgpu_mec mec;
  868. struct amdgpu_kiq kiq;
  869. struct amdgpu_scratch scratch;
  870. const struct firmware *me_fw; /* ME firmware */
  871. uint32_t me_fw_version;
  872. const struct firmware *pfp_fw; /* PFP firmware */
  873. uint32_t pfp_fw_version;
  874. const struct firmware *ce_fw; /* CE firmware */
  875. uint32_t ce_fw_version;
  876. const struct firmware *rlc_fw; /* RLC firmware */
  877. uint32_t rlc_fw_version;
  878. const struct firmware *mec_fw; /* MEC firmware */
  879. uint32_t mec_fw_version;
  880. const struct firmware *mec2_fw; /* MEC2 firmware */
  881. uint32_t mec2_fw_version;
  882. uint32_t me_feature_version;
  883. uint32_t ce_feature_version;
  884. uint32_t pfp_feature_version;
  885. uint32_t rlc_feature_version;
  886. uint32_t mec_feature_version;
  887. uint32_t mec2_feature_version;
  888. struct amdgpu_ring gfx_ring[AMDGPU_MAX_GFX_RINGS];
  889. unsigned num_gfx_rings;
  890. struct amdgpu_ring compute_ring[AMDGPU_MAX_COMPUTE_RINGS];
  891. unsigned num_compute_rings;
  892. struct amdgpu_irq_src eop_irq;
  893. struct amdgpu_irq_src priv_reg_irq;
  894. struct amdgpu_irq_src priv_inst_irq;
  895. /* gfx status */
  896. uint32_t gfx_current_status;
  897. /* ce ram size*/
  898. unsigned ce_ram_size;
  899. struct amdgpu_cu_info cu_info;
  900. const struct amdgpu_gfx_funcs *funcs;
  901. /* reset mask */
  902. uint32_t grbm_soft_reset;
  903. uint32_t srbm_soft_reset;
  904. /* s3/s4 mask */
  905. bool in_suspend;
  906. /* NGG */
  907. struct amdgpu_ngg ngg;
  908. };
  909. int amdgpu_ib_get(struct amdgpu_device *adev, struct amdgpu_vm *vm,
  910. unsigned size, struct amdgpu_ib *ib);
  911. void amdgpu_ib_free(struct amdgpu_device *adev, struct amdgpu_ib *ib,
  912. struct dma_fence *f);
  913. int amdgpu_ib_schedule(struct amdgpu_ring *ring, unsigned num_ibs,
  914. struct amdgpu_ib *ibs, struct amdgpu_job *job,
  915. struct dma_fence **f);
  916. int amdgpu_ib_pool_init(struct amdgpu_device *adev);
  917. void amdgpu_ib_pool_fini(struct amdgpu_device *adev);
  918. int amdgpu_ib_ring_tests(struct amdgpu_device *adev);
  919. /*
  920. * CS.
  921. */
  922. struct amdgpu_cs_chunk {
  923. uint32_t chunk_id;
  924. uint32_t length_dw;
  925. void *kdata;
  926. };
  927. struct amdgpu_cs_parser {
  928. struct amdgpu_device *adev;
  929. struct drm_file *filp;
  930. struct amdgpu_ctx *ctx;
  931. /* chunks */
  932. unsigned nchunks;
  933. struct amdgpu_cs_chunk *chunks;
  934. /* scheduler job object */
  935. struct amdgpu_job *job;
  936. /* buffer objects */
  937. struct ww_acquire_ctx ticket;
  938. struct amdgpu_bo_list *bo_list;
  939. struct amdgpu_mn *mn;
  940. struct amdgpu_bo_list_entry vm_pd;
  941. struct list_head validated;
  942. struct dma_fence *fence;
  943. uint64_t bytes_moved_threshold;
  944. uint64_t bytes_moved_vis_threshold;
  945. uint64_t bytes_moved;
  946. uint64_t bytes_moved_vis;
  947. struct amdgpu_bo_list_entry *evictable;
  948. /* user fence */
  949. struct amdgpu_bo_list_entry uf_entry;
  950. unsigned num_post_dep_syncobjs;
  951. struct drm_syncobj **post_dep_syncobjs;
  952. };
  953. #define AMDGPU_PREAMBLE_IB_PRESENT (1 << 0) /* bit set means command submit involves a preamble IB */
  954. #define AMDGPU_PREAMBLE_IB_PRESENT_FIRST (1 << 1) /* bit set means preamble IB is first presented in belonging context */
  955. #define AMDGPU_HAVE_CTX_SWITCH (1 << 2) /* bit set means context switch occured */
  956. struct amdgpu_job {
  957. struct amd_sched_job base;
  958. struct amdgpu_device *adev;
  959. struct amdgpu_vm *vm;
  960. struct amdgpu_ring *ring;
  961. struct amdgpu_sync sync;
  962. struct amdgpu_sync dep_sync;
  963. struct amdgpu_sync sched_sync;
  964. struct amdgpu_ib *ibs;
  965. struct dma_fence *fence; /* the hw fence */
  966. uint32_t preamble_status;
  967. uint32_t num_ibs;
  968. void *owner;
  969. uint64_t fence_ctx; /* the fence_context this job uses */
  970. bool vm_needs_flush;
  971. unsigned vm_id;
  972. uint64_t vm_pd_addr;
  973. uint32_t gds_base, gds_size;
  974. uint32_t gws_base, gws_size;
  975. uint32_t oa_base, oa_size;
  976. /* user fence handling */
  977. uint64_t uf_addr;
  978. uint64_t uf_sequence;
  979. };
  980. #define to_amdgpu_job(sched_job) \
  981. container_of((sched_job), struct amdgpu_job, base)
  982. static inline u32 amdgpu_get_ib_value(struct amdgpu_cs_parser *p,
  983. uint32_t ib_idx, int idx)
  984. {
  985. return p->job->ibs[ib_idx].ptr[idx];
  986. }
  987. static inline void amdgpu_set_ib_value(struct amdgpu_cs_parser *p,
  988. uint32_t ib_idx, int idx,
  989. uint32_t value)
  990. {
  991. p->job->ibs[ib_idx].ptr[idx] = value;
  992. }
  993. /*
  994. * Writeback
  995. */
  996. #define AMDGPU_MAX_WB 1024 /* Reserve at most 1024 WB slots for amdgpu-owned rings. */
  997. struct amdgpu_wb {
  998. struct amdgpu_bo *wb_obj;
  999. volatile uint32_t *wb;
  1000. uint64_t gpu_addr;
  1001. u32 num_wb; /* Number of wb slots actually reserved for amdgpu. */
  1002. unsigned long used[DIV_ROUND_UP(AMDGPU_MAX_WB, BITS_PER_LONG)];
  1003. };
  1004. int amdgpu_wb_get(struct amdgpu_device *adev, u32 *wb);
  1005. void amdgpu_wb_free(struct amdgpu_device *adev, u32 wb);
  1006. void amdgpu_get_pcie_info(struct amdgpu_device *adev);
  1007. /*
  1008. * SDMA
  1009. */
  1010. struct amdgpu_sdma_instance {
  1011. /* SDMA firmware */
  1012. const struct firmware *fw;
  1013. uint32_t fw_version;
  1014. uint32_t feature_version;
  1015. struct amdgpu_ring ring;
  1016. bool burst_nop;
  1017. };
  1018. struct amdgpu_sdma {
  1019. struct amdgpu_sdma_instance instance[AMDGPU_MAX_SDMA_INSTANCES];
  1020. #ifdef CONFIG_DRM_AMDGPU_SI
  1021. //SI DMA has a difference trap irq number for the second engine
  1022. struct amdgpu_irq_src trap_irq_1;
  1023. #endif
  1024. struct amdgpu_irq_src trap_irq;
  1025. struct amdgpu_irq_src illegal_inst_irq;
  1026. int num_instances;
  1027. uint32_t srbm_soft_reset;
  1028. };
  1029. /*
  1030. * Firmware
  1031. */
  1032. enum amdgpu_firmware_load_type {
  1033. AMDGPU_FW_LOAD_DIRECT = 0,
  1034. AMDGPU_FW_LOAD_SMU,
  1035. AMDGPU_FW_LOAD_PSP,
  1036. };
  1037. struct amdgpu_firmware {
  1038. struct amdgpu_firmware_info ucode[AMDGPU_UCODE_ID_MAXIMUM];
  1039. enum amdgpu_firmware_load_type load_type;
  1040. struct amdgpu_bo *fw_buf;
  1041. unsigned int fw_size;
  1042. unsigned int max_ucodes;
  1043. /* firmwares are loaded by psp instead of smu from vega10 */
  1044. const struct amdgpu_psp_funcs *funcs;
  1045. struct amdgpu_bo *rbuf;
  1046. struct mutex mutex;
  1047. /* gpu info firmware data pointer */
  1048. const struct firmware *gpu_info_fw;
  1049. void *fw_buf_ptr;
  1050. uint64_t fw_buf_mc;
  1051. };
  1052. /*
  1053. * Benchmarking
  1054. */
  1055. void amdgpu_benchmark(struct amdgpu_device *adev, int test_number);
  1056. /*
  1057. * Testing
  1058. */
  1059. void amdgpu_test_moves(struct amdgpu_device *adev);
  1060. /*
  1061. * Debugfs
  1062. */
  1063. struct amdgpu_debugfs {
  1064. const struct drm_info_list *files;
  1065. unsigned num_files;
  1066. };
  1067. int amdgpu_debugfs_add_files(struct amdgpu_device *adev,
  1068. const struct drm_info_list *files,
  1069. unsigned nfiles);
  1070. int amdgpu_debugfs_fence_init(struct amdgpu_device *adev);
  1071. #if defined(CONFIG_DEBUG_FS)
  1072. int amdgpu_debugfs_init(struct drm_minor *minor);
  1073. #endif
  1074. int amdgpu_debugfs_firmware_init(struct amdgpu_device *adev);
  1075. /*
  1076. * amdgpu smumgr functions
  1077. */
  1078. struct amdgpu_smumgr_funcs {
  1079. int (*check_fw_load_finish)(struct amdgpu_device *adev, uint32_t fwtype);
  1080. int (*request_smu_load_fw)(struct amdgpu_device *adev);
  1081. int (*request_smu_specific_fw)(struct amdgpu_device *adev, uint32_t fwtype);
  1082. };
  1083. /*
  1084. * amdgpu smumgr
  1085. */
  1086. struct amdgpu_smumgr {
  1087. struct amdgpu_bo *toc_buf;
  1088. struct amdgpu_bo *smu_buf;
  1089. /* asic priv smu data */
  1090. void *priv;
  1091. spinlock_t smu_lock;
  1092. /* smumgr functions */
  1093. const struct amdgpu_smumgr_funcs *smumgr_funcs;
  1094. /* ucode loading complete flag */
  1095. uint32_t fw_flags;
  1096. };
  1097. /*
  1098. * ASIC specific register table accessible by UMD
  1099. */
  1100. struct amdgpu_allowed_register_entry {
  1101. uint32_t reg_offset;
  1102. bool grbm_indexed;
  1103. };
  1104. /*
  1105. * ASIC specific functions.
  1106. */
  1107. struct amdgpu_asic_funcs {
  1108. bool (*read_disabled_bios)(struct amdgpu_device *adev);
  1109. bool (*read_bios_from_rom)(struct amdgpu_device *adev,
  1110. u8 *bios, u32 length_bytes);
  1111. int (*read_register)(struct amdgpu_device *adev, u32 se_num,
  1112. u32 sh_num, u32 reg_offset, u32 *value);
  1113. void (*set_vga_state)(struct amdgpu_device *adev, bool state);
  1114. int (*reset)(struct amdgpu_device *adev);
  1115. /* get the reference clock */
  1116. u32 (*get_xclk)(struct amdgpu_device *adev);
  1117. /* MM block clocks */
  1118. int (*set_uvd_clocks)(struct amdgpu_device *adev, u32 vclk, u32 dclk);
  1119. int (*set_vce_clocks)(struct amdgpu_device *adev, u32 evclk, u32 ecclk);
  1120. /* static power management */
  1121. int (*get_pcie_lanes)(struct amdgpu_device *adev);
  1122. void (*set_pcie_lanes)(struct amdgpu_device *adev, int lanes);
  1123. /* get config memsize register */
  1124. u32 (*get_config_memsize)(struct amdgpu_device *adev);
  1125. };
  1126. /*
  1127. * IOCTL.
  1128. */
  1129. int amdgpu_gem_create_ioctl(struct drm_device *dev, void *data,
  1130. struct drm_file *filp);
  1131. int amdgpu_bo_list_ioctl(struct drm_device *dev, void *data,
  1132. struct drm_file *filp);
  1133. int amdgpu_gem_info_ioctl(struct drm_device *dev, void *data,
  1134. struct drm_file *filp);
  1135. int amdgpu_gem_userptr_ioctl(struct drm_device *dev, void *data,
  1136. struct drm_file *filp);
  1137. int amdgpu_gem_mmap_ioctl(struct drm_device *dev, void *data,
  1138. struct drm_file *filp);
  1139. int amdgpu_gem_wait_idle_ioctl(struct drm_device *dev, void *data,
  1140. struct drm_file *filp);
  1141. int amdgpu_gem_va_ioctl(struct drm_device *dev, void *data,
  1142. struct drm_file *filp);
  1143. int amdgpu_gem_op_ioctl(struct drm_device *dev, void *data,
  1144. struct drm_file *filp);
  1145. int amdgpu_cs_ioctl(struct drm_device *dev, void *data, struct drm_file *filp);
  1146. int amdgpu_cs_fence_to_handle_ioctl(struct drm_device *dev, void *data,
  1147. struct drm_file *filp);
  1148. int amdgpu_cs_wait_ioctl(struct drm_device *dev, void *data, struct drm_file *filp);
  1149. int amdgpu_cs_wait_fences_ioctl(struct drm_device *dev, void *data,
  1150. struct drm_file *filp);
  1151. int amdgpu_gem_metadata_ioctl(struct drm_device *dev, void *data,
  1152. struct drm_file *filp);
  1153. /* VRAM scratch page for HDP bug, default vram page */
  1154. struct amdgpu_vram_scratch {
  1155. struct amdgpu_bo *robj;
  1156. volatile uint32_t *ptr;
  1157. u64 gpu_addr;
  1158. };
  1159. /*
  1160. * ACPI
  1161. */
  1162. struct amdgpu_atif_notification_cfg {
  1163. bool enabled;
  1164. int command_code;
  1165. };
  1166. struct amdgpu_atif_notifications {
  1167. bool display_switch;
  1168. bool expansion_mode_change;
  1169. bool thermal_state;
  1170. bool forced_power_state;
  1171. bool system_power_state;
  1172. bool display_conf_change;
  1173. bool px_gfx_switch;
  1174. bool brightness_change;
  1175. bool dgpu_display_event;
  1176. };
  1177. struct amdgpu_atif_functions {
  1178. bool system_params;
  1179. bool sbios_requests;
  1180. bool select_active_disp;
  1181. bool lid_state;
  1182. bool get_tv_standard;
  1183. bool set_tv_standard;
  1184. bool get_panel_expansion_mode;
  1185. bool set_panel_expansion_mode;
  1186. bool temperature_change;
  1187. bool graphics_device_types;
  1188. };
  1189. struct amdgpu_atif {
  1190. struct amdgpu_atif_notifications notifications;
  1191. struct amdgpu_atif_functions functions;
  1192. struct amdgpu_atif_notification_cfg notification_cfg;
  1193. struct amdgpu_encoder *encoder_for_bl;
  1194. };
  1195. struct amdgpu_atcs_functions {
  1196. bool get_ext_state;
  1197. bool pcie_perf_req;
  1198. bool pcie_dev_rdy;
  1199. bool pcie_bus_width;
  1200. };
  1201. struct amdgpu_atcs {
  1202. struct amdgpu_atcs_functions functions;
  1203. };
  1204. /*
  1205. * CGS
  1206. */
  1207. struct cgs_device *amdgpu_cgs_create_device(struct amdgpu_device *adev);
  1208. void amdgpu_cgs_destroy_device(struct cgs_device *cgs_device);
  1209. /*
  1210. * Core structure, functions and helpers.
  1211. */
  1212. typedef uint32_t (*amdgpu_rreg_t)(struct amdgpu_device*, uint32_t);
  1213. typedef void (*amdgpu_wreg_t)(struct amdgpu_device*, uint32_t, uint32_t);
  1214. typedef uint32_t (*amdgpu_block_rreg_t)(struct amdgpu_device*, uint32_t, uint32_t);
  1215. typedef void (*amdgpu_block_wreg_t)(struct amdgpu_device*, uint32_t, uint32_t, uint32_t);
  1216. #define AMDGPU_RESET_MAGIC_NUM 64
  1217. struct amdgpu_device {
  1218. struct device *dev;
  1219. struct drm_device *ddev;
  1220. struct pci_dev *pdev;
  1221. #ifdef CONFIG_DRM_AMD_ACP
  1222. struct amdgpu_acp acp;
  1223. #endif
  1224. /* ASIC */
  1225. enum amd_asic_type asic_type;
  1226. uint32_t family;
  1227. uint32_t rev_id;
  1228. uint32_t external_rev_id;
  1229. unsigned long flags;
  1230. int usec_timeout;
  1231. const struct amdgpu_asic_funcs *asic_funcs;
  1232. bool shutdown;
  1233. bool need_dma32;
  1234. bool accel_working;
  1235. struct work_struct reset_work;
  1236. struct notifier_block acpi_nb;
  1237. struct amdgpu_i2c_chan *i2c_bus[AMDGPU_MAX_I2C_BUS];
  1238. struct amdgpu_debugfs debugfs[AMDGPU_DEBUGFS_MAX_COMPONENTS];
  1239. unsigned debugfs_count;
  1240. #if defined(CONFIG_DEBUG_FS)
  1241. struct dentry *debugfs_regs[AMDGPU_DEBUGFS_MAX_COMPONENTS];
  1242. #endif
  1243. struct amdgpu_atif atif;
  1244. struct amdgpu_atcs atcs;
  1245. struct mutex srbm_mutex;
  1246. /* GRBM index mutex. Protects concurrent access to GRBM index */
  1247. struct mutex grbm_idx_mutex;
  1248. struct dev_pm_domain vga_pm_domain;
  1249. bool have_disp_power_ref;
  1250. /* BIOS */
  1251. bool is_atom_fw;
  1252. uint8_t *bios;
  1253. uint32_t bios_size;
  1254. struct amdgpu_bo *stolen_vga_memory;
  1255. uint32_t bios_scratch_reg_offset;
  1256. uint32_t bios_scratch[AMDGPU_BIOS_NUM_SCRATCH];
  1257. /* Register/doorbell mmio */
  1258. resource_size_t rmmio_base;
  1259. resource_size_t rmmio_size;
  1260. void __iomem *rmmio;
  1261. /* protects concurrent MM_INDEX/DATA based register access */
  1262. spinlock_t mmio_idx_lock;
  1263. /* protects concurrent SMC based register access */
  1264. spinlock_t smc_idx_lock;
  1265. amdgpu_rreg_t smc_rreg;
  1266. amdgpu_wreg_t smc_wreg;
  1267. /* protects concurrent PCIE register access */
  1268. spinlock_t pcie_idx_lock;
  1269. amdgpu_rreg_t pcie_rreg;
  1270. amdgpu_wreg_t pcie_wreg;
  1271. amdgpu_rreg_t pciep_rreg;
  1272. amdgpu_wreg_t pciep_wreg;
  1273. /* protects concurrent UVD register access */
  1274. spinlock_t uvd_ctx_idx_lock;
  1275. amdgpu_rreg_t uvd_ctx_rreg;
  1276. amdgpu_wreg_t uvd_ctx_wreg;
  1277. /* protects concurrent DIDT register access */
  1278. spinlock_t didt_idx_lock;
  1279. amdgpu_rreg_t didt_rreg;
  1280. amdgpu_wreg_t didt_wreg;
  1281. /* protects concurrent gc_cac register access */
  1282. spinlock_t gc_cac_idx_lock;
  1283. amdgpu_rreg_t gc_cac_rreg;
  1284. amdgpu_wreg_t gc_cac_wreg;
  1285. /* protects concurrent se_cac register access */
  1286. spinlock_t se_cac_idx_lock;
  1287. amdgpu_rreg_t se_cac_rreg;
  1288. amdgpu_wreg_t se_cac_wreg;
  1289. /* protects concurrent ENDPOINT (audio) register access */
  1290. spinlock_t audio_endpt_idx_lock;
  1291. amdgpu_block_rreg_t audio_endpt_rreg;
  1292. amdgpu_block_wreg_t audio_endpt_wreg;
  1293. void __iomem *rio_mem;
  1294. resource_size_t rio_mem_size;
  1295. struct amdgpu_doorbell doorbell;
  1296. /* clock/pll info */
  1297. struct amdgpu_clock clock;
  1298. /* MC */
  1299. struct amdgpu_mc mc;
  1300. struct amdgpu_gart gart;
  1301. struct amdgpu_dummy_page dummy_page;
  1302. struct amdgpu_vm_manager vm_manager;
  1303. struct amdgpu_vmhub vmhub[AMDGPU_MAX_VMHUBS];
  1304. /* memory management */
  1305. struct amdgpu_mman mman;
  1306. struct amdgpu_vram_scratch vram_scratch;
  1307. struct amdgpu_wb wb;
  1308. atomic64_t num_bytes_moved;
  1309. atomic64_t num_evictions;
  1310. atomic64_t num_vram_cpu_page_faults;
  1311. atomic_t gpu_reset_counter;
  1312. atomic_t vram_lost_counter;
  1313. /* data for buffer migration throttling */
  1314. struct {
  1315. spinlock_t lock;
  1316. s64 last_update_us;
  1317. s64 accum_us; /* accumulated microseconds */
  1318. s64 accum_us_vis; /* for visible VRAM */
  1319. u32 log2_max_MBps;
  1320. } mm_stats;
  1321. /* display */
  1322. bool enable_virtual_display;
  1323. struct amdgpu_mode_info mode_info;
  1324. struct work_struct hotplug_work;
  1325. struct amdgpu_irq_src crtc_irq;
  1326. struct amdgpu_irq_src pageflip_irq;
  1327. struct amdgpu_irq_src hpd_irq;
  1328. /* rings */
  1329. u64 fence_context;
  1330. unsigned num_rings;
  1331. struct amdgpu_ring *rings[AMDGPU_MAX_RINGS];
  1332. bool ib_pool_ready;
  1333. struct amdgpu_sa_manager ring_tmp_bo;
  1334. /* interrupts */
  1335. struct amdgpu_irq irq;
  1336. /* powerplay */
  1337. struct amd_powerplay powerplay;
  1338. bool pp_force_state_enabled;
  1339. /* dpm */
  1340. struct amdgpu_pm pm;
  1341. u32 cg_flags;
  1342. u32 pg_flags;
  1343. /* amdgpu smumgr */
  1344. struct amdgpu_smumgr smu;
  1345. /* gfx */
  1346. struct amdgpu_gfx gfx;
  1347. /* sdma */
  1348. struct amdgpu_sdma sdma;
  1349. union {
  1350. struct {
  1351. /* uvd */
  1352. struct amdgpu_uvd uvd;
  1353. /* vce */
  1354. struct amdgpu_vce vce;
  1355. };
  1356. /* vcn */
  1357. struct amdgpu_vcn vcn;
  1358. };
  1359. /* firmwares */
  1360. struct amdgpu_firmware firmware;
  1361. /* PSP */
  1362. struct psp_context psp;
  1363. /* GDS */
  1364. struct amdgpu_gds gds;
  1365. struct amdgpu_ip_block ip_blocks[AMDGPU_MAX_IP_NUM];
  1366. int num_ip_blocks;
  1367. struct mutex mn_lock;
  1368. DECLARE_HASHTABLE(mn_hash, 7);
  1369. /* tracking pinned memory */
  1370. u64 vram_pin_size;
  1371. u64 invisible_pin_size;
  1372. u64 gart_pin_size;
  1373. /* amdkfd interface */
  1374. struct kfd_dev *kfd;
  1375. /* delayed work_func for deferring clockgating during resume */
  1376. struct delayed_work late_init_work;
  1377. struct amdgpu_virt virt;
  1378. /* link all shadow bo */
  1379. struct list_head shadow_list;
  1380. struct mutex shadow_list_lock;
  1381. /* link all gtt */
  1382. spinlock_t gtt_list_lock;
  1383. struct list_head gtt_list;
  1384. /* keep an lru list of rings by HW IP */
  1385. struct list_head ring_lru_list;
  1386. spinlock_t ring_lru_list_lock;
  1387. /* record hw reset is performed */
  1388. bool has_hw_reset;
  1389. u8 reset_magic[AMDGPU_RESET_MAGIC_NUM];
  1390. /* record last mm index being written through WREG32*/
  1391. unsigned long last_mm_index;
  1392. bool in_sriov_reset;
  1393. };
  1394. static inline struct amdgpu_device *amdgpu_ttm_adev(struct ttm_bo_device *bdev)
  1395. {
  1396. return container_of(bdev, struct amdgpu_device, mman.bdev);
  1397. }
  1398. int amdgpu_device_init(struct amdgpu_device *adev,
  1399. struct drm_device *ddev,
  1400. struct pci_dev *pdev,
  1401. uint32_t flags);
  1402. void amdgpu_device_fini(struct amdgpu_device *adev);
  1403. int amdgpu_gpu_wait_for_idle(struct amdgpu_device *adev);
  1404. uint32_t amdgpu_mm_rreg(struct amdgpu_device *adev, uint32_t reg,
  1405. uint32_t acc_flags);
  1406. void amdgpu_mm_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v,
  1407. uint32_t acc_flags);
  1408. u32 amdgpu_io_rreg(struct amdgpu_device *adev, u32 reg);
  1409. void amdgpu_io_wreg(struct amdgpu_device *adev, u32 reg, u32 v);
  1410. u32 amdgpu_mm_rdoorbell(struct amdgpu_device *adev, u32 index);
  1411. void amdgpu_mm_wdoorbell(struct amdgpu_device *adev, u32 index, u32 v);
  1412. u64 amdgpu_mm_rdoorbell64(struct amdgpu_device *adev, u32 index);
  1413. void amdgpu_mm_wdoorbell64(struct amdgpu_device *adev, u32 index, u64 v);
  1414. /*
  1415. * Registers read & write functions.
  1416. */
  1417. #define AMDGPU_REGS_IDX (1<<0)
  1418. #define AMDGPU_REGS_NO_KIQ (1<<1)
  1419. #define RREG32_NO_KIQ(reg) amdgpu_mm_rreg(adev, (reg), AMDGPU_REGS_NO_KIQ)
  1420. #define WREG32_NO_KIQ(reg, v) amdgpu_mm_wreg(adev, (reg), (v), AMDGPU_REGS_NO_KIQ)
  1421. #define RREG32(reg) amdgpu_mm_rreg(adev, (reg), 0)
  1422. #define RREG32_IDX(reg) amdgpu_mm_rreg(adev, (reg), AMDGPU_REGS_IDX)
  1423. #define DREG32(reg) printk(KERN_INFO "REGISTER: " #reg " : 0x%08X\n", amdgpu_mm_rreg(adev, (reg), 0))
  1424. #define WREG32(reg, v) amdgpu_mm_wreg(adev, (reg), (v), 0)
  1425. #define WREG32_IDX(reg, v) amdgpu_mm_wreg(adev, (reg), (v), AMDGPU_REGS_IDX)
  1426. #define REG_SET(FIELD, v) (((v) << FIELD##_SHIFT) & FIELD##_MASK)
  1427. #define REG_GET(FIELD, v) (((v) << FIELD##_SHIFT) & FIELD##_MASK)
  1428. #define RREG32_PCIE(reg) adev->pcie_rreg(adev, (reg))
  1429. #define WREG32_PCIE(reg, v) adev->pcie_wreg(adev, (reg), (v))
  1430. #define RREG32_PCIE_PORT(reg) adev->pciep_rreg(adev, (reg))
  1431. #define WREG32_PCIE_PORT(reg, v) adev->pciep_wreg(adev, (reg), (v))
  1432. #define RREG32_SMC(reg) adev->smc_rreg(adev, (reg))
  1433. #define WREG32_SMC(reg, v) adev->smc_wreg(adev, (reg), (v))
  1434. #define RREG32_UVD_CTX(reg) adev->uvd_ctx_rreg(adev, (reg))
  1435. #define WREG32_UVD_CTX(reg, v) adev->uvd_ctx_wreg(adev, (reg), (v))
  1436. #define RREG32_DIDT(reg) adev->didt_rreg(adev, (reg))
  1437. #define WREG32_DIDT(reg, v) adev->didt_wreg(adev, (reg), (v))
  1438. #define RREG32_GC_CAC(reg) adev->gc_cac_rreg(adev, (reg))
  1439. #define WREG32_GC_CAC(reg, v) adev->gc_cac_wreg(adev, (reg), (v))
  1440. #define RREG32_SE_CAC(reg) adev->se_cac_rreg(adev, (reg))
  1441. #define WREG32_SE_CAC(reg, v) adev->se_cac_wreg(adev, (reg), (v))
  1442. #define RREG32_AUDIO_ENDPT(block, reg) adev->audio_endpt_rreg(adev, (block), (reg))
  1443. #define WREG32_AUDIO_ENDPT(block, reg, v) adev->audio_endpt_wreg(adev, (block), (reg), (v))
  1444. #define WREG32_P(reg, val, mask) \
  1445. do { \
  1446. uint32_t tmp_ = RREG32(reg); \
  1447. tmp_ &= (mask); \
  1448. tmp_ |= ((val) & ~(mask)); \
  1449. WREG32(reg, tmp_); \
  1450. } while (0)
  1451. #define WREG32_AND(reg, and) WREG32_P(reg, 0, and)
  1452. #define WREG32_OR(reg, or) WREG32_P(reg, or, ~(or))
  1453. #define WREG32_PLL_P(reg, val, mask) \
  1454. do { \
  1455. uint32_t tmp_ = RREG32_PLL(reg); \
  1456. tmp_ &= (mask); \
  1457. tmp_ |= ((val) & ~(mask)); \
  1458. WREG32_PLL(reg, tmp_); \
  1459. } while (0)
  1460. #define DREG32_SYS(sqf, adev, reg) seq_printf((sqf), #reg " : 0x%08X\n", amdgpu_mm_rreg((adev), (reg), false))
  1461. #define RREG32_IO(reg) amdgpu_io_rreg(adev, (reg))
  1462. #define WREG32_IO(reg, v) amdgpu_io_wreg(adev, (reg), (v))
  1463. #define RDOORBELL32(index) amdgpu_mm_rdoorbell(adev, (index))
  1464. #define WDOORBELL32(index, v) amdgpu_mm_wdoorbell(adev, (index), (v))
  1465. #define RDOORBELL64(index) amdgpu_mm_rdoorbell64(adev, (index))
  1466. #define WDOORBELL64(index, v) amdgpu_mm_wdoorbell64(adev, (index), (v))
  1467. #define REG_FIELD_SHIFT(reg, field) reg##__##field##__SHIFT
  1468. #define REG_FIELD_MASK(reg, field) reg##__##field##_MASK
  1469. #define REG_SET_FIELD(orig_val, reg, field, field_val) \
  1470. (((orig_val) & ~REG_FIELD_MASK(reg, field)) | \
  1471. (REG_FIELD_MASK(reg, field) & ((field_val) << REG_FIELD_SHIFT(reg, field))))
  1472. #define REG_GET_FIELD(value, reg, field) \
  1473. (((value) & REG_FIELD_MASK(reg, field)) >> REG_FIELD_SHIFT(reg, field))
  1474. #define WREG32_FIELD(reg, field, val) \
  1475. WREG32(mm##reg, (RREG32(mm##reg) & ~REG_FIELD_MASK(reg, field)) | (val) << REG_FIELD_SHIFT(reg, field))
  1476. #define WREG32_FIELD_OFFSET(reg, offset, field, val) \
  1477. WREG32(mm##reg + offset, (RREG32(mm##reg + offset) & ~REG_FIELD_MASK(reg, field)) | (val) << REG_FIELD_SHIFT(reg, field))
  1478. /*
  1479. * BIOS helpers.
  1480. */
  1481. #define RBIOS8(i) (adev->bios[i])
  1482. #define RBIOS16(i) (RBIOS8(i) | (RBIOS8((i)+1) << 8))
  1483. #define RBIOS32(i) ((RBIOS16(i)) | (RBIOS16((i)+2) << 16))
  1484. static inline struct amdgpu_sdma_instance *
  1485. amdgpu_get_sdma_instance(struct amdgpu_ring *ring)
  1486. {
  1487. struct amdgpu_device *adev = ring->adev;
  1488. int i;
  1489. for (i = 0; i < adev->sdma.num_instances; i++)
  1490. if (&adev->sdma.instance[i].ring == ring)
  1491. break;
  1492. if (i < AMDGPU_MAX_SDMA_INSTANCES)
  1493. return &adev->sdma.instance[i];
  1494. else
  1495. return NULL;
  1496. }
  1497. /*
  1498. * ASICs macro.
  1499. */
  1500. #define amdgpu_asic_set_vga_state(adev, state) (adev)->asic_funcs->set_vga_state((adev), (state))
  1501. #define amdgpu_asic_reset(adev) (adev)->asic_funcs->reset((adev))
  1502. #define amdgpu_asic_get_xclk(adev) (adev)->asic_funcs->get_xclk((adev))
  1503. #define amdgpu_asic_set_uvd_clocks(adev, v, d) (adev)->asic_funcs->set_uvd_clocks((adev), (v), (d))
  1504. #define amdgpu_asic_set_vce_clocks(adev, ev, ec) (adev)->asic_funcs->set_vce_clocks((adev), (ev), (ec))
  1505. #define amdgpu_get_pcie_lanes(adev) (adev)->asic_funcs->get_pcie_lanes((adev))
  1506. #define amdgpu_set_pcie_lanes(adev, l) (adev)->asic_funcs->set_pcie_lanes((adev), (l))
  1507. #define amdgpu_asic_get_gpu_clock_counter(adev) (adev)->asic_funcs->get_gpu_clock_counter((adev))
  1508. #define amdgpu_asic_read_disabled_bios(adev) (adev)->asic_funcs->read_disabled_bios((adev))
  1509. #define amdgpu_asic_read_bios_from_rom(adev, b, l) (adev)->asic_funcs->read_bios_from_rom((adev), (b), (l))
  1510. #define amdgpu_asic_read_register(adev, se, sh, offset, v)((adev)->asic_funcs->read_register((adev), (se), (sh), (offset), (v)))
  1511. #define amdgpu_asic_get_config_memsize(adev) (adev)->asic_funcs->get_config_memsize((adev))
  1512. #define amdgpu_gart_flush_gpu_tlb(adev, vmid) (adev)->gart.gart_funcs->flush_gpu_tlb((adev), (vmid))
  1513. #define amdgpu_gart_set_pte_pde(adev, pt, idx, addr, flags) (adev)->gart.gart_funcs->set_pte_pde((adev), (pt), (idx), (addr), (flags))
  1514. #define amdgpu_gart_get_vm_pde(adev, addr) (adev)->gart.gart_funcs->get_vm_pde((adev), (addr))
  1515. #define amdgpu_vm_copy_pte(adev, ib, pe, src, count) ((adev)->vm_manager.vm_pte_funcs->copy_pte((ib), (pe), (src), (count)))
  1516. #define amdgpu_vm_write_pte(adev, ib, pe, value, count, incr) ((adev)->vm_manager.vm_pte_funcs->write_pte((ib), (pe), (value), (count), (incr)))
  1517. #define amdgpu_vm_set_pte_pde(adev, ib, pe, addr, count, incr, flags) ((adev)->vm_manager.vm_pte_funcs->set_pte_pde((ib), (pe), (addr), (count), (incr), (flags)))
  1518. #define amdgpu_vm_get_pte_flags(adev, flags) (adev)->gart.gart_funcs->get_vm_pte_flags((adev),(flags))
  1519. #define amdgpu_ring_parse_cs(r, p, ib) ((r)->funcs->parse_cs((p), (ib)))
  1520. #define amdgpu_ring_test_ring(r) (r)->funcs->test_ring((r))
  1521. #define amdgpu_ring_test_ib(r, t) (r)->funcs->test_ib((r), (t))
  1522. #define amdgpu_ring_get_rptr(r) (r)->funcs->get_rptr((r))
  1523. #define amdgpu_ring_get_wptr(r) (r)->funcs->get_wptr((r))
  1524. #define amdgpu_ring_set_wptr(r) (r)->funcs->set_wptr((r))
  1525. #define amdgpu_ring_emit_ib(r, ib, vm_id, c) (r)->funcs->emit_ib((r), (ib), (vm_id), (c))
  1526. #define amdgpu_ring_emit_pipeline_sync(r) (r)->funcs->emit_pipeline_sync((r))
  1527. #define amdgpu_ring_emit_vm_flush(r, vmid, addr) (r)->funcs->emit_vm_flush((r), (vmid), (addr))
  1528. #define amdgpu_ring_emit_fence(r, addr, seq, flags) (r)->funcs->emit_fence((r), (addr), (seq), (flags))
  1529. #define amdgpu_ring_emit_gds_switch(r, v, db, ds, wb, ws, ab, as) (r)->funcs->emit_gds_switch((r), (v), (db), (ds), (wb), (ws), (ab), (as))
  1530. #define amdgpu_ring_emit_hdp_flush(r) (r)->funcs->emit_hdp_flush((r))
  1531. #define amdgpu_ring_emit_hdp_invalidate(r) (r)->funcs->emit_hdp_invalidate((r))
  1532. #define amdgpu_ring_emit_switch_buffer(r) (r)->funcs->emit_switch_buffer((r))
  1533. #define amdgpu_ring_emit_cntxcntl(r, d) (r)->funcs->emit_cntxcntl((r), (d))
  1534. #define amdgpu_ring_emit_rreg(r, d) (r)->funcs->emit_rreg((r), (d))
  1535. #define amdgpu_ring_emit_wreg(r, d, v) (r)->funcs->emit_wreg((r), (d), (v))
  1536. #define amdgpu_ring_emit_tmz(r, b) (r)->funcs->emit_tmz((r), (b))
  1537. #define amdgpu_ring_pad_ib(r, ib) ((r)->funcs->pad_ib((r), (ib)))
  1538. #define amdgpu_ring_init_cond_exec(r) (r)->funcs->init_cond_exec((r))
  1539. #define amdgpu_ring_patch_cond_exec(r,o) (r)->funcs->patch_cond_exec((r),(o))
  1540. #define amdgpu_ih_get_wptr(adev) (adev)->irq.ih_funcs->get_wptr((adev))
  1541. #define amdgpu_ih_prescreen_iv(adev) (adev)->irq.ih_funcs->prescreen_iv((adev))
  1542. #define amdgpu_ih_decode_iv(adev, iv) (adev)->irq.ih_funcs->decode_iv((adev), (iv))
  1543. #define amdgpu_ih_set_rptr(adev) (adev)->irq.ih_funcs->set_rptr((adev))
  1544. #define amdgpu_display_vblank_get_counter(adev, crtc) (adev)->mode_info.funcs->vblank_get_counter((adev), (crtc))
  1545. #define amdgpu_display_vblank_wait(adev, crtc) (adev)->mode_info.funcs->vblank_wait((adev), (crtc))
  1546. #define amdgpu_display_backlight_set_level(adev, e, l) (adev)->mode_info.funcs->backlight_set_level((e), (l))
  1547. #define amdgpu_display_backlight_get_level(adev, e) (adev)->mode_info.funcs->backlight_get_level((e))
  1548. #define amdgpu_display_hpd_sense(adev, h) (adev)->mode_info.funcs->hpd_sense((adev), (h))
  1549. #define amdgpu_display_hpd_set_polarity(adev, h) (adev)->mode_info.funcs->hpd_set_polarity((adev), (h))
  1550. #define amdgpu_display_hpd_get_gpio_reg(adev) (adev)->mode_info.funcs->hpd_get_gpio_reg((adev))
  1551. #define amdgpu_display_bandwidth_update(adev) (adev)->mode_info.funcs->bandwidth_update((adev))
  1552. #define amdgpu_display_page_flip(adev, crtc, base, async) (adev)->mode_info.funcs->page_flip((adev), (crtc), (base), (async))
  1553. #define amdgpu_display_page_flip_get_scanoutpos(adev, crtc, vbl, pos) (adev)->mode_info.funcs->page_flip_get_scanoutpos((adev), (crtc), (vbl), (pos))
  1554. #define amdgpu_display_add_encoder(adev, e, s, c) (adev)->mode_info.funcs->add_encoder((adev), (e), (s), (c))
  1555. #define amdgpu_display_add_connector(adev, ci, sd, ct, ib, coi, h, r) (adev)->mode_info.funcs->add_connector((adev), (ci), (sd), (ct), (ib), (coi), (h), (r))
  1556. #define amdgpu_emit_copy_buffer(adev, ib, s, d, b) (adev)->mman.buffer_funcs->emit_copy_buffer((ib), (s), (d), (b))
  1557. #define amdgpu_emit_fill_buffer(adev, ib, s, d, b) (adev)->mman.buffer_funcs->emit_fill_buffer((ib), (s), (d), (b))
  1558. #define amdgpu_gfx_get_gpu_clock_counter(adev) (adev)->gfx.funcs->get_gpu_clock_counter((adev))
  1559. #define amdgpu_gfx_select_se_sh(adev, se, sh, instance) (adev)->gfx.funcs->select_se_sh((adev), (se), (sh), (instance))
  1560. #define amdgpu_gds_switch(adev, r, v, d, w, a) (adev)->gds.funcs->patch_gds_switch((r), (v), (d), (w), (a))
  1561. #define amdgpu_psp_check_fw_loading_status(adev, i) (adev)->firmware.funcs->check_fw_loading_status((adev), (i))
  1562. /* Common functions */
  1563. int amdgpu_gpu_reset(struct amdgpu_device *adev);
  1564. bool amdgpu_need_backup(struct amdgpu_device *adev);
  1565. void amdgpu_pci_config_reset(struct amdgpu_device *adev);
  1566. bool amdgpu_need_post(struct amdgpu_device *adev);
  1567. void amdgpu_update_display_priority(struct amdgpu_device *adev);
  1568. void amdgpu_cs_report_moved_bytes(struct amdgpu_device *adev, u64 num_bytes,
  1569. u64 num_vis_bytes);
  1570. void amdgpu_ttm_placement_from_domain(struct amdgpu_bo *abo, u32 domain);
  1571. bool amdgpu_ttm_bo_is_amdgpu_bo(struct ttm_buffer_object *bo);
  1572. void amdgpu_vram_location(struct amdgpu_device *adev, struct amdgpu_mc *mc, u64 base);
  1573. void amdgpu_gart_location(struct amdgpu_device *adev, struct amdgpu_mc *mc);
  1574. void amdgpu_ttm_set_active_vram_size(struct amdgpu_device *adev, u64 size);
  1575. int amdgpu_ttm_init(struct amdgpu_device *adev);
  1576. void amdgpu_ttm_fini(struct amdgpu_device *adev);
  1577. void amdgpu_program_register_sequence(struct amdgpu_device *adev,
  1578. const u32 *registers,
  1579. const u32 array_size);
  1580. bool amdgpu_device_is_px(struct drm_device *dev);
  1581. /* atpx handler */
  1582. #if defined(CONFIG_VGA_SWITCHEROO)
  1583. void amdgpu_register_atpx_handler(void);
  1584. void amdgpu_unregister_atpx_handler(void);
  1585. bool amdgpu_has_atpx_dgpu_power_cntl(void);
  1586. bool amdgpu_is_atpx_hybrid(void);
  1587. bool amdgpu_atpx_dgpu_req_power_for_displays(void);
  1588. bool amdgpu_has_atpx(void);
  1589. #else
  1590. static inline void amdgpu_register_atpx_handler(void) {}
  1591. static inline void amdgpu_unregister_atpx_handler(void) {}
  1592. static inline bool amdgpu_has_atpx_dgpu_power_cntl(void) { return false; }
  1593. static inline bool amdgpu_is_atpx_hybrid(void) { return false; }
  1594. static inline bool amdgpu_atpx_dgpu_req_power_for_displays(void) { return false; }
  1595. static inline bool amdgpu_has_atpx(void) { return false; }
  1596. #endif
  1597. /*
  1598. * KMS
  1599. */
  1600. extern const struct drm_ioctl_desc amdgpu_ioctls_kms[];
  1601. extern const int amdgpu_max_kms_ioctl;
  1602. bool amdgpu_kms_vram_lost(struct amdgpu_device *adev,
  1603. struct amdgpu_fpriv *fpriv);
  1604. int amdgpu_driver_load_kms(struct drm_device *dev, unsigned long flags);
  1605. void amdgpu_driver_unload_kms(struct drm_device *dev);
  1606. void amdgpu_driver_lastclose_kms(struct drm_device *dev);
  1607. int amdgpu_driver_open_kms(struct drm_device *dev, struct drm_file *file_priv);
  1608. void amdgpu_driver_postclose_kms(struct drm_device *dev,
  1609. struct drm_file *file_priv);
  1610. int amdgpu_suspend(struct amdgpu_device *adev);
  1611. int amdgpu_device_suspend(struct drm_device *dev, bool suspend, bool fbcon);
  1612. int amdgpu_device_resume(struct drm_device *dev, bool resume, bool fbcon);
  1613. u32 amdgpu_get_vblank_counter_kms(struct drm_device *dev, unsigned int pipe);
  1614. int amdgpu_enable_vblank_kms(struct drm_device *dev, unsigned int pipe);
  1615. void amdgpu_disable_vblank_kms(struct drm_device *dev, unsigned int pipe);
  1616. long amdgpu_kms_compat_ioctl(struct file *filp, unsigned int cmd,
  1617. unsigned long arg);
  1618. /*
  1619. * functions used by amdgpu_encoder.c
  1620. */
  1621. struct amdgpu_afmt_acr {
  1622. u32 clock;
  1623. int n_32khz;
  1624. int cts_32khz;
  1625. int n_44_1khz;
  1626. int cts_44_1khz;
  1627. int n_48khz;
  1628. int cts_48khz;
  1629. };
  1630. struct amdgpu_afmt_acr amdgpu_afmt_acr(uint32_t clock);
  1631. /* amdgpu_acpi.c */
  1632. #if defined(CONFIG_ACPI)
  1633. int amdgpu_acpi_init(struct amdgpu_device *adev);
  1634. void amdgpu_acpi_fini(struct amdgpu_device *adev);
  1635. bool amdgpu_acpi_is_pcie_performance_request_supported(struct amdgpu_device *adev);
  1636. int amdgpu_acpi_pcie_performance_request(struct amdgpu_device *adev,
  1637. u8 perf_req, bool advertise);
  1638. int amdgpu_acpi_pcie_notify_device_ready(struct amdgpu_device *adev);
  1639. #else
  1640. static inline int amdgpu_acpi_init(struct amdgpu_device *adev) { return 0; }
  1641. static inline void amdgpu_acpi_fini(struct amdgpu_device *adev) { }
  1642. #endif
  1643. int amdgpu_cs_find_mapping(struct amdgpu_cs_parser *parser,
  1644. uint64_t addr, struct amdgpu_bo **bo,
  1645. struct amdgpu_bo_va_mapping **mapping);
  1646. #include "amdgpu_object.h"
  1647. #endif