mxgpu_ai.c 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340
  1. /*
  2. * Copyright 2014 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include "amdgpu.h"
  24. #include "vega10/soc15ip.h"
  25. #include "vega10/NBIO/nbio_6_1_offset.h"
  26. #include "vega10/NBIO/nbio_6_1_sh_mask.h"
  27. #include "vega10/GC/gc_9_0_offset.h"
  28. #include "vega10/GC/gc_9_0_sh_mask.h"
  29. #include "soc15.h"
  30. #include "vega10_ih.h"
  31. #include "soc15_common.h"
  32. #include "mxgpu_ai.h"
  33. static void xgpu_ai_mailbox_send_ack(struct amdgpu_device *adev)
  34. {
  35. u32 reg;
  36. int timeout = AI_MAILBOX_TIMEDOUT;
  37. u32 mask = REG_FIELD_MASK(BIF_BX_PF0_MAILBOX_CONTROL, RCV_MSG_VALID);
  38. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  39. mmBIF_BX_PF0_MAILBOX_CONTROL));
  40. reg = REG_SET_FIELD(reg, BIF_BX_PF0_MAILBOX_CONTROL, RCV_MSG_ACK, 1);
  41. WREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  42. mmBIF_BX_PF0_MAILBOX_CONTROL), reg);
  43. /*Wait for RCV_MSG_VALID to be 0*/
  44. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  45. mmBIF_BX_PF0_MAILBOX_CONTROL));
  46. while (reg & mask) {
  47. if (timeout <= 0) {
  48. pr_err("RCV_MSG_VALID is not cleared\n");
  49. break;
  50. }
  51. mdelay(1);
  52. timeout -=1;
  53. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  54. mmBIF_BX_PF0_MAILBOX_CONTROL));
  55. }
  56. }
  57. static void xgpu_ai_mailbox_set_valid(struct amdgpu_device *adev, bool val)
  58. {
  59. u32 reg;
  60. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  61. mmBIF_BX_PF0_MAILBOX_CONTROL));
  62. reg = REG_SET_FIELD(reg, BIF_BX_PF0_MAILBOX_CONTROL,
  63. TRN_MSG_VALID, val ? 1 : 0);
  64. WREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_CONTROL),
  65. reg);
  66. }
  67. static void xgpu_ai_mailbox_trans_msg(struct amdgpu_device *adev,
  68. enum idh_request req)
  69. {
  70. u32 reg;
  71. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  72. mmBIF_BX_PF0_MAILBOX_MSGBUF_TRN_DW0));
  73. reg = REG_SET_FIELD(reg, BIF_BX_PF0_MAILBOX_MSGBUF_TRN_DW0,
  74. MSGBUF_DATA, req);
  75. WREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_MSGBUF_TRN_DW0),
  76. reg);
  77. xgpu_ai_mailbox_set_valid(adev, true);
  78. }
  79. static int xgpu_ai_mailbox_rcv_msg(struct amdgpu_device *adev,
  80. enum idh_event event)
  81. {
  82. u32 reg;
  83. u32 mask = REG_FIELD_MASK(BIF_BX_PF0_MAILBOX_CONTROL, RCV_MSG_VALID);
  84. if (event != IDH_FLR_NOTIFICATION_CMPL) {
  85. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  86. mmBIF_BX_PF0_MAILBOX_CONTROL));
  87. if (!(reg & mask))
  88. return -ENOENT;
  89. }
  90. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  91. mmBIF_BX_PF0_MAILBOX_MSGBUF_RCV_DW0));
  92. if (reg != event)
  93. return -ENOENT;
  94. xgpu_ai_mailbox_send_ack(adev);
  95. return 0;
  96. }
  97. static int xgpu_ai_poll_ack(struct amdgpu_device *adev)
  98. {
  99. int r = 0, timeout = AI_MAILBOX_TIMEDOUT;
  100. u32 mask = REG_FIELD_MASK(BIF_BX_PF0_MAILBOX_CONTROL, TRN_MSG_ACK);
  101. u32 reg;
  102. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  103. mmBIF_BX_PF0_MAILBOX_CONTROL));
  104. while (!(reg & mask)) {
  105. if (timeout <= 0) {
  106. pr_err("Doesn't get ack from pf.\n");
  107. r = -ETIME;
  108. break;
  109. }
  110. msleep(1);
  111. timeout -= 1;
  112. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  113. mmBIF_BX_PF0_MAILBOX_CONTROL));
  114. }
  115. return r;
  116. }
  117. static int xgpu_ai_poll_msg(struct amdgpu_device *adev, enum idh_event event)
  118. {
  119. int r = 0, timeout = AI_MAILBOX_TIMEDOUT;
  120. r = xgpu_ai_mailbox_rcv_msg(adev, event);
  121. while (r) {
  122. if (timeout <= 0) {
  123. pr_err("Doesn't get ack from pf.\n");
  124. r = -ETIME;
  125. break;
  126. }
  127. msleep(1);
  128. timeout -= 1;
  129. r = xgpu_ai_mailbox_rcv_msg(adev, event);
  130. }
  131. return r;
  132. }
  133. static int xgpu_ai_send_access_requests(struct amdgpu_device *adev,
  134. enum idh_request req)
  135. {
  136. int r;
  137. xgpu_ai_mailbox_trans_msg(adev, req);
  138. /* start to poll ack */
  139. r = xgpu_ai_poll_ack(adev);
  140. if (r)
  141. return r;
  142. xgpu_ai_mailbox_set_valid(adev, false);
  143. /* start to check msg if request is idh_req_gpu_init_access */
  144. if (req == IDH_REQ_GPU_INIT_ACCESS ||
  145. req == IDH_REQ_GPU_FINI_ACCESS ||
  146. req == IDH_REQ_GPU_RESET_ACCESS) {
  147. r = xgpu_ai_poll_msg(adev, IDH_READY_TO_ACCESS_GPU);
  148. if (r)
  149. return r;
  150. }
  151. return 0;
  152. }
  153. static int xgpu_ai_request_reset(struct amdgpu_device *adev)
  154. {
  155. return xgpu_ai_send_access_requests(adev, IDH_REQ_GPU_RESET_ACCESS);
  156. }
  157. static int xgpu_ai_request_full_gpu_access(struct amdgpu_device *adev,
  158. bool init)
  159. {
  160. enum idh_request req;
  161. req = init ? IDH_REQ_GPU_INIT_ACCESS : IDH_REQ_GPU_FINI_ACCESS;
  162. return xgpu_ai_send_access_requests(adev, req);
  163. }
  164. static int xgpu_ai_release_full_gpu_access(struct amdgpu_device *adev,
  165. bool init)
  166. {
  167. enum idh_request req;
  168. int r = 0;
  169. req = init ? IDH_REL_GPU_INIT_ACCESS : IDH_REL_GPU_FINI_ACCESS;
  170. r = xgpu_ai_send_access_requests(adev, req);
  171. return r;
  172. }
  173. static int xgpu_ai_mailbox_ack_irq(struct amdgpu_device *adev,
  174. struct amdgpu_irq_src *source,
  175. struct amdgpu_iv_entry *entry)
  176. {
  177. DRM_DEBUG("get ack intr and do nothing.\n");
  178. return 0;
  179. }
  180. static int xgpu_ai_set_mailbox_ack_irq(struct amdgpu_device *adev,
  181. struct amdgpu_irq_src *source,
  182. unsigned type,
  183. enum amdgpu_interrupt_state state)
  184. {
  185. u32 tmp = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_INT_CNTL));
  186. tmp = REG_SET_FIELD(tmp, BIF_BX_PF0_MAILBOX_INT_CNTL, ACK_INT_EN,
  187. (state == AMDGPU_IRQ_STATE_ENABLE) ? 1 : 0);
  188. WREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_INT_CNTL), tmp);
  189. return 0;
  190. }
  191. static void xgpu_ai_mailbox_flr_work(struct work_struct *work)
  192. {
  193. struct amdgpu_virt *virt = container_of(work, struct amdgpu_virt, flr_work);
  194. struct amdgpu_device *adev = container_of(virt, struct amdgpu_device, virt);
  195. /* wait until RCV_MSG become 3 */
  196. if (xgpu_ai_poll_msg(adev, IDH_FLR_NOTIFICATION_CMPL)) {
  197. pr_err("failed to recieve FLR_CMPL\n");
  198. return;
  199. }
  200. /* Trigger recovery due to world switch failure */
  201. amdgpu_sriov_gpu_reset(adev, false);
  202. }
  203. static int xgpu_ai_set_mailbox_rcv_irq(struct amdgpu_device *adev,
  204. struct amdgpu_irq_src *src,
  205. unsigned type,
  206. enum amdgpu_interrupt_state state)
  207. {
  208. u32 tmp = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_INT_CNTL));
  209. tmp = REG_SET_FIELD(tmp, BIF_BX_PF0_MAILBOX_INT_CNTL, VALID_INT_EN,
  210. (state == AMDGPU_IRQ_STATE_ENABLE) ? 1 : 0);
  211. WREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_INT_CNTL), tmp);
  212. return 0;
  213. }
  214. static int xgpu_ai_mailbox_rcv_irq(struct amdgpu_device *adev,
  215. struct amdgpu_irq_src *source,
  216. struct amdgpu_iv_entry *entry)
  217. {
  218. int r;
  219. /* see what event we get */
  220. r = xgpu_ai_mailbox_rcv_msg(adev, IDH_FLR_NOTIFICATION);
  221. /* only handle FLR_NOTIFY now */
  222. if (!r)
  223. schedule_work(&adev->virt.flr_work);
  224. return 0;
  225. }
  226. static const struct amdgpu_irq_src_funcs xgpu_ai_mailbox_ack_irq_funcs = {
  227. .set = xgpu_ai_set_mailbox_ack_irq,
  228. .process = xgpu_ai_mailbox_ack_irq,
  229. };
  230. static const struct amdgpu_irq_src_funcs xgpu_ai_mailbox_rcv_irq_funcs = {
  231. .set = xgpu_ai_set_mailbox_rcv_irq,
  232. .process = xgpu_ai_mailbox_rcv_irq,
  233. };
  234. void xgpu_ai_mailbox_set_irq_funcs(struct amdgpu_device *adev)
  235. {
  236. adev->virt.ack_irq.num_types = 1;
  237. adev->virt.ack_irq.funcs = &xgpu_ai_mailbox_ack_irq_funcs;
  238. adev->virt.rcv_irq.num_types = 1;
  239. adev->virt.rcv_irq.funcs = &xgpu_ai_mailbox_rcv_irq_funcs;
  240. }
  241. int xgpu_ai_mailbox_add_irq_id(struct amdgpu_device *adev)
  242. {
  243. int r;
  244. r = amdgpu_irq_add_id(adev, AMDGPU_IH_CLIENTID_LEGACY, 135, &adev->virt.rcv_irq);
  245. if (r)
  246. return r;
  247. r = amdgpu_irq_add_id(adev, AMDGPU_IH_CLIENTID_LEGACY, 138, &adev->virt.ack_irq);
  248. if (r) {
  249. amdgpu_irq_put(adev, &adev->virt.rcv_irq, 0);
  250. return r;
  251. }
  252. return 0;
  253. }
  254. int xgpu_ai_mailbox_get_irq(struct amdgpu_device *adev)
  255. {
  256. int r;
  257. r = amdgpu_irq_get(adev, &adev->virt.rcv_irq, 0);
  258. if (r)
  259. return r;
  260. r = amdgpu_irq_get(adev, &adev->virt.ack_irq, 0);
  261. if (r) {
  262. amdgpu_irq_put(adev, &adev->virt.rcv_irq, 0);
  263. return r;
  264. }
  265. INIT_WORK(&adev->virt.flr_work, xgpu_ai_mailbox_flr_work);
  266. return 0;
  267. }
  268. void xgpu_ai_mailbox_put_irq(struct amdgpu_device *adev)
  269. {
  270. amdgpu_irq_put(adev, &adev->virt.ack_irq, 0);
  271. amdgpu_irq_put(adev, &adev->virt.rcv_irq, 0);
  272. }
  273. const struct amdgpu_virt_ops xgpu_ai_virt_ops = {
  274. .req_full_gpu = xgpu_ai_request_full_gpu_access,
  275. .rel_full_gpu = xgpu_ai_release_full_gpu_access,
  276. .reset_gpu = xgpu_ai_request_reset,
  277. };