mxgpu_ai.c 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342
  1. /*
  2. * Copyright 2014 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include "amdgpu.h"
  24. #include "vega10/soc15ip.h"
  25. #include "vega10/NBIO/nbio_6_1_offset.h"
  26. #include "vega10/NBIO/nbio_6_1_sh_mask.h"
  27. #include "vega10/GC/gc_9_0_offset.h"
  28. #include "vega10/GC/gc_9_0_sh_mask.h"
  29. #include "soc15.h"
  30. #include "vega10_ih.h"
  31. #include "soc15_common.h"
  32. #include "mxgpu_ai.h"
  33. static void xgpu_ai_mailbox_send_ack(struct amdgpu_device *adev)
  34. {
  35. u32 reg;
  36. int timeout = AI_MAILBOX_TIMEDOUT;
  37. u32 mask = REG_FIELD_MASK(BIF_BX_PF0_MAILBOX_CONTROL, RCV_MSG_VALID);
  38. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  39. mmBIF_BX_PF0_MAILBOX_CONTROL));
  40. reg = REG_SET_FIELD(reg, BIF_BX_PF0_MAILBOX_CONTROL, RCV_MSG_ACK, 1);
  41. WREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  42. mmBIF_BX_PF0_MAILBOX_CONTROL), reg);
  43. /*Wait for RCV_MSG_VALID to be 0*/
  44. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  45. mmBIF_BX_PF0_MAILBOX_CONTROL));
  46. while (reg & mask) {
  47. if (timeout <= 0) {
  48. pr_err("RCV_MSG_VALID is not cleared\n");
  49. break;
  50. }
  51. mdelay(1);
  52. timeout -=1;
  53. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  54. mmBIF_BX_PF0_MAILBOX_CONTROL));
  55. }
  56. }
  57. static void xgpu_ai_mailbox_set_valid(struct amdgpu_device *adev, bool val)
  58. {
  59. u32 reg;
  60. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  61. mmBIF_BX_PF0_MAILBOX_CONTROL));
  62. reg = REG_SET_FIELD(reg, BIF_BX_PF0_MAILBOX_CONTROL,
  63. TRN_MSG_VALID, val ? 1 : 0);
  64. WREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_CONTROL),
  65. reg);
  66. }
  67. static void xgpu_ai_mailbox_trans_msg(struct amdgpu_device *adev,
  68. enum idh_request req)
  69. {
  70. u32 reg;
  71. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  72. mmBIF_BX_PF0_MAILBOX_MSGBUF_TRN_DW0));
  73. reg = REG_SET_FIELD(reg, BIF_BX_PF0_MAILBOX_MSGBUF_TRN_DW0,
  74. MSGBUF_DATA, req);
  75. WREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_MSGBUF_TRN_DW0),
  76. reg);
  77. xgpu_ai_mailbox_set_valid(adev, true);
  78. }
  79. static int xgpu_ai_mailbox_rcv_msg(struct amdgpu_device *adev,
  80. enum idh_event event)
  81. {
  82. u32 reg;
  83. u32 mask = REG_FIELD_MASK(BIF_BX_PF0_MAILBOX_CONTROL, RCV_MSG_VALID);
  84. if (event != IDH_FLR_NOTIFICATION_CMPL) {
  85. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  86. mmBIF_BX_PF0_MAILBOX_CONTROL));
  87. if (!(reg & mask))
  88. return -ENOENT;
  89. }
  90. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  91. mmBIF_BX_PF0_MAILBOX_MSGBUF_RCV_DW0));
  92. if (reg != event)
  93. return -ENOENT;
  94. xgpu_ai_mailbox_send_ack(adev);
  95. return 0;
  96. }
  97. static int xgpu_ai_poll_ack(struct amdgpu_device *adev)
  98. {
  99. int r = 0, timeout = AI_MAILBOX_TIMEDOUT;
  100. u32 mask = REG_FIELD_MASK(BIF_BX_PF0_MAILBOX_CONTROL, TRN_MSG_ACK);
  101. u32 reg;
  102. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  103. mmBIF_BX_PF0_MAILBOX_CONTROL));
  104. while (!(reg & mask)) {
  105. if (timeout <= 0) {
  106. pr_err("Doesn't get ack from pf.\n");
  107. r = -ETIME;
  108. break;
  109. }
  110. mdelay(5);
  111. timeout -= 5;
  112. reg = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0,
  113. mmBIF_BX_PF0_MAILBOX_CONTROL));
  114. }
  115. return r;
  116. }
  117. static int xgpu_ai_poll_msg(struct amdgpu_device *adev, enum idh_event event)
  118. {
  119. int r = 0, timeout = AI_MAILBOX_TIMEDOUT;
  120. r = xgpu_ai_mailbox_rcv_msg(adev, event);
  121. while (r) {
  122. if (timeout <= 0) {
  123. pr_err("Doesn't get msg:%d from pf.\n", event);
  124. r = -ETIME;
  125. break;
  126. }
  127. mdelay(5);
  128. timeout -= 5;
  129. r = xgpu_ai_mailbox_rcv_msg(adev, event);
  130. }
  131. return r;
  132. }
  133. static int xgpu_ai_send_access_requests(struct amdgpu_device *adev,
  134. enum idh_request req)
  135. {
  136. int r;
  137. xgpu_ai_mailbox_trans_msg(adev, req);
  138. /* start to poll ack */
  139. r = xgpu_ai_poll_ack(adev);
  140. if (r)
  141. pr_err("Doesn't get ack from pf, continue\n");
  142. xgpu_ai_mailbox_set_valid(adev, false);
  143. /* start to check msg if request is idh_req_gpu_init_access */
  144. if (req == IDH_REQ_GPU_INIT_ACCESS ||
  145. req == IDH_REQ_GPU_FINI_ACCESS ||
  146. req == IDH_REQ_GPU_RESET_ACCESS) {
  147. r = xgpu_ai_poll_msg(adev, IDH_READY_TO_ACCESS_GPU);
  148. if (r) {
  149. pr_err("Doesn't get READY_TO_ACCESS_GPU from pf, give up\n");
  150. return r;
  151. }
  152. }
  153. return 0;
  154. }
  155. static int xgpu_ai_request_reset(struct amdgpu_device *adev)
  156. {
  157. return xgpu_ai_send_access_requests(adev, IDH_REQ_GPU_RESET_ACCESS);
  158. }
  159. static int xgpu_ai_request_full_gpu_access(struct amdgpu_device *adev,
  160. bool init)
  161. {
  162. enum idh_request req;
  163. req = init ? IDH_REQ_GPU_INIT_ACCESS : IDH_REQ_GPU_FINI_ACCESS;
  164. return xgpu_ai_send_access_requests(adev, req);
  165. }
  166. static int xgpu_ai_release_full_gpu_access(struct amdgpu_device *adev,
  167. bool init)
  168. {
  169. enum idh_request req;
  170. int r = 0;
  171. req = init ? IDH_REL_GPU_INIT_ACCESS : IDH_REL_GPU_FINI_ACCESS;
  172. r = xgpu_ai_send_access_requests(adev, req);
  173. return r;
  174. }
  175. static int xgpu_ai_mailbox_ack_irq(struct amdgpu_device *adev,
  176. struct amdgpu_irq_src *source,
  177. struct amdgpu_iv_entry *entry)
  178. {
  179. DRM_DEBUG("get ack intr and do nothing.\n");
  180. return 0;
  181. }
  182. static int xgpu_ai_set_mailbox_ack_irq(struct amdgpu_device *adev,
  183. struct amdgpu_irq_src *source,
  184. unsigned type,
  185. enum amdgpu_interrupt_state state)
  186. {
  187. u32 tmp = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_INT_CNTL));
  188. tmp = REG_SET_FIELD(tmp, BIF_BX_PF0_MAILBOX_INT_CNTL, ACK_INT_EN,
  189. (state == AMDGPU_IRQ_STATE_ENABLE) ? 1 : 0);
  190. WREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_INT_CNTL), tmp);
  191. return 0;
  192. }
  193. static void xgpu_ai_mailbox_flr_work(struct work_struct *work)
  194. {
  195. struct amdgpu_virt *virt = container_of(work, struct amdgpu_virt, flr_work);
  196. struct amdgpu_device *adev = container_of(virt, struct amdgpu_device, virt);
  197. /* wait until RCV_MSG become 3 */
  198. if (xgpu_ai_poll_msg(adev, IDH_FLR_NOTIFICATION_CMPL)) {
  199. pr_err("failed to recieve FLR_CMPL\n");
  200. return;
  201. }
  202. /* Trigger recovery due to world switch failure */
  203. amdgpu_sriov_gpu_reset(adev, NULL);
  204. }
  205. static int xgpu_ai_set_mailbox_rcv_irq(struct amdgpu_device *adev,
  206. struct amdgpu_irq_src *src,
  207. unsigned type,
  208. enum amdgpu_interrupt_state state)
  209. {
  210. u32 tmp = RREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_INT_CNTL));
  211. tmp = REG_SET_FIELD(tmp, BIF_BX_PF0_MAILBOX_INT_CNTL, VALID_INT_EN,
  212. (state == AMDGPU_IRQ_STATE_ENABLE) ? 1 : 0);
  213. WREG32_NO_KIQ(SOC15_REG_OFFSET(NBIO, 0, mmBIF_BX_PF0_MAILBOX_INT_CNTL), tmp);
  214. return 0;
  215. }
  216. static int xgpu_ai_mailbox_rcv_irq(struct amdgpu_device *adev,
  217. struct amdgpu_irq_src *source,
  218. struct amdgpu_iv_entry *entry)
  219. {
  220. int r;
  221. /* see what event we get */
  222. r = xgpu_ai_mailbox_rcv_msg(adev, IDH_FLR_NOTIFICATION);
  223. /* only handle FLR_NOTIFY now */
  224. if (!r)
  225. schedule_work(&adev->virt.flr_work);
  226. return 0;
  227. }
  228. static const struct amdgpu_irq_src_funcs xgpu_ai_mailbox_ack_irq_funcs = {
  229. .set = xgpu_ai_set_mailbox_ack_irq,
  230. .process = xgpu_ai_mailbox_ack_irq,
  231. };
  232. static const struct amdgpu_irq_src_funcs xgpu_ai_mailbox_rcv_irq_funcs = {
  233. .set = xgpu_ai_set_mailbox_rcv_irq,
  234. .process = xgpu_ai_mailbox_rcv_irq,
  235. };
  236. void xgpu_ai_mailbox_set_irq_funcs(struct amdgpu_device *adev)
  237. {
  238. adev->virt.ack_irq.num_types = 1;
  239. adev->virt.ack_irq.funcs = &xgpu_ai_mailbox_ack_irq_funcs;
  240. adev->virt.rcv_irq.num_types = 1;
  241. adev->virt.rcv_irq.funcs = &xgpu_ai_mailbox_rcv_irq_funcs;
  242. }
  243. int xgpu_ai_mailbox_add_irq_id(struct amdgpu_device *adev)
  244. {
  245. int r;
  246. r = amdgpu_irq_add_id(adev, AMDGPU_IH_CLIENTID_BIF, 135, &adev->virt.rcv_irq);
  247. if (r)
  248. return r;
  249. r = amdgpu_irq_add_id(adev, AMDGPU_IH_CLIENTID_BIF, 138, &adev->virt.ack_irq);
  250. if (r) {
  251. amdgpu_irq_put(adev, &adev->virt.rcv_irq, 0);
  252. return r;
  253. }
  254. return 0;
  255. }
  256. int xgpu_ai_mailbox_get_irq(struct amdgpu_device *adev)
  257. {
  258. int r;
  259. r = amdgpu_irq_get(adev, &adev->virt.rcv_irq, 0);
  260. if (r)
  261. return r;
  262. r = amdgpu_irq_get(adev, &adev->virt.ack_irq, 0);
  263. if (r) {
  264. amdgpu_irq_put(adev, &adev->virt.rcv_irq, 0);
  265. return r;
  266. }
  267. INIT_WORK(&adev->virt.flr_work, xgpu_ai_mailbox_flr_work);
  268. return 0;
  269. }
  270. void xgpu_ai_mailbox_put_irq(struct amdgpu_device *adev)
  271. {
  272. amdgpu_irq_put(adev, &adev->virt.ack_irq, 0);
  273. amdgpu_irq_put(adev, &adev->virt.rcv_irq, 0);
  274. }
  275. const struct amdgpu_virt_ops xgpu_ai_virt_ops = {
  276. .req_full_gpu = xgpu_ai_request_full_gpu_access,
  277. .rel_full_gpu = xgpu_ai_release_full_gpu_access,
  278. .reset_gpu = xgpu_ai_request_reset,
  279. };