main.c 39 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543
  1. /*
  2. * Copyright (c) 2013, Mellanox Technologies inc. All rights reserved.
  3. *
  4. * This software is available to you under a choice of one of two
  5. * licenses. You may choose to be licensed under the terms of the GNU
  6. * General Public License (GPL) Version 2, available from the file
  7. * COPYING in the main directory of this source tree, or the
  8. * OpenIB.org BSD license below:
  9. *
  10. * Redistribution and use in source and binary forms, with or
  11. * without modification, are permitted provided that the following
  12. * conditions are met:
  13. *
  14. * - Redistributions of source code must retain the above
  15. * copyright notice, this list of conditions and the following
  16. * disclaimer.
  17. *
  18. * - Redistributions in binary form must reproduce the above
  19. * copyright notice, this list of conditions and the following
  20. * disclaimer in the documentation and/or other materials
  21. * provided with the distribution.
  22. *
  23. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  24. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  25. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  26. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  27. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  28. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  29. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  30. * SOFTWARE.
  31. */
  32. #include <asm-generic/kmap_types.h>
  33. #include <linux/module.h>
  34. #include <linux/init.h>
  35. #include <linux/errno.h>
  36. #include <linux/pci.h>
  37. #include <linux/dma-mapping.h>
  38. #include <linux/slab.h>
  39. #include <linux/io-mapping.h>
  40. #include <linux/sched.h>
  41. #include <rdma/ib_user_verbs.h>
  42. #include <rdma/ib_smi.h>
  43. #include <rdma/ib_umem.h>
  44. #include "user.h"
  45. #include "mlx5_ib.h"
  46. #define DRIVER_NAME "mlx5_ib"
  47. #define DRIVER_VERSION "2.2-1"
  48. #define DRIVER_RELDATE "Feb 2014"
  49. MODULE_AUTHOR("Eli Cohen <eli@mellanox.com>");
  50. MODULE_DESCRIPTION("Mellanox Connect-IB HCA IB driver");
  51. MODULE_LICENSE("Dual BSD/GPL");
  52. MODULE_VERSION(DRIVER_VERSION);
  53. static int prof_sel = 2;
  54. module_param_named(prof_sel, prof_sel, int, 0444);
  55. MODULE_PARM_DESC(prof_sel, "profile selector. Valid range 0 - 2");
  56. static char mlx5_version[] =
  57. DRIVER_NAME ": Mellanox Connect-IB Infiniband driver v"
  58. DRIVER_VERSION " (" DRIVER_RELDATE ")\n";
  59. static struct mlx5_profile profile[] = {
  60. [0] = {
  61. .mask = 0,
  62. },
  63. [1] = {
  64. .mask = MLX5_PROF_MASK_QP_SIZE,
  65. .log_max_qp = 12,
  66. },
  67. [2] = {
  68. .mask = MLX5_PROF_MASK_QP_SIZE |
  69. MLX5_PROF_MASK_MR_CACHE,
  70. .log_max_qp = 17,
  71. .mr_cache[0] = {
  72. .size = 500,
  73. .limit = 250
  74. },
  75. .mr_cache[1] = {
  76. .size = 500,
  77. .limit = 250
  78. },
  79. .mr_cache[2] = {
  80. .size = 500,
  81. .limit = 250
  82. },
  83. .mr_cache[3] = {
  84. .size = 500,
  85. .limit = 250
  86. },
  87. .mr_cache[4] = {
  88. .size = 500,
  89. .limit = 250
  90. },
  91. .mr_cache[5] = {
  92. .size = 500,
  93. .limit = 250
  94. },
  95. .mr_cache[6] = {
  96. .size = 500,
  97. .limit = 250
  98. },
  99. .mr_cache[7] = {
  100. .size = 500,
  101. .limit = 250
  102. },
  103. .mr_cache[8] = {
  104. .size = 500,
  105. .limit = 250
  106. },
  107. .mr_cache[9] = {
  108. .size = 500,
  109. .limit = 250
  110. },
  111. .mr_cache[10] = {
  112. .size = 500,
  113. .limit = 250
  114. },
  115. .mr_cache[11] = {
  116. .size = 500,
  117. .limit = 250
  118. },
  119. .mr_cache[12] = {
  120. .size = 64,
  121. .limit = 32
  122. },
  123. .mr_cache[13] = {
  124. .size = 32,
  125. .limit = 16
  126. },
  127. .mr_cache[14] = {
  128. .size = 16,
  129. .limit = 8
  130. },
  131. .mr_cache[15] = {
  132. .size = 8,
  133. .limit = 4
  134. },
  135. },
  136. };
  137. int mlx5_vector2eqn(struct mlx5_ib_dev *dev, int vector, int *eqn, int *irqn)
  138. {
  139. struct mlx5_eq_table *table = &dev->mdev.priv.eq_table;
  140. struct mlx5_eq *eq, *n;
  141. int err = -ENOENT;
  142. spin_lock(&table->lock);
  143. list_for_each_entry_safe(eq, n, &dev->eqs_list, list) {
  144. if (eq->index == vector) {
  145. *eqn = eq->eqn;
  146. *irqn = eq->irqn;
  147. err = 0;
  148. break;
  149. }
  150. }
  151. spin_unlock(&table->lock);
  152. return err;
  153. }
  154. static int alloc_comp_eqs(struct mlx5_ib_dev *dev)
  155. {
  156. struct mlx5_eq_table *table = &dev->mdev.priv.eq_table;
  157. char name[MLX5_MAX_EQ_NAME];
  158. struct mlx5_eq *eq, *n;
  159. int ncomp_vec;
  160. int nent;
  161. int err;
  162. int i;
  163. INIT_LIST_HEAD(&dev->eqs_list);
  164. ncomp_vec = table->num_comp_vectors;
  165. nent = MLX5_COMP_EQ_SIZE;
  166. for (i = 0; i < ncomp_vec; i++) {
  167. eq = kzalloc(sizeof(*eq), GFP_KERNEL);
  168. if (!eq) {
  169. err = -ENOMEM;
  170. goto clean;
  171. }
  172. snprintf(name, MLX5_MAX_EQ_NAME, "mlx5_comp%d", i);
  173. err = mlx5_create_map_eq(&dev->mdev, eq,
  174. i + MLX5_EQ_VEC_COMP_BASE, nent, 0,
  175. name, &dev->mdev.priv.uuari.uars[0]);
  176. if (err) {
  177. kfree(eq);
  178. goto clean;
  179. }
  180. mlx5_ib_dbg(dev, "allocated completion EQN %d\n", eq->eqn);
  181. eq->index = i;
  182. spin_lock(&table->lock);
  183. list_add_tail(&eq->list, &dev->eqs_list);
  184. spin_unlock(&table->lock);
  185. }
  186. dev->num_comp_vectors = ncomp_vec;
  187. return 0;
  188. clean:
  189. spin_lock(&table->lock);
  190. list_for_each_entry_safe(eq, n, &dev->eqs_list, list) {
  191. list_del(&eq->list);
  192. spin_unlock(&table->lock);
  193. if (mlx5_destroy_unmap_eq(&dev->mdev, eq))
  194. mlx5_ib_warn(dev, "failed to destroy EQ 0x%x\n", eq->eqn);
  195. kfree(eq);
  196. spin_lock(&table->lock);
  197. }
  198. spin_unlock(&table->lock);
  199. return err;
  200. }
  201. static void free_comp_eqs(struct mlx5_ib_dev *dev)
  202. {
  203. struct mlx5_eq_table *table = &dev->mdev.priv.eq_table;
  204. struct mlx5_eq *eq, *n;
  205. spin_lock(&table->lock);
  206. list_for_each_entry_safe(eq, n, &dev->eqs_list, list) {
  207. list_del(&eq->list);
  208. spin_unlock(&table->lock);
  209. if (mlx5_destroy_unmap_eq(&dev->mdev, eq))
  210. mlx5_ib_warn(dev, "failed to destroy EQ 0x%x\n", eq->eqn);
  211. kfree(eq);
  212. spin_lock(&table->lock);
  213. }
  214. spin_unlock(&table->lock);
  215. }
  216. static int mlx5_ib_query_device(struct ib_device *ibdev,
  217. struct ib_device_attr *props)
  218. {
  219. struct mlx5_ib_dev *dev = to_mdev(ibdev);
  220. struct ib_smp *in_mad = NULL;
  221. struct ib_smp *out_mad = NULL;
  222. int err = -ENOMEM;
  223. int max_rq_sg;
  224. int max_sq_sg;
  225. u64 flags;
  226. in_mad = kzalloc(sizeof(*in_mad), GFP_KERNEL);
  227. out_mad = kmalloc(sizeof(*out_mad), GFP_KERNEL);
  228. if (!in_mad || !out_mad)
  229. goto out;
  230. init_query_mad(in_mad);
  231. in_mad->attr_id = IB_SMP_ATTR_NODE_INFO;
  232. err = mlx5_MAD_IFC(to_mdev(ibdev), 1, 1, 1, NULL, NULL, in_mad, out_mad);
  233. if (err)
  234. goto out;
  235. memset(props, 0, sizeof(*props));
  236. props->fw_ver = ((u64)fw_rev_maj(&dev->mdev) << 32) |
  237. (fw_rev_min(&dev->mdev) << 16) |
  238. fw_rev_sub(&dev->mdev);
  239. props->device_cap_flags = IB_DEVICE_CHANGE_PHY_PORT |
  240. IB_DEVICE_PORT_ACTIVE_EVENT |
  241. IB_DEVICE_SYS_IMAGE_GUID |
  242. IB_DEVICE_RC_RNR_NAK_GEN;
  243. flags = dev->mdev.caps.flags;
  244. if (flags & MLX5_DEV_CAP_FLAG_BAD_PKEY_CNTR)
  245. props->device_cap_flags |= IB_DEVICE_BAD_PKEY_CNTR;
  246. if (flags & MLX5_DEV_CAP_FLAG_BAD_QKEY_CNTR)
  247. props->device_cap_flags |= IB_DEVICE_BAD_QKEY_CNTR;
  248. if (flags & MLX5_DEV_CAP_FLAG_APM)
  249. props->device_cap_flags |= IB_DEVICE_AUTO_PATH_MIG;
  250. props->device_cap_flags |= IB_DEVICE_LOCAL_DMA_LKEY;
  251. if (flags & MLX5_DEV_CAP_FLAG_XRC)
  252. props->device_cap_flags |= IB_DEVICE_XRC;
  253. props->device_cap_flags |= IB_DEVICE_MEM_MGT_EXTENSIONS;
  254. if (flags & MLX5_DEV_CAP_FLAG_SIG_HAND_OVER) {
  255. props->device_cap_flags |= IB_DEVICE_SIGNATURE_HANDOVER;
  256. /* At this stage no support for signature handover */
  257. props->sig_prot_cap = IB_PROT_T10DIF_TYPE_1 |
  258. IB_PROT_T10DIF_TYPE_2 |
  259. IB_PROT_T10DIF_TYPE_3;
  260. props->sig_guard_cap = IB_GUARD_T10DIF_CRC |
  261. IB_GUARD_T10DIF_CSUM;
  262. }
  263. if (flags & MLX5_DEV_CAP_FLAG_BLOCK_MCAST)
  264. props->device_cap_flags |= IB_DEVICE_BLOCK_MULTICAST_LOOPBACK;
  265. props->vendor_id = be32_to_cpup((__be32 *)(out_mad->data + 36)) &
  266. 0xffffff;
  267. props->vendor_part_id = be16_to_cpup((__be16 *)(out_mad->data + 30));
  268. props->hw_ver = be32_to_cpup((__be32 *)(out_mad->data + 32));
  269. memcpy(&props->sys_image_guid, out_mad->data + 4, 8);
  270. props->max_mr_size = ~0ull;
  271. props->page_size_cap = dev->mdev.caps.min_page_sz;
  272. props->max_qp = 1 << dev->mdev.caps.log_max_qp;
  273. props->max_qp_wr = dev->mdev.caps.max_wqes;
  274. max_rq_sg = dev->mdev.caps.max_rq_desc_sz / sizeof(struct mlx5_wqe_data_seg);
  275. max_sq_sg = (dev->mdev.caps.max_sq_desc_sz - sizeof(struct mlx5_wqe_ctrl_seg)) /
  276. sizeof(struct mlx5_wqe_data_seg);
  277. props->max_sge = min(max_rq_sg, max_sq_sg);
  278. props->max_cq = 1 << dev->mdev.caps.log_max_cq;
  279. props->max_cqe = dev->mdev.caps.max_cqes - 1;
  280. props->max_mr = 1 << dev->mdev.caps.log_max_mkey;
  281. props->max_pd = 1 << dev->mdev.caps.log_max_pd;
  282. props->max_qp_rd_atom = dev->mdev.caps.max_ra_req_qp;
  283. props->max_qp_init_rd_atom = dev->mdev.caps.max_ra_res_qp;
  284. props->max_res_rd_atom = props->max_qp_rd_atom * props->max_qp;
  285. props->max_srq = 1 << dev->mdev.caps.log_max_srq;
  286. props->max_srq_wr = dev->mdev.caps.max_srq_wqes - 1;
  287. props->max_srq_sge = max_rq_sg - 1;
  288. props->max_fast_reg_page_list_len = (unsigned int)-1;
  289. props->local_ca_ack_delay = dev->mdev.caps.local_ca_ack_delay;
  290. props->atomic_cap = IB_ATOMIC_NONE;
  291. props->masked_atomic_cap = IB_ATOMIC_NONE;
  292. props->max_pkeys = be16_to_cpup((__be16 *)(out_mad->data + 28));
  293. props->max_mcast_grp = 1 << dev->mdev.caps.log_max_mcg;
  294. props->max_mcast_qp_attach = dev->mdev.caps.max_qp_mcg;
  295. props->max_total_mcast_qp_attach = props->max_mcast_qp_attach *
  296. props->max_mcast_grp;
  297. props->max_map_per_fmr = INT_MAX; /* no limit in ConnectIB */
  298. out:
  299. kfree(in_mad);
  300. kfree(out_mad);
  301. return err;
  302. }
  303. int mlx5_ib_query_port(struct ib_device *ibdev, u8 port,
  304. struct ib_port_attr *props)
  305. {
  306. struct mlx5_ib_dev *dev = to_mdev(ibdev);
  307. struct ib_smp *in_mad = NULL;
  308. struct ib_smp *out_mad = NULL;
  309. int ext_active_speed;
  310. int err = -ENOMEM;
  311. if (port < 1 || port > dev->mdev.caps.num_ports) {
  312. mlx5_ib_warn(dev, "invalid port number %d\n", port);
  313. return -EINVAL;
  314. }
  315. in_mad = kzalloc(sizeof(*in_mad), GFP_KERNEL);
  316. out_mad = kmalloc(sizeof(*out_mad), GFP_KERNEL);
  317. if (!in_mad || !out_mad)
  318. goto out;
  319. memset(props, 0, sizeof(*props));
  320. init_query_mad(in_mad);
  321. in_mad->attr_id = IB_SMP_ATTR_PORT_INFO;
  322. in_mad->attr_mod = cpu_to_be32(port);
  323. err = mlx5_MAD_IFC(dev, 1, 1, port, NULL, NULL, in_mad, out_mad);
  324. if (err) {
  325. mlx5_ib_warn(dev, "err %d\n", err);
  326. goto out;
  327. }
  328. props->lid = be16_to_cpup((__be16 *)(out_mad->data + 16));
  329. props->lmc = out_mad->data[34] & 0x7;
  330. props->sm_lid = be16_to_cpup((__be16 *)(out_mad->data + 18));
  331. props->sm_sl = out_mad->data[36] & 0xf;
  332. props->state = out_mad->data[32] & 0xf;
  333. props->phys_state = out_mad->data[33] >> 4;
  334. props->port_cap_flags = be32_to_cpup((__be32 *)(out_mad->data + 20));
  335. props->gid_tbl_len = out_mad->data[50];
  336. props->max_msg_sz = 1 << to_mdev(ibdev)->mdev.caps.log_max_msg;
  337. props->pkey_tbl_len = to_mdev(ibdev)->mdev.caps.port[port - 1].pkey_table_len;
  338. props->bad_pkey_cntr = be16_to_cpup((__be16 *)(out_mad->data + 46));
  339. props->qkey_viol_cntr = be16_to_cpup((__be16 *)(out_mad->data + 48));
  340. props->active_width = out_mad->data[31] & 0xf;
  341. props->active_speed = out_mad->data[35] >> 4;
  342. props->max_mtu = out_mad->data[41] & 0xf;
  343. props->active_mtu = out_mad->data[36] >> 4;
  344. props->subnet_timeout = out_mad->data[51] & 0x1f;
  345. props->max_vl_num = out_mad->data[37] >> 4;
  346. props->init_type_reply = out_mad->data[41] >> 4;
  347. /* Check if extended speeds (EDR/FDR/...) are supported */
  348. if (props->port_cap_flags & IB_PORT_EXTENDED_SPEEDS_SUP) {
  349. ext_active_speed = out_mad->data[62] >> 4;
  350. switch (ext_active_speed) {
  351. case 1:
  352. props->active_speed = 16; /* FDR */
  353. break;
  354. case 2:
  355. props->active_speed = 32; /* EDR */
  356. break;
  357. }
  358. }
  359. /* If reported active speed is QDR, check if is FDR-10 */
  360. if (props->active_speed == 4) {
  361. if (dev->mdev.caps.ext_port_cap[port - 1] &
  362. MLX_EXT_PORT_CAP_FLAG_EXTENDED_PORT_INFO) {
  363. init_query_mad(in_mad);
  364. in_mad->attr_id = MLX5_ATTR_EXTENDED_PORT_INFO;
  365. in_mad->attr_mod = cpu_to_be32(port);
  366. err = mlx5_MAD_IFC(dev, 1, 1, port,
  367. NULL, NULL, in_mad, out_mad);
  368. if (err)
  369. goto out;
  370. /* Checking LinkSpeedActive for FDR-10 */
  371. if (out_mad->data[15] & 0x1)
  372. props->active_speed = 8;
  373. }
  374. }
  375. out:
  376. kfree(in_mad);
  377. kfree(out_mad);
  378. return err;
  379. }
  380. static int mlx5_ib_query_gid(struct ib_device *ibdev, u8 port, int index,
  381. union ib_gid *gid)
  382. {
  383. struct ib_smp *in_mad = NULL;
  384. struct ib_smp *out_mad = NULL;
  385. int err = -ENOMEM;
  386. in_mad = kzalloc(sizeof(*in_mad), GFP_KERNEL);
  387. out_mad = kmalloc(sizeof(*out_mad), GFP_KERNEL);
  388. if (!in_mad || !out_mad)
  389. goto out;
  390. init_query_mad(in_mad);
  391. in_mad->attr_id = IB_SMP_ATTR_PORT_INFO;
  392. in_mad->attr_mod = cpu_to_be32(port);
  393. err = mlx5_MAD_IFC(to_mdev(ibdev), 1, 1, port, NULL, NULL, in_mad, out_mad);
  394. if (err)
  395. goto out;
  396. memcpy(gid->raw, out_mad->data + 8, 8);
  397. init_query_mad(in_mad);
  398. in_mad->attr_id = IB_SMP_ATTR_GUID_INFO;
  399. in_mad->attr_mod = cpu_to_be32(index / 8);
  400. err = mlx5_MAD_IFC(to_mdev(ibdev), 1, 1, port, NULL, NULL, in_mad, out_mad);
  401. if (err)
  402. goto out;
  403. memcpy(gid->raw + 8, out_mad->data + (index % 8) * 8, 8);
  404. out:
  405. kfree(in_mad);
  406. kfree(out_mad);
  407. return err;
  408. }
  409. static int mlx5_ib_query_pkey(struct ib_device *ibdev, u8 port, u16 index,
  410. u16 *pkey)
  411. {
  412. struct ib_smp *in_mad = NULL;
  413. struct ib_smp *out_mad = NULL;
  414. int err = -ENOMEM;
  415. in_mad = kzalloc(sizeof(*in_mad), GFP_KERNEL);
  416. out_mad = kmalloc(sizeof(*out_mad), GFP_KERNEL);
  417. if (!in_mad || !out_mad)
  418. goto out;
  419. init_query_mad(in_mad);
  420. in_mad->attr_id = IB_SMP_ATTR_PKEY_TABLE;
  421. in_mad->attr_mod = cpu_to_be32(index / 32);
  422. err = mlx5_MAD_IFC(to_mdev(ibdev), 1, 1, port, NULL, NULL, in_mad, out_mad);
  423. if (err)
  424. goto out;
  425. *pkey = be16_to_cpu(((__be16 *)out_mad->data)[index % 32]);
  426. out:
  427. kfree(in_mad);
  428. kfree(out_mad);
  429. return err;
  430. }
  431. struct mlx5_reg_node_desc {
  432. u8 desc[64];
  433. };
  434. static int mlx5_ib_modify_device(struct ib_device *ibdev, int mask,
  435. struct ib_device_modify *props)
  436. {
  437. struct mlx5_ib_dev *dev = to_mdev(ibdev);
  438. struct mlx5_reg_node_desc in;
  439. struct mlx5_reg_node_desc out;
  440. int err;
  441. if (mask & ~IB_DEVICE_MODIFY_NODE_DESC)
  442. return -EOPNOTSUPP;
  443. if (!(mask & IB_DEVICE_MODIFY_NODE_DESC))
  444. return 0;
  445. /*
  446. * If possible, pass node desc to FW, so it can generate
  447. * a 144 trap. If cmd fails, just ignore.
  448. */
  449. memcpy(&in, props->node_desc, 64);
  450. err = mlx5_core_access_reg(&dev->mdev, &in, sizeof(in), &out,
  451. sizeof(out), MLX5_REG_NODE_DESC, 0, 1);
  452. if (err)
  453. return err;
  454. memcpy(ibdev->node_desc, props->node_desc, 64);
  455. return err;
  456. }
  457. static int mlx5_ib_modify_port(struct ib_device *ibdev, u8 port, int mask,
  458. struct ib_port_modify *props)
  459. {
  460. struct mlx5_ib_dev *dev = to_mdev(ibdev);
  461. struct ib_port_attr attr;
  462. u32 tmp;
  463. int err;
  464. mutex_lock(&dev->cap_mask_mutex);
  465. err = mlx5_ib_query_port(ibdev, port, &attr);
  466. if (err)
  467. goto out;
  468. tmp = (attr.port_cap_flags | props->set_port_cap_mask) &
  469. ~props->clr_port_cap_mask;
  470. err = mlx5_set_port_caps(&dev->mdev, port, tmp);
  471. out:
  472. mutex_unlock(&dev->cap_mask_mutex);
  473. return err;
  474. }
  475. static struct ib_ucontext *mlx5_ib_alloc_ucontext(struct ib_device *ibdev,
  476. struct ib_udata *udata)
  477. {
  478. struct mlx5_ib_dev *dev = to_mdev(ibdev);
  479. struct mlx5_ib_alloc_ucontext_req_v2 req;
  480. struct mlx5_ib_alloc_ucontext_resp resp;
  481. struct mlx5_ib_ucontext *context;
  482. struct mlx5_uuar_info *uuari;
  483. struct mlx5_uar *uars;
  484. int gross_uuars;
  485. int num_uars;
  486. int ver;
  487. int uuarn;
  488. int err;
  489. int i;
  490. int reqlen;
  491. if (!dev->ib_active)
  492. return ERR_PTR(-EAGAIN);
  493. memset(&req, 0, sizeof(req));
  494. reqlen = udata->inlen - sizeof(struct ib_uverbs_cmd_hdr);
  495. if (reqlen == sizeof(struct mlx5_ib_alloc_ucontext_req))
  496. ver = 0;
  497. else if (reqlen == sizeof(struct mlx5_ib_alloc_ucontext_req_v2))
  498. ver = 2;
  499. else
  500. return ERR_PTR(-EINVAL);
  501. err = ib_copy_from_udata(&req, udata, reqlen);
  502. if (err)
  503. return ERR_PTR(err);
  504. if (req.flags || req.reserved)
  505. return ERR_PTR(-EINVAL);
  506. if (req.total_num_uuars > MLX5_MAX_UUARS)
  507. return ERR_PTR(-ENOMEM);
  508. if (req.total_num_uuars == 0)
  509. return ERR_PTR(-EINVAL);
  510. req.total_num_uuars = ALIGN(req.total_num_uuars,
  511. MLX5_NON_FP_BF_REGS_PER_PAGE);
  512. if (req.num_low_latency_uuars > req.total_num_uuars - 1)
  513. return ERR_PTR(-EINVAL);
  514. num_uars = req.total_num_uuars / MLX5_NON_FP_BF_REGS_PER_PAGE;
  515. gross_uuars = num_uars * MLX5_BF_REGS_PER_PAGE;
  516. resp.qp_tab_size = 1 << dev->mdev.caps.log_max_qp;
  517. resp.bf_reg_size = dev->mdev.caps.bf_reg_size;
  518. resp.cache_line_size = L1_CACHE_BYTES;
  519. resp.max_sq_desc_sz = dev->mdev.caps.max_sq_desc_sz;
  520. resp.max_rq_desc_sz = dev->mdev.caps.max_rq_desc_sz;
  521. resp.max_send_wqebb = dev->mdev.caps.max_wqes;
  522. resp.max_recv_wr = dev->mdev.caps.max_wqes;
  523. resp.max_srq_recv_wr = dev->mdev.caps.max_srq_wqes;
  524. context = kzalloc(sizeof(*context), GFP_KERNEL);
  525. if (!context)
  526. return ERR_PTR(-ENOMEM);
  527. uuari = &context->uuari;
  528. mutex_init(&uuari->lock);
  529. uars = kcalloc(num_uars, sizeof(*uars), GFP_KERNEL);
  530. if (!uars) {
  531. err = -ENOMEM;
  532. goto out_ctx;
  533. }
  534. uuari->bitmap = kcalloc(BITS_TO_LONGS(gross_uuars),
  535. sizeof(*uuari->bitmap),
  536. GFP_KERNEL);
  537. if (!uuari->bitmap) {
  538. err = -ENOMEM;
  539. goto out_uar_ctx;
  540. }
  541. /*
  542. * clear all fast path uuars
  543. */
  544. for (i = 0; i < gross_uuars; i++) {
  545. uuarn = i & 3;
  546. if (uuarn == 2 || uuarn == 3)
  547. set_bit(i, uuari->bitmap);
  548. }
  549. uuari->count = kcalloc(gross_uuars, sizeof(*uuari->count), GFP_KERNEL);
  550. if (!uuari->count) {
  551. err = -ENOMEM;
  552. goto out_bitmap;
  553. }
  554. for (i = 0; i < num_uars; i++) {
  555. err = mlx5_cmd_alloc_uar(&dev->mdev, &uars[i].index);
  556. if (err)
  557. goto out_count;
  558. }
  559. INIT_LIST_HEAD(&context->db_page_list);
  560. mutex_init(&context->db_page_mutex);
  561. resp.tot_uuars = req.total_num_uuars;
  562. resp.num_ports = dev->mdev.caps.num_ports;
  563. err = ib_copy_to_udata(udata, &resp,
  564. sizeof(resp) - sizeof(resp.reserved));
  565. if (err)
  566. goto out_uars;
  567. uuari->ver = ver;
  568. uuari->num_low_latency_uuars = req.num_low_latency_uuars;
  569. uuari->uars = uars;
  570. uuari->num_uars = num_uars;
  571. return &context->ibucontext;
  572. out_uars:
  573. for (i--; i >= 0; i--)
  574. mlx5_cmd_free_uar(&dev->mdev, uars[i].index);
  575. out_count:
  576. kfree(uuari->count);
  577. out_bitmap:
  578. kfree(uuari->bitmap);
  579. out_uar_ctx:
  580. kfree(uars);
  581. out_ctx:
  582. kfree(context);
  583. return ERR_PTR(err);
  584. }
  585. static int mlx5_ib_dealloc_ucontext(struct ib_ucontext *ibcontext)
  586. {
  587. struct mlx5_ib_ucontext *context = to_mucontext(ibcontext);
  588. struct mlx5_ib_dev *dev = to_mdev(ibcontext->device);
  589. struct mlx5_uuar_info *uuari = &context->uuari;
  590. int i;
  591. for (i = 0; i < uuari->num_uars; i++) {
  592. if (mlx5_cmd_free_uar(&dev->mdev, uuari->uars[i].index))
  593. mlx5_ib_warn(dev, "failed to free UAR 0x%x\n", uuari->uars[i].index);
  594. }
  595. kfree(uuari->count);
  596. kfree(uuari->bitmap);
  597. kfree(uuari->uars);
  598. kfree(context);
  599. return 0;
  600. }
  601. static phys_addr_t uar_index2pfn(struct mlx5_ib_dev *dev, int index)
  602. {
  603. return (pci_resource_start(dev->mdev.pdev, 0) >> PAGE_SHIFT) + index;
  604. }
  605. static int get_command(unsigned long offset)
  606. {
  607. return (offset >> MLX5_IB_MMAP_CMD_SHIFT) & MLX5_IB_MMAP_CMD_MASK;
  608. }
  609. static int get_arg(unsigned long offset)
  610. {
  611. return offset & ((1 << MLX5_IB_MMAP_CMD_SHIFT) - 1);
  612. }
  613. static int get_index(unsigned long offset)
  614. {
  615. return get_arg(offset);
  616. }
  617. static int mlx5_ib_mmap(struct ib_ucontext *ibcontext, struct vm_area_struct *vma)
  618. {
  619. struct mlx5_ib_ucontext *context = to_mucontext(ibcontext);
  620. struct mlx5_ib_dev *dev = to_mdev(ibcontext->device);
  621. struct mlx5_uuar_info *uuari = &context->uuari;
  622. unsigned long command;
  623. unsigned long idx;
  624. phys_addr_t pfn;
  625. command = get_command(vma->vm_pgoff);
  626. switch (command) {
  627. case MLX5_IB_MMAP_REGULAR_PAGE:
  628. if (vma->vm_end - vma->vm_start != PAGE_SIZE)
  629. return -EINVAL;
  630. idx = get_index(vma->vm_pgoff);
  631. pfn = uar_index2pfn(dev, uuari->uars[idx].index);
  632. mlx5_ib_dbg(dev, "uar idx 0x%lx, pfn 0x%llx\n", idx,
  633. (unsigned long long)pfn);
  634. if (idx >= uuari->num_uars)
  635. return -EINVAL;
  636. vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
  637. if (io_remap_pfn_range(vma, vma->vm_start, pfn,
  638. PAGE_SIZE, vma->vm_page_prot))
  639. return -EAGAIN;
  640. mlx5_ib_dbg(dev, "mapped WC at 0x%lx, PA 0x%llx\n",
  641. vma->vm_start,
  642. (unsigned long long)pfn << PAGE_SHIFT);
  643. break;
  644. case MLX5_IB_MMAP_GET_CONTIGUOUS_PAGES:
  645. return -ENOSYS;
  646. default:
  647. return -EINVAL;
  648. }
  649. return 0;
  650. }
  651. static int alloc_pa_mkey(struct mlx5_ib_dev *dev, u32 *key, u32 pdn)
  652. {
  653. struct mlx5_create_mkey_mbox_in *in;
  654. struct mlx5_mkey_seg *seg;
  655. struct mlx5_core_mr mr;
  656. int err;
  657. in = kzalloc(sizeof(*in), GFP_KERNEL);
  658. if (!in)
  659. return -ENOMEM;
  660. seg = &in->seg;
  661. seg->flags = MLX5_PERM_LOCAL_READ | MLX5_ACCESS_MODE_PA;
  662. seg->flags_pd = cpu_to_be32(pdn | MLX5_MKEY_LEN64);
  663. seg->qpn_mkey7_0 = cpu_to_be32(0xffffff << 8);
  664. seg->start_addr = 0;
  665. err = mlx5_core_create_mkey(&dev->mdev, &mr, in, sizeof(*in),
  666. NULL, NULL, NULL);
  667. if (err) {
  668. mlx5_ib_warn(dev, "failed to create mkey, %d\n", err);
  669. goto err_in;
  670. }
  671. kfree(in);
  672. *key = mr.key;
  673. return 0;
  674. err_in:
  675. kfree(in);
  676. return err;
  677. }
  678. static void free_pa_mkey(struct mlx5_ib_dev *dev, u32 key)
  679. {
  680. struct mlx5_core_mr mr;
  681. int err;
  682. memset(&mr, 0, sizeof(mr));
  683. mr.key = key;
  684. err = mlx5_core_destroy_mkey(&dev->mdev, &mr);
  685. if (err)
  686. mlx5_ib_warn(dev, "failed to destroy mkey 0x%x\n", key);
  687. }
  688. static struct ib_pd *mlx5_ib_alloc_pd(struct ib_device *ibdev,
  689. struct ib_ucontext *context,
  690. struct ib_udata *udata)
  691. {
  692. struct mlx5_ib_alloc_pd_resp resp;
  693. struct mlx5_ib_pd *pd;
  694. int err;
  695. pd = kmalloc(sizeof(*pd), GFP_KERNEL);
  696. if (!pd)
  697. return ERR_PTR(-ENOMEM);
  698. err = mlx5_core_alloc_pd(&to_mdev(ibdev)->mdev, &pd->pdn);
  699. if (err) {
  700. kfree(pd);
  701. return ERR_PTR(err);
  702. }
  703. if (context) {
  704. resp.pdn = pd->pdn;
  705. if (ib_copy_to_udata(udata, &resp, sizeof(resp))) {
  706. mlx5_core_dealloc_pd(&to_mdev(ibdev)->mdev, pd->pdn);
  707. kfree(pd);
  708. return ERR_PTR(-EFAULT);
  709. }
  710. } else {
  711. err = alloc_pa_mkey(to_mdev(ibdev), &pd->pa_lkey, pd->pdn);
  712. if (err) {
  713. mlx5_core_dealloc_pd(&to_mdev(ibdev)->mdev, pd->pdn);
  714. kfree(pd);
  715. return ERR_PTR(err);
  716. }
  717. }
  718. return &pd->ibpd;
  719. }
  720. static int mlx5_ib_dealloc_pd(struct ib_pd *pd)
  721. {
  722. struct mlx5_ib_dev *mdev = to_mdev(pd->device);
  723. struct mlx5_ib_pd *mpd = to_mpd(pd);
  724. if (!pd->uobject)
  725. free_pa_mkey(mdev, mpd->pa_lkey);
  726. mlx5_core_dealloc_pd(&mdev->mdev, mpd->pdn);
  727. kfree(mpd);
  728. return 0;
  729. }
  730. static int mlx5_ib_mcg_attach(struct ib_qp *ibqp, union ib_gid *gid, u16 lid)
  731. {
  732. struct mlx5_ib_dev *dev = to_mdev(ibqp->device);
  733. int err;
  734. err = mlx5_core_attach_mcg(&dev->mdev, gid, ibqp->qp_num);
  735. if (err)
  736. mlx5_ib_warn(dev, "failed attaching QPN 0x%x, MGID %pI6\n",
  737. ibqp->qp_num, gid->raw);
  738. return err;
  739. }
  740. static int mlx5_ib_mcg_detach(struct ib_qp *ibqp, union ib_gid *gid, u16 lid)
  741. {
  742. struct mlx5_ib_dev *dev = to_mdev(ibqp->device);
  743. int err;
  744. err = mlx5_core_detach_mcg(&dev->mdev, gid, ibqp->qp_num);
  745. if (err)
  746. mlx5_ib_warn(dev, "failed detaching QPN 0x%x, MGID %pI6\n",
  747. ibqp->qp_num, gid->raw);
  748. return err;
  749. }
  750. static int init_node_data(struct mlx5_ib_dev *dev)
  751. {
  752. struct ib_smp *in_mad = NULL;
  753. struct ib_smp *out_mad = NULL;
  754. int err = -ENOMEM;
  755. in_mad = kzalloc(sizeof(*in_mad), GFP_KERNEL);
  756. out_mad = kmalloc(sizeof(*out_mad), GFP_KERNEL);
  757. if (!in_mad || !out_mad)
  758. goto out;
  759. init_query_mad(in_mad);
  760. in_mad->attr_id = IB_SMP_ATTR_NODE_DESC;
  761. err = mlx5_MAD_IFC(dev, 1, 1, 1, NULL, NULL, in_mad, out_mad);
  762. if (err)
  763. goto out;
  764. memcpy(dev->ib_dev.node_desc, out_mad->data, 64);
  765. in_mad->attr_id = IB_SMP_ATTR_NODE_INFO;
  766. err = mlx5_MAD_IFC(dev, 1, 1, 1, NULL, NULL, in_mad, out_mad);
  767. if (err)
  768. goto out;
  769. dev->mdev.rev_id = be32_to_cpup((__be32 *)(out_mad->data + 32));
  770. memcpy(&dev->ib_dev.node_guid, out_mad->data + 12, 8);
  771. out:
  772. kfree(in_mad);
  773. kfree(out_mad);
  774. return err;
  775. }
  776. static ssize_t show_fw_pages(struct device *device, struct device_attribute *attr,
  777. char *buf)
  778. {
  779. struct mlx5_ib_dev *dev =
  780. container_of(device, struct mlx5_ib_dev, ib_dev.dev);
  781. return sprintf(buf, "%d\n", dev->mdev.priv.fw_pages);
  782. }
  783. static ssize_t show_reg_pages(struct device *device,
  784. struct device_attribute *attr, char *buf)
  785. {
  786. struct mlx5_ib_dev *dev =
  787. container_of(device, struct mlx5_ib_dev, ib_dev.dev);
  788. return sprintf(buf, "%d\n", dev->mdev.priv.reg_pages);
  789. }
  790. static ssize_t show_hca(struct device *device, struct device_attribute *attr,
  791. char *buf)
  792. {
  793. struct mlx5_ib_dev *dev =
  794. container_of(device, struct mlx5_ib_dev, ib_dev.dev);
  795. return sprintf(buf, "MT%d\n", dev->mdev.pdev->device);
  796. }
  797. static ssize_t show_fw_ver(struct device *device, struct device_attribute *attr,
  798. char *buf)
  799. {
  800. struct mlx5_ib_dev *dev =
  801. container_of(device, struct mlx5_ib_dev, ib_dev.dev);
  802. return sprintf(buf, "%d.%d.%d\n", fw_rev_maj(&dev->mdev),
  803. fw_rev_min(&dev->mdev), fw_rev_sub(&dev->mdev));
  804. }
  805. static ssize_t show_rev(struct device *device, struct device_attribute *attr,
  806. char *buf)
  807. {
  808. struct mlx5_ib_dev *dev =
  809. container_of(device, struct mlx5_ib_dev, ib_dev.dev);
  810. return sprintf(buf, "%x\n", dev->mdev.rev_id);
  811. }
  812. static ssize_t show_board(struct device *device, struct device_attribute *attr,
  813. char *buf)
  814. {
  815. struct mlx5_ib_dev *dev =
  816. container_of(device, struct mlx5_ib_dev, ib_dev.dev);
  817. return sprintf(buf, "%.*s\n", MLX5_BOARD_ID_LEN,
  818. dev->mdev.board_id);
  819. }
  820. static DEVICE_ATTR(hw_rev, S_IRUGO, show_rev, NULL);
  821. static DEVICE_ATTR(fw_ver, S_IRUGO, show_fw_ver, NULL);
  822. static DEVICE_ATTR(hca_type, S_IRUGO, show_hca, NULL);
  823. static DEVICE_ATTR(board_id, S_IRUGO, show_board, NULL);
  824. static DEVICE_ATTR(fw_pages, S_IRUGO, show_fw_pages, NULL);
  825. static DEVICE_ATTR(reg_pages, S_IRUGO, show_reg_pages, NULL);
  826. static struct device_attribute *mlx5_class_attributes[] = {
  827. &dev_attr_hw_rev,
  828. &dev_attr_fw_ver,
  829. &dev_attr_hca_type,
  830. &dev_attr_board_id,
  831. &dev_attr_fw_pages,
  832. &dev_attr_reg_pages,
  833. };
  834. static void mlx5_ib_event(struct mlx5_core_dev *dev, enum mlx5_dev_event event,
  835. void *data)
  836. {
  837. struct mlx5_ib_dev *ibdev = container_of(dev, struct mlx5_ib_dev, mdev);
  838. struct ib_event ibev;
  839. u8 port = 0;
  840. switch (event) {
  841. case MLX5_DEV_EVENT_SYS_ERROR:
  842. ibdev->ib_active = false;
  843. ibev.event = IB_EVENT_DEVICE_FATAL;
  844. break;
  845. case MLX5_DEV_EVENT_PORT_UP:
  846. ibev.event = IB_EVENT_PORT_ACTIVE;
  847. port = *(u8 *)data;
  848. break;
  849. case MLX5_DEV_EVENT_PORT_DOWN:
  850. ibev.event = IB_EVENT_PORT_ERR;
  851. port = *(u8 *)data;
  852. break;
  853. case MLX5_DEV_EVENT_PORT_INITIALIZED:
  854. /* not used by ULPs */
  855. return;
  856. case MLX5_DEV_EVENT_LID_CHANGE:
  857. ibev.event = IB_EVENT_LID_CHANGE;
  858. port = *(u8 *)data;
  859. break;
  860. case MLX5_DEV_EVENT_PKEY_CHANGE:
  861. ibev.event = IB_EVENT_PKEY_CHANGE;
  862. port = *(u8 *)data;
  863. break;
  864. case MLX5_DEV_EVENT_GUID_CHANGE:
  865. ibev.event = IB_EVENT_GID_CHANGE;
  866. port = *(u8 *)data;
  867. break;
  868. case MLX5_DEV_EVENT_CLIENT_REREG:
  869. ibev.event = IB_EVENT_CLIENT_REREGISTER;
  870. port = *(u8 *)data;
  871. break;
  872. }
  873. ibev.device = &ibdev->ib_dev;
  874. ibev.element.port_num = port;
  875. if (port < 1 || port > ibdev->num_ports) {
  876. mlx5_ib_warn(ibdev, "warning: event on port %d\n", port);
  877. return;
  878. }
  879. if (ibdev->ib_active)
  880. ib_dispatch_event(&ibev);
  881. }
  882. static void get_ext_port_caps(struct mlx5_ib_dev *dev)
  883. {
  884. int port;
  885. for (port = 1; port <= dev->mdev.caps.num_ports; port++)
  886. mlx5_query_ext_port_caps(dev, port);
  887. }
  888. static int get_port_caps(struct mlx5_ib_dev *dev)
  889. {
  890. struct ib_device_attr *dprops = NULL;
  891. struct ib_port_attr *pprops = NULL;
  892. int err = 0;
  893. int port;
  894. pprops = kmalloc(sizeof(*pprops), GFP_KERNEL);
  895. if (!pprops)
  896. goto out;
  897. dprops = kmalloc(sizeof(*dprops), GFP_KERNEL);
  898. if (!dprops)
  899. goto out;
  900. err = mlx5_ib_query_device(&dev->ib_dev, dprops);
  901. if (err) {
  902. mlx5_ib_warn(dev, "query_device failed %d\n", err);
  903. goto out;
  904. }
  905. for (port = 1; port <= dev->mdev.caps.num_ports; port++) {
  906. err = mlx5_ib_query_port(&dev->ib_dev, port, pprops);
  907. if (err) {
  908. mlx5_ib_warn(dev, "query_port %d failed %d\n", port, err);
  909. break;
  910. }
  911. dev->mdev.caps.port[port - 1].pkey_table_len = dprops->max_pkeys;
  912. dev->mdev.caps.port[port - 1].gid_table_len = pprops->gid_tbl_len;
  913. mlx5_ib_dbg(dev, "pkey_table_len %d, gid_table_len %d\n",
  914. dprops->max_pkeys, pprops->gid_tbl_len);
  915. }
  916. out:
  917. kfree(pprops);
  918. kfree(dprops);
  919. return err;
  920. }
  921. static void destroy_umrc_res(struct mlx5_ib_dev *dev)
  922. {
  923. int err;
  924. err = mlx5_mr_cache_cleanup(dev);
  925. if (err)
  926. mlx5_ib_warn(dev, "mr cache cleanup failed\n");
  927. mlx5_ib_destroy_qp(dev->umrc.qp);
  928. ib_destroy_cq(dev->umrc.cq);
  929. ib_dereg_mr(dev->umrc.mr);
  930. ib_dealloc_pd(dev->umrc.pd);
  931. }
  932. enum {
  933. MAX_UMR_WR = 128,
  934. };
  935. static int create_umr_res(struct mlx5_ib_dev *dev)
  936. {
  937. struct ib_qp_init_attr *init_attr = NULL;
  938. struct ib_qp_attr *attr = NULL;
  939. struct ib_pd *pd;
  940. struct ib_cq *cq;
  941. struct ib_qp *qp;
  942. struct ib_mr *mr;
  943. int ret;
  944. attr = kzalloc(sizeof(*attr), GFP_KERNEL);
  945. init_attr = kzalloc(sizeof(*init_attr), GFP_KERNEL);
  946. if (!attr || !init_attr) {
  947. ret = -ENOMEM;
  948. goto error_0;
  949. }
  950. pd = ib_alloc_pd(&dev->ib_dev);
  951. if (IS_ERR(pd)) {
  952. mlx5_ib_dbg(dev, "Couldn't create PD for sync UMR QP\n");
  953. ret = PTR_ERR(pd);
  954. goto error_0;
  955. }
  956. mr = ib_get_dma_mr(pd, IB_ACCESS_LOCAL_WRITE);
  957. if (IS_ERR(mr)) {
  958. mlx5_ib_dbg(dev, "Couldn't create DMA MR for sync UMR QP\n");
  959. ret = PTR_ERR(mr);
  960. goto error_1;
  961. }
  962. cq = ib_create_cq(&dev->ib_dev, mlx5_umr_cq_handler, NULL, NULL, 128,
  963. 0);
  964. if (IS_ERR(cq)) {
  965. mlx5_ib_dbg(dev, "Couldn't create CQ for sync UMR QP\n");
  966. ret = PTR_ERR(cq);
  967. goto error_2;
  968. }
  969. ib_req_notify_cq(cq, IB_CQ_NEXT_COMP);
  970. init_attr->send_cq = cq;
  971. init_attr->recv_cq = cq;
  972. init_attr->sq_sig_type = IB_SIGNAL_ALL_WR;
  973. init_attr->cap.max_send_wr = MAX_UMR_WR;
  974. init_attr->cap.max_send_sge = 1;
  975. init_attr->qp_type = MLX5_IB_QPT_REG_UMR;
  976. init_attr->port_num = 1;
  977. qp = mlx5_ib_create_qp(pd, init_attr, NULL);
  978. if (IS_ERR(qp)) {
  979. mlx5_ib_dbg(dev, "Couldn't create sync UMR QP\n");
  980. ret = PTR_ERR(qp);
  981. goto error_3;
  982. }
  983. qp->device = &dev->ib_dev;
  984. qp->real_qp = qp;
  985. qp->uobject = NULL;
  986. qp->qp_type = MLX5_IB_QPT_REG_UMR;
  987. attr->qp_state = IB_QPS_INIT;
  988. attr->port_num = 1;
  989. ret = mlx5_ib_modify_qp(qp, attr, IB_QP_STATE | IB_QP_PKEY_INDEX |
  990. IB_QP_PORT, NULL);
  991. if (ret) {
  992. mlx5_ib_dbg(dev, "Couldn't modify UMR QP\n");
  993. goto error_4;
  994. }
  995. memset(attr, 0, sizeof(*attr));
  996. attr->qp_state = IB_QPS_RTR;
  997. attr->path_mtu = IB_MTU_256;
  998. ret = mlx5_ib_modify_qp(qp, attr, IB_QP_STATE, NULL);
  999. if (ret) {
  1000. mlx5_ib_dbg(dev, "Couldn't modify umr QP to rtr\n");
  1001. goto error_4;
  1002. }
  1003. memset(attr, 0, sizeof(*attr));
  1004. attr->qp_state = IB_QPS_RTS;
  1005. ret = mlx5_ib_modify_qp(qp, attr, IB_QP_STATE, NULL);
  1006. if (ret) {
  1007. mlx5_ib_dbg(dev, "Couldn't modify umr QP to rts\n");
  1008. goto error_4;
  1009. }
  1010. dev->umrc.qp = qp;
  1011. dev->umrc.cq = cq;
  1012. dev->umrc.mr = mr;
  1013. dev->umrc.pd = pd;
  1014. sema_init(&dev->umrc.sem, MAX_UMR_WR);
  1015. ret = mlx5_mr_cache_init(dev);
  1016. if (ret) {
  1017. mlx5_ib_warn(dev, "mr cache init failed %d\n", ret);
  1018. goto error_4;
  1019. }
  1020. kfree(attr);
  1021. kfree(init_attr);
  1022. return 0;
  1023. error_4:
  1024. mlx5_ib_destroy_qp(qp);
  1025. error_3:
  1026. ib_destroy_cq(cq);
  1027. error_2:
  1028. ib_dereg_mr(mr);
  1029. error_1:
  1030. ib_dealloc_pd(pd);
  1031. error_0:
  1032. kfree(attr);
  1033. kfree(init_attr);
  1034. return ret;
  1035. }
  1036. static int create_dev_resources(struct mlx5_ib_resources *devr)
  1037. {
  1038. struct ib_srq_init_attr attr;
  1039. struct mlx5_ib_dev *dev;
  1040. int ret = 0;
  1041. dev = container_of(devr, struct mlx5_ib_dev, devr);
  1042. devr->p0 = mlx5_ib_alloc_pd(&dev->ib_dev, NULL, NULL);
  1043. if (IS_ERR(devr->p0)) {
  1044. ret = PTR_ERR(devr->p0);
  1045. goto error0;
  1046. }
  1047. devr->p0->device = &dev->ib_dev;
  1048. devr->p0->uobject = NULL;
  1049. atomic_set(&devr->p0->usecnt, 0);
  1050. devr->c0 = mlx5_ib_create_cq(&dev->ib_dev, 1, 0, NULL, NULL);
  1051. if (IS_ERR(devr->c0)) {
  1052. ret = PTR_ERR(devr->c0);
  1053. goto error1;
  1054. }
  1055. devr->c0->device = &dev->ib_dev;
  1056. devr->c0->uobject = NULL;
  1057. devr->c0->comp_handler = NULL;
  1058. devr->c0->event_handler = NULL;
  1059. devr->c0->cq_context = NULL;
  1060. atomic_set(&devr->c0->usecnt, 0);
  1061. devr->x0 = mlx5_ib_alloc_xrcd(&dev->ib_dev, NULL, NULL);
  1062. if (IS_ERR(devr->x0)) {
  1063. ret = PTR_ERR(devr->x0);
  1064. goto error2;
  1065. }
  1066. devr->x0->device = &dev->ib_dev;
  1067. devr->x0->inode = NULL;
  1068. atomic_set(&devr->x0->usecnt, 0);
  1069. mutex_init(&devr->x0->tgt_qp_mutex);
  1070. INIT_LIST_HEAD(&devr->x0->tgt_qp_list);
  1071. devr->x1 = mlx5_ib_alloc_xrcd(&dev->ib_dev, NULL, NULL);
  1072. if (IS_ERR(devr->x1)) {
  1073. ret = PTR_ERR(devr->x1);
  1074. goto error3;
  1075. }
  1076. devr->x1->device = &dev->ib_dev;
  1077. devr->x1->inode = NULL;
  1078. atomic_set(&devr->x1->usecnt, 0);
  1079. mutex_init(&devr->x1->tgt_qp_mutex);
  1080. INIT_LIST_HEAD(&devr->x1->tgt_qp_list);
  1081. memset(&attr, 0, sizeof(attr));
  1082. attr.attr.max_sge = 1;
  1083. attr.attr.max_wr = 1;
  1084. attr.srq_type = IB_SRQT_XRC;
  1085. attr.ext.xrc.cq = devr->c0;
  1086. attr.ext.xrc.xrcd = devr->x0;
  1087. devr->s0 = mlx5_ib_create_srq(devr->p0, &attr, NULL);
  1088. if (IS_ERR(devr->s0)) {
  1089. ret = PTR_ERR(devr->s0);
  1090. goto error4;
  1091. }
  1092. devr->s0->device = &dev->ib_dev;
  1093. devr->s0->pd = devr->p0;
  1094. devr->s0->uobject = NULL;
  1095. devr->s0->event_handler = NULL;
  1096. devr->s0->srq_context = NULL;
  1097. devr->s0->srq_type = IB_SRQT_XRC;
  1098. devr->s0->ext.xrc.xrcd = devr->x0;
  1099. devr->s0->ext.xrc.cq = devr->c0;
  1100. atomic_inc(&devr->s0->ext.xrc.xrcd->usecnt);
  1101. atomic_inc(&devr->s0->ext.xrc.cq->usecnt);
  1102. atomic_inc(&devr->p0->usecnt);
  1103. atomic_set(&devr->s0->usecnt, 0);
  1104. return 0;
  1105. error4:
  1106. mlx5_ib_dealloc_xrcd(devr->x1);
  1107. error3:
  1108. mlx5_ib_dealloc_xrcd(devr->x0);
  1109. error2:
  1110. mlx5_ib_destroy_cq(devr->c0);
  1111. error1:
  1112. mlx5_ib_dealloc_pd(devr->p0);
  1113. error0:
  1114. return ret;
  1115. }
  1116. static void destroy_dev_resources(struct mlx5_ib_resources *devr)
  1117. {
  1118. mlx5_ib_destroy_srq(devr->s0);
  1119. mlx5_ib_dealloc_xrcd(devr->x0);
  1120. mlx5_ib_dealloc_xrcd(devr->x1);
  1121. mlx5_ib_destroy_cq(devr->c0);
  1122. mlx5_ib_dealloc_pd(devr->p0);
  1123. }
  1124. static int init_one(struct pci_dev *pdev,
  1125. const struct pci_device_id *id)
  1126. {
  1127. struct mlx5_core_dev *mdev;
  1128. struct mlx5_ib_dev *dev;
  1129. int err;
  1130. int i;
  1131. printk_once(KERN_INFO "%s", mlx5_version);
  1132. dev = (struct mlx5_ib_dev *)ib_alloc_device(sizeof(*dev));
  1133. if (!dev)
  1134. return -ENOMEM;
  1135. mdev = &dev->mdev;
  1136. mdev->event = mlx5_ib_event;
  1137. if (prof_sel >= ARRAY_SIZE(profile)) {
  1138. pr_warn("selected pofile out of range, selceting default\n");
  1139. prof_sel = 0;
  1140. }
  1141. mdev->profile = &profile[prof_sel];
  1142. err = mlx5_dev_init(mdev, pdev);
  1143. if (err)
  1144. goto err_free;
  1145. err = get_port_caps(dev);
  1146. if (err)
  1147. goto err_cleanup;
  1148. get_ext_port_caps(dev);
  1149. err = alloc_comp_eqs(dev);
  1150. if (err)
  1151. goto err_cleanup;
  1152. MLX5_INIT_DOORBELL_LOCK(&dev->uar_lock);
  1153. strlcpy(dev->ib_dev.name, "mlx5_%d", IB_DEVICE_NAME_MAX);
  1154. dev->ib_dev.owner = THIS_MODULE;
  1155. dev->ib_dev.node_type = RDMA_NODE_IB_CA;
  1156. dev->ib_dev.local_dma_lkey = mdev->caps.reserved_lkey;
  1157. dev->num_ports = mdev->caps.num_ports;
  1158. dev->ib_dev.phys_port_cnt = dev->num_ports;
  1159. dev->ib_dev.num_comp_vectors = dev->num_comp_vectors;
  1160. dev->ib_dev.dma_device = &mdev->pdev->dev;
  1161. dev->ib_dev.uverbs_abi_ver = MLX5_IB_UVERBS_ABI_VERSION;
  1162. dev->ib_dev.uverbs_cmd_mask =
  1163. (1ull << IB_USER_VERBS_CMD_GET_CONTEXT) |
  1164. (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE) |
  1165. (1ull << IB_USER_VERBS_CMD_QUERY_PORT) |
  1166. (1ull << IB_USER_VERBS_CMD_ALLOC_PD) |
  1167. (1ull << IB_USER_VERBS_CMD_DEALLOC_PD) |
  1168. (1ull << IB_USER_VERBS_CMD_REG_MR) |
  1169. (1ull << IB_USER_VERBS_CMD_DEREG_MR) |
  1170. (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
  1171. (1ull << IB_USER_VERBS_CMD_CREATE_CQ) |
  1172. (1ull << IB_USER_VERBS_CMD_RESIZE_CQ) |
  1173. (1ull << IB_USER_VERBS_CMD_DESTROY_CQ) |
  1174. (1ull << IB_USER_VERBS_CMD_CREATE_QP) |
  1175. (1ull << IB_USER_VERBS_CMD_MODIFY_QP) |
  1176. (1ull << IB_USER_VERBS_CMD_QUERY_QP) |
  1177. (1ull << IB_USER_VERBS_CMD_DESTROY_QP) |
  1178. (1ull << IB_USER_VERBS_CMD_ATTACH_MCAST) |
  1179. (1ull << IB_USER_VERBS_CMD_DETACH_MCAST) |
  1180. (1ull << IB_USER_VERBS_CMD_CREATE_SRQ) |
  1181. (1ull << IB_USER_VERBS_CMD_MODIFY_SRQ) |
  1182. (1ull << IB_USER_VERBS_CMD_QUERY_SRQ) |
  1183. (1ull << IB_USER_VERBS_CMD_DESTROY_SRQ) |
  1184. (1ull << IB_USER_VERBS_CMD_CREATE_XSRQ) |
  1185. (1ull << IB_USER_VERBS_CMD_OPEN_QP);
  1186. dev->ib_dev.query_device = mlx5_ib_query_device;
  1187. dev->ib_dev.query_port = mlx5_ib_query_port;
  1188. dev->ib_dev.query_gid = mlx5_ib_query_gid;
  1189. dev->ib_dev.query_pkey = mlx5_ib_query_pkey;
  1190. dev->ib_dev.modify_device = mlx5_ib_modify_device;
  1191. dev->ib_dev.modify_port = mlx5_ib_modify_port;
  1192. dev->ib_dev.alloc_ucontext = mlx5_ib_alloc_ucontext;
  1193. dev->ib_dev.dealloc_ucontext = mlx5_ib_dealloc_ucontext;
  1194. dev->ib_dev.mmap = mlx5_ib_mmap;
  1195. dev->ib_dev.alloc_pd = mlx5_ib_alloc_pd;
  1196. dev->ib_dev.dealloc_pd = mlx5_ib_dealloc_pd;
  1197. dev->ib_dev.create_ah = mlx5_ib_create_ah;
  1198. dev->ib_dev.query_ah = mlx5_ib_query_ah;
  1199. dev->ib_dev.destroy_ah = mlx5_ib_destroy_ah;
  1200. dev->ib_dev.create_srq = mlx5_ib_create_srq;
  1201. dev->ib_dev.modify_srq = mlx5_ib_modify_srq;
  1202. dev->ib_dev.query_srq = mlx5_ib_query_srq;
  1203. dev->ib_dev.destroy_srq = mlx5_ib_destroy_srq;
  1204. dev->ib_dev.post_srq_recv = mlx5_ib_post_srq_recv;
  1205. dev->ib_dev.create_qp = mlx5_ib_create_qp;
  1206. dev->ib_dev.modify_qp = mlx5_ib_modify_qp;
  1207. dev->ib_dev.query_qp = mlx5_ib_query_qp;
  1208. dev->ib_dev.destroy_qp = mlx5_ib_destroy_qp;
  1209. dev->ib_dev.post_send = mlx5_ib_post_send;
  1210. dev->ib_dev.post_recv = mlx5_ib_post_recv;
  1211. dev->ib_dev.create_cq = mlx5_ib_create_cq;
  1212. dev->ib_dev.modify_cq = mlx5_ib_modify_cq;
  1213. dev->ib_dev.resize_cq = mlx5_ib_resize_cq;
  1214. dev->ib_dev.destroy_cq = mlx5_ib_destroy_cq;
  1215. dev->ib_dev.poll_cq = mlx5_ib_poll_cq;
  1216. dev->ib_dev.req_notify_cq = mlx5_ib_arm_cq;
  1217. dev->ib_dev.get_dma_mr = mlx5_ib_get_dma_mr;
  1218. dev->ib_dev.reg_user_mr = mlx5_ib_reg_user_mr;
  1219. dev->ib_dev.dereg_mr = mlx5_ib_dereg_mr;
  1220. dev->ib_dev.destroy_mr = mlx5_ib_destroy_mr;
  1221. dev->ib_dev.attach_mcast = mlx5_ib_mcg_attach;
  1222. dev->ib_dev.detach_mcast = mlx5_ib_mcg_detach;
  1223. dev->ib_dev.process_mad = mlx5_ib_process_mad;
  1224. dev->ib_dev.create_mr = mlx5_ib_create_mr;
  1225. dev->ib_dev.alloc_fast_reg_mr = mlx5_ib_alloc_fast_reg_mr;
  1226. dev->ib_dev.alloc_fast_reg_page_list = mlx5_ib_alloc_fast_reg_page_list;
  1227. dev->ib_dev.free_fast_reg_page_list = mlx5_ib_free_fast_reg_page_list;
  1228. dev->ib_dev.check_mr_status = mlx5_ib_check_mr_status;
  1229. if (mdev->caps.flags & MLX5_DEV_CAP_FLAG_XRC) {
  1230. dev->ib_dev.alloc_xrcd = mlx5_ib_alloc_xrcd;
  1231. dev->ib_dev.dealloc_xrcd = mlx5_ib_dealloc_xrcd;
  1232. dev->ib_dev.uverbs_cmd_mask |=
  1233. (1ull << IB_USER_VERBS_CMD_OPEN_XRCD) |
  1234. (1ull << IB_USER_VERBS_CMD_CLOSE_XRCD);
  1235. }
  1236. err = init_node_data(dev);
  1237. if (err)
  1238. goto err_eqs;
  1239. mutex_init(&dev->cap_mask_mutex);
  1240. spin_lock_init(&dev->mr_lock);
  1241. err = create_dev_resources(&dev->devr);
  1242. if (err)
  1243. goto err_eqs;
  1244. err = ib_register_device(&dev->ib_dev, NULL);
  1245. if (err)
  1246. goto err_rsrc;
  1247. err = create_umr_res(dev);
  1248. if (err)
  1249. goto err_dev;
  1250. for (i = 0; i < ARRAY_SIZE(mlx5_class_attributes); i++) {
  1251. err = device_create_file(&dev->ib_dev.dev,
  1252. mlx5_class_attributes[i]);
  1253. if (err)
  1254. goto err_umrc;
  1255. }
  1256. dev->ib_active = true;
  1257. return 0;
  1258. err_umrc:
  1259. destroy_umrc_res(dev);
  1260. err_dev:
  1261. ib_unregister_device(&dev->ib_dev);
  1262. err_rsrc:
  1263. destroy_dev_resources(&dev->devr);
  1264. err_eqs:
  1265. free_comp_eqs(dev);
  1266. err_cleanup:
  1267. mlx5_dev_cleanup(mdev);
  1268. err_free:
  1269. ib_dealloc_device((struct ib_device *)dev);
  1270. return err;
  1271. }
  1272. static void remove_one(struct pci_dev *pdev)
  1273. {
  1274. struct mlx5_ib_dev *dev = mlx5_pci2ibdev(pdev);
  1275. destroy_umrc_res(dev);
  1276. ib_unregister_device(&dev->ib_dev);
  1277. destroy_dev_resources(&dev->devr);
  1278. free_comp_eqs(dev);
  1279. mlx5_dev_cleanup(&dev->mdev);
  1280. ib_dealloc_device(&dev->ib_dev);
  1281. }
  1282. static DEFINE_PCI_DEVICE_TABLE(mlx5_ib_pci_table) = {
  1283. { PCI_VDEVICE(MELLANOX, 4113) }, /* MT4113 Connect-IB */
  1284. { 0, }
  1285. };
  1286. MODULE_DEVICE_TABLE(pci, mlx5_ib_pci_table);
  1287. static struct pci_driver mlx5_ib_driver = {
  1288. .name = DRIVER_NAME,
  1289. .id_table = mlx5_ib_pci_table,
  1290. .probe = init_one,
  1291. .remove = remove_one
  1292. };
  1293. static int __init mlx5_ib_init(void)
  1294. {
  1295. return pci_register_driver(&mlx5_ib_driver);
  1296. }
  1297. static void __exit mlx5_ib_cleanup(void)
  1298. {
  1299. pci_unregister_driver(&mlx5_ib_driver);
  1300. }
  1301. module_init(mlx5_ib_init);
  1302. module_exit(mlx5_ib_cleanup);