hns_roce_mr.c 32 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399
  1. /*
  2. * Copyright (c) 2016 Hisilicon Limited.
  3. * Copyright (c) 2007, 2008 Mellanox Technologies. All rights reserved.
  4. *
  5. * This software is available to you under a choice of one of two
  6. * licenses. You may choose to be licensed under the terms of the GNU
  7. * General Public License (GPL) Version 2, available from the file
  8. * COPYING in the main directory of this source tree, or the
  9. * OpenIB.org BSD license below:
  10. *
  11. * Redistribution and use in source and binary forms, with or
  12. * without modification, are permitted provided that the following
  13. * conditions are met:
  14. *
  15. * - Redistributions of source code must retain the above
  16. * copyright notice, this list of conditions and the following
  17. * disclaimer.
  18. *
  19. * - Redistributions in binary form must reproduce the above
  20. * copyright notice, this list of conditions and the following
  21. * disclaimer in the documentation and/or other materials
  22. * provided with the distribution.
  23. *
  24. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  25. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  26. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  27. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  28. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  29. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  30. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  31. * SOFTWARE.
  32. */
  33. #include <linux/platform_device.h>
  34. #include <linux/vmalloc.h>
  35. #include <rdma/ib_umem.h>
  36. #include "hns_roce_device.h"
  37. #include "hns_roce_cmd.h"
  38. #include "hns_roce_hem.h"
  39. static u32 hw_index_to_key(unsigned long ind)
  40. {
  41. return (u32)(ind >> 24) | (ind << 8);
  42. }
  43. unsigned long key_to_hw_index(u32 key)
  44. {
  45. return (key << 24) | (key >> 8);
  46. }
  47. EXPORT_SYMBOL_GPL(key_to_hw_index);
  48. static int hns_roce_sw2hw_mpt(struct hns_roce_dev *hr_dev,
  49. struct hns_roce_cmd_mailbox *mailbox,
  50. unsigned long mpt_index)
  51. {
  52. return hns_roce_cmd_mbox(hr_dev, mailbox->dma, 0, mpt_index, 0,
  53. HNS_ROCE_CMD_SW2HW_MPT,
  54. HNS_ROCE_CMD_TIMEOUT_MSECS);
  55. }
  56. int hns_roce_hw2sw_mpt(struct hns_roce_dev *hr_dev,
  57. struct hns_roce_cmd_mailbox *mailbox,
  58. unsigned long mpt_index)
  59. {
  60. return hns_roce_cmd_mbox(hr_dev, 0, mailbox ? mailbox->dma : 0,
  61. mpt_index, !mailbox, HNS_ROCE_CMD_HW2SW_MPT,
  62. HNS_ROCE_CMD_TIMEOUT_MSECS);
  63. }
  64. EXPORT_SYMBOL_GPL(hns_roce_hw2sw_mpt);
  65. static int hns_roce_buddy_alloc(struct hns_roce_buddy *buddy, int order,
  66. unsigned long *seg)
  67. {
  68. int o;
  69. u32 m;
  70. spin_lock(&buddy->lock);
  71. for (o = order; o <= buddy->max_order; ++o) {
  72. if (buddy->num_free[o]) {
  73. m = 1 << (buddy->max_order - o);
  74. *seg = find_first_bit(buddy->bits[o], m);
  75. if (*seg < m)
  76. goto found;
  77. }
  78. }
  79. spin_unlock(&buddy->lock);
  80. return -1;
  81. found:
  82. clear_bit(*seg, buddy->bits[o]);
  83. --buddy->num_free[o];
  84. while (o > order) {
  85. --o;
  86. *seg <<= 1;
  87. set_bit(*seg ^ 1, buddy->bits[o]);
  88. ++buddy->num_free[o];
  89. }
  90. spin_unlock(&buddy->lock);
  91. *seg <<= order;
  92. return 0;
  93. }
  94. static void hns_roce_buddy_free(struct hns_roce_buddy *buddy, unsigned long seg,
  95. int order)
  96. {
  97. seg >>= order;
  98. spin_lock(&buddy->lock);
  99. while (test_bit(seg ^ 1, buddy->bits[order])) {
  100. clear_bit(seg ^ 1, buddy->bits[order]);
  101. --buddy->num_free[order];
  102. seg >>= 1;
  103. ++order;
  104. }
  105. set_bit(seg, buddy->bits[order]);
  106. ++buddy->num_free[order];
  107. spin_unlock(&buddy->lock);
  108. }
  109. static int hns_roce_buddy_init(struct hns_roce_buddy *buddy, int max_order)
  110. {
  111. int i, s;
  112. buddy->max_order = max_order;
  113. spin_lock_init(&buddy->lock);
  114. buddy->bits = kcalloc(buddy->max_order + 1,
  115. sizeof(*buddy->bits),
  116. GFP_KERNEL);
  117. buddy->num_free = kcalloc(buddy->max_order + 1,
  118. sizeof(*buddy->num_free),
  119. GFP_KERNEL);
  120. if (!buddy->bits || !buddy->num_free)
  121. goto err_out;
  122. for (i = 0; i <= buddy->max_order; ++i) {
  123. s = BITS_TO_LONGS(1 << (buddy->max_order - i));
  124. buddy->bits[i] = kcalloc(s, sizeof(long), GFP_KERNEL |
  125. __GFP_NOWARN);
  126. if (!buddy->bits[i]) {
  127. buddy->bits[i] = vzalloc(array_size(s, sizeof(long)));
  128. if (!buddy->bits[i])
  129. goto err_out_free;
  130. }
  131. }
  132. set_bit(0, buddy->bits[buddy->max_order]);
  133. buddy->num_free[buddy->max_order] = 1;
  134. return 0;
  135. err_out_free:
  136. for (i = 0; i <= buddy->max_order; ++i)
  137. kvfree(buddy->bits[i]);
  138. err_out:
  139. kfree(buddy->bits);
  140. kfree(buddy->num_free);
  141. return -ENOMEM;
  142. }
  143. static void hns_roce_buddy_cleanup(struct hns_roce_buddy *buddy)
  144. {
  145. int i;
  146. for (i = 0; i <= buddy->max_order; ++i)
  147. kvfree(buddy->bits[i]);
  148. kfree(buddy->bits);
  149. kfree(buddy->num_free);
  150. }
  151. static int hns_roce_alloc_mtt_range(struct hns_roce_dev *hr_dev, int order,
  152. unsigned long *seg, u32 mtt_type)
  153. {
  154. struct hns_roce_mr_table *mr_table = &hr_dev->mr_table;
  155. struct hns_roce_hem_table *table;
  156. struct hns_roce_buddy *buddy;
  157. int ret;
  158. if (mtt_type == MTT_TYPE_WQE) {
  159. buddy = &mr_table->mtt_buddy;
  160. table = &mr_table->mtt_table;
  161. } else {
  162. buddy = &mr_table->mtt_cqe_buddy;
  163. table = &mr_table->mtt_cqe_table;
  164. }
  165. ret = hns_roce_buddy_alloc(buddy, order, seg);
  166. if (ret == -1)
  167. return -1;
  168. if (hns_roce_table_get_range(hr_dev, table, *seg,
  169. *seg + (1 << order) - 1)) {
  170. hns_roce_buddy_free(buddy, *seg, order);
  171. return -1;
  172. }
  173. return 0;
  174. }
  175. int hns_roce_mtt_init(struct hns_roce_dev *hr_dev, int npages, int page_shift,
  176. struct hns_roce_mtt *mtt)
  177. {
  178. int ret;
  179. int i;
  180. /* Page num is zero, correspond to DMA memory register */
  181. if (!npages) {
  182. mtt->order = -1;
  183. mtt->page_shift = HNS_ROCE_HEM_PAGE_SHIFT;
  184. return 0;
  185. }
  186. /* Note: if page_shift is zero, FAST memory register */
  187. mtt->page_shift = page_shift;
  188. /* Compute MTT entry necessary */
  189. for (mtt->order = 0, i = HNS_ROCE_MTT_ENTRY_PER_SEG; i < npages;
  190. i <<= 1)
  191. ++mtt->order;
  192. /* Allocate MTT entry */
  193. ret = hns_roce_alloc_mtt_range(hr_dev, mtt->order, &mtt->first_seg,
  194. mtt->mtt_type);
  195. if (ret == -1)
  196. return -ENOMEM;
  197. return 0;
  198. }
  199. void hns_roce_mtt_cleanup(struct hns_roce_dev *hr_dev, struct hns_roce_mtt *mtt)
  200. {
  201. struct hns_roce_mr_table *mr_table = &hr_dev->mr_table;
  202. if (mtt->order < 0)
  203. return;
  204. if (mtt->mtt_type == MTT_TYPE_WQE) {
  205. hns_roce_buddy_free(&mr_table->mtt_buddy, mtt->first_seg,
  206. mtt->order);
  207. hns_roce_table_put_range(hr_dev, &mr_table->mtt_table,
  208. mtt->first_seg,
  209. mtt->first_seg + (1 << mtt->order) - 1);
  210. } else {
  211. hns_roce_buddy_free(&mr_table->mtt_cqe_buddy, mtt->first_seg,
  212. mtt->order);
  213. hns_roce_table_put_range(hr_dev, &mr_table->mtt_cqe_table,
  214. mtt->first_seg,
  215. mtt->first_seg + (1 << mtt->order) - 1);
  216. }
  217. }
  218. EXPORT_SYMBOL_GPL(hns_roce_mtt_cleanup);
  219. static void hns_roce_loop_free(struct hns_roce_dev *hr_dev,
  220. struct hns_roce_mr *mr, int err_loop_index,
  221. int loop_i, int loop_j)
  222. {
  223. struct device *dev = hr_dev->dev;
  224. u32 mhop_num;
  225. u32 pbl_bt_sz;
  226. u64 bt_idx;
  227. int i, j;
  228. pbl_bt_sz = 1 << (hr_dev->caps.pbl_ba_pg_sz + PAGE_SHIFT);
  229. mhop_num = hr_dev->caps.pbl_hop_num;
  230. i = loop_i;
  231. if (mhop_num == 3 && err_loop_index == 2) {
  232. for (; i >= 0; i--) {
  233. dma_free_coherent(dev, pbl_bt_sz, mr->pbl_bt_l1[i],
  234. mr->pbl_l1_dma_addr[i]);
  235. for (j = 0; j < pbl_bt_sz / 8; j++) {
  236. if (i == loop_i && j >= loop_j)
  237. break;
  238. bt_idx = i * pbl_bt_sz / 8 + j;
  239. dma_free_coherent(dev, pbl_bt_sz,
  240. mr->pbl_bt_l2[bt_idx],
  241. mr->pbl_l2_dma_addr[bt_idx]);
  242. }
  243. }
  244. } else if (mhop_num == 3 && err_loop_index == 1) {
  245. for (i -= 1; i >= 0; i--) {
  246. dma_free_coherent(dev, pbl_bt_sz, mr->pbl_bt_l1[i],
  247. mr->pbl_l1_dma_addr[i]);
  248. for (j = 0; j < pbl_bt_sz / 8; j++) {
  249. bt_idx = i * pbl_bt_sz / 8 + j;
  250. dma_free_coherent(dev, pbl_bt_sz,
  251. mr->pbl_bt_l2[bt_idx],
  252. mr->pbl_l2_dma_addr[bt_idx]);
  253. }
  254. }
  255. } else if (mhop_num == 2 && err_loop_index == 1) {
  256. for (i -= 1; i >= 0; i--)
  257. dma_free_coherent(dev, pbl_bt_sz, mr->pbl_bt_l1[i],
  258. mr->pbl_l1_dma_addr[i]);
  259. } else {
  260. dev_warn(dev, "not support: mhop_num=%d, err_loop_index=%d.",
  261. mhop_num, err_loop_index);
  262. return;
  263. }
  264. dma_free_coherent(dev, pbl_bt_sz, mr->pbl_bt_l0, mr->pbl_l0_dma_addr);
  265. mr->pbl_bt_l0 = NULL;
  266. mr->pbl_l0_dma_addr = 0;
  267. }
  268. /* PBL multi hop addressing */
  269. static int hns_roce_mhop_alloc(struct hns_roce_dev *hr_dev, int npages,
  270. struct hns_roce_mr *mr)
  271. {
  272. struct device *dev = hr_dev->dev;
  273. int mr_alloc_done = 0;
  274. int npages_allocated;
  275. int i = 0, j = 0;
  276. u32 pbl_bt_sz;
  277. u32 mhop_num;
  278. u64 pbl_last_bt_num;
  279. u64 pbl_bt_cnt = 0;
  280. u64 bt_idx;
  281. u64 size;
  282. mhop_num = (mr->type == MR_TYPE_FRMR ? 1 : hr_dev->caps.pbl_hop_num);
  283. pbl_bt_sz = 1 << (hr_dev->caps.pbl_ba_pg_sz + PAGE_SHIFT);
  284. pbl_last_bt_num = (npages + pbl_bt_sz / 8 - 1) / (pbl_bt_sz / 8);
  285. if (mhop_num == HNS_ROCE_HOP_NUM_0)
  286. return 0;
  287. /* hop_num = 1 */
  288. if (mhop_num == 1) {
  289. if (npages > pbl_bt_sz / 8) {
  290. dev_err(dev, "npages %d is larger than buf_pg_sz!",
  291. npages);
  292. return -EINVAL;
  293. }
  294. mr->pbl_buf = dma_alloc_coherent(dev, npages * 8,
  295. &(mr->pbl_dma_addr),
  296. GFP_KERNEL);
  297. if (!mr->pbl_buf)
  298. return -ENOMEM;
  299. mr->pbl_size = npages;
  300. mr->pbl_ba = mr->pbl_dma_addr;
  301. mr->pbl_hop_num = mhop_num;
  302. mr->pbl_ba_pg_sz = hr_dev->caps.pbl_ba_pg_sz;
  303. mr->pbl_buf_pg_sz = hr_dev->caps.pbl_buf_pg_sz;
  304. return 0;
  305. }
  306. mr->pbl_l1_dma_addr = kcalloc(pbl_bt_sz / 8,
  307. sizeof(*mr->pbl_l1_dma_addr),
  308. GFP_KERNEL);
  309. if (!mr->pbl_l1_dma_addr)
  310. return -ENOMEM;
  311. mr->pbl_bt_l1 = kcalloc(pbl_bt_sz / 8, sizeof(*mr->pbl_bt_l1),
  312. GFP_KERNEL);
  313. if (!mr->pbl_bt_l1)
  314. goto err_kcalloc_bt_l1;
  315. if (mhop_num == 3) {
  316. mr->pbl_l2_dma_addr = kcalloc(pbl_last_bt_num,
  317. sizeof(*mr->pbl_l2_dma_addr),
  318. GFP_KERNEL);
  319. if (!mr->pbl_l2_dma_addr)
  320. goto err_kcalloc_l2_dma;
  321. mr->pbl_bt_l2 = kcalloc(pbl_last_bt_num,
  322. sizeof(*mr->pbl_bt_l2),
  323. GFP_KERNEL);
  324. if (!mr->pbl_bt_l2)
  325. goto err_kcalloc_bt_l2;
  326. }
  327. /* alloc L0 BT */
  328. mr->pbl_bt_l0 = dma_alloc_coherent(dev, pbl_bt_sz,
  329. &(mr->pbl_l0_dma_addr),
  330. GFP_KERNEL);
  331. if (!mr->pbl_bt_l0)
  332. goto err_dma_alloc_l0;
  333. if (mhop_num == 2) {
  334. /* alloc L1 BT */
  335. for (i = 0; i < pbl_bt_sz / 8; i++) {
  336. if (pbl_bt_cnt + 1 < pbl_last_bt_num) {
  337. size = pbl_bt_sz;
  338. } else {
  339. npages_allocated = i * (pbl_bt_sz / 8);
  340. size = (npages - npages_allocated) * 8;
  341. }
  342. mr->pbl_bt_l1[i] = dma_alloc_coherent(dev, size,
  343. &(mr->pbl_l1_dma_addr[i]),
  344. GFP_KERNEL);
  345. if (!mr->pbl_bt_l1[i]) {
  346. hns_roce_loop_free(hr_dev, mr, 1, i, 0);
  347. goto err_dma_alloc_l0;
  348. }
  349. *(mr->pbl_bt_l0 + i) = mr->pbl_l1_dma_addr[i];
  350. pbl_bt_cnt++;
  351. if (pbl_bt_cnt >= pbl_last_bt_num)
  352. break;
  353. }
  354. } else if (mhop_num == 3) {
  355. /* alloc L1, L2 BT */
  356. for (i = 0; i < pbl_bt_sz / 8; i++) {
  357. mr->pbl_bt_l1[i] = dma_alloc_coherent(dev, pbl_bt_sz,
  358. &(mr->pbl_l1_dma_addr[i]),
  359. GFP_KERNEL);
  360. if (!mr->pbl_bt_l1[i]) {
  361. hns_roce_loop_free(hr_dev, mr, 1, i, 0);
  362. goto err_dma_alloc_l0;
  363. }
  364. *(mr->pbl_bt_l0 + i) = mr->pbl_l1_dma_addr[i];
  365. for (j = 0; j < pbl_bt_sz / 8; j++) {
  366. bt_idx = i * pbl_bt_sz / 8 + j;
  367. if (pbl_bt_cnt + 1 < pbl_last_bt_num) {
  368. size = pbl_bt_sz;
  369. } else {
  370. npages_allocated = bt_idx *
  371. (pbl_bt_sz / 8);
  372. size = (npages - npages_allocated) * 8;
  373. }
  374. mr->pbl_bt_l2[bt_idx] = dma_alloc_coherent(
  375. dev, size,
  376. &(mr->pbl_l2_dma_addr[bt_idx]),
  377. GFP_KERNEL);
  378. if (!mr->pbl_bt_l2[bt_idx]) {
  379. hns_roce_loop_free(hr_dev, mr, 2, i, j);
  380. goto err_dma_alloc_l0;
  381. }
  382. *(mr->pbl_bt_l1[i] + j) =
  383. mr->pbl_l2_dma_addr[bt_idx];
  384. pbl_bt_cnt++;
  385. if (pbl_bt_cnt >= pbl_last_bt_num) {
  386. mr_alloc_done = 1;
  387. break;
  388. }
  389. }
  390. if (mr_alloc_done)
  391. break;
  392. }
  393. }
  394. mr->l0_chunk_last_num = i + 1;
  395. if (mhop_num == 3)
  396. mr->l1_chunk_last_num = j + 1;
  397. mr->pbl_size = npages;
  398. mr->pbl_ba = mr->pbl_l0_dma_addr;
  399. mr->pbl_hop_num = hr_dev->caps.pbl_hop_num;
  400. mr->pbl_ba_pg_sz = hr_dev->caps.pbl_ba_pg_sz;
  401. mr->pbl_buf_pg_sz = hr_dev->caps.pbl_buf_pg_sz;
  402. return 0;
  403. err_dma_alloc_l0:
  404. kfree(mr->pbl_bt_l2);
  405. mr->pbl_bt_l2 = NULL;
  406. err_kcalloc_bt_l2:
  407. kfree(mr->pbl_l2_dma_addr);
  408. mr->pbl_l2_dma_addr = NULL;
  409. err_kcalloc_l2_dma:
  410. kfree(mr->pbl_bt_l1);
  411. mr->pbl_bt_l1 = NULL;
  412. err_kcalloc_bt_l1:
  413. kfree(mr->pbl_l1_dma_addr);
  414. mr->pbl_l1_dma_addr = NULL;
  415. return -ENOMEM;
  416. }
  417. static int hns_roce_mr_alloc(struct hns_roce_dev *hr_dev, u32 pd, u64 iova,
  418. u64 size, u32 access, int npages,
  419. struct hns_roce_mr *mr)
  420. {
  421. struct device *dev = hr_dev->dev;
  422. unsigned long index = 0;
  423. int ret = 0;
  424. /* Allocate a key for mr from mr_table */
  425. ret = hns_roce_bitmap_alloc(&hr_dev->mr_table.mtpt_bitmap, &index);
  426. if (ret == -1)
  427. return -ENOMEM;
  428. mr->iova = iova; /* MR va starting addr */
  429. mr->size = size; /* MR addr range */
  430. mr->pd = pd; /* MR num */
  431. mr->access = access; /* MR access permit */
  432. mr->enabled = 0; /* MR active status */
  433. mr->key = hw_index_to_key(index); /* MR key */
  434. if (size == ~0ull) {
  435. mr->pbl_buf = NULL;
  436. mr->pbl_dma_addr = 0;
  437. /* PBL multi-hop addressing parameters */
  438. mr->pbl_bt_l2 = NULL;
  439. mr->pbl_bt_l1 = NULL;
  440. mr->pbl_bt_l0 = NULL;
  441. mr->pbl_l2_dma_addr = NULL;
  442. mr->pbl_l1_dma_addr = NULL;
  443. mr->pbl_l0_dma_addr = 0;
  444. } else {
  445. if (!hr_dev->caps.pbl_hop_num) {
  446. mr->pbl_buf = dma_alloc_coherent(dev, npages * 8,
  447. &(mr->pbl_dma_addr),
  448. GFP_KERNEL);
  449. if (!mr->pbl_buf)
  450. return -ENOMEM;
  451. } else {
  452. ret = hns_roce_mhop_alloc(hr_dev, npages, mr);
  453. }
  454. }
  455. return ret;
  456. }
  457. static void hns_roce_mhop_free(struct hns_roce_dev *hr_dev,
  458. struct hns_roce_mr *mr)
  459. {
  460. struct device *dev = hr_dev->dev;
  461. int npages_allocated;
  462. int npages;
  463. int i, j;
  464. u32 pbl_bt_sz;
  465. u32 mhop_num;
  466. u64 bt_idx;
  467. npages = mr->pbl_size;
  468. pbl_bt_sz = 1 << (hr_dev->caps.pbl_ba_pg_sz + PAGE_SHIFT);
  469. mhop_num = (mr->type == MR_TYPE_FRMR) ? 1 : hr_dev->caps.pbl_hop_num;
  470. if (mhop_num == HNS_ROCE_HOP_NUM_0)
  471. return;
  472. /* hop_num = 1 */
  473. if (mhop_num == 1) {
  474. dma_free_coherent(dev, (unsigned int)(npages * 8),
  475. mr->pbl_buf, mr->pbl_dma_addr);
  476. return;
  477. }
  478. dma_free_coherent(dev, pbl_bt_sz, mr->pbl_bt_l0,
  479. mr->pbl_l0_dma_addr);
  480. if (mhop_num == 2) {
  481. for (i = 0; i < mr->l0_chunk_last_num; i++) {
  482. if (i == mr->l0_chunk_last_num - 1) {
  483. npages_allocated = i * (pbl_bt_sz / 8);
  484. dma_free_coherent(dev,
  485. (npages - npages_allocated) * 8,
  486. mr->pbl_bt_l1[i],
  487. mr->pbl_l1_dma_addr[i]);
  488. break;
  489. }
  490. dma_free_coherent(dev, pbl_bt_sz, mr->pbl_bt_l1[i],
  491. mr->pbl_l1_dma_addr[i]);
  492. }
  493. } else if (mhop_num == 3) {
  494. for (i = 0; i < mr->l0_chunk_last_num; i++) {
  495. dma_free_coherent(dev, pbl_bt_sz, mr->pbl_bt_l1[i],
  496. mr->pbl_l1_dma_addr[i]);
  497. for (j = 0; j < pbl_bt_sz / 8; j++) {
  498. bt_idx = i * (pbl_bt_sz / 8) + j;
  499. if ((i == mr->l0_chunk_last_num - 1)
  500. && j == mr->l1_chunk_last_num - 1) {
  501. npages_allocated = bt_idx *
  502. (pbl_bt_sz / 8);
  503. dma_free_coherent(dev,
  504. (npages - npages_allocated) * 8,
  505. mr->pbl_bt_l2[bt_idx],
  506. mr->pbl_l2_dma_addr[bt_idx]);
  507. break;
  508. }
  509. dma_free_coherent(dev, pbl_bt_sz,
  510. mr->pbl_bt_l2[bt_idx],
  511. mr->pbl_l2_dma_addr[bt_idx]);
  512. }
  513. }
  514. }
  515. kfree(mr->pbl_bt_l1);
  516. kfree(mr->pbl_l1_dma_addr);
  517. mr->pbl_bt_l1 = NULL;
  518. mr->pbl_l1_dma_addr = NULL;
  519. if (mhop_num == 3) {
  520. kfree(mr->pbl_bt_l2);
  521. kfree(mr->pbl_l2_dma_addr);
  522. mr->pbl_bt_l2 = NULL;
  523. mr->pbl_l2_dma_addr = NULL;
  524. }
  525. }
  526. static void hns_roce_mr_free(struct hns_roce_dev *hr_dev,
  527. struct hns_roce_mr *mr)
  528. {
  529. struct device *dev = hr_dev->dev;
  530. int npages = 0;
  531. int ret;
  532. if (mr->enabled) {
  533. ret = hns_roce_hw2sw_mpt(hr_dev, NULL, key_to_hw_index(mr->key)
  534. & (hr_dev->caps.num_mtpts - 1));
  535. if (ret)
  536. dev_warn(dev, "HW2SW_MPT failed (%d)\n", ret);
  537. }
  538. if (mr->size != ~0ULL) {
  539. if (mr->type == MR_TYPE_MR)
  540. npages = ib_umem_page_count(mr->umem);
  541. if (!hr_dev->caps.pbl_hop_num)
  542. dma_free_coherent(dev, (unsigned int)(npages * 8),
  543. mr->pbl_buf, mr->pbl_dma_addr);
  544. else
  545. hns_roce_mhop_free(hr_dev, mr);
  546. }
  547. if (mr->enabled)
  548. hns_roce_table_put(hr_dev, &hr_dev->mr_table.mtpt_table,
  549. key_to_hw_index(mr->key));
  550. hns_roce_bitmap_free(&hr_dev->mr_table.mtpt_bitmap,
  551. key_to_hw_index(mr->key), BITMAP_NO_RR);
  552. }
  553. static int hns_roce_mr_enable(struct hns_roce_dev *hr_dev,
  554. struct hns_roce_mr *mr)
  555. {
  556. int ret;
  557. unsigned long mtpt_idx = key_to_hw_index(mr->key);
  558. struct device *dev = hr_dev->dev;
  559. struct hns_roce_cmd_mailbox *mailbox;
  560. struct hns_roce_mr_table *mr_table = &hr_dev->mr_table;
  561. /* Prepare HEM entry memory */
  562. ret = hns_roce_table_get(hr_dev, &mr_table->mtpt_table, mtpt_idx);
  563. if (ret)
  564. return ret;
  565. /* Allocate mailbox memory */
  566. mailbox = hns_roce_alloc_cmd_mailbox(hr_dev);
  567. if (IS_ERR(mailbox)) {
  568. ret = PTR_ERR(mailbox);
  569. goto err_table;
  570. }
  571. if (mr->type != MR_TYPE_FRMR)
  572. ret = hr_dev->hw->write_mtpt(mailbox->buf, mr, mtpt_idx);
  573. else
  574. ret = hr_dev->hw->frmr_write_mtpt(mailbox->buf, mr);
  575. if (ret) {
  576. dev_err(dev, "Write mtpt fail!\n");
  577. goto err_page;
  578. }
  579. ret = hns_roce_sw2hw_mpt(hr_dev, mailbox,
  580. mtpt_idx & (hr_dev->caps.num_mtpts - 1));
  581. if (ret) {
  582. dev_err(dev, "SW2HW_MPT failed (%d)\n", ret);
  583. goto err_page;
  584. }
  585. mr->enabled = 1;
  586. hns_roce_free_cmd_mailbox(hr_dev, mailbox);
  587. return 0;
  588. err_page:
  589. hns_roce_free_cmd_mailbox(hr_dev, mailbox);
  590. err_table:
  591. hns_roce_table_put(hr_dev, &mr_table->mtpt_table, mtpt_idx);
  592. return ret;
  593. }
  594. static int hns_roce_write_mtt_chunk(struct hns_roce_dev *hr_dev,
  595. struct hns_roce_mtt *mtt, u32 start_index,
  596. u32 npages, u64 *page_list)
  597. {
  598. struct hns_roce_hem_table *table;
  599. dma_addr_t dma_handle;
  600. __le64 *mtts;
  601. u32 s = start_index * sizeof(u64);
  602. u32 bt_page_size;
  603. u32 i;
  604. if (mtt->mtt_type == MTT_TYPE_WQE)
  605. bt_page_size = 1 << (hr_dev->caps.mtt_ba_pg_sz + PAGE_SHIFT);
  606. else
  607. bt_page_size = 1 << (hr_dev->caps.cqe_ba_pg_sz + PAGE_SHIFT);
  608. /* All MTTs must fit in the same page */
  609. if (start_index / (bt_page_size / sizeof(u64)) !=
  610. (start_index + npages - 1) / (bt_page_size / sizeof(u64)))
  611. return -EINVAL;
  612. if (start_index & (HNS_ROCE_MTT_ENTRY_PER_SEG - 1))
  613. return -EINVAL;
  614. if (mtt->mtt_type == MTT_TYPE_WQE)
  615. table = &hr_dev->mr_table.mtt_table;
  616. else
  617. table = &hr_dev->mr_table.mtt_cqe_table;
  618. mtts = hns_roce_table_find(hr_dev, table,
  619. mtt->first_seg + s / hr_dev->caps.mtt_entry_sz,
  620. &dma_handle);
  621. if (!mtts)
  622. return -ENOMEM;
  623. /* Save page addr, low 12 bits : 0 */
  624. for (i = 0; i < npages; ++i) {
  625. if (!hr_dev->caps.mtt_hop_num)
  626. mtts[i] = cpu_to_le64(page_list[i] >> PAGE_ADDR_SHIFT);
  627. else
  628. mtts[i] = cpu_to_le64(page_list[i]);
  629. }
  630. return 0;
  631. }
  632. static int hns_roce_write_mtt(struct hns_roce_dev *hr_dev,
  633. struct hns_roce_mtt *mtt, u32 start_index,
  634. u32 npages, u64 *page_list)
  635. {
  636. int chunk;
  637. int ret;
  638. u32 bt_page_size;
  639. if (mtt->order < 0)
  640. return -EINVAL;
  641. if (mtt->mtt_type == MTT_TYPE_WQE)
  642. bt_page_size = 1 << (hr_dev->caps.mtt_ba_pg_sz + PAGE_SHIFT);
  643. else
  644. bt_page_size = 1 << (hr_dev->caps.cqe_ba_pg_sz + PAGE_SHIFT);
  645. while (npages > 0) {
  646. chunk = min_t(int, bt_page_size / sizeof(u64), npages);
  647. ret = hns_roce_write_mtt_chunk(hr_dev, mtt, start_index, chunk,
  648. page_list);
  649. if (ret)
  650. return ret;
  651. npages -= chunk;
  652. start_index += chunk;
  653. page_list += chunk;
  654. }
  655. return 0;
  656. }
  657. int hns_roce_buf_write_mtt(struct hns_roce_dev *hr_dev,
  658. struct hns_roce_mtt *mtt, struct hns_roce_buf *buf)
  659. {
  660. u64 *page_list;
  661. int ret;
  662. u32 i;
  663. page_list = kmalloc_array(buf->npages, sizeof(*page_list), GFP_KERNEL);
  664. if (!page_list)
  665. return -ENOMEM;
  666. for (i = 0; i < buf->npages; ++i) {
  667. if (buf->nbufs == 1)
  668. page_list[i] = buf->direct.map + (i << buf->page_shift);
  669. else
  670. page_list[i] = buf->page_list[i].map;
  671. }
  672. ret = hns_roce_write_mtt(hr_dev, mtt, 0, buf->npages, page_list);
  673. kfree(page_list);
  674. return ret;
  675. }
  676. int hns_roce_init_mr_table(struct hns_roce_dev *hr_dev)
  677. {
  678. struct hns_roce_mr_table *mr_table = &hr_dev->mr_table;
  679. int ret;
  680. ret = hns_roce_bitmap_init(&mr_table->mtpt_bitmap,
  681. hr_dev->caps.num_mtpts,
  682. hr_dev->caps.num_mtpts - 1,
  683. hr_dev->caps.reserved_mrws, 0);
  684. if (ret)
  685. return ret;
  686. ret = hns_roce_buddy_init(&mr_table->mtt_buddy,
  687. ilog2(hr_dev->caps.num_mtt_segs));
  688. if (ret)
  689. goto err_buddy;
  690. if (hns_roce_check_whether_mhop(hr_dev, HEM_TYPE_CQE)) {
  691. ret = hns_roce_buddy_init(&mr_table->mtt_cqe_buddy,
  692. ilog2(hr_dev->caps.num_cqe_segs));
  693. if (ret)
  694. goto err_buddy_cqe;
  695. }
  696. return 0;
  697. err_buddy_cqe:
  698. hns_roce_buddy_cleanup(&mr_table->mtt_buddy);
  699. err_buddy:
  700. hns_roce_bitmap_cleanup(&mr_table->mtpt_bitmap);
  701. return ret;
  702. }
  703. void hns_roce_cleanup_mr_table(struct hns_roce_dev *hr_dev)
  704. {
  705. struct hns_roce_mr_table *mr_table = &hr_dev->mr_table;
  706. hns_roce_buddy_cleanup(&mr_table->mtt_buddy);
  707. if (hns_roce_check_whether_mhop(hr_dev, HEM_TYPE_CQE))
  708. hns_roce_buddy_cleanup(&mr_table->mtt_cqe_buddy);
  709. hns_roce_bitmap_cleanup(&mr_table->mtpt_bitmap);
  710. }
  711. struct ib_mr *hns_roce_get_dma_mr(struct ib_pd *pd, int acc)
  712. {
  713. struct hns_roce_mr *mr;
  714. int ret;
  715. mr = kmalloc(sizeof(*mr), GFP_KERNEL);
  716. if (mr == NULL)
  717. return ERR_PTR(-ENOMEM);
  718. mr->type = MR_TYPE_DMA;
  719. /* Allocate memory region key */
  720. ret = hns_roce_mr_alloc(to_hr_dev(pd->device), to_hr_pd(pd)->pdn, 0,
  721. ~0ULL, acc, 0, mr);
  722. if (ret)
  723. goto err_free;
  724. ret = hns_roce_mr_enable(to_hr_dev(pd->device), mr);
  725. if (ret)
  726. goto err_mr;
  727. mr->ibmr.rkey = mr->ibmr.lkey = mr->key;
  728. mr->umem = NULL;
  729. return &mr->ibmr;
  730. err_mr:
  731. hns_roce_mr_free(to_hr_dev(pd->device), mr);
  732. err_free:
  733. kfree(mr);
  734. return ERR_PTR(ret);
  735. }
  736. int hns_roce_ib_umem_write_mtt(struct hns_roce_dev *hr_dev,
  737. struct hns_roce_mtt *mtt, struct ib_umem *umem)
  738. {
  739. struct device *dev = hr_dev->dev;
  740. struct scatterlist *sg;
  741. unsigned int order;
  742. int i, k, entry;
  743. int npage = 0;
  744. int ret = 0;
  745. int len;
  746. u64 page_addr;
  747. u64 *pages;
  748. u32 bt_page_size;
  749. u32 n;
  750. order = mtt->mtt_type == MTT_TYPE_WQE ? hr_dev->caps.mtt_ba_pg_sz :
  751. hr_dev->caps.cqe_ba_pg_sz;
  752. bt_page_size = 1 << (order + PAGE_SHIFT);
  753. pages = (u64 *) __get_free_pages(GFP_KERNEL, order);
  754. if (!pages)
  755. return -ENOMEM;
  756. i = n = 0;
  757. for_each_sg(umem->sg_head.sgl, sg, umem->nmap, entry) {
  758. len = sg_dma_len(sg) >> PAGE_SHIFT;
  759. for (k = 0; k < len; ++k) {
  760. page_addr =
  761. sg_dma_address(sg) + (k << umem->page_shift);
  762. if (!(npage % (1 << (mtt->page_shift - PAGE_SHIFT)))) {
  763. if (page_addr & ((1 << mtt->page_shift) - 1)) {
  764. dev_err(dev, "page_addr 0x%llx is not page_shift %d alignment!\n",
  765. page_addr, mtt->page_shift);
  766. ret = -EINVAL;
  767. goto out;
  768. }
  769. pages[i++] = page_addr;
  770. }
  771. npage++;
  772. if (i == bt_page_size / sizeof(u64)) {
  773. ret = hns_roce_write_mtt(hr_dev, mtt, n, i,
  774. pages);
  775. if (ret)
  776. goto out;
  777. n += i;
  778. i = 0;
  779. }
  780. }
  781. }
  782. if (i)
  783. ret = hns_roce_write_mtt(hr_dev, mtt, n, i, pages);
  784. out:
  785. free_pages((unsigned long) pages, order);
  786. return ret;
  787. }
  788. static int hns_roce_ib_umem_write_mr(struct hns_roce_dev *hr_dev,
  789. struct hns_roce_mr *mr,
  790. struct ib_umem *umem)
  791. {
  792. struct scatterlist *sg;
  793. int i = 0, j = 0, k;
  794. int entry;
  795. int len;
  796. u64 page_addr;
  797. u32 pbl_bt_sz;
  798. if (hr_dev->caps.pbl_hop_num == HNS_ROCE_HOP_NUM_0)
  799. return 0;
  800. pbl_bt_sz = 1 << (hr_dev->caps.pbl_ba_pg_sz + PAGE_SHIFT);
  801. for_each_sg(umem->sg_head.sgl, sg, umem->nmap, entry) {
  802. len = sg_dma_len(sg) >> PAGE_SHIFT;
  803. for (k = 0; k < len; ++k) {
  804. page_addr = sg_dma_address(sg) +
  805. (k << umem->page_shift);
  806. if (!hr_dev->caps.pbl_hop_num) {
  807. mr->pbl_buf[i++] = page_addr >> 12;
  808. } else if (hr_dev->caps.pbl_hop_num == 1) {
  809. mr->pbl_buf[i++] = page_addr;
  810. } else {
  811. if (hr_dev->caps.pbl_hop_num == 2)
  812. mr->pbl_bt_l1[i][j] = page_addr;
  813. else if (hr_dev->caps.pbl_hop_num == 3)
  814. mr->pbl_bt_l2[i][j] = page_addr;
  815. j++;
  816. if (j >= (pbl_bt_sz / 8)) {
  817. i++;
  818. j = 0;
  819. }
  820. }
  821. }
  822. }
  823. /* Memory barrier */
  824. mb();
  825. return 0;
  826. }
  827. struct ib_mr *hns_roce_reg_user_mr(struct ib_pd *pd, u64 start, u64 length,
  828. u64 virt_addr, int access_flags,
  829. struct ib_udata *udata)
  830. {
  831. struct hns_roce_dev *hr_dev = to_hr_dev(pd->device);
  832. struct device *dev = hr_dev->dev;
  833. struct hns_roce_mr *mr;
  834. int bt_size;
  835. int ret;
  836. int n;
  837. int i;
  838. mr = kmalloc(sizeof(*mr), GFP_KERNEL);
  839. if (!mr)
  840. return ERR_PTR(-ENOMEM);
  841. mr->umem = ib_umem_get(pd->uobject->context, start, length,
  842. access_flags, 0);
  843. if (IS_ERR(mr->umem)) {
  844. ret = PTR_ERR(mr->umem);
  845. goto err_free;
  846. }
  847. n = ib_umem_page_count(mr->umem);
  848. if (!hr_dev->caps.pbl_hop_num) {
  849. if (n > HNS_ROCE_MAX_MTPT_PBL_NUM) {
  850. dev_err(dev,
  851. " MR len %lld err. MR is limited to 4G at most!\n",
  852. length);
  853. ret = -EINVAL;
  854. goto err_umem;
  855. }
  856. } else {
  857. int pbl_size = 1;
  858. bt_size = (1 << (hr_dev->caps.pbl_ba_pg_sz + PAGE_SHIFT)) / 8;
  859. for (i = 0; i < hr_dev->caps.pbl_hop_num; i++)
  860. pbl_size *= bt_size;
  861. if (n > pbl_size) {
  862. dev_err(dev,
  863. " MR len %lld err. MR page num is limited to %d!\n",
  864. length, pbl_size);
  865. ret = -EINVAL;
  866. goto err_umem;
  867. }
  868. }
  869. mr->type = MR_TYPE_MR;
  870. ret = hns_roce_mr_alloc(hr_dev, to_hr_pd(pd)->pdn, virt_addr, length,
  871. access_flags, n, mr);
  872. if (ret)
  873. goto err_umem;
  874. ret = hns_roce_ib_umem_write_mr(hr_dev, mr, mr->umem);
  875. if (ret)
  876. goto err_mr;
  877. ret = hns_roce_mr_enable(hr_dev, mr);
  878. if (ret)
  879. goto err_mr;
  880. mr->ibmr.rkey = mr->ibmr.lkey = mr->key;
  881. return &mr->ibmr;
  882. err_mr:
  883. hns_roce_mr_free(hr_dev, mr);
  884. err_umem:
  885. ib_umem_release(mr->umem);
  886. err_free:
  887. kfree(mr);
  888. return ERR_PTR(ret);
  889. }
  890. int hns_roce_rereg_user_mr(struct ib_mr *ibmr, int flags, u64 start, u64 length,
  891. u64 virt_addr, int mr_access_flags, struct ib_pd *pd,
  892. struct ib_udata *udata)
  893. {
  894. struct hns_roce_dev *hr_dev = to_hr_dev(ibmr->device);
  895. struct hns_roce_mr *mr = to_hr_mr(ibmr);
  896. struct hns_roce_cmd_mailbox *mailbox;
  897. struct device *dev = hr_dev->dev;
  898. unsigned long mtpt_idx;
  899. u32 pdn = 0;
  900. int npages;
  901. int ret;
  902. if (!mr->enabled)
  903. return -EINVAL;
  904. mailbox = hns_roce_alloc_cmd_mailbox(hr_dev);
  905. if (IS_ERR(mailbox))
  906. return PTR_ERR(mailbox);
  907. mtpt_idx = key_to_hw_index(mr->key) & (hr_dev->caps.num_mtpts - 1);
  908. ret = hns_roce_cmd_mbox(hr_dev, 0, mailbox->dma, mtpt_idx, 0,
  909. HNS_ROCE_CMD_QUERY_MPT,
  910. HNS_ROCE_CMD_TIMEOUT_MSECS);
  911. if (ret)
  912. goto free_cmd_mbox;
  913. ret = hns_roce_hw2sw_mpt(hr_dev, NULL, mtpt_idx);
  914. if (ret)
  915. dev_warn(dev, "HW2SW_MPT failed (%d)\n", ret);
  916. mr->enabled = 0;
  917. if (flags & IB_MR_REREG_PD)
  918. pdn = to_hr_pd(pd)->pdn;
  919. if (flags & IB_MR_REREG_TRANS) {
  920. if (mr->size != ~0ULL) {
  921. npages = ib_umem_page_count(mr->umem);
  922. if (hr_dev->caps.pbl_hop_num)
  923. hns_roce_mhop_free(hr_dev, mr);
  924. else
  925. dma_free_coherent(dev, npages * 8, mr->pbl_buf,
  926. mr->pbl_dma_addr);
  927. }
  928. ib_umem_release(mr->umem);
  929. mr->umem = ib_umem_get(ibmr->uobject->context, start, length,
  930. mr_access_flags, 0);
  931. if (IS_ERR(mr->umem)) {
  932. ret = PTR_ERR(mr->umem);
  933. mr->umem = NULL;
  934. goto free_cmd_mbox;
  935. }
  936. npages = ib_umem_page_count(mr->umem);
  937. if (hr_dev->caps.pbl_hop_num) {
  938. ret = hns_roce_mhop_alloc(hr_dev, npages, mr);
  939. if (ret)
  940. goto release_umem;
  941. } else {
  942. mr->pbl_buf = dma_alloc_coherent(dev, npages * 8,
  943. &(mr->pbl_dma_addr),
  944. GFP_KERNEL);
  945. if (!mr->pbl_buf) {
  946. ret = -ENOMEM;
  947. goto release_umem;
  948. }
  949. }
  950. }
  951. ret = hr_dev->hw->rereg_write_mtpt(hr_dev, mr, flags, pdn,
  952. mr_access_flags, virt_addr,
  953. length, mailbox->buf);
  954. if (ret) {
  955. if (flags & IB_MR_REREG_TRANS)
  956. goto release_umem;
  957. else
  958. goto free_cmd_mbox;
  959. }
  960. if (flags & IB_MR_REREG_TRANS) {
  961. ret = hns_roce_ib_umem_write_mr(hr_dev, mr, mr->umem);
  962. if (ret) {
  963. if (mr->size != ~0ULL) {
  964. npages = ib_umem_page_count(mr->umem);
  965. if (hr_dev->caps.pbl_hop_num)
  966. hns_roce_mhop_free(hr_dev, mr);
  967. else
  968. dma_free_coherent(dev, npages * 8,
  969. mr->pbl_buf,
  970. mr->pbl_dma_addr);
  971. }
  972. goto release_umem;
  973. }
  974. }
  975. ret = hns_roce_sw2hw_mpt(hr_dev, mailbox, mtpt_idx);
  976. if (ret) {
  977. dev_err(dev, "SW2HW_MPT failed (%d)\n", ret);
  978. goto release_umem;
  979. }
  980. mr->enabled = 1;
  981. if (flags & IB_MR_REREG_ACCESS)
  982. mr->access = mr_access_flags;
  983. hns_roce_free_cmd_mailbox(hr_dev, mailbox);
  984. return 0;
  985. release_umem:
  986. ib_umem_release(mr->umem);
  987. free_cmd_mbox:
  988. hns_roce_free_cmd_mailbox(hr_dev, mailbox);
  989. return ret;
  990. }
  991. int hns_roce_dereg_mr(struct ib_mr *ibmr)
  992. {
  993. struct hns_roce_dev *hr_dev = to_hr_dev(ibmr->device);
  994. struct hns_roce_mr *mr = to_hr_mr(ibmr);
  995. int ret = 0;
  996. if (hr_dev->hw->dereg_mr) {
  997. ret = hr_dev->hw->dereg_mr(hr_dev, mr);
  998. } else {
  999. hns_roce_mr_free(hr_dev, mr);
  1000. if (mr->umem)
  1001. ib_umem_release(mr->umem);
  1002. kfree(mr);
  1003. }
  1004. return ret;
  1005. }
  1006. struct ib_mr *hns_roce_alloc_mr(struct ib_pd *pd, enum ib_mr_type mr_type,
  1007. u32 max_num_sg)
  1008. {
  1009. struct hns_roce_dev *hr_dev = to_hr_dev(pd->device);
  1010. struct device *dev = hr_dev->dev;
  1011. struct hns_roce_mr *mr;
  1012. u64 length;
  1013. u32 page_size;
  1014. int ret;
  1015. page_size = 1 << (hr_dev->caps.pbl_buf_pg_sz + PAGE_SHIFT);
  1016. length = max_num_sg * page_size;
  1017. if (mr_type != IB_MR_TYPE_MEM_REG)
  1018. return ERR_PTR(-EINVAL);
  1019. if (max_num_sg > HNS_ROCE_FRMR_MAX_PA) {
  1020. dev_err(dev, "max_num_sg larger than %d\n",
  1021. HNS_ROCE_FRMR_MAX_PA);
  1022. return ERR_PTR(-EINVAL);
  1023. }
  1024. mr = kzalloc(sizeof(*mr), GFP_KERNEL);
  1025. if (!mr)
  1026. return ERR_PTR(-ENOMEM);
  1027. mr->type = MR_TYPE_FRMR;
  1028. /* Allocate memory region key */
  1029. ret = hns_roce_mr_alloc(hr_dev, to_hr_pd(pd)->pdn, 0, length,
  1030. 0, max_num_sg, mr);
  1031. if (ret)
  1032. goto err_free;
  1033. ret = hns_roce_mr_enable(hr_dev, mr);
  1034. if (ret)
  1035. goto err_mr;
  1036. mr->ibmr.rkey = mr->ibmr.lkey = mr->key;
  1037. mr->umem = NULL;
  1038. return &mr->ibmr;
  1039. err_mr:
  1040. hns_roce_mr_free(to_hr_dev(pd->device), mr);
  1041. err_free:
  1042. kfree(mr);
  1043. return ERR_PTR(ret);
  1044. }
  1045. static int hns_roce_set_page(struct ib_mr *ibmr, u64 addr)
  1046. {
  1047. struct hns_roce_mr *mr = to_hr_mr(ibmr);
  1048. mr->pbl_buf[mr->npages++] = cpu_to_le64(addr);
  1049. return 0;
  1050. }
  1051. int hns_roce_map_mr_sg(struct ib_mr *ibmr, struct scatterlist *sg, int sg_nents,
  1052. unsigned int *sg_offset)
  1053. {
  1054. struct hns_roce_mr *mr = to_hr_mr(ibmr);
  1055. mr->npages = 0;
  1056. return ib_sg_to_pages(ibmr, sg, sg_nents, sg_offset, hns_roce_set_page);
  1057. }
  1058. static void hns_roce_mw_free(struct hns_roce_dev *hr_dev,
  1059. struct hns_roce_mw *mw)
  1060. {
  1061. struct device *dev = hr_dev->dev;
  1062. int ret;
  1063. if (mw->enabled) {
  1064. ret = hns_roce_hw2sw_mpt(hr_dev, NULL, key_to_hw_index(mw->rkey)
  1065. & (hr_dev->caps.num_mtpts - 1));
  1066. if (ret)
  1067. dev_warn(dev, "MW HW2SW_MPT failed (%d)\n", ret);
  1068. hns_roce_table_put(hr_dev, &hr_dev->mr_table.mtpt_table,
  1069. key_to_hw_index(mw->rkey));
  1070. }
  1071. hns_roce_bitmap_free(&hr_dev->mr_table.mtpt_bitmap,
  1072. key_to_hw_index(mw->rkey), BITMAP_NO_RR);
  1073. }
  1074. static int hns_roce_mw_enable(struct hns_roce_dev *hr_dev,
  1075. struct hns_roce_mw *mw)
  1076. {
  1077. struct hns_roce_mr_table *mr_table = &hr_dev->mr_table;
  1078. struct hns_roce_cmd_mailbox *mailbox;
  1079. struct device *dev = hr_dev->dev;
  1080. unsigned long mtpt_idx = key_to_hw_index(mw->rkey);
  1081. int ret;
  1082. /* prepare HEM entry memory */
  1083. ret = hns_roce_table_get(hr_dev, &mr_table->mtpt_table, mtpt_idx);
  1084. if (ret)
  1085. return ret;
  1086. mailbox = hns_roce_alloc_cmd_mailbox(hr_dev);
  1087. if (IS_ERR(mailbox)) {
  1088. ret = PTR_ERR(mailbox);
  1089. goto err_table;
  1090. }
  1091. ret = hr_dev->hw->mw_write_mtpt(mailbox->buf, mw);
  1092. if (ret) {
  1093. dev_err(dev, "MW write mtpt fail!\n");
  1094. goto err_page;
  1095. }
  1096. ret = hns_roce_sw2hw_mpt(hr_dev, mailbox,
  1097. mtpt_idx & (hr_dev->caps.num_mtpts - 1));
  1098. if (ret) {
  1099. dev_err(dev, "MW sw2hw_mpt failed (%d)\n", ret);
  1100. goto err_page;
  1101. }
  1102. mw->enabled = 1;
  1103. hns_roce_free_cmd_mailbox(hr_dev, mailbox);
  1104. return 0;
  1105. err_page:
  1106. hns_roce_free_cmd_mailbox(hr_dev, mailbox);
  1107. err_table:
  1108. hns_roce_table_put(hr_dev, &mr_table->mtpt_table, mtpt_idx);
  1109. return ret;
  1110. }
  1111. struct ib_mw *hns_roce_alloc_mw(struct ib_pd *ib_pd, enum ib_mw_type type,
  1112. struct ib_udata *udata)
  1113. {
  1114. struct hns_roce_dev *hr_dev = to_hr_dev(ib_pd->device);
  1115. struct hns_roce_mw *mw;
  1116. unsigned long index = 0;
  1117. int ret;
  1118. mw = kmalloc(sizeof(*mw), GFP_KERNEL);
  1119. if (!mw)
  1120. return ERR_PTR(-ENOMEM);
  1121. /* Allocate a key for mw from bitmap */
  1122. ret = hns_roce_bitmap_alloc(&hr_dev->mr_table.mtpt_bitmap, &index);
  1123. if (ret)
  1124. goto err_bitmap;
  1125. mw->rkey = hw_index_to_key(index);
  1126. mw->ibmw.rkey = mw->rkey;
  1127. mw->ibmw.type = type;
  1128. mw->pdn = to_hr_pd(ib_pd)->pdn;
  1129. mw->pbl_hop_num = hr_dev->caps.pbl_hop_num;
  1130. mw->pbl_ba_pg_sz = hr_dev->caps.pbl_ba_pg_sz;
  1131. mw->pbl_buf_pg_sz = hr_dev->caps.pbl_buf_pg_sz;
  1132. ret = hns_roce_mw_enable(hr_dev, mw);
  1133. if (ret)
  1134. goto err_mw;
  1135. return &mw->ibmw;
  1136. err_mw:
  1137. hns_roce_mw_free(hr_dev, mw);
  1138. err_bitmap:
  1139. kfree(mw);
  1140. return ERR_PTR(ret);
  1141. }
  1142. int hns_roce_dealloc_mw(struct ib_mw *ibmw)
  1143. {
  1144. struct hns_roce_dev *hr_dev = to_hr_dev(ibmw->device);
  1145. struct hns_roce_mw *mw = to_hr_mw(ibmw);
  1146. hns_roce_mw_free(hr_dev, mw);
  1147. kfree(mw);
  1148. return 0;
  1149. }