rxe_pool.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501
  1. /*
  2. * Copyright (c) 2016 Mellanox Technologies Ltd. All rights reserved.
  3. * Copyright (c) 2015 System Fabric Works, Inc. All rights reserved.
  4. *
  5. * This software is available to you under a choice of one of two
  6. * licenses. You may choose to be licensed under the terms of the GNU
  7. * General Public License (GPL) Version 2, available from the file
  8. * COPYING in the main directory of this source tree, or the
  9. * OpenIB.org BSD license below:
  10. *
  11. * Redistribution and use in source and binary forms, with or
  12. * without modification, are permitted provided that the following
  13. * conditions are met:
  14. *
  15. * - Redistributions of source code must retain the above
  16. * copyright notice, this list of conditions and the following
  17. * disclaimer.
  18. *
  19. * - Redistributions in binary form must reproduce the above
  20. * copyright notice, this list of conditions and the following
  21. * disclaimer in the documentation and/or other materials
  22. * provided with the distribution.
  23. *
  24. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  25. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  26. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  27. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  28. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  29. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  30. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  31. * SOFTWARE.
  32. */
  33. #include "rxe.h"
  34. #include "rxe_loc.h"
  35. /* info about object pools
  36. * note that mr and mw share a single index space
  37. * so that one can map an lkey to the correct type of object
  38. */
  39. struct rxe_type_info rxe_type_info[RXE_NUM_TYPES] = {
  40. [RXE_TYPE_UC] = {
  41. .name = "rxe-uc",
  42. .size = sizeof(struct rxe_ucontext),
  43. },
  44. [RXE_TYPE_PD] = {
  45. .name = "rxe-pd",
  46. .size = sizeof(struct rxe_pd),
  47. },
  48. [RXE_TYPE_AH] = {
  49. .name = "rxe-ah",
  50. .size = sizeof(struct rxe_ah),
  51. .flags = RXE_POOL_ATOMIC,
  52. },
  53. [RXE_TYPE_SRQ] = {
  54. .name = "rxe-srq",
  55. .size = sizeof(struct rxe_srq),
  56. .flags = RXE_POOL_INDEX,
  57. .min_index = RXE_MIN_SRQ_INDEX,
  58. .max_index = RXE_MAX_SRQ_INDEX,
  59. },
  60. [RXE_TYPE_QP] = {
  61. .name = "rxe-qp",
  62. .size = sizeof(struct rxe_qp),
  63. .cleanup = rxe_qp_cleanup,
  64. .flags = RXE_POOL_INDEX,
  65. .min_index = RXE_MIN_QP_INDEX,
  66. .max_index = RXE_MAX_QP_INDEX,
  67. },
  68. [RXE_TYPE_CQ] = {
  69. .name = "rxe-cq",
  70. .size = sizeof(struct rxe_cq),
  71. .cleanup = rxe_cq_cleanup,
  72. },
  73. [RXE_TYPE_MR] = {
  74. .name = "rxe-mr",
  75. .size = sizeof(struct rxe_mem),
  76. .cleanup = rxe_mem_cleanup,
  77. .flags = RXE_POOL_INDEX,
  78. .max_index = RXE_MAX_MR_INDEX,
  79. .min_index = RXE_MIN_MR_INDEX,
  80. },
  81. [RXE_TYPE_MW] = {
  82. .name = "rxe-mw",
  83. .size = sizeof(struct rxe_mem),
  84. .flags = RXE_POOL_INDEX,
  85. .max_index = RXE_MAX_MW_INDEX,
  86. .min_index = RXE_MIN_MW_INDEX,
  87. },
  88. [RXE_TYPE_MC_GRP] = {
  89. .name = "rxe-mc_grp",
  90. .size = sizeof(struct rxe_mc_grp),
  91. .cleanup = rxe_mc_cleanup,
  92. .flags = RXE_POOL_KEY,
  93. .key_offset = offsetof(struct rxe_mc_grp, mgid),
  94. .key_size = sizeof(union ib_gid),
  95. },
  96. [RXE_TYPE_MC_ELEM] = {
  97. .name = "rxe-mc_elem",
  98. .size = sizeof(struct rxe_mc_elem),
  99. .flags = RXE_POOL_ATOMIC,
  100. },
  101. };
  102. static inline char *pool_name(struct rxe_pool *pool)
  103. {
  104. return rxe_type_info[pool->type].name;
  105. }
  106. static inline struct kmem_cache *pool_cache(struct rxe_pool *pool)
  107. {
  108. return rxe_type_info[pool->type].cache;
  109. }
  110. static inline enum rxe_elem_type rxe_type(void *arg)
  111. {
  112. struct rxe_pool_entry *elem = arg;
  113. return elem->pool->type;
  114. }
  115. int rxe_cache_init(void)
  116. {
  117. int err;
  118. int i;
  119. size_t size;
  120. struct rxe_type_info *type;
  121. for (i = 0; i < RXE_NUM_TYPES; i++) {
  122. type = &rxe_type_info[i];
  123. size = ALIGN(type->size, RXE_POOL_ALIGN);
  124. type->cache = kmem_cache_create(type->name, size,
  125. RXE_POOL_ALIGN,
  126. RXE_POOL_CACHE_FLAGS, NULL);
  127. if (!type->cache) {
  128. pr_err("Unable to init kmem cache for %s\n",
  129. type->name);
  130. err = -ENOMEM;
  131. goto err1;
  132. }
  133. }
  134. return 0;
  135. err1:
  136. while (--i >= 0) {
  137. kmem_cache_destroy(type->cache);
  138. type->cache = NULL;
  139. }
  140. return err;
  141. }
  142. void rxe_cache_exit(void)
  143. {
  144. int i;
  145. struct rxe_type_info *type;
  146. for (i = 0; i < RXE_NUM_TYPES; i++) {
  147. type = &rxe_type_info[i];
  148. kmem_cache_destroy(type->cache);
  149. type->cache = NULL;
  150. }
  151. }
  152. static int rxe_pool_init_index(struct rxe_pool *pool, u32 max, u32 min)
  153. {
  154. int err = 0;
  155. size_t size;
  156. if ((max - min + 1) < pool->max_elem) {
  157. pr_warn("not enough indices for max_elem\n");
  158. err = -EINVAL;
  159. goto out;
  160. }
  161. pool->max_index = max;
  162. pool->min_index = min;
  163. size = BITS_TO_LONGS(max - min + 1) * sizeof(long);
  164. pool->table = kmalloc(size, GFP_KERNEL);
  165. if (!pool->table) {
  166. err = -ENOMEM;
  167. goto out;
  168. }
  169. pool->table_size = size;
  170. bitmap_zero(pool->table, max - min + 1);
  171. out:
  172. return err;
  173. }
  174. int rxe_pool_init(
  175. struct rxe_dev *rxe,
  176. struct rxe_pool *pool,
  177. enum rxe_elem_type type,
  178. unsigned max_elem)
  179. {
  180. int err = 0;
  181. size_t size = rxe_type_info[type].size;
  182. memset(pool, 0, sizeof(*pool));
  183. pool->rxe = rxe;
  184. pool->type = type;
  185. pool->max_elem = max_elem;
  186. pool->elem_size = ALIGN(size, RXE_POOL_ALIGN);
  187. pool->flags = rxe_type_info[type].flags;
  188. pool->tree = RB_ROOT;
  189. pool->cleanup = rxe_type_info[type].cleanup;
  190. atomic_set(&pool->num_elem, 0);
  191. kref_init(&pool->ref_cnt);
  192. spin_lock_init(&pool->pool_lock);
  193. if (rxe_type_info[type].flags & RXE_POOL_INDEX) {
  194. err = rxe_pool_init_index(pool,
  195. rxe_type_info[type].max_index,
  196. rxe_type_info[type].min_index);
  197. if (err)
  198. goto out;
  199. }
  200. if (rxe_type_info[type].flags & RXE_POOL_KEY) {
  201. pool->key_offset = rxe_type_info[type].key_offset;
  202. pool->key_size = rxe_type_info[type].key_size;
  203. }
  204. pool->state = rxe_pool_valid;
  205. out:
  206. return err;
  207. }
  208. static void rxe_pool_release(struct kref *kref)
  209. {
  210. struct rxe_pool *pool = container_of(kref, struct rxe_pool, ref_cnt);
  211. pool->state = rxe_pool_invalid;
  212. kfree(pool->table);
  213. }
  214. static void rxe_pool_put(struct rxe_pool *pool)
  215. {
  216. kref_put(&pool->ref_cnt, rxe_pool_release);
  217. }
  218. int rxe_pool_cleanup(struct rxe_pool *pool)
  219. {
  220. unsigned long flags;
  221. spin_lock_irqsave(&pool->pool_lock, flags);
  222. pool->state = rxe_pool_invalid;
  223. if (atomic_read(&pool->num_elem) > 0)
  224. pr_warn("%s pool destroyed with unfree'd elem\n",
  225. pool_name(pool));
  226. spin_unlock_irqrestore(&pool->pool_lock, flags);
  227. rxe_pool_put(pool);
  228. return 0;
  229. }
  230. static u32 alloc_index(struct rxe_pool *pool)
  231. {
  232. u32 index;
  233. u32 range = pool->max_index - pool->min_index + 1;
  234. index = find_next_zero_bit(pool->table, range, pool->last);
  235. if (index >= range)
  236. index = find_first_zero_bit(pool->table, range);
  237. set_bit(index, pool->table);
  238. pool->last = index;
  239. return index + pool->min_index;
  240. }
  241. static void insert_index(struct rxe_pool *pool, struct rxe_pool_entry *new)
  242. {
  243. struct rb_node **link = &pool->tree.rb_node;
  244. struct rb_node *parent = NULL;
  245. struct rxe_pool_entry *elem;
  246. while (*link) {
  247. parent = *link;
  248. elem = rb_entry(parent, struct rxe_pool_entry, node);
  249. if (elem->index == new->index) {
  250. pr_warn("element already exists!\n");
  251. goto out;
  252. }
  253. if (elem->index > new->index)
  254. link = &(*link)->rb_left;
  255. else
  256. link = &(*link)->rb_right;
  257. }
  258. rb_link_node(&new->node, parent, link);
  259. rb_insert_color(&new->node, &pool->tree);
  260. out:
  261. return;
  262. }
  263. static void insert_key(struct rxe_pool *pool, struct rxe_pool_entry *new)
  264. {
  265. struct rb_node **link = &pool->tree.rb_node;
  266. struct rb_node *parent = NULL;
  267. struct rxe_pool_entry *elem;
  268. int cmp;
  269. while (*link) {
  270. parent = *link;
  271. elem = rb_entry(parent, struct rxe_pool_entry, node);
  272. cmp = memcmp((u8 *)elem + pool->key_offset,
  273. (u8 *)new + pool->key_offset, pool->key_size);
  274. if (cmp == 0) {
  275. pr_warn("key already exists!\n");
  276. goto out;
  277. }
  278. if (cmp > 0)
  279. link = &(*link)->rb_left;
  280. else
  281. link = &(*link)->rb_right;
  282. }
  283. rb_link_node(&new->node, parent, link);
  284. rb_insert_color(&new->node, &pool->tree);
  285. out:
  286. return;
  287. }
  288. void rxe_add_key(void *arg, void *key)
  289. {
  290. struct rxe_pool_entry *elem = arg;
  291. struct rxe_pool *pool = elem->pool;
  292. unsigned long flags;
  293. spin_lock_irqsave(&pool->pool_lock, flags);
  294. memcpy((u8 *)elem + pool->key_offset, key, pool->key_size);
  295. insert_key(pool, elem);
  296. spin_unlock_irqrestore(&pool->pool_lock, flags);
  297. }
  298. void rxe_drop_key(void *arg)
  299. {
  300. struct rxe_pool_entry *elem = arg;
  301. struct rxe_pool *pool = elem->pool;
  302. unsigned long flags;
  303. spin_lock_irqsave(&pool->pool_lock, flags);
  304. rb_erase(&elem->node, &pool->tree);
  305. spin_unlock_irqrestore(&pool->pool_lock, flags);
  306. }
  307. void rxe_add_index(void *arg)
  308. {
  309. struct rxe_pool_entry *elem = arg;
  310. struct rxe_pool *pool = elem->pool;
  311. unsigned long flags;
  312. spin_lock_irqsave(&pool->pool_lock, flags);
  313. elem->index = alloc_index(pool);
  314. insert_index(pool, elem);
  315. spin_unlock_irqrestore(&pool->pool_lock, flags);
  316. }
  317. void rxe_drop_index(void *arg)
  318. {
  319. struct rxe_pool_entry *elem = arg;
  320. struct rxe_pool *pool = elem->pool;
  321. unsigned long flags;
  322. spin_lock_irqsave(&pool->pool_lock, flags);
  323. clear_bit(elem->index - pool->min_index, pool->table);
  324. rb_erase(&elem->node, &pool->tree);
  325. spin_unlock_irqrestore(&pool->pool_lock, flags);
  326. }
  327. void *rxe_alloc(struct rxe_pool *pool)
  328. {
  329. struct rxe_pool_entry *elem;
  330. unsigned long flags;
  331. might_sleep_if(!(pool->flags & RXE_POOL_ATOMIC));
  332. spin_lock_irqsave(&pool->pool_lock, flags);
  333. if (pool->state != rxe_pool_valid) {
  334. spin_unlock_irqrestore(&pool->pool_lock, flags);
  335. return NULL;
  336. }
  337. kref_get(&pool->ref_cnt);
  338. spin_unlock_irqrestore(&pool->pool_lock, flags);
  339. kref_get(&pool->rxe->ref_cnt);
  340. if (atomic_inc_return(&pool->num_elem) > pool->max_elem) {
  341. atomic_dec(&pool->num_elem);
  342. rxe_dev_put(pool->rxe);
  343. rxe_pool_put(pool);
  344. return NULL;
  345. }
  346. elem = kmem_cache_zalloc(pool_cache(pool),
  347. (pool->flags & RXE_POOL_ATOMIC) ?
  348. GFP_ATOMIC : GFP_KERNEL);
  349. elem->pool = pool;
  350. kref_init(&elem->ref_cnt);
  351. return elem;
  352. }
  353. void rxe_elem_release(struct kref *kref)
  354. {
  355. struct rxe_pool_entry *elem =
  356. container_of(kref, struct rxe_pool_entry, ref_cnt);
  357. struct rxe_pool *pool = elem->pool;
  358. if (pool->cleanup)
  359. pool->cleanup(elem);
  360. kmem_cache_free(pool_cache(pool), elem);
  361. atomic_dec(&pool->num_elem);
  362. rxe_dev_put(pool->rxe);
  363. rxe_pool_put(pool);
  364. }
  365. void *rxe_pool_get_index(struct rxe_pool *pool, u32 index)
  366. {
  367. struct rb_node *node = NULL;
  368. struct rxe_pool_entry *elem = NULL;
  369. unsigned long flags;
  370. spin_lock_irqsave(&pool->pool_lock, flags);
  371. if (pool->state != rxe_pool_valid)
  372. goto out;
  373. node = pool->tree.rb_node;
  374. while (node) {
  375. elem = rb_entry(node, struct rxe_pool_entry, node);
  376. if (elem->index > index)
  377. node = node->rb_left;
  378. else if (elem->index < index)
  379. node = node->rb_right;
  380. else
  381. break;
  382. }
  383. if (node)
  384. kref_get(&elem->ref_cnt);
  385. out:
  386. spin_unlock_irqrestore(&pool->pool_lock, flags);
  387. return node ? (void *)elem : NULL;
  388. }
  389. void *rxe_pool_get_key(struct rxe_pool *pool, void *key)
  390. {
  391. struct rb_node *node = NULL;
  392. struct rxe_pool_entry *elem = NULL;
  393. int cmp;
  394. unsigned long flags;
  395. spin_lock_irqsave(&pool->pool_lock, flags);
  396. if (pool->state != rxe_pool_valid)
  397. goto out;
  398. node = pool->tree.rb_node;
  399. while (node) {
  400. elem = rb_entry(node, struct rxe_pool_entry, node);
  401. cmp = memcmp((u8 *)elem + pool->key_offset,
  402. key, pool->key_size);
  403. if (cmp > 0)
  404. node = node->rb_left;
  405. else if (cmp < 0)
  406. node = node->rb_right;
  407. else
  408. break;
  409. }
  410. if (node)
  411. kref_get(&elem->ref_cnt);
  412. out:
  413. spin_unlock_irqrestore(&pool->pool_lock, flags);
  414. return node ? ((void *)elem) : NULL;
  415. }