eq.c 40 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427
  1. /*
  2. * Copyright (c) 2005, 2006, 2007, 2008 Mellanox Technologies. All rights reserved.
  3. * Copyright (c) 2005, 2006, 2007 Cisco Systems, Inc. All rights reserved.
  4. *
  5. * This software is available to you under a choice of one of two
  6. * licenses. You may choose to be licensed under the terms of the GNU
  7. * General Public License (GPL) Version 2, available from the file
  8. * COPYING in the main directory of this source tree, or the
  9. * OpenIB.org BSD license below:
  10. *
  11. * Redistribution and use in source and binary forms, with or
  12. * without modification, are permitted provided that the following
  13. * conditions are met:
  14. *
  15. * - Redistributions of source code must retain the above
  16. * copyright notice, this list of conditions and the following
  17. * disclaimer.
  18. *
  19. * - Redistributions in binary form must reproduce the above
  20. * copyright notice, this list of conditions and the following
  21. * disclaimer in the documentation and/or other materials
  22. * provided with the distribution.
  23. *
  24. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  25. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  26. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  27. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  28. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  29. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  30. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  31. * SOFTWARE.
  32. */
  33. #include <linux/interrupt.h>
  34. #include <linux/slab.h>
  35. #include <linux/export.h>
  36. #include <linux/mm.h>
  37. #include <linux/dma-mapping.h>
  38. #include <linux/mlx4/cmd.h>
  39. #include <linux/cpu_rmap.h>
  40. #include "mlx4.h"
  41. #include "fw.h"
  42. enum {
  43. MLX4_IRQNAME_SIZE = 32
  44. };
  45. enum {
  46. MLX4_NUM_ASYNC_EQE = 0x100,
  47. MLX4_NUM_SPARE_EQE = 0x80,
  48. MLX4_EQ_ENTRY_SIZE = 0x20
  49. };
  50. #define MLX4_EQ_STATUS_OK ( 0 << 28)
  51. #define MLX4_EQ_STATUS_WRITE_FAIL (10 << 28)
  52. #define MLX4_EQ_OWNER_SW ( 0 << 24)
  53. #define MLX4_EQ_OWNER_HW ( 1 << 24)
  54. #define MLX4_EQ_FLAG_EC ( 1 << 18)
  55. #define MLX4_EQ_FLAG_OI ( 1 << 17)
  56. #define MLX4_EQ_STATE_ARMED ( 9 << 8)
  57. #define MLX4_EQ_STATE_FIRED (10 << 8)
  58. #define MLX4_EQ_STATE_ALWAYS_ARMED (11 << 8)
  59. #define MLX4_ASYNC_EVENT_MASK ((1ull << MLX4_EVENT_TYPE_PATH_MIG) | \
  60. (1ull << MLX4_EVENT_TYPE_COMM_EST) | \
  61. (1ull << MLX4_EVENT_TYPE_SQ_DRAINED) | \
  62. (1ull << MLX4_EVENT_TYPE_CQ_ERROR) | \
  63. (1ull << MLX4_EVENT_TYPE_WQ_CATAS_ERROR) | \
  64. (1ull << MLX4_EVENT_TYPE_EEC_CATAS_ERROR) | \
  65. (1ull << MLX4_EVENT_TYPE_PATH_MIG_FAILED) | \
  66. (1ull << MLX4_EVENT_TYPE_WQ_INVAL_REQ_ERROR) | \
  67. (1ull << MLX4_EVENT_TYPE_WQ_ACCESS_ERROR) | \
  68. (1ull << MLX4_EVENT_TYPE_PORT_CHANGE) | \
  69. (1ull << MLX4_EVENT_TYPE_ECC_DETECT) | \
  70. (1ull << MLX4_EVENT_TYPE_SRQ_CATAS_ERROR) | \
  71. (1ull << MLX4_EVENT_TYPE_SRQ_QP_LAST_WQE) | \
  72. (1ull << MLX4_EVENT_TYPE_SRQ_LIMIT) | \
  73. (1ull << MLX4_EVENT_TYPE_CMD) | \
  74. (1ull << MLX4_EVENT_TYPE_OP_REQUIRED) | \
  75. (1ull << MLX4_EVENT_TYPE_COMM_CHANNEL) | \
  76. (1ull << MLX4_EVENT_TYPE_FLR_EVENT) | \
  77. (1ull << MLX4_EVENT_TYPE_FATAL_WARNING))
  78. static u64 get_async_ev_mask(struct mlx4_dev *dev)
  79. {
  80. u64 async_ev_mask = MLX4_ASYNC_EVENT_MASK;
  81. if (dev->caps.flags & MLX4_DEV_CAP_FLAG_PORT_MNG_CHG_EV)
  82. async_ev_mask |= (1ull << MLX4_EVENT_TYPE_PORT_MNG_CHG_EVENT);
  83. return async_ev_mask;
  84. }
  85. static void eq_set_ci(struct mlx4_eq *eq, int req_not)
  86. {
  87. __raw_writel((__force u32) cpu_to_be32((eq->cons_index & 0xffffff) |
  88. req_not << 31),
  89. eq->doorbell);
  90. /* We still want ordering, just not swabbing, so add a barrier */
  91. mb();
  92. }
  93. static struct mlx4_eqe *get_eqe(struct mlx4_eq *eq, u32 entry, u8 eqe_factor,
  94. u8 eqe_size)
  95. {
  96. /* (entry & (eq->nent - 1)) gives us a cyclic array */
  97. unsigned long offset = (entry & (eq->nent - 1)) * eqe_size;
  98. /* CX3 is capable of extending the EQE from 32 to 64 bytes with
  99. * strides of 64B,128B and 256B.
  100. * When 64B EQE is used, the first (in the lower addresses)
  101. * 32 bytes in the 64 byte EQE are reserved and the next 32 bytes
  102. * contain the legacy EQE information.
  103. * In all other cases, the first 32B contains the legacy EQE info.
  104. */
  105. return eq->page_list[offset / PAGE_SIZE].buf + (offset + (eqe_factor ? MLX4_EQ_ENTRY_SIZE : 0)) % PAGE_SIZE;
  106. }
  107. static struct mlx4_eqe *next_eqe_sw(struct mlx4_eq *eq, u8 eqe_factor, u8 size)
  108. {
  109. struct mlx4_eqe *eqe = get_eqe(eq, eq->cons_index, eqe_factor, size);
  110. return !!(eqe->owner & 0x80) ^ !!(eq->cons_index & eq->nent) ? NULL : eqe;
  111. }
  112. static struct mlx4_eqe *next_slave_event_eqe(struct mlx4_slave_event_eq *slave_eq)
  113. {
  114. struct mlx4_eqe *eqe =
  115. &slave_eq->event_eqe[slave_eq->cons & (SLAVE_EVENT_EQ_SIZE - 1)];
  116. return (!!(eqe->owner & 0x80) ^
  117. !!(slave_eq->cons & SLAVE_EVENT_EQ_SIZE)) ?
  118. eqe : NULL;
  119. }
  120. void mlx4_gen_slave_eqe(struct work_struct *work)
  121. {
  122. struct mlx4_mfunc_master_ctx *master =
  123. container_of(work, struct mlx4_mfunc_master_ctx,
  124. slave_event_work);
  125. struct mlx4_mfunc *mfunc =
  126. container_of(master, struct mlx4_mfunc, master);
  127. struct mlx4_priv *priv = container_of(mfunc, struct mlx4_priv, mfunc);
  128. struct mlx4_dev *dev = &priv->dev;
  129. struct mlx4_slave_event_eq *slave_eq = &mfunc->master.slave_eq;
  130. struct mlx4_eqe *eqe;
  131. u8 slave;
  132. int i;
  133. for (eqe = next_slave_event_eqe(slave_eq); eqe;
  134. eqe = next_slave_event_eqe(slave_eq)) {
  135. slave = eqe->slave_id;
  136. /* All active slaves need to receive the event */
  137. if (slave == ALL_SLAVES) {
  138. for (i = 0; i < dev->num_slaves; i++) {
  139. if (i != dev->caps.function &&
  140. master->slave_state[i].active)
  141. if (mlx4_GEN_EQE(dev, i, eqe))
  142. mlx4_warn(dev, "Failed to generate event for slave %d\n",
  143. i);
  144. }
  145. } else {
  146. if (mlx4_GEN_EQE(dev, slave, eqe))
  147. mlx4_warn(dev, "Failed to generate event for slave %d\n",
  148. slave);
  149. }
  150. ++slave_eq->cons;
  151. }
  152. }
  153. static void slave_event(struct mlx4_dev *dev, u8 slave, struct mlx4_eqe *eqe)
  154. {
  155. struct mlx4_priv *priv = mlx4_priv(dev);
  156. struct mlx4_slave_event_eq *slave_eq = &priv->mfunc.master.slave_eq;
  157. struct mlx4_eqe *s_eqe;
  158. unsigned long flags;
  159. spin_lock_irqsave(&slave_eq->event_lock, flags);
  160. s_eqe = &slave_eq->event_eqe[slave_eq->prod & (SLAVE_EVENT_EQ_SIZE - 1)];
  161. if ((!!(s_eqe->owner & 0x80)) ^
  162. (!!(slave_eq->prod & SLAVE_EVENT_EQ_SIZE))) {
  163. mlx4_warn(dev, "Master failed to generate an EQE for slave: %d. No free EQE on slave events queue\n",
  164. slave);
  165. spin_unlock_irqrestore(&slave_eq->event_lock, flags);
  166. return;
  167. }
  168. memcpy(s_eqe, eqe, dev->caps.eqe_size - 1);
  169. s_eqe->slave_id = slave;
  170. /* ensure all information is written before setting the ownersip bit */
  171. wmb();
  172. s_eqe->owner = !!(slave_eq->prod & SLAVE_EVENT_EQ_SIZE) ? 0x0 : 0x80;
  173. ++slave_eq->prod;
  174. queue_work(priv->mfunc.master.comm_wq,
  175. &priv->mfunc.master.slave_event_work);
  176. spin_unlock_irqrestore(&slave_eq->event_lock, flags);
  177. }
  178. static void mlx4_slave_event(struct mlx4_dev *dev, int slave,
  179. struct mlx4_eqe *eqe)
  180. {
  181. struct mlx4_priv *priv = mlx4_priv(dev);
  182. struct mlx4_slave_state *s_slave =
  183. &priv->mfunc.master.slave_state[slave];
  184. if (!s_slave->active) {
  185. /*mlx4_warn(dev, "Trying to pass event to inactive slave\n");*/
  186. return;
  187. }
  188. slave_event(dev, slave, eqe);
  189. }
  190. int mlx4_gen_pkey_eqe(struct mlx4_dev *dev, int slave, u8 port)
  191. {
  192. struct mlx4_eqe eqe;
  193. struct mlx4_priv *priv = mlx4_priv(dev);
  194. struct mlx4_slave_state *s_slave = &priv->mfunc.master.slave_state[slave];
  195. if (!s_slave->active)
  196. return 0;
  197. memset(&eqe, 0, sizeof eqe);
  198. eqe.type = MLX4_EVENT_TYPE_PORT_MNG_CHG_EVENT;
  199. eqe.subtype = MLX4_DEV_PMC_SUBTYPE_PKEY_TABLE;
  200. eqe.event.port_mgmt_change.port = port;
  201. return mlx4_GEN_EQE(dev, slave, &eqe);
  202. }
  203. EXPORT_SYMBOL(mlx4_gen_pkey_eqe);
  204. int mlx4_gen_guid_change_eqe(struct mlx4_dev *dev, int slave, u8 port)
  205. {
  206. struct mlx4_eqe eqe;
  207. /*don't send if we don't have the that slave */
  208. if (dev->num_vfs < slave)
  209. return 0;
  210. memset(&eqe, 0, sizeof eqe);
  211. eqe.type = MLX4_EVENT_TYPE_PORT_MNG_CHG_EVENT;
  212. eqe.subtype = MLX4_DEV_PMC_SUBTYPE_GUID_INFO;
  213. eqe.event.port_mgmt_change.port = port;
  214. return mlx4_GEN_EQE(dev, slave, &eqe);
  215. }
  216. EXPORT_SYMBOL(mlx4_gen_guid_change_eqe);
  217. int mlx4_gen_port_state_change_eqe(struct mlx4_dev *dev, int slave, u8 port,
  218. u8 port_subtype_change)
  219. {
  220. struct mlx4_eqe eqe;
  221. /*don't send if we don't have the that slave */
  222. if (dev->num_vfs < slave)
  223. return 0;
  224. memset(&eqe, 0, sizeof eqe);
  225. eqe.type = MLX4_EVENT_TYPE_PORT_CHANGE;
  226. eqe.subtype = port_subtype_change;
  227. eqe.event.port_change.port = cpu_to_be32(port << 28);
  228. mlx4_dbg(dev, "%s: sending: %d to slave: %d on port: %d\n", __func__,
  229. port_subtype_change, slave, port);
  230. return mlx4_GEN_EQE(dev, slave, &eqe);
  231. }
  232. EXPORT_SYMBOL(mlx4_gen_port_state_change_eqe);
  233. enum slave_port_state mlx4_get_slave_port_state(struct mlx4_dev *dev, int slave, u8 port)
  234. {
  235. struct mlx4_priv *priv = mlx4_priv(dev);
  236. struct mlx4_slave_state *s_state = priv->mfunc.master.slave_state;
  237. struct mlx4_active_ports actv_ports = mlx4_get_active_ports(dev, slave);
  238. if (slave >= dev->num_slaves || port > dev->caps.num_ports ||
  239. port <= 0 || !test_bit(port - 1, actv_ports.ports)) {
  240. pr_err("%s: Error: asking for slave:%d, port:%d\n",
  241. __func__, slave, port);
  242. return SLAVE_PORT_DOWN;
  243. }
  244. return s_state[slave].port_state[port];
  245. }
  246. EXPORT_SYMBOL(mlx4_get_slave_port_state);
  247. static int mlx4_set_slave_port_state(struct mlx4_dev *dev, int slave, u8 port,
  248. enum slave_port_state state)
  249. {
  250. struct mlx4_priv *priv = mlx4_priv(dev);
  251. struct mlx4_slave_state *s_state = priv->mfunc.master.slave_state;
  252. struct mlx4_active_ports actv_ports = mlx4_get_active_ports(dev, slave);
  253. if (slave >= dev->num_slaves || port > dev->caps.num_ports ||
  254. port <= 0 || !test_bit(port - 1, actv_ports.ports)) {
  255. pr_err("%s: Error: asking for slave:%d, port:%d\n",
  256. __func__, slave, port);
  257. return -1;
  258. }
  259. s_state[slave].port_state[port] = state;
  260. return 0;
  261. }
  262. static void set_all_slave_state(struct mlx4_dev *dev, u8 port, int event)
  263. {
  264. int i;
  265. enum slave_port_gen_event gen_event;
  266. struct mlx4_slaves_pport slaves_pport = mlx4_phys_to_slaves_pport(dev,
  267. port);
  268. for (i = 0; i < dev->num_vfs + 1; i++)
  269. if (test_bit(i, slaves_pport.slaves))
  270. set_and_calc_slave_port_state(dev, i, port,
  271. event, &gen_event);
  272. }
  273. /**************************************************************************
  274. The function get as input the new event to that port,
  275. and according to the prev state change the slave's port state.
  276. The events are:
  277. MLX4_PORT_STATE_DEV_EVENT_PORT_DOWN,
  278. MLX4_PORT_STATE_DEV_EVENT_PORT_UP
  279. MLX4_PORT_STATE_IB_EVENT_GID_VALID
  280. MLX4_PORT_STATE_IB_EVENT_GID_INVALID
  281. ***************************************************************************/
  282. int set_and_calc_slave_port_state(struct mlx4_dev *dev, int slave,
  283. u8 port, int event,
  284. enum slave_port_gen_event *gen_event)
  285. {
  286. struct mlx4_priv *priv = mlx4_priv(dev);
  287. struct mlx4_slave_state *ctx = NULL;
  288. unsigned long flags;
  289. int ret = -1;
  290. struct mlx4_active_ports actv_ports = mlx4_get_active_ports(dev, slave);
  291. enum slave_port_state cur_state =
  292. mlx4_get_slave_port_state(dev, slave, port);
  293. *gen_event = SLAVE_PORT_GEN_EVENT_NONE;
  294. if (slave >= dev->num_slaves || port > dev->caps.num_ports ||
  295. port <= 0 || !test_bit(port - 1, actv_ports.ports)) {
  296. pr_err("%s: Error: asking for slave:%d, port:%d\n",
  297. __func__, slave, port);
  298. return ret;
  299. }
  300. ctx = &priv->mfunc.master.slave_state[slave];
  301. spin_lock_irqsave(&ctx->lock, flags);
  302. switch (cur_state) {
  303. case SLAVE_PORT_DOWN:
  304. if (MLX4_PORT_STATE_DEV_EVENT_PORT_UP == event)
  305. mlx4_set_slave_port_state(dev, slave, port,
  306. SLAVE_PENDING_UP);
  307. break;
  308. case SLAVE_PENDING_UP:
  309. if (MLX4_PORT_STATE_DEV_EVENT_PORT_DOWN == event)
  310. mlx4_set_slave_port_state(dev, slave, port,
  311. SLAVE_PORT_DOWN);
  312. else if (MLX4_PORT_STATE_IB_PORT_STATE_EVENT_GID_VALID == event) {
  313. mlx4_set_slave_port_state(dev, slave, port,
  314. SLAVE_PORT_UP);
  315. *gen_event = SLAVE_PORT_GEN_EVENT_UP;
  316. }
  317. break;
  318. case SLAVE_PORT_UP:
  319. if (MLX4_PORT_STATE_DEV_EVENT_PORT_DOWN == event) {
  320. mlx4_set_slave_port_state(dev, slave, port,
  321. SLAVE_PORT_DOWN);
  322. *gen_event = SLAVE_PORT_GEN_EVENT_DOWN;
  323. } else if (MLX4_PORT_STATE_IB_EVENT_GID_INVALID ==
  324. event) {
  325. mlx4_set_slave_port_state(dev, slave, port,
  326. SLAVE_PENDING_UP);
  327. *gen_event = SLAVE_PORT_GEN_EVENT_DOWN;
  328. }
  329. break;
  330. default:
  331. pr_err("%s: BUG!!! UNKNOWN state: slave:%d, port:%d\n",
  332. __func__, slave, port);
  333. goto out;
  334. }
  335. ret = mlx4_get_slave_port_state(dev, slave, port);
  336. out:
  337. spin_unlock_irqrestore(&ctx->lock, flags);
  338. return ret;
  339. }
  340. EXPORT_SYMBOL(set_and_calc_slave_port_state);
  341. int mlx4_gen_slaves_port_mgt_ev(struct mlx4_dev *dev, u8 port, int attr)
  342. {
  343. struct mlx4_eqe eqe;
  344. memset(&eqe, 0, sizeof eqe);
  345. eqe.type = MLX4_EVENT_TYPE_PORT_MNG_CHG_EVENT;
  346. eqe.subtype = MLX4_DEV_PMC_SUBTYPE_PORT_INFO;
  347. eqe.event.port_mgmt_change.port = port;
  348. eqe.event.port_mgmt_change.params.port_info.changed_attr =
  349. cpu_to_be32((u32) attr);
  350. slave_event(dev, ALL_SLAVES, &eqe);
  351. return 0;
  352. }
  353. EXPORT_SYMBOL(mlx4_gen_slaves_port_mgt_ev);
  354. void mlx4_master_handle_slave_flr(struct work_struct *work)
  355. {
  356. struct mlx4_mfunc_master_ctx *master =
  357. container_of(work, struct mlx4_mfunc_master_ctx,
  358. slave_flr_event_work);
  359. struct mlx4_mfunc *mfunc =
  360. container_of(master, struct mlx4_mfunc, master);
  361. struct mlx4_priv *priv =
  362. container_of(mfunc, struct mlx4_priv, mfunc);
  363. struct mlx4_dev *dev = &priv->dev;
  364. struct mlx4_slave_state *slave_state = priv->mfunc.master.slave_state;
  365. int i;
  366. int err;
  367. unsigned long flags;
  368. mlx4_dbg(dev, "mlx4_handle_slave_flr\n");
  369. for (i = 0 ; i < dev->num_slaves; i++) {
  370. if (MLX4_COMM_CMD_FLR == slave_state[i].last_cmd) {
  371. mlx4_dbg(dev, "mlx4_handle_slave_flr: clean slave: %d\n",
  372. i);
  373. mlx4_delete_all_resources_for_slave(dev, i);
  374. /*return the slave to running mode*/
  375. spin_lock_irqsave(&priv->mfunc.master.slave_state_lock, flags);
  376. slave_state[i].last_cmd = MLX4_COMM_CMD_RESET;
  377. slave_state[i].is_slave_going_down = 0;
  378. spin_unlock_irqrestore(&priv->mfunc.master.slave_state_lock, flags);
  379. /*notify the FW:*/
  380. err = mlx4_cmd(dev, 0, i, 0, MLX4_CMD_INFORM_FLR_DONE,
  381. MLX4_CMD_TIME_CLASS_A, MLX4_CMD_WRAPPED);
  382. if (err)
  383. mlx4_warn(dev, "Failed to notify FW on FLR done (slave:%d)\n",
  384. i);
  385. }
  386. }
  387. }
  388. static int mlx4_eq_int(struct mlx4_dev *dev, struct mlx4_eq *eq)
  389. {
  390. struct mlx4_priv *priv = mlx4_priv(dev);
  391. struct mlx4_eqe *eqe;
  392. int cqn = -1;
  393. int eqes_found = 0;
  394. int set_ci = 0;
  395. int port;
  396. int slave = 0;
  397. int ret;
  398. u32 flr_slave;
  399. u8 update_slave_state;
  400. int i;
  401. enum slave_port_gen_event gen_event;
  402. unsigned long flags;
  403. struct mlx4_vport_state *s_info;
  404. int eqe_size = dev->caps.eqe_size;
  405. while ((eqe = next_eqe_sw(eq, dev->caps.eqe_factor, eqe_size))) {
  406. /*
  407. * Make sure we read EQ entry contents after we've
  408. * checked the ownership bit.
  409. */
  410. rmb();
  411. switch (eqe->type) {
  412. case MLX4_EVENT_TYPE_COMP:
  413. cqn = be32_to_cpu(eqe->event.comp.cqn) & 0xffffff;
  414. mlx4_cq_completion(dev, cqn);
  415. break;
  416. case MLX4_EVENT_TYPE_PATH_MIG:
  417. case MLX4_EVENT_TYPE_COMM_EST:
  418. case MLX4_EVENT_TYPE_SQ_DRAINED:
  419. case MLX4_EVENT_TYPE_SRQ_QP_LAST_WQE:
  420. case MLX4_EVENT_TYPE_WQ_CATAS_ERROR:
  421. case MLX4_EVENT_TYPE_PATH_MIG_FAILED:
  422. case MLX4_EVENT_TYPE_WQ_INVAL_REQ_ERROR:
  423. case MLX4_EVENT_TYPE_WQ_ACCESS_ERROR:
  424. mlx4_dbg(dev, "event %d arrived\n", eqe->type);
  425. if (mlx4_is_master(dev)) {
  426. /* forward only to slave owning the QP */
  427. ret = mlx4_get_slave_from_resource_id(dev,
  428. RES_QP,
  429. be32_to_cpu(eqe->event.qp.qpn)
  430. & 0xffffff, &slave);
  431. if (ret && ret != -ENOENT) {
  432. mlx4_dbg(dev, "QP event %02x(%02x) on EQ %d at index %u: could not get slave id (%d)\n",
  433. eqe->type, eqe->subtype,
  434. eq->eqn, eq->cons_index, ret);
  435. break;
  436. }
  437. if (!ret && slave != dev->caps.function) {
  438. mlx4_slave_event(dev, slave, eqe);
  439. break;
  440. }
  441. }
  442. mlx4_qp_event(dev, be32_to_cpu(eqe->event.qp.qpn) &
  443. 0xffffff, eqe->type);
  444. break;
  445. case MLX4_EVENT_TYPE_SRQ_LIMIT:
  446. mlx4_dbg(dev, "%s: MLX4_EVENT_TYPE_SRQ_LIMIT\n",
  447. __func__);
  448. case MLX4_EVENT_TYPE_SRQ_CATAS_ERROR:
  449. if (mlx4_is_master(dev)) {
  450. /* forward only to slave owning the SRQ */
  451. ret = mlx4_get_slave_from_resource_id(dev,
  452. RES_SRQ,
  453. be32_to_cpu(eqe->event.srq.srqn)
  454. & 0xffffff,
  455. &slave);
  456. if (ret && ret != -ENOENT) {
  457. mlx4_warn(dev, "SRQ event %02x(%02x) on EQ %d at index %u: could not get slave id (%d)\n",
  458. eqe->type, eqe->subtype,
  459. eq->eqn, eq->cons_index, ret);
  460. break;
  461. }
  462. mlx4_warn(dev, "%s: slave:%d, srq_no:0x%x, event: %02x(%02x)\n",
  463. __func__, slave,
  464. be32_to_cpu(eqe->event.srq.srqn),
  465. eqe->type, eqe->subtype);
  466. if (!ret && slave != dev->caps.function) {
  467. mlx4_warn(dev, "%s: sending event %02x(%02x) to slave:%d\n",
  468. __func__, eqe->type,
  469. eqe->subtype, slave);
  470. mlx4_slave_event(dev, slave, eqe);
  471. break;
  472. }
  473. }
  474. mlx4_srq_event(dev, be32_to_cpu(eqe->event.srq.srqn) &
  475. 0xffffff, eqe->type);
  476. break;
  477. case MLX4_EVENT_TYPE_CMD:
  478. mlx4_cmd_event(dev,
  479. be16_to_cpu(eqe->event.cmd.token),
  480. eqe->event.cmd.status,
  481. be64_to_cpu(eqe->event.cmd.out_param));
  482. break;
  483. case MLX4_EVENT_TYPE_PORT_CHANGE: {
  484. struct mlx4_slaves_pport slaves_port;
  485. port = be32_to_cpu(eqe->event.port_change.port) >> 28;
  486. slaves_port = mlx4_phys_to_slaves_pport(dev, port);
  487. if (eqe->subtype == MLX4_PORT_CHANGE_SUBTYPE_DOWN) {
  488. mlx4_dispatch_event(dev, MLX4_DEV_EVENT_PORT_DOWN,
  489. port);
  490. mlx4_priv(dev)->sense.do_sense_port[port] = 1;
  491. if (!mlx4_is_master(dev))
  492. break;
  493. for (i = 0; i < dev->num_vfs + 1; i++) {
  494. if (!test_bit(i, slaves_port.slaves))
  495. continue;
  496. if (dev->caps.port_type[port] == MLX4_PORT_TYPE_ETH) {
  497. if (i == mlx4_master_func_num(dev))
  498. continue;
  499. mlx4_dbg(dev, "%s: Sending MLX4_PORT_CHANGE_SUBTYPE_DOWN to slave: %d, port:%d\n",
  500. __func__, i, port);
  501. s_info = &priv->mfunc.master.vf_oper[slave].vport[port].state;
  502. if (IFLA_VF_LINK_STATE_AUTO == s_info->link_state) {
  503. eqe->event.port_change.port =
  504. cpu_to_be32(
  505. (be32_to_cpu(eqe->event.port_change.port) & 0xFFFFFFF)
  506. | (mlx4_phys_to_slave_port(dev, i, port) << 28));
  507. mlx4_slave_event(dev, i, eqe);
  508. }
  509. } else { /* IB port */
  510. set_and_calc_slave_port_state(dev, i, port,
  511. MLX4_PORT_STATE_DEV_EVENT_PORT_DOWN,
  512. &gen_event);
  513. /*we can be in pending state, then do not send port_down event*/
  514. if (SLAVE_PORT_GEN_EVENT_DOWN == gen_event) {
  515. if (i == mlx4_master_func_num(dev))
  516. continue;
  517. mlx4_slave_event(dev, i, eqe);
  518. }
  519. }
  520. }
  521. } else {
  522. mlx4_dispatch_event(dev, MLX4_DEV_EVENT_PORT_UP, port);
  523. mlx4_priv(dev)->sense.do_sense_port[port] = 0;
  524. if (!mlx4_is_master(dev))
  525. break;
  526. if (dev->caps.port_type[port] == MLX4_PORT_TYPE_ETH)
  527. for (i = 0; i < dev->num_vfs + 1; i++) {
  528. if (!test_bit(i, slaves_port.slaves))
  529. continue;
  530. if (i == mlx4_master_func_num(dev))
  531. continue;
  532. s_info = &priv->mfunc.master.vf_oper[slave].vport[port].state;
  533. if (IFLA_VF_LINK_STATE_AUTO == s_info->link_state) {
  534. eqe->event.port_change.port =
  535. cpu_to_be32(
  536. (be32_to_cpu(eqe->event.port_change.port) & 0xFFFFFFF)
  537. | (mlx4_phys_to_slave_port(dev, i, port) << 28));
  538. mlx4_slave_event(dev, i, eqe);
  539. }
  540. }
  541. else /* IB port */
  542. /* port-up event will be sent to a slave when the
  543. * slave's alias-guid is set. This is done in alias_GUID.c
  544. */
  545. set_all_slave_state(dev, port, MLX4_DEV_EVENT_PORT_UP);
  546. }
  547. break;
  548. }
  549. case MLX4_EVENT_TYPE_CQ_ERROR:
  550. mlx4_warn(dev, "CQ %s on CQN %06x\n",
  551. eqe->event.cq_err.syndrome == 1 ?
  552. "overrun" : "access violation",
  553. be32_to_cpu(eqe->event.cq_err.cqn) & 0xffffff);
  554. if (mlx4_is_master(dev)) {
  555. ret = mlx4_get_slave_from_resource_id(dev,
  556. RES_CQ,
  557. be32_to_cpu(eqe->event.cq_err.cqn)
  558. & 0xffffff, &slave);
  559. if (ret && ret != -ENOENT) {
  560. mlx4_dbg(dev, "CQ event %02x(%02x) on EQ %d at index %u: could not get slave id (%d)\n",
  561. eqe->type, eqe->subtype,
  562. eq->eqn, eq->cons_index, ret);
  563. break;
  564. }
  565. if (!ret && slave != dev->caps.function) {
  566. mlx4_slave_event(dev, slave, eqe);
  567. break;
  568. }
  569. }
  570. mlx4_cq_event(dev,
  571. be32_to_cpu(eqe->event.cq_err.cqn)
  572. & 0xffffff,
  573. eqe->type);
  574. break;
  575. case MLX4_EVENT_TYPE_EQ_OVERFLOW:
  576. mlx4_warn(dev, "EQ overrun on EQN %d\n", eq->eqn);
  577. break;
  578. case MLX4_EVENT_TYPE_OP_REQUIRED:
  579. atomic_inc(&priv->opreq_count);
  580. /* FW commands can't be executed from interrupt context
  581. * working in deferred task
  582. */
  583. queue_work(mlx4_wq, &priv->opreq_task);
  584. break;
  585. case MLX4_EVENT_TYPE_COMM_CHANNEL:
  586. if (!mlx4_is_master(dev)) {
  587. mlx4_warn(dev, "Received comm channel event for non master device\n");
  588. break;
  589. }
  590. memcpy(&priv->mfunc.master.comm_arm_bit_vector,
  591. eqe->event.comm_channel_arm.bit_vec,
  592. sizeof eqe->event.comm_channel_arm.bit_vec);
  593. queue_work(priv->mfunc.master.comm_wq,
  594. &priv->mfunc.master.comm_work);
  595. break;
  596. case MLX4_EVENT_TYPE_FLR_EVENT:
  597. flr_slave = be32_to_cpu(eqe->event.flr_event.slave_id);
  598. if (!mlx4_is_master(dev)) {
  599. mlx4_warn(dev, "Non-master function received FLR event\n");
  600. break;
  601. }
  602. mlx4_dbg(dev, "FLR event for slave: %d\n", flr_slave);
  603. if (flr_slave >= dev->num_slaves) {
  604. mlx4_warn(dev,
  605. "Got FLR for unknown function: %d\n",
  606. flr_slave);
  607. update_slave_state = 0;
  608. } else
  609. update_slave_state = 1;
  610. spin_lock_irqsave(&priv->mfunc.master.slave_state_lock, flags);
  611. if (update_slave_state) {
  612. priv->mfunc.master.slave_state[flr_slave].active = false;
  613. priv->mfunc.master.slave_state[flr_slave].last_cmd = MLX4_COMM_CMD_FLR;
  614. priv->mfunc.master.slave_state[flr_slave].is_slave_going_down = 1;
  615. }
  616. spin_unlock_irqrestore(&priv->mfunc.master.slave_state_lock, flags);
  617. queue_work(priv->mfunc.master.comm_wq,
  618. &priv->mfunc.master.slave_flr_event_work);
  619. break;
  620. case MLX4_EVENT_TYPE_FATAL_WARNING:
  621. if (eqe->subtype == MLX4_FATAL_WARNING_SUBTYPE_WARMING) {
  622. if (mlx4_is_master(dev))
  623. for (i = 0; i < dev->num_slaves; i++) {
  624. mlx4_dbg(dev, "%s: Sending MLX4_FATAL_WARNING_SUBTYPE_WARMING to slave: %d\n",
  625. __func__, i);
  626. if (i == dev->caps.function)
  627. continue;
  628. mlx4_slave_event(dev, i, eqe);
  629. }
  630. mlx4_err(dev, "Temperature Threshold was reached! Threshold: %d celsius degrees; Current Temperature: %d\n",
  631. be16_to_cpu(eqe->event.warming.warning_threshold),
  632. be16_to_cpu(eqe->event.warming.current_temperature));
  633. } else
  634. mlx4_warn(dev, "Unhandled event FATAL WARNING (%02x), subtype %02x on EQ %d at index %u. owner=%x, nent=0x%x, slave=%x, ownership=%s\n",
  635. eqe->type, eqe->subtype, eq->eqn,
  636. eq->cons_index, eqe->owner, eq->nent,
  637. eqe->slave_id,
  638. !!(eqe->owner & 0x80) ^
  639. !!(eq->cons_index & eq->nent) ? "HW" : "SW");
  640. break;
  641. case MLX4_EVENT_TYPE_PORT_MNG_CHG_EVENT:
  642. mlx4_dispatch_event(dev, MLX4_DEV_EVENT_PORT_MGMT_CHANGE,
  643. (unsigned long) eqe);
  644. break;
  645. case MLX4_EVENT_TYPE_EEC_CATAS_ERROR:
  646. case MLX4_EVENT_TYPE_ECC_DETECT:
  647. default:
  648. mlx4_warn(dev, "Unhandled event %02x(%02x) on EQ %d at index %u. owner=%x, nent=0x%x, slave=%x, ownership=%s\n",
  649. eqe->type, eqe->subtype, eq->eqn,
  650. eq->cons_index, eqe->owner, eq->nent,
  651. eqe->slave_id,
  652. !!(eqe->owner & 0x80) ^
  653. !!(eq->cons_index & eq->nent) ? "HW" : "SW");
  654. break;
  655. };
  656. ++eq->cons_index;
  657. eqes_found = 1;
  658. ++set_ci;
  659. /*
  660. * The HCA will think the queue has overflowed if we
  661. * don't tell it we've been processing events. We
  662. * create our EQs with MLX4_NUM_SPARE_EQE extra
  663. * entries, so we must update our consumer index at
  664. * least that often.
  665. */
  666. if (unlikely(set_ci >= MLX4_NUM_SPARE_EQE)) {
  667. eq_set_ci(eq, 0);
  668. set_ci = 0;
  669. }
  670. }
  671. eq_set_ci(eq, 1);
  672. /* cqn is 24bit wide but is initialized such that its higher bits
  673. * are ones too. Thus, if we got any event, cqn's high bits should be off
  674. * and we need to schedule the tasklet.
  675. */
  676. if (!(cqn & ~0xffffff))
  677. tasklet_schedule(&eq->tasklet_ctx.task);
  678. return eqes_found;
  679. }
  680. static irqreturn_t mlx4_interrupt(int irq, void *dev_ptr)
  681. {
  682. struct mlx4_dev *dev = dev_ptr;
  683. struct mlx4_priv *priv = mlx4_priv(dev);
  684. int work = 0;
  685. int i;
  686. writel(priv->eq_table.clr_mask, priv->eq_table.clr_int);
  687. for (i = 0; i < dev->caps.num_comp_vectors + 1; ++i)
  688. work |= mlx4_eq_int(dev, &priv->eq_table.eq[i]);
  689. return IRQ_RETVAL(work);
  690. }
  691. static irqreturn_t mlx4_msi_x_interrupt(int irq, void *eq_ptr)
  692. {
  693. struct mlx4_eq *eq = eq_ptr;
  694. struct mlx4_dev *dev = eq->dev;
  695. mlx4_eq_int(dev, eq);
  696. /* MSI-X vectors always belong to us */
  697. return IRQ_HANDLED;
  698. }
  699. int mlx4_MAP_EQ_wrapper(struct mlx4_dev *dev, int slave,
  700. struct mlx4_vhcr *vhcr,
  701. struct mlx4_cmd_mailbox *inbox,
  702. struct mlx4_cmd_mailbox *outbox,
  703. struct mlx4_cmd_info *cmd)
  704. {
  705. struct mlx4_priv *priv = mlx4_priv(dev);
  706. struct mlx4_slave_event_eq_info *event_eq =
  707. priv->mfunc.master.slave_state[slave].event_eq;
  708. u32 in_modifier = vhcr->in_modifier;
  709. u32 eqn = in_modifier & 0x3FF;
  710. u64 in_param = vhcr->in_param;
  711. int err = 0;
  712. int i;
  713. if (slave == dev->caps.function)
  714. err = mlx4_cmd(dev, in_param, (in_modifier & 0x80000000) | eqn,
  715. 0, MLX4_CMD_MAP_EQ, MLX4_CMD_TIME_CLASS_B,
  716. MLX4_CMD_NATIVE);
  717. if (!err)
  718. for (i = 0; i < MLX4_EVENT_TYPES_NUM; ++i)
  719. if (in_param & (1LL << i))
  720. event_eq[i].eqn = in_modifier >> 31 ? -1 : eqn;
  721. return err;
  722. }
  723. static int mlx4_MAP_EQ(struct mlx4_dev *dev, u64 event_mask, int unmap,
  724. int eq_num)
  725. {
  726. return mlx4_cmd(dev, event_mask, (unmap << 31) | eq_num,
  727. 0, MLX4_CMD_MAP_EQ, MLX4_CMD_TIME_CLASS_B,
  728. MLX4_CMD_WRAPPED);
  729. }
  730. static int mlx4_SW2HW_EQ(struct mlx4_dev *dev, struct mlx4_cmd_mailbox *mailbox,
  731. int eq_num)
  732. {
  733. return mlx4_cmd(dev, mailbox->dma, eq_num, 0,
  734. MLX4_CMD_SW2HW_EQ, MLX4_CMD_TIME_CLASS_A,
  735. MLX4_CMD_WRAPPED);
  736. }
  737. static int mlx4_HW2SW_EQ(struct mlx4_dev *dev, struct mlx4_cmd_mailbox *mailbox,
  738. int eq_num)
  739. {
  740. return mlx4_cmd_box(dev, 0, mailbox->dma, eq_num,
  741. 0, MLX4_CMD_HW2SW_EQ, MLX4_CMD_TIME_CLASS_A,
  742. MLX4_CMD_WRAPPED);
  743. }
  744. static int mlx4_num_eq_uar(struct mlx4_dev *dev)
  745. {
  746. /*
  747. * Each UAR holds 4 EQ doorbells. To figure out how many UARs
  748. * we need to map, take the difference of highest index and
  749. * the lowest index we'll use and add 1.
  750. */
  751. return (dev->caps.num_comp_vectors + 1 + dev->caps.reserved_eqs +
  752. dev->caps.comp_pool)/4 - dev->caps.reserved_eqs/4 + 1;
  753. }
  754. static void __iomem *mlx4_get_eq_uar(struct mlx4_dev *dev, struct mlx4_eq *eq)
  755. {
  756. struct mlx4_priv *priv = mlx4_priv(dev);
  757. int index;
  758. index = eq->eqn / 4 - dev->caps.reserved_eqs / 4;
  759. if (!priv->eq_table.uar_map[index]) {
  760. priv->eq_table.uar_map[index] =
  761. ioremap(pci_resource_start(dev->pdev, 2) +
  762. ((eq->eqn / 4) << PAGE_SHIFT),
  763. PAGE_SIZE);
  764. if (!priv->eq_table.uar_map[index]) {
  765. mlx4_err(dev, "Couldn't map EQ doorbell for EQN 0x%06x\n",
  766. eq->eqn);
  767. return NULL;
  768. }
  769. }
  770. return priv->eq_table.uar_map[index] + 0x800 + 8 * (eq->eqn % 4);
  771. }
  772. static void mlx4_unmap_uar(struct mlx4_dev *dev)
  773. {
  774. struct mlx4_priv *priv = mlx4_priv(dev);
  775. int i;
  776. for (i = 0; i < mlx4_num_eq_uar(dev); ++i)
  777. if (priv->eq_table.uar_map[i]) {
  778. iounmap(priv->eq_table.uar_map[i]);
  779. priv->eq_table.uar_map[i] = NULL;
  780. }
  781. }
  782. static int mlx4_create_eq(struct mlx4_dev *dev, int nent,
  783. u8 intr, struct mlx4_eq *eq)
  784. {
  785. struct mlx4_priv *priv = mlx4_priv(dev);
  786. struct mlx4_cmd_mailbox *mailbox;
  787. struct mlx4_eq_context *eq_context;
  788. int npages;
  789. u64 *dma_list = NULL;
  790. dma_addr_t t;
  791. u64 mtt_addr;
  792. int err = -ENOMEM;
  793. int i;
  794. eq->dev = dev;
  795. eq->nent = roundup_pow_of_two(max(nent, 2));
  796. /* CX3 is capable of extending the CQE/EQE from 32 to 64 bytes, with
  797. * strides of 64B,128B and 256B.
  798. */
  799. npages = PAGE_ALIGN(eq->nent * dev->caps.eqe_size) / PAGE_SIZE;
  800. eq->page_list = kmalloc(npages * sizeof *eq->page_list,
  801. GFP_KERNEL);
  802. if (!eq->page_list)
  803. goto err_out;
  804. for (i = 0; i < npages; ++i)
  805. eq->page_list[i].buf = NULL;
  806. dma_list = kmalloc(npages * sizeof *dma_list, GFP_KERNEL);
  807. if (!dma_list)
  808. goto err_out_free;
  809. mailbox = mlx4_alloc_cmd_mailbox(dev);
  810. if (IS_ERR(mailbox))
  811. goto err_out_free;
  812. eq_context = mailbox->buf;
  813. for (i = 0; i < npages; ++i) {
  814. eq->page_list[i].buf = dma_alloc_coherent(&dev->pdev->dev,
  815. PAGE_SIZE, &t, GFP_KERNEL);
  816. if (!eq->page_list[i].buf)
  817. goto err_out_free_pages;
  818. dma_list[i] = t;
  819. eq->page_list[i].map = t;
  820. memset(eq->page_list[i].buf, 0, PAGE_SIZE);
  821. }
  822. eq->eqn = mlx4_bitmap_alloc(&priv->eq_table.bitmap);
  823. if (eq->eqn == -1)
  824. goto err_out_free_pages;
  825. eq->doorbell = mlx4_get_eq_uar(dev, eq);
  826. if (!eq->doorbell) {
  827. err = -ENOMEM;
  828. goto err_out_free_eq;
  829. }
  830. err = mlx4_mtt_init(dev, npages, PAGE_SHIFT, &eq->mtt);
  831. if (err)
  832. goto err_out_free_eq;
  833. err = mlx4_write_mtt(dev, &eq->mtt, 0, npages, dma_list);
  834. if (err)
  835. goto err_out_free_mtt;
  836. eq_context->flags = cpu_to_be32(MLX4_EQ_STATUS_OK |
  837. MLX4_EQ_STATE_ARMED);
  838. eq_context->log_eq_size = ilog2(eq->nent);
  839. eq_context->intr = intr;
  840. eq_context->log_page_size = PAGE_SHIFT - MLX4_ICM_PAGE_SHIFT;
  841. mtt_addr = mlx4_mtt_addr(dev, &eq->mtt);
  842. eq_context->mtt_base_addr_h = mtt_addr >> 32;
  843. eq_context->mtt_base_addr_l = cpu_to_be32(mtt_addr & 0xffffffff);
  844. err = mlx4_SW2HW_EQ(dev, mailbox, eq->eqn);
  845. if (err) {
  846. mlx4_warn(dev, "SW2HW_EQ failed (%d)\n", err);
  847. goto err_out_free_mtt;
  848. }
  849. kfree(dma_list);
  850. mlx4_free_cmd_mailbox(dev, mailbox);
  851. eq->cons_index = 0;
  852. INIT_LIST_HEAD(&eq->tasklet_ctx.list);
  853. INIT_LIST_HEAD(&eq->tasklet_ctx.process_list);
  854. spin_lock_init(&eq->tasklet_ctx.lock);
  855. tasklet_init(&eq->tasklet_ctx.task, mlx4_cq_tasklet_cb,
  856. (unsigned long)&eq->tasklet_ctx);
  857. return err;
  858. err_out_free_mtt:
  859. mlx4_mtt_cleanup(dev, &eq->mtt);
  860. err_out_free_eq:
  861. mlx4_bitmap_free(&priv->eq_table.bitmap, eq->eqn, MLX4_USE_RR);
  862. err_out_free_pages:
  863. for (i = 0; i < npages; ++i)
  864. if (eq->page_list[i].buf)
  865. dma_free_coherent(&dev->pdev->dev, PAGE_SIZE,
  866. eq->page_list[i].buf,
  867. eq->page_list[i].map);
  868. mlx4_free_cmd_mailbox(dev, mailbox);
  869. err_out_free:
  870. kfree(eq->page_list);
  871. kfree(dma_list);
  872. err_out:
  873. return err;
  874. }
  875. static void mlx4_free_eq(struct mlx4_dev *dev,
  876. struct mlx4_eq *eq)
  877. {
  878. struct mlx4_priv *priv = mlx4_priv(dev);
  879. struct mlx4_cmd_mailbox *mailbox;
  880. int err;
  881. int i;
  882. /* CX3 is capable of extending the CQE/EQE from 32 to 64 bytes, with
  883. * strides of 64B,128B and 256B
  884. */
  885. int npages = PAGE_ALIGN(dev->caps.eqe_size * eq->nent) / PAGE_SIZE;
  886. mailbox = mlx4_alloc_cmd_mailbox(dev);
  887. if (IS_ERR(mailbox))
  888. return;
  889. err = mlx4_HW2SW_EQ(dev, mailbox, eq->eqn);
  890. if (err)
  891. mlx4_warn(dev, "HW2SW_EQ failed (%d)\n", err);
  892. if (0) {
  893. mlx4_dbg(dev, "Dumping EQ context %02x:\n", eq->eqn);
  894. for (i = 0; i < sizeof (struct mlx4_eq_context) / 4; ++i) {
  895. if (i % 4 == 0)
  896. pr_cont("[%02x] ", i * 4);
  897. pr_cont(" %08x", be32_to_cpup(mailbox->buf + i * 4));
  898. if ((i + 1) % 4 == 0)
  899. pr_cont("\n");
  900. }
  901. }
  902. synchronize_irq(eq->irq);
  903. tasklet_disable(&eq->tasklet_ctx.task);
  904. mlx4_mtt_cleanup(dev, &eq->mtt);
  905. for (i = 0; i < npages; ++i)
  906. dma_free_coherent(&dev->pdev->dev, PAGE_SIZE,
  907. eq->page_list[i].buf,
  908. eq->page_list[i].map);
  909. kfree(eq->page_list);
  910. mlx4_bitmap_free(&priv->eq_table.bitmap, eq->eqn, MLX4_USE_RR);
  911. mlx4_free_cmd_mailbox(dev, mailbox);
  912. }
  913. static void mlx4_free_irqs(struct mlx4_dev *dev)
  914. {
  915. struct mlx4_eq_table *eq_table = &mlx4_priv(dev)->eq_table;
  916. struct mlx4_priv *priv = mlx4_priv(dev);
  917. int i, vec;
  918. if (eq_table->have_irq)
  919. free_irq(dev->pdev->irq, dev);
  920. for (i = 0; i < dev->caps.num_comp_vectors + 1; ++i)
  921. if (eq_table->eq[i].have_irq) {
  922. free_irq(eq_table->eq[i].irq, eq_table->eq + i);
  923. eq_table->eq[i].have_irq = 0;
  924. }
  925. for (i = 0; i < dev->caps.comp_pool; i++) {
  926. /*
  927. * Freeing the assigned irq's
  928. * all bits should be 0, but we need to validate
  929. */
  930. if (priv->msix_ctl.pool_bm & 1ULL << i) {
  931. /* NO need protecting*/
  932. vec = dev->caps.num_comp_vectors + 1 + i;
  933. free_irq(priv->eq_table.eq[vec].irq,
  934. &priv->eq_table.eq[vec]);
  935. }
  936. }
  937. kfree(eq_table->irq_names);
  938. }
  939. static int mlx4_map_clr_int(struct mlx4_dev *dev)
  940. {
  941. struct mlx4_priv *priv = mlx4_priv(dev);
  942. priv->clr_base = ioremap(pci_resource_start(dev->pdev, priv->fw.clr_int_bar) +
  943. priv->fw.clr_int_base, MLX4_CLR_INT_SIZE);
  944. if (!priv->clr_base) {
  945. mlx4_err(dev, "Couldn't map interrupt clear register, aborting\n");
  946. return -ENOMEM;
  947. }
  948. return 0;
  949. }
  950. static void mlx4_unmap_clr_int(struct mlx4_dev *dev)
  951. {
  952. struct mlx4_priv *priv = mlx4_priv(dev);
  953. iounmap(priv->clr_base);
  954. }
  955. int mlx4_alloc_eq_table(struct mlx4_dev *dev)
  956. {
  957. struct mlx4_priv *priv = mlx4_priv(dev);
  958. priv->eq_table.eq = kcalloc(dev->caps.num_eqs - dev->caps.reserved_eqs,
  959. sizeof *priv->eq_table.eq, GFP_KERNEL);
  960. if (!priv->eq_table.eq)
  961. return -ENOMEM;
  962. return 0;
  963. }
  964. void mlx4_free_eq_table(struct mlx4_dev *dev)
  965. {
  966. kfree(mlx4_priv(dev)->eq_table.eq);
  967. }
  968. int mlx4_init_eq_table(struct mlx4_dev *dev)
  969. {
  970. struct mlx4_priv *priv = mlx4_priv(dev);
  971. int err;
  972. int i;
  973. priv->eq_table.uar_map = kcalloc(mlx4_num_eq_uar(dev),
  974. sizeof *priv->eq_table.uar_map,
  975. GFP_KERNEL);
  976. if (!priv->eq_table.uar_map) {
  977. err = -ENOMEM;
  978. goto err_out_free;
  979. }
  980. err = mlx4_bitmap_init(&priv->eq_table.bitmap,
  981. roundup_pow_of_two(dev->caps.num_eqs),
  982. dev->caps.num_eqs - 1,
  983. dev->caps.reserved_eqs,
  984. roundup_pow_of_two(dev->caps.num_eqs) -
  985. dev->caps.num_eqs);
  986. if (err)
  987. goto err_out_free;
  988. for (i = 0; i < mlx4_num_eq_uar(dev); ++i)
  989. priv->eq_table.uar_map[i] = NULL;
  990. if (!mlx4_is_slave(dev)) {
  991. err = mlx4_map_clr_int(dev);
  992. if (err)
  993. goto err_out_bitmap;
  994. priv->eq_table.clr_mask =
  995. swab32(1 << (priv->eq_table.inta_pin & 31));
  996. priv->eq_table.clr_int = priv->clr_base +
  997. (priv->eq_table.inta_pin < 32 ? 4 : 0);
  998. }
  999. priv->eq_table.irq_names =
  1000. kmalloc(MLX4_IRQNAME_SIZE * (dev->caps.num_comp_vectors + 1 +
  1001. dev->caps.comp_pool),
  1002. GFP_KERNEL);
  1003. if (!priv->eq_table.irq_names) {
  1004. err = -ENOMEM;
  1005. goto err_out_bitmap;
  1006. }
  1007. for (i = 0; i < dev->caps.num_comp_vectors; ++i) {
  1008. err = mlx4_create_eq(dev, dev->caps.num_cqs -
  1009. dev->caps.reserved_cqs +
  1010. MLX4_NUM_SPARE_EQE,
  1011. (dev->flags & MLX4_FLAG_MSI_X) ? i : 0,
  1012. &priv->eq_table.eq[i]);
  1013. if (err) {
  1014. --i;
  1015. goto err_out_unmap;
  1016. }
  1017. }
  1018. err = mlx4_create_eq(dev, MLX4_NUM_ASYNC_EQE + MLX4_NUM_SPARE_EQE,
  1019. (dev->flags & MLX4_FLAG_MSI_X) ? dev->caps.num_comp_vectors : 0,
  1020. &priv->eq_table.eq[dev->caps.num_comp_vectors]);
  1021. if (err)
  1022. goto err_out_comp;
  1023. /*if additional completion vectors poolsize is 0 this loop will not run*/
  1024. for (i = dev->caps.num_comp_vectors + 1;
  1025. i < dev->caps.num_comp_vectors + dev->caps.comp_pool + 1; ++i) {
  1026. err = mlx4_create_eq(dev, dev->caps.num_cqs -
  1027. dev->caps.reserved_cqs +
  1028. MLX4_NUM_SPARE_EQE,
  1029. (dev->flags & MLX4_FLAG_MSI_X) ? i : 0,
  1030. &priv->eq_table.eq[i]);
  1031. if (err) {
  1032. --i;
  1033. goto err_out_unmap;
  1034. }
  1035. }
  1036. if (dev->flags & MLX4_FLAG_MSI_X) {
  1037. const char *eq_name;
  1038. for (i = 0; i < dev->caps.num_comp_vectors + 1; ++i) {
  1039. if (i < dev->caps.num_comp_vectors) {
  1040. snprintf(priv->eq_table.irq_names +
  1041. i * MLX4_IRQNAME_SIZE,
  1042. MLX4_IRQNAME_SIZE,
  1043. "mlx4-comp-%d@pci:%s", i,
  1044. pci_name(dev->pdev));
  1045. } else {
  1046. snprintf(priv->eq_table.irq_names +
  1047. i * MLX4_IRQNAME_SIZE,
  1048. MLX4_IRQNAME_SIZE,
  1049. "mlx4-async@pci:%s",
  1050. pci_name(dev->pdev));
  1051. }
  1052. eq_name = priv->eq_table.irq_names +
  1053. i * MLX4_IRQNAME_SIZE;
  1054. err = request_irq(priv->eq_table.eq[i].irq,
  1055. mlx4_msi_x_interrupt, 0, eq_name,
  1056. priv->eq_table.eq + i);
  1057. if (err)
  1058. goto err_out_async;
  1059. priv->eq_table.eq[i].have_irq = 1;
  1060. }
  1061. } else {
  1062. snprintf(priv->eq_table.irq_names,
  1063. MLX4_IRQNAME_SIZE,
  1064. DRV_NAME "@pci:%s",
  1065. pci_name(dev->pdev));
  1066. err = request_irq(dev->pdev->irq, mlx4_interrupt,
  1067. IRQF_SHARED, priv->eq_table.irq_names, dev);
  1068. if (err)
  1069. goto err_out_async;
  1070. priv->eq_table.have_irq = 1;
  1071. }
  1072. err = mlx4_MAP_EQ(dev, get_async_ev_mask(dev), 0,
  1073. priv->eq_table.eq[dev->caps.num_comp_vectors].eqn);
  1074. if (err)
  1075. mlx4_warn(dev, "MAP_EQ for async EQ %d failed (%d)\n",
  1076. priv->eq_table.eq[dev->caps.num_comp_vectors].eqn, err);
  1077. for (i = 0; i < dev->caps.num_comp_vectors + 1; ++i)
  1078. eq_set_ci(&priv->eq_table.eq[i], 1);
  1079. return 0;
  1080. err_out_async:
  1081. mlx4_free_eq(dev, &priv->eq_table.eq[dev->caps.num_comp_vectors]);
  1082. err_out_comp:
  1083. i = dev->caps.num_comp_vectors - 1;
  1084. err_out_unmap:
  1085. while (i >= 0) {
  1086. mlx4_free_eq(dev, &priv->eq_table.eq[i]);
  1087. --i;
  1088. }
  1089. if (!mlx4_is_slave(dev))
  1090. mlx4_unmap_clr_int(dev);
  1091. mlx4_free_irqs(dev);
  1092. err_out_bitmap:
  1093. mlx4_unmap_uar(dev);
  1094. mlx4_bitmap_cleanup(&priv->eq_table.bitmap);
  1095. err_out_free:
  1096. kfree(priv->eq_table.uar_map);
  1097. return err;
  1098. }
  1099. void mlx4_cleanup_eq_table(struct mlx4_dev *dev)
  1100. {
  1101. struct mlx4_priv *priv = mlx4_priv(dev);
  1102. int i;
  1103. mlx4_MAP_EQ(dev, get_async_ev_mask(dev), 1,
  1104. priv->eq_table.eq[dev->caps.num_comp_vectors].eqn);
  1105. mlx4_free_irqs(dev);
  1106. for (i = 0; i < dev->caps.num_comp_vectors + dev->caps.comp_pool + 1; ++i)
  1107. mlx4_free_eq(dev, &priv->eq_table.eq[i]);
  1108. if (!mlx4_is_slave(dev))
  1109. mlx4_unmap_clr_int(dev);
  1110. mlx4_unmap_uar(dev);
  1111. mlx4_bitmap_cleanup(&priv->eq_table.bitmap);
  1112. kfree(priv->eq_table.uar_map);
  1113. }
  1114. /* A test that verifies that we can accept interrupts on all
  1115. * the irq vectors of the device.
  1116. * Interrupts are checked using the NOP command.
  1117. */
  1118. int mlx4_test_interrupts(struct mlx4_dev *dev)
  1119. {
  1120. struct mlx4_priv *priv = mlx4_priv(dev);
  1121. int i;
  1122. int err;
  1123. err = mlx4_NOP(dev);
  1124. /* When not in MSI_X, there is only one irq to check */
  1125. if (!(dev->flags & MLX4_FLAG_MSI_X) || mlx4_is_slave(dev))
  1126. return err;
  1127. /* A loop over all completion vectors, for each vector we will check
  1128. * whether it works by mapping command completions to that vector
  1129. * and performing a NOP command
  1130. */
  1131. for(i = 0; !err && (i < dev->caps.num_comp_vectors); ++i) {
  1132. /* Temporary use polling for command completions */
  1133. mlx4_cmd_use_polling(dev);
  1134. /* Map the new eq to handle all asynchronous events */
  1135. err = mlx4_MAP_EQ(dev, get_async_ev_mask(dev), 0,
  1136. priv->eq_table.eq[i].eqn);
  1137. if (err) {
  1138. mlx4_warn(dev, "Failed mapping eq for interrupt test\n");
  1139. mlx4_cmd_use_events(dev);
  1140. break;
  1141. }
  1142. /* Go back to using events */
  1143. mlx4_cmd_use_events(dev);
  1144. err = mlx4_NOP(dev);
  1145. }
  1146. /* Return to default */
  1147. mlx4_MAP_EQ(dev, get_async_ev_mask(dev), 0,
  1148. priv->eq_table.eq[dev->caps.num_comp_vectors].eqn);
  1149. return err;
  1150. }
  1151. EXPORT_SYMBOL(mlx4_test_interrupts);
  1152. int mlx4_assign_eq(struct mlx4_dev *dev, char *name, struct cpu_rmap *rmap,
  1153. int *vector)
  1154. {
  1155. struct mlx4_priv *priv = mlx4_priv(dev);
  1156. int vec = 0, err = 0, i;
  1157. mutex_lock(&priv->msix_ctl.pool_lock);
  1158. for (i = 0; !vec && i < dev->caps.comp_pool; i++) {
  1159. if (~priv->msix_ctl.pool_bm & 1ULL << i) {
  1160. priv->msix_ctl.pool_bm |= 1ULL << i;
  1161. vec = dev->caps.num_comp_vectors + 1 + i;
  1162. snprintf(priv->eq_table.irq_names +
  1163. vec * MLX4_IRQNAME_SIZE,
  1164. MLX4_IRQNAME_SIZE, "%s", name);
  1165. #ifdef CONFIG_RFS_ACCEL
  1166. if (rmap) {
  1167. err = irq_cpu_rmap_add(rmap,
  1168. priv->eq_table.eq[vec].irq);
  1169. if (err)
  1170. mlx4_warn(dev, "Failed adding irq rmap\n");
  1171. }
  1172. #endif
  1173. err = request_irq(priv->eq_table.eq[vec].irq,
  1174. mlx4_msi_x_interrupt, 0,
  1175. &priv->eq_table.irq_names[vec<<5],
  1176. priv->eq_table.eq + vec);
  1177. if (err) {
  1178. /*zero out bit by fliping it*/
  1179. priv->msix_ctl.pool_bm ^= 1 << i;
  1180. vec = 0;
  1181. continue;
  1182. /*we dont want to break here*/
  1183. }
  1184. eq_set_ci(&priv->eq_table.eq[vec], 1);
  1185. }
  1186. }
  1187. mutex_unlock(&priv->msix_ctl.pool_lock);
  1188. if (vec) {
  1189. *vector = vec;
  1190. } else {
  1191. *vector = 0;
  1192. err = (i == dev->caps.comp_pool) ? -ENOSPC : err;
  1193. }
  1194. return err;
  1195. }
  1196. EXPORT_SYMBOL(mlx4_assign_eq);
  1197. int mlx4_eq_get_irq(struct mlx4_dev *dev, int vec)
  1198. {
  1199. struct mlx4_priv *priv = mlx4_priv(dev);
  1200. return priv->eq_table.eq[vec].irq;
  1201. }
  1202. EXPORT_SYMBOL(mlx4_eq_get_irq);
  1203. void mlx4_release_eq(struct mlx4_dev *dev, int vec)
  1204. {
  1205. struct mlx4_priv *priv = mlx4_priv(dev);
  1206. /*bm index*/
  1207. int i = vec - dev->caps.num_comp_vectors - 1;
  1208. if (likely(i >= 0)) {
  1209. /*sanity check , making sure were not trying to free irq's
  1210. Belonging to a legacy EQ*/
  1211. mutex_lock(&priv->msix_ctl.pool_lock);
  1212. if (priv->msix_ctl.pool_bm & 1ULL << i) {
  1213. free_irq(priv->eq_table.eq[vec].irq,
  1214. &priv->eq_table.eq[vec]);
  1215. priv->msix_ctl.pool_bm &= ~(1ULL << i);
  1216. }
  1217. mutex_unlock(&priv->msix_ctl.pool_lock);
  1218. }
  1219. }
  1220. EXPORT_SYMBOL(mlx4_release_eq);