switchdev.c 35 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385
  1. /*
  2. * net/switchdev/switchdev.c - Switch device API
  3. * Copyright (c) 2014-2015 Jiri Pirko <jiri@resnulli.us>
  4. * Copyright (c) 2014-2015 Scott Feldman <sfeldma@gmail.com>
  5. *
  6. * This program is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU General Public License as published by
  8. * the Free Software Foundation; either version 2 of the License, or
  9. * (at your option) any later version.
  10. */
  11. #include <linux/kernel.h>
  12. #include <linux/types.h>
  13. #include <linux/init.h>
  14. #include <linux/mutex.h>
  15. #include <linux/notifier.h>
  16. #include <linux/netdevice.h>
  17. #include <linux/etherdevice.h>
  18. #include <linux/if_bridge.h>
  19. #include <linux/list.h>
  20. #include <linux/workqueue.h>
  21. #include <linux/if_vlan.h>
  22. #include <net/ip_fib.h>
  23. #include <net/switchdev.h>
  24. /**
  25. * switchdev_trans_item_enqueue - Enqueue data item to transaction queue
  26. *
  27. * @trans: transaction
  28. * @data: pointer to data being queued
  29. * @destructor: data destructor
  30. * @tritem: transaction item being queued
  31. *
  32. * Enqeueue data item to transaction queue. tritem is typically placed in
  33. * cointainter pointed at by data pointer. Destructor is called on
  34. * transaction abort and after successful commit phase in case
  35. * the caller did not dequeue the item before.
  36. */
  37. void switchdev_trans_item_enqueue(struct switchdev_trans *trans,
  38. void *data, void (*destructor)(void const *),
  39. struct switchdev_trans_item *tritem)
  40. {
  41. tritem->data = data;
  42. tritem->destructor = destructor;
  43. list_add_tail(&tritem->list, &trans->item_list);
  44. }
  45. EXPORT_SYMBOL_GPL(switchdev_trans_item_enqueue);
  46. static struct switchdev_trans_item *
  47. __switchdev_trans_item_dequeue(struct switchdev_trans *trans)
  48. {
  49. struct switchdev_trans_item *tritem;
  50. if (list_empty(&trans->item_list))
  51. return NULL;
  52. tritem = list_first_entry(&trans->item_list,
  53. struct switchdev_trans_item, list);
  54. list_del(&tritem->list);
  55. return tritem;
  56. }
  57. /**
  58. * switchdev_trans_item_dequeue - Dequeue data item from transaction queue
  59. *
  60. * @trans: transaction
  61. */
  62. void *switchdev_trans_item_dequeue(struct switchdev_trans *trans)
  63. {
  64. struct switchdev_trans_item *tritem;
  65. tritem = __switchdev_trans_item_dequeue(trans);
  66. BUG_ON(!tritem);
  67. return tritem->data;
  68. }
  69. EXPORT_SYMBOL_GPL(switchdev_trans_item_dequeue);
  70. static void switchdev_trans_init(struct switchdev_trans *trans)
  71. {
  72. INIT_LIST_HEAD(&trans->item_list);
  73. }
  74. static void switchdev_trans_items_destroy(struct switchdev_trans *trans)
  75. {
  76. struct switchdev_trans_item *tritem;
  77. while ((tritem = __switchdev_trans_item_dequeue(trans)))
  78. tritem->destructor(tritem->data);
  79. }
  80. static void switchdev_trans_items_warn_destroy(struct net_device *dev,
  81. struct switchdev_trans *trans)
  82. {
  83. WARN(!list_empty(&trans->item_list), "%s: transaction item queue is not empty.\n",
  84. dev->name);
  85. switchdev_trans_items_destroy(trans);
  86. }
  87. static LIST_HEAD(deferred);
  88. static DEFINE_SPINLOCK(deferred_lock);
  89. typedef void switchdev_deferred_func_t(struct net_device *dev,
  90. const void *data);
  91. struct switchdev_deferred_item {
  92. struct list_head list;
  93. struct net_device *dev;
  94. switchdev_deferred_func_t *func;
  95. unsigned long data[0];
  96. };
  97. static struct switchdev_deferred_item *switchdev_deferred_dequeue(void)
  98. {
  99. struct switchdev_deferred_item *dfitem;
  100. spin_lock_bh(&deferred_lock);
  101. if (list_empty(&deferred)) {
  102. dfitem = NULL;
  103. goto unlock;
  104. }
  105. dfitem = list_first_entry(&deferred,
  106. struct switchdev_deferred_item, list);
  107. list_del(&dfitem->list);
  108. unlock:
  109. spin_unlock_bh(&deferred_lock);
  110. return dfitem;
  111. }
  112. /**
  113. * switchdev_deferred_process - Process ops in deferred queue
  114. *
  115. * Called to flush the ops currently queued in deferred ops queue.
  116. * rtnl_lock must be held.
  117. */
  118. void switchdev_deferred_process(void)
  119. {
  120. struct switchdev_deferred_item *dfitem;
  121. ASSERT_RTNL();
  122. while ((dfitem = switchdev_deferred_dequeue())) {
  123. dfitem->func(dfitem->dev, dfitem->data);
  124. dev_put(dfitem->dev);
  125. kfree(dfitem);
  126. }
  127. }
  128. EXPORT_SYMBOL_GPL(switchdev_deferred_process);
  129. static void switchdev_deferred_process_work(struct work_struct *work)
  130. {
  131. rtnl_lock();
  132. switchdev_deferred_process();
  133. rtnl_unlock();
  134. }
  135. static DECLARE_WORK(deferred_process_work, switchdev_deferred_process_work);
  136. static int switchdev_deferred_enqueue(struct net_device *dev,
  137. const void *data, size_t data_len,
  138. switchdev_deferred_func_t *func)
  139. {
  140. struct switchdev_deferred_item *dfitem;
  141. dfitem = kmalloc(sizeof(*dfitem) + data_len, GFP_ATOMIC);
  142. if (!dfitem)
  143. return -ENOMEM;
  144. dfitem->dev = dev;
  145. dfitem->func = func;
  146. memcpy(dfitem->data, data, data_len);
  147. dev_hold(dev);
  148. spin_lock_bh(&deferred_lock);
  149. list_add_tail(&dfitem->list, &deferred);
  150. spin_unlock_bh(&deferred_lock);
  151. schedule_work(&deferred_process_work);
  152. return 0;
  153. }
  154. /**
  155. * switchdev_port_attr_get - Get port attribute
  156. *
  157. * @dev: port device
  158. * @attr: attribute to get
  159. */
  160. int switchdev_port_attr_get(struct net_device *dev, struct switchdev_attr *attr)
  161. {
  162. const struct switchdev_ops *ops = dev->switchdev_ops;
  163. struct net_device *lower_dev;
  164. struct list_head *iter;
  165. struct switchdev_attr first = {
  166. .id = SWITCHDEV_ATTR_ID_UNDEFINED
  167. };
  168. int err = -EOPNOTSUPP;
  169. if (ops && ops->switchdev_port_attr_get)
  170. return ops->switchdev_port_attr_get(dev, attr);
  171. if (attr->flags & SWITCHDEV_F_NO_RECURSE)
  172. return err;
  173. /* Switch device port(s) may be stacked under
  174. * bond/team/vlan dev, so recurse down to get attr on
  175. * each port. Return -ENODATA if attr values don't
  176. * compare across ports.
  177. */
  178. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  179. err = switchdev_port_attr_get(lower_dev, attr);
  180. if (err)
  181. break;
  182. if (first.id == SWITCHDEV_ATTR_ID_UNDEFINED)
  183. first = *attr;
  184. else if (memcmp(&first, attr, sizeof(*attr)))
  185. return -ENODATA;
  186. }
  187. return err;
  188. }
  189. EXPORT_SYMBOL_GPL(switchdev_port_attr_get);
  190. static int __switchdev_port_attr_set(struct net_device *dev,
  191. const struct switchdev_attr *attr,
  192. struct switchdev_trans *trans)
  193. {
  194. const struct switchdev_ops *ops = dev->switchdev_ops;
  195. struct net_device *lower_dev;
  196. struct list_head *iter;
  197. int err = -EOPNOTSUPP;
  198. if (ops && ops->switchdev_port_attr_set) {
  199. err = ops->switchdev_port_attr_set(dev, attr, trans);
  200. goto done;
  201. }
  202. if (attr->flags & SWITCHDEV_F_NO_RECURSE)
  203. goto done;
  204. /* Switch device port(s) may be stacked under
  205. * bond/team/vlan dev, so recurse down to set attr on
  206. * each port.
  207. */
  208. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  209. err = __switchdev_port_attr_set(lower_dev, attr, trans);
  210. if (err)
  211. break;
  212. }
  213. done:
  214. if (err == -EOPNOTSUPP && attr->flags & SWITCHDEV_F_SKIP_EOPNOTSUPP)
  215. err = 0;
  216. return err;
  217. }
  218. static int switchdev_port_attr_set_now(struct net_device *dev,
  219. const struct switchdev_attr *attr)
  220. {
  221. struct switchdev_trans trans;
  222. int err;
  223. switchdev_trans_init(&trans);
  224. /* Phase I: prepare for attr set. Driver/device should fail
  225. * here if there are going to be issues in the commit phase,
  226. * such as lack of resources or support. The driver/device
  227. * should reserve resources needed for the commit phase here,
  228. * but should not commit the attr.
  229. */
  230. trans.ph_prepare = true;
  231. err = __switchdev_port_attr_set(dev, attr, &trans);
  232. if (err) {
  233. /* Prepare phase failed: abort the transaction. Any
  234. * resources reserved in the prepare phase are
  235. * released.
  236. */
  237. if (err != -EOPNOTSUPP)
  238. switchdev_trans_items_destroy(&trans);
  239. return err;
  240. }
  241. /* Phase II: commit attr set. This cannot fail as a fault
  242. * of driver/device. If it does, it's a bug in the driver/device
  243. * because the driver said everythings was OK in phase I.
  244. */
  245. trans.ph_prepare = false;
  246. err = __switchdev_port_attr_set(dev, attr, &trans);
  247. WARN(err, "%s: Commit of attribute (id=%d) failed.\n",
  248. dev->name, attr->id);
  249. switchdev_trans_items_warn_destroy(dev, &trans);
  250. return err;
  251. }
  252. static void switchdev_port_attr_set_deferred(struct net_device *dev,
  253. const void *data)
  254. {
  255. const struct switchdev_attr *attr = data;
  256. int err;
  257. err = switchdev_port_attr_set_now(dev, attr);
  258. if (err && err != -EOPNOTSUPP)
  259. netdev_err(dev, "failed (err=%d) to set attribute (id=%d)\n",
  260. err, attr->id);
  261. }
  262. static int switchdev_port_attr_set_defer(struct net_device *dev,
  263. const struct switchdev_attr *attr)
  264. {
  265. return switchdev_deferred_enqueue(dev, attr, sizeof(*attr),
  266. switchdev_port_attr_set_deferred);
  267. }
  268. /**
  269. * switchdev_port_attr_set - Set port attribute
  270. *
  271. * @dev: port device
  272. * @attr: attribute to set
  273. *
  274. * Use a 2-phase prepare-commit transaction model to ensure
  275. * system is not left in a partially updated state due to
  276. * failure from driver/device.
  277. *
  278. * rtnl_lock must be held and must not be in atomic section,
  279. * in case SWITCHDEV_F_DEFER flag is not set.
  280. */
  281. int switchdev_port_attr_set(struct net_device *dev,
  282. const struct switchdev_attr *attr)
  283. {
  284. if (attr->flags & SWITCHDEV_F_DEFER)
  285. return switchdev_port_attr_set_defer(dev, attr);
  286. ASSERT_RTNL();
  287. return switchdev_port_attr_set_now(dev, attr);
  288. }
  289. EXPORT_SYMBOL_GPL(switchdev_port_attr_set);
  290. static size_t switchdev_obj_size(const struct switchdev_obj *obj)
  291. {
  292. switch (obj->id) {
  293. case SWITCHDEV_OBJ_ID_PORT_VLAN:
  294. return sizeof(struct switchdev_obj_port_vlan);
  295. case SWITCHDEV_OBJ_ID_IPV4_FIB:
  296. return sizeof(struct switchdev_obj_ipv4_fib);
  297. case SWITCHDEV_OBJ_ID_PORT_FDB:
  298. return sizeof(struct switchdev_obj_port_fdb);
  299. case SWITCHDEV_OBJ_ID_PORT_MDB:
  300. return sizeof(struct switchdev_obj_port_mdb);
  301. default:
  302. BUG();
  303. }
  304. return 0;
  305. }
  306. static int __switchdev_port_obj_add(struct net_device *dev,
  307. const struct switchdev_obj *obj,
  308. struct switchdev_trans *trans)
  309. {
  310. const struct switchdev_ops *ops = dev->switchdev_ops;
  311. struct net_device *lower_dev;
  312. struct list_head *iter;
  313. int err = -EOPNOTSUPP;
  314. if (ops && ops->switchdev_port_obj_add)
  315. return ops->switchdev_port_obj_add(dev, obj, trans);
  316. /* Switch device port(s) may be stacked under
  317. * bond/team/vlan dev, so recurse down to add object on
  318. * each port.
  319. */
  320. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  321. err = __switchdev_port_obj_add(lower_dev, obj, trans);
  322. if (err)
  323. break;
  324. }
  325. return err;
  326. }
  327. static int switchdev_port_obj_add_now(struct net_device *dev,
  328. const struct switchdev_obj *obj)
  329. {
  330. struct switchdev_trans trans;
  331. int err;
  332. ASSERT_RTNL();
  333. switchdev_trans_init(&trans);
  334. /* Phase I: prepare for obj add. Driver/device should fail
  335. * here if there are going to be issues in the commit phase,
  336. * such as lack of resources or support. The driver/device
  337. * should reserve resources needed for the commit phase here,
  338. * but should not commit the obj.
  339. */
  340. trans.ph_prepare = true;
  341. err = __switchdev_port_obj_add(dev, obj, &trans);
  342. if (err) {
  343. /* Prepare phase failed: abort the transaction. Any
  344. * resources reserved in the prepare phase are
  345. * released.
  346. */
  347. if (err != -EOPNOTSUPP)
  348. switchdev_trans_items_destroy(&trans);
  349. return err;
  350. }
  351. /* Phase II: commit obj add. This cannot fail as a fault
  352. * of driver/device. If it does, it's a bug in the driver/device
  353. * because the driver said everythings was OK in phase I.
  354. */
  355. trans.ph_prepare = false;
  356. err = __switchdev_port_obj_add(dev, obj, &trans);
  357. WARN(err, "%s: Commit of object (id=%d) failed.\n", dev->name, obj->id);
  358. switchdev_trans_items_warn_destroy(dev, &trans);
  359. return err;
  360. }
  361. static void switchdev_port_obj_add_deferred(struct net_device *dev,
  362. const void *data)
  363. {
  364. const struct switchdev_obj *obj = data;
  365. int err;
  366. err = switchdev_port_obj_add_now(dev, obj);
  367. if (err && err != -EOPNOTSUPP)
  368. netdev_err(dev, "failed (err=%d) to add object (id=%d)\n",
  369. err, obj->id);
  370. }
  371. static int switchdev_port_obj_add_defer(struct net_device *dev,
  372. const struct switchdev_obj *obj)
  373. {
  374. return switchdev_deferred_enqueue(dev, obj, switchdev_obj_size(obj),
  375. switchdev_port_obj_add_deferred);
  376. }
  377. /**
  378. * switchdev_port_obj_add - Add port object
  379. *
  380. * @dev: port device
  381. * @id: object ID
  382. * @obj: object to add
  383. *
  384. * Use a 2-phase prepare-commit transaction model to ensure
  385. * system is not left in a partially updated state due to
  386. * failure from driver/device.
  387. *
  388. * rtnl_lock must be held and must not be in atomic section,
  389. * in case SWITCHDEV_F_DEFER flag is not set.
  390. */
  391. int switchdev_port_obj_add(struct net_device *dev,
  392. const struct switchdev_obj *obj)
  393. {
  394. if (obj->flags & SWITCHDEV_F_DEFER)
  395. return switchdev_port_obj_add_defer(dev, obj);
  396. ASSERT_RTNL();
  397. return switchdev_port_obj_add_now(dev, obj);
  398. }
  399. EXPORT_SYMBOL_GPL(switchdev_port_obj_add);
  400. static int switchdev_port_obj_del_now(struct net_device *dev,
  401. const struct switchdev_obj *obj)
  402. {
  403. const struct switchdev_ops *ops = dev->switchdev_ops;
  404. struct net_device *lower_dev;
  405. struct list_head *iter;
  406. int err = -EOPNOTSUPP;
  407. if (ops && ops->switchdev_port_obj_del)
  408. return ops->switchdev_port_obj_del(dev, obj);
  409. /* Switch device port(s) may be stacked under
  410. * bond/team/vlan dev, so recurse down to delete object on
  411. * each port.
  412. */
  413. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  414. err = switchdev_port_obj_del_now(lower_dev, obj);
  415. if (err)
  416. break;
  417. }
  418. return err;
  419. }
  420. static void switchdev_port_obj_del_deferred(struct net_device *dev,
  421. const void *data)
  422. {
  423. const struct switchdev_obj *obj = data;
  424. int err;
  425. err = switchdev_port_obj_del_now(dev, obj);
  426. if (err && err != -EOPNOTSUPP)
  427. netdev_err(dev, "failed (err=%d) to del object (id=%d)\n",
  428. err, obj->id);
  429. }
  430. static int switchdev_port_obj_del_defer(struct net_device *dev,
  431. const struct switchdev_obj *obj)
  432. {
  433. return switchdev_deferred_enqueue(dev, obj, switchdev_obj_size(obj),
  434. switchdev_port_obj_del_deferred);
  435. }
  436. /**
  437. * switchdev_port_obj_del - Delete port object
  438. *
  439. * @dev: port device
  440. * @id: object ID
  441. * @obj: object to delete
  442. *
  443. * rtnl_lock must be held and must not be in atomic section,
  444. * in case SWITCHDEV_F_DEFER flag is not set.
  445. */
  446. int switchdev_port_obj_del(struct net_device *dev,
  447. const struct switchdev_obj *obj)
  448. {
  449. if (obj->flags & SWITCHDEV_F_DEFER)
  450. return switchdev_port_obj_del_defer(dev, obj);
  451. ASSERT_RTNL();
  452. return switchdev_port_obj_del_now(dev, obj);
  453. }
  454. EXPORT_SYMBOL_GPL(switchdev_port_obj_del);
  455. /**
  456. * switchdev_port_obj_dump - Dump port objects
  457. *
  458. * @dev: port device
  459. * @id: object ID
  460. * @obj: object to dump
  461. * @cb: function to call with a filled object
  462. *
  463. * rtnl_lock must be held.
  464. */
  465. int switchdev_port_obj_dump(struct net_device *dev, struct switchdev_obj *obj,
  466. switchdev_obj_dump_cb_t *cb)
  467. {
  468. const struct switchdev_ops *ops = dev->switchdev_ops;
  469. struct net_device *lower_dev;
  470. struct list_head *iter;
  471. int err = -EOPNOTSUPP;
  472. ASSERT_RTNL();
  473. if (ops && ops->switchdev_port_obj_dump)
  474. return ops->switchdev_port_obj_dump(dev, obj, cb);
  475. /* Switch device port(s) may be stacked under
  476. * bond/team/vlan dev, so recurse down to dump objects on
  477. * first port at bottom of stack.
  478. */
  479. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  480. err = switchdev_port_obj_dump(lower_dev, obj, cb);
  481. break;
  482. }
  483. return err;
  484. }
  485. EXPORT_SYMBOL_GPL(switchdev_port_obj_dump);
  486. static DEFINE_MUTEX(switchdev_mutex);
  487. static RAW_NOTIFIER_HEAD(switchdev_notif_chain);
  488. /**
  489. * register_switchdev_notifier - Register notifier
  490. * @nb: notifier_block
  491. *
  492. * Register switch device notifier. This should be used by code
  493. * which needs to monitor events happening in particular device.
  494. * Return values are same as for atomic_notifier_chain_register().
  495. */
  496. int register_switchdev_notifier(struct notifier_block *nb)
  497. {
  498. int err;
  499. mutex_lock(&switchdev_mutex);
  500. err = raw_notifier_chain_register(&switchdev_notif_chain, nb);
  501. mutex_unlock(&switchdev_mutex);
  502. return err;
  503. }
  504. EXPORT_SYMBOL_GPL(register_switchdev_notifier);
  505. /**
  506. * unregister_switchdev_notifier - Unregister notifier
  507. * @nb: notifier_block
  508. *
  509. * Unregister switch device notifier.
  510. * Return values are same as for atomic_notifier_chain_unregister().
  511. */
  512. int unregister_switchdev_notifier(struct notifier_block *nb)
  513. {
  514. int err;
  515. mutex_lock(&switchdev_mutex);
  516. err = raw_notifier_chain_unregister(&switchdev_notif_chain, nb);
  517. mutex_unlock(&switchdev_mutex);
  518. return err;
  519. }
  520. EXPORT_SYMBOL_GPL(unregister_switchdev_notifier);
  521. /**
  522. * call_switchdev_notifiers - Call notifiers
  523. * @val: value passed unmodified to notifier function
  524. * @dev: port device
  525. * @info: notifier information data
  526. *
  527. * Call all network notifier blocks. This should be called by driver
  528. * when it needs to propagate hardware event.
  529. * Return values are same as for atomic_notifier_call_chain().
  530. */
  531. int call_switchdev_notifiers(unsigned long val, struct net_device *dev,
  532. struct switchdev_notifier_info *info)
  533. {
  534. int err;
  535. info->dev = dev;
  536. mutex_lock(&switchdev_mutex);
  537. err = raw_notifier_call_chain(&switchdev_notif_chain, val, info);
  538. mutex_unlock(&switchdev_mutex);
  539. return err;
  540. }
  541. EXPORT_SYMBOL_GPL(call_switchdev_notifiers);
  542. struct switchdev_vlan_dump {
  543. struct switchdev_obj_port_vlan vlan;
  544. struct sk_buff *skb;
  545. u32 filter_mask;
  546. u16 flags;
  547. u16 begin;
  548. u16 end;
  549. };
  550. static int switchdev_port_vlan_dump_put(struct switchdev_vlan_dump *dump)
  551. {
  552. struct bridge_vlan_info vinfo;
  553. vinfo.flags = dump->flags;
  554. if (dump->begin == 0 && dump->end == 0) {
  555. return 0;
  556. } else if (dump->begin == dump->end) {
  557. vinfo.vid = dump->begin;
  558. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  559. sizeof(vinfo), &vinfo))
  560. return -EMSGSIZE;
  561. } else {
  562. vinfo.vid = dump->begin;
  563. vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_BEGIN;
  564. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  565. sizeof(vinfo), &vinfo))
  566. return -EMSGSIZE;
  567. vinfo.vid = dump->end;
  568. vinfo.flags &= ~BRIDGE_VLAN_INFO_RANGE_BEGIN;
  569. vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_END;
  570. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  571. sizeof(vinfo), &vinfo))
  572. return -EMSGSIZE;
  573. }
  574. return 0;
  575. }
  576. static int switchdev_port_vlan_dump_cb(struct switchdev_obj *obj)
  577. {
  578. struct switchdev_obj_port_vlan *vlan = SWITCHDEV_OBJ_PORT_VLAN(obj);
  579. struct switchdev_vlan_dump *dump =
  580. container_of(vlan, struct switchdev_vlan_dump, vlan);
  581. int err = 0;
  582. if (vlan->vid_begin > vlan->vid_end)
  583. return -EINVAL;
  584. if (dump->filter_mask & RTEXT_FILTER_BRVLAN) {
  585. dump->flags = vlan->flags;
  586. for (dump->begin = dump->end = vlan->vid_begin;
  587. dump->begin <= vlan->vid_end;
  588. dump->begin++, dump->end++) {
  589. err = switchdev_port_vlan_dump_put(dump);
  590. if (err)
  591. return err;
  592. }
  593. } else if (dump->filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED) {
  594. if (dump->begin > vlan->vid_begin &&
  595. dump->begin >= vlan->vid_end) {
  596. if ((dump->begin - 1) == vlan->vid_end &&
  597. dump->flags == vlan->flags) {
  598. /* prepend */
  599. dump->begin = vlan->vid_begin;
  600. } else {
  601. err = switchdev_port_vlan_dump_put(dump);
  602. dump->flags = vlan->flags;
  603. dump->begin = vlan->vid_begin;
  604. dump->end = vlan->vid_end;
  605. }
  606. } else if (dump->end <= vlan->vid_begin &&
  607. dump->end < vlan->vid_end) {
  608. if ((dump->end + 1) == vlan->vid_begin &&
  609. dump->flags == vlan->flags) {
  610. /* append */
  611. dump->end = vlan->vid_end;
  612. } else {
  613. err = switchdev_port_vlan_dump_put(dump);
  614. dump->flags = vlan->flags;
  615. dump->begin = vlan->vid_begin;
  616. dump->end = vlan->vid_end;
  617. }
  618. } else {
  619. err = -EINVAL;
  620. }
  621. }
  622. return err;
  623. }
  624. static int switchdev_port_vlan_fill(struct sk_buff *skb, struct net_device *dev,
  625. u32 filter_mask)
  626. {
  627. struct switchdev_vlan_dump dump = {
  628. .vlan.obj.orig_dev = dev,
  629. .vlan.obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
  630. .skb = skb,
  631. .filter_mask = filter_mask,
  632. };
  633. int err = 0;
  634. if ((filter_mask & RTEXT_FILTER_BRVLAN) ||
  635. (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)) {
  636. err = switchdev_port_obj_dump(dev, &dump.vlan.obj,
  637. switchdev_port_vlan_dump_cb);
  638. if (err)
  639. goto err_out;
  640. if (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)
  641. /* last one */
  642. err = switchdev_port_vlan_dump_put(&dump);
  643. }
  644. err_out:
  645. return err == -EOPNOTSUPP ? 0 : err;
  646. }
  647. /**
  648. * switchdev_port_bridge_getlink - Get bridge port attributes
  649. *
  650. * @dev: port device
  651. *
  652. * Called for SELF on rtnl_bridge_getlink to get bridge port
  653. * attributes.
  654. */
  655. int switchdev_port_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
  656. struct net_device *dev, u32 filter_mask,
  657. int nlflags)
  658. {
  659. struct switchdev_attr attr = {
  660. .orig_dev = dev,
  661. .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
  662. };
  663. u16 mode = BRIDGE_MODE_UNDEF;
  664. u32 mask = BR_LEARNING | BR_LEARNING_SYNC | BR_FLOOD;
  665. int err;
  666. err = switchdev_port_attr_get(dev, &attr);
  667. if (err && err != -EOPNOTSUPP)
  668. return err;
  669. return ndo_dflt_bridge_getlink(skb, pid, seq, dev, mode,
  670. attr.u.brport_flags, mask, nlflags,
  671. filter_mask, switchdev_port_vlan_fill);
  672. }
  673. EXPORT_SYMBOL_GPL(switchdev_port_bridge_getlink);
  674. static int switchdev_port_br_setflag(struct net_device *dev,
  675. struct nlattr *nlattr,
  676. unsigned long brport_flag)
  677. {
  678. struct switchdev_attr attr = {
  679. .orig_dev = dev,
  680. .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
  681. };
  682. u8 flag = nla_get_u8(nlattr);
  683. int err;
  684. err = switchdev_port_attr_get(dev, &attr);
  685. if (err)
  686. return err;
  687. if (flag)
  688. attr.u.brport_flags |= brport_flag;
  689. else
  690. attr.u.brport_flags &= ~brport_flag;
  691. return switchdev_port_attr_set(dev, &attr);
  692. }
  693. static const struct nla_policy
  694. switchdev_port_bridge_policy[IFLA_BRPORT_MAX + 1] = {
  695. [IFLA_BRPORT_STATE] = { .type = NLA_U8 },
  696. [IFLA_BRPORT_COST] = { .type = NLA_U32 },
  697. [IFLA_BRPORT_PRIORITY] = { .type = NLA_U16 },
  698. [IFLA_BRPORT_MODE] = { .type = NLA_U8 },
  699. [IFLA_BRPORT_GUARD] = { .type = NLA_U8 },
  700. [IFLA_BRPORT_PROTECT] = { .type = NLA_U8 },
  701. [IFLA_BRPORT_FAST_LEAVE] = { .type = NLA_U8 },
  702. [IFLA_BRPORT_LEARNING] = { .type = NLA_U8 },
  703. [IFLA_BRPORT_LEARNING_SYNC] = { .type = NLA_U8 },
  704. [IFLA_BRPORT_UNICAST_FLOOD] = { .type = NLA_U8 },
  705. };
  706. static int switchdev_port_br_setlink_protinfo(struct net_device *dev,
  707. struct nlattr *protinfo)
  708. {
  709. struct nlattr *attr;
  710. int rem;
  711. int err;
  712. err = nla_validate_nested(protinfo, IFLA_BRPORT_MAX,
  713. switchdev_port_bridge_policy);
  714. if (err)
  715. return err;
  716. nla_for_each_nested(attr, protinfo, rem) {
  717. switch (nla_type(attr)) {
  718. case IFLA_BRPORT_LEARNING:
  719. err = switchdev_port_br_setflag(dev, attr,
  720. BR_LEARNING);
  721. break;
  722. case IFLA_BRPORT_LEARNING_SYNC:
  723. err = switchdev_port_br_setflag(dev, attr,
  724. BR_LEARNING_SYNC);
  725. break;
  726. case IFLA_BRPORT_UNICAST_FLOOD:
  727. err = switchdev_port_br_setflag(dev, attr, BR_FLOOD);
  728. break;
  729. default:
  730. err = -EOPNOTSUPP;
  731. break;
  732. }
  733. if (err)
  734. return err;
  735. }
  736. return 0;
  737. }
  738. static int switchdev_port_br_afspec(struct net_device *dev,
  739. struct nlattr *afspec,
  740. int (*f)(struct net_device *dev,
  741. const struct switchdev_obj *obj))
  742. {
  743. struct nlattr *attr;
  744. struct bridge_vlan_info *vinfo;
  745. struct switchdev_obj_port_vlan vlan = {
  746. .obj.orig_dev = dev,
  747. .obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
  748. };
  749. int rem;
  750. int err;
  751. nla_for_each_nested(attr, afspec, rem) {
  752. if (nla_type(attr) != IFLA_BRIDGE_VLAN_INFO)
  753. continue;
  754. if (nla_len(attr) != sizeof(struct bridge_vlan_info))
  755. return -EINVAL;
  756. vinfo = nla_data(attr);
  757. if (!vinfo->vid || vinfo->vid >= VLAN_VID_MASK)
  758. return -EINVAL;
  759. vlan.flags = vinfo->flags;
  760. if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_BEGIN) {
  761. if (vlan.vid_begin)
  762. return -EINVAL;
  763. vlan.vid_begin = vinfo->vid;
  764. /* don't allow range of pvids */
  765. if (vlan.flags & BRIDGE_VLAN_INFO_PVID)
  766. return -EINVAL;
  767. } else if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_END) {
  768. if (!vlan.vid_begin)
  769. return -EINVAL;
  770. vlan.vid_end = vinfo->vid;
  771. if (vlan.vid_end <= vlan.vid_begin)
  772. return -EINVAL;
  773. err = f(dev, &vlan.obj);
  774. if (err)
  775. return err;
  776. vlan.vid_begin = 0;
  777. } else {
  778. if (vlan.vid_begin)
  779. return -EINVAL;
  780. vlan.vid_begin = vinfo->vid;
  781. vlan.vid_end = vinfo->vid;
  782. err = f(dev, &vlan.obj);
  783. if (err)
  784. return err;
  785. vlan.vid_begin = 0;
  786. }
  787. }
  788. return 0;
  789. }
  790. /**
  791. * switchdev_port_bridge_setlink - Set bridge port attributes
  792. *
  793. * @dev: port device
  794. * @nlh: netlink header
  795. * @flags: netlink flags
  796. *
  797. * Called for SELF on rtnl_bridge_setlink to set bridge port
  798. * attributes.
  799. */
  800. int switchdev_port_bridge_setlink(struct net_device *dev,
  801. struct nlmsghdr *nlh, u16 flags)
  802. {
  803. struct nlattr *protinfo;
  804. struct nlattr *afspec;
  805. int err = 0;
  806. protinfo = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  807. IFLA_PROTINFO);
  808. if (protinfo) {
  809. err = switchdev_port_br_setlink_protinfo(dev, protinfo);
  810. if (err)
  811. return err;
  812. }
  813. afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  814. IFLA_AF_SPEC);
  815. if (afspec)
  816. err = switchdev_port_br_afspec(dev, afspec,
  817. switchdev_port_obj_add);
  818. return err;
  819. }
  820. EXPORT_SYMBOL_GPL(switchdev_port_bridge_setlink);
  821. /**
  822. * switchdev_port_bridge_dellink - Set bridge port attributes
  823. *
  824. * @dev: port device
  825. * @nlh: netlink header
  826. * @flags: netlink flags
  827. *
  828. * Called for SELF on rtnl_bridge_dellink to set bridge port
  829. * attributes.
  830. */
  831. int switchdev_port_bridge_dellink(struct net_device *dev,
  832. struct nlmsghdr *nlh, u16 flags)
  833. {
  834. struct nlattr *afspec;
  835. afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  836. IFLA_AF_SPEC);
  837. if (afspec)
  838. return switchdev_port_br_afspec(dev, afspec,
  839. switchdev_port_obj_del);
  840. return 0;
  841. }
  842. EXPORT_SYMBOL_GPL(switchdev_port_bridge_dellink);
  843. /**
  844. * switchdev_port_fdb_add - Add FDB (MAC/VLAN) entry to port
  845. *
  846. * @ndmsg: netlink hdr
  847. * @nlattr: netlink attributes
  848. * @dev: port device
  849. * @addr: MAC address to add
  850. * @vid: VLAN to add
  851. *
  852. * Add FDB entry to switch device.
  853. */
  854. int switchdev_port_fdb_add(struct ndmsg *ndm, struct nlattr *tb[],
  855. struct net_device *dev, const unsigned char *addr,
  856. u16 vid, u16 nlm_flags)
  857. {
  858. struct switchdev_obj_port_fdb fdb = {
  859. .obj.orig_dev = dev,
  860. .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  861. .vid = vid,
  862. };
  863. ether_addr_copy(fdb.addr, addr);
  864. return switchdev_port_obj_add(dev, &fdb.obj);
  865. }
  866. EXPORT_SYMBOL_GPL(switchdev_port_fdb_add);
  867. /**
  868. * switchdev_port_fdb_del - Delete FDB (MAC/VLAN) entry from port
  869. *
  870. * @ndmsg: netlink hdr
  871. * @nlattr: netlink attributes
  872. * @dev: port device
  873. * @addr: MAC address to delete
  874. * @vid: VLAN to delete
  875. *
  876. * Delete FDB entry from switch device.
  877. */
  878. int switchdev_port_fdb_del(struct ndmsg *ndm, struct nlattr *tb[],
  879. struct net_device *dev, const unsigned char *addr,
  880. u16 vid)
  881. {
  882. struct switchdev_obj_port_fdb fdb = {
  883. .obj.orig_dev = dev,
  884. .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  885. .vid = vid,
  886. };
  887. ether_addr_copy(fdb.addr, addr);
  888. return switchdev_port_obj_del(dev, &fdb.obj);
  889. }
  890. EXPORT_SYMBOL_GPL(switchdev_port_fdb_del);
  891. struct switchdev_fdb_dump {
  892. struct switchdev_obj_port_fdb fdb;
  893. struct net_device *dev;
  894. struct sk_buff *skb;
  895. struct netlink_callback *cb;
  896. int idx;
  897. };
  898. static int switchdev_port_fdb_dump_cb(struct switchdev_obj *obj)
  899. {
  900. struct switchdev_obj_port_fdb *fdb = SWITCHDEV_OBJ_PORT_FDB(obj);
  901. struct switchdev_fdb_dump *dump =
  902. container_of(fdb, struct switchdev_fdb_dump, fdb);
  903. u32 portid = NETLINK_CB(dump->cb->skb).portid;
  904. u32 seq = dump->cb->nlh->nlmsg_seq;
  905. struct nlmsghdr *nlh;
  906. struct ndmsg *ndm;
  907. if (dump->idx < dump->cb->args[0])
  908. goto skip;
  909. nlh = nlmsg_put(dump->skb, portid, seq, RTM_NEWNEIGH,
  910. sizeof(*ndm), NLM_F_MULTI);
  911. if (!nlh)
  912. return -EMSGSIZE;
  913. ndm = nlmsg_data(nlh);
  914. ndm->ndm_family = AF_BRIDGE;
  915. ndm->ndm_pad1 = 0;
  916. ndm->ndm_pad2 = 0;
  917. ndm->ndm_flags = NTF_SELF;
  918. ndm->ndm_type = 0;
  919. ndm->ndm_ifindex = dump->dev->ifindex;
  920. ndm->ndm_state = fdb->ndm_state;
  921. if (nla_put(dump->skb, NDA_LLADDR, ETH_ALEN, fdb->addr))
  922. goto nla_put_failure;
  923. if (fdb->vid && nla_put_u16(dump->skb, NDA_VLAN, fdb->vid))
  924. goto nla_put_failure;
  925. nlmsg_end(dump->skb, nlh);
  926. skip:
  927. dump->idx++;
  928. return 0;
  929. nla_put_failure:
  930. nlmsg_cancel(dump->skb, nlh);
  931. return -EMSGSIZE;
  932. }
  933. /**
  934. * switchdev_port_fdb_dump - Dump port FDB (MAC/VLAN) entries
  935. *
  936. * @skb: netlink skb
  937. * @cb: netlink callback
  938. * @dev: port device
  939. * @filter_dev: filter device
  940. * @idx:
  941. *
  942. * Delete FDB entry from switch device.
  943. */
  944. int switchdev_port_fdb_dump(struct sk_buff *skb, struct netlink_callback *cb,
  945. struct net_device *dev,
  946. struct net_device *filter_dev, int idx)
  947. {
  948. struct switchdev_fdb_dump dump = {
  949. .fdb.obj.orig_dev = dev,
  950. .fdb.obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  951. .dev = dev,
  952. .skb = skb,
  953. .cb = cb,
  954. .idx = idx,
  955. };
  956. switchdev_port_obj_dump(dev, &dump.fdb.obj, switchdev_port_fdb_dump_cb);
  957. return dump.idx;
  958. }
  959. EXPORT_SYMBOL_GPL(switchdev_port_fdb_dump);
  960. static struct net_device *switchdev_get_lowest_dev(struct net_device *dev)
  961. {
  962. const struct switchdev_ops *ops = dev->switchdev_ops;
  963. struct net_device *lower_dev;
  964. struct net_device *port_dev;
  965. struct list_head *iter;
  966. /* Recusively search down until we find a sw port dev.
  967. * (A sw port dev supports switchdev_port_attr_get).
  968. */
  969. if (ops && ops->switchdev_port_attr_get)
  970. return dev;
  971. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  972. port_dev = switchdev_get_lowest_dev(lower_dev);
  973. if (port_dev)
  974. return port_dev;
  975. }
  976. return NULL;
  977. }
  978. static struct net_device *switchdev_get_dev_by_nhs(struct fib_info *fi)
  979. {
  980. struct switchdev_attr attr = {
  981. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  982. };
  983. struct switchdev_attr prev_attr;
  984. struct net_device *dev = NULL;
  985. int nhsel;
  986. ASSERT_RTNL();
  987. /* For this route, all nexthop devs must be on the same switch. */
  988. for (nhsel = 0; nhsel < fi->fib_nhs; nhsel++) {
  989. const struct fib_nh *nh = &fi->fib_nh[nhsel];
  990. if (!nh->nh_dev)
  991. return NULL;
  992. dev = switchdev_get_lowest_dev(nh->nh_dev);
  993. if (!dev)
  994. return NULL;
  995. attr.orig_dev = dev;
  996. if (switchdev_port_attr_get(dev, &attr))
  997. return NULL;
  998. if (nhsel > 0 &&
  999. !netdev_phys_item_id_same(&prev_attr.u.ppid, &attr.u.ppid))
  1000. return NULL;
  1001. prev_attr = attr;
  1002. }
  1003. return dev;
  1004. }
  1005. /**
  1006. * switchdev_fib_ipv4_add - Add/modify switch IPv4 route entry
  1007. *
  1008. * @dst: route's IPv4 destination address
  1009. * @dst_len: destination address length (prefix length)
  1010. * @fi: route FIB info structure
  1011. * @tos: route TOS
  1012. * @type: route type
  1013. * @nlflags: netlink flags passed in (NLM_F_*)
  1014. * @tb_id: route table ID
  1015. *
  1016. * Add/modify switch IPv4 route entry.
  1017. */
  1018. int switchdev_fib_ipv4_add(u32 dst, int dst_len, struct fib_info *fi,
  1019. u8 tos, u8 type, u32 nlflags, u32 tb_id)
  1020. {
  1021. struct switchdev_obj_ipv4_fib ipv4_fib = {
  1022. .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
  1023. .dst = dst,
  1024. .dst_len = dst_len,
  1025. .tos = tos,
  1026. .type = type,
  1027. .nlflags = nlflags,
  1028. .tb_id = tb_id,
  1029. };
  1030. struct net_device *dev;
  1031. int err = 0;
  1032. memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
  1033. /* Don't offload route if using custom ip rules or if
  1034. * IPv4 FIB offloading has been disabled completely.
  1035. */
  1036. #ifdef CONFIG_IP_MULTIPLE_TABLES
  1037. if (fi->fib_net->ipv4.fib_has_custom_rules)
  1038. return 0;
  1039. #endif
  1040. if (fi->fib_net->ipv4.fib_offload_disabled)
  1041. return 0;
  1042. dev = switchdev_get_dev_by_nhs(fi);
  1043. if (!dev)
  1044. return 0;
  1045. ipv4_fib.obj.orig_dev = dev;
  1046. err = switchdev_port_obj_add(dev, &ipv4_fib.obj);
  1047. if (!err)
  1048. fi->fib_flags |= RTNH_F_OFFLOAD;
  1049. return err == -EOPNOTSUPP ? 0 : err;
  1050. }
  1051. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_add);
  1052. /**
  1053. * switchdev_fib_ipv4_del - Delete IPv4 route entry from switch
  1054. *
  1055. * @dst: route's IPv4 destination address
  1056. * @dst_len: destination address length (prefix length)
  1057. * @fi: route FIB info structure
  1058. * @tos: route TOS
  1059. * @type: route type
  1060. * @tb_id: route table ID
  1061. *
  1062. * Delete IPv4 route entry from switch device.
  1063. */
  1064. int switchdev_fib_ipv4_del(u32 dst, int dst_len, struct fib_info *fi,
  1065. u8 tos, u8 type, u32 tb_id)
  1066. {
  1067. struct switchdev_obj_ipv4_fib ipv4_fib = {
  1068. .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
  1069. .dst = dst,
  1070. .dst_len = dst_len,
  1071. .tos = tos,
  1072. .type = type,
  1073. .nlflags = 0,
  1074. .tb_id = tb_id,
  1075. };
  1076. struct net_device *dev;
  1077. int err = 0;
  1078. memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
  1079. if (!(fi->fib_flags & RTNH_F_OFFLOAD))
  1080. return 0;
  1081. dev = switchdev_get_dev_by_nhs(fi);
  1082. if (!dev)
  1083. return 0;
  1084. ipv4_fib.obj.orig_dev = dev;
  1085. err = switchdev_port_obj_del(dev, &ipv4_fib.obj);
  1086. if (!err)
  1087. fi->fib_flags &= ~RTNH_F_OFFLOAD;
  1088. return err == -EOPNOTSUPP ? 0 : err;
  1089. }
  1090. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_del);
  1091. /**
  1092. * switchdev_fib_ipv4_abort - Abort an IPv4 FIB operation
  1093. *
  1094. * @fi: route FIB info structure
  1095. */
  1096. void switchdev_fib_ipv4_abort(struct fib_info *fi)
  1097. {
  1098. /* There was a problem installing this route to the offload
  1099. * device. For now, until we come up with more refined
  1100. * policy handling, abruptly end IPv4 fib offloading for
  1101. * for entire net by flushing offload device(s) of all
  1102. * IPv4 routes, and mark IPv4 fib offloading broken from
  1103. * this point forward.
  1104. */
  1105. fib_flush_external(fi->fib_net);
  1106. fi->fib_net->ipv4.fib_offload_disabled = true;
  1107. }
  1108. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_abort);
  1109. static bool switchdev_port_same_parent_id(struct net_device *a,
  1110. struct net_device *b)
  1111. {
  1112. struct switchdev_attr a_attr = {
  1113. .orig_dev = a,
  1114. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  1115. .flags = SWITCHDEV_F_NO_RECURSE,
  1116. };
  1117. struct switchdev_attr b_attr = {
  1118. .orig_dev = b,
  1119. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  1120. .flags = SWITCHDEV_F_NO_RECURSE,
  1121. };
  1122. if (switchdev_port_attr_get(a, &a_attr) ||
  1123. switchdev_port_attr_get(b, &b_attr))
  1124. return false;
  1125. return netdev_phys_item_id_same(&a_attr.u.ppid, &b_attr.u.ppid);
  1126. }
  1127. static u32 switchdev_port_fwd_mark_get(struct net_device *dev,
  1128. struct net_device *group_dev)
  1129. {
  1130. struct net_device *lower_dev;
  1131. struct list_head *iter;
  1132. netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
  1133. if (lower_dev == dev)
  1134. continue;
  1135. if (switchdev_port_same_parent_id(dev, lower_dev))
  1136. return lower_dev->offload_fwd_mark;
  1137. return switchdev_port_fwd_mark_get(dev, lower_dev);
  1138. }
  1139. return dev->ifindex;
  1140. }
  1141. static void switchdev_port_fwd_mark_reset(struct net_device *group_dev,
  1142. u32 old_mark, u32 *reset_mark)
  1143. {
  1144. struct net_device *lower_dev;
  1145. struct list_head *iter;
  1146. netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
  1147. if (lower_dev->offload_fwd_mark == old_mark) {
  1148. if (!*reset_mark)
  1149. *reset_mark = lower_dev->ifindex;
  1150. lower_dev->offload_fwd_mark = *reset_mark;
  1151. }
  1152. switchdev_port_fwd_mark_reset(lower_dev, old_mark, reset_mark);
  1153. }
  1154. }
  1155. /**
  1156. * switchdev_port_fwd_mark_set - Set port offload forwarding mark
  1157. *
  1158. * @dev: port device
  1159. * @group_dev: containing device
  1160. * @joining: true if dev is joining group; false if leaving group
  1161. *
  1162. * An ungrouped port's offload mark is just its ifindex. A grouped
  1163. * port's (member of a bridge, for example) offload mark is the ifindex
  1164. * of one of the ports in the group with the same parent (switch) ID.
  1165. * Ports on the same device in the same group will have the same mark.
  1166. *
  1167. * Example:
  1168. *
  1169. * br0 ifindex=9
  1170. * sw1p1 ifindex=2 mark=2
  1171. * sw1p2 ifindex=3 mark=2
  1172. * sw2p1 ifindex=4 mark=5
  1173. * sw2p2 ifindex=5 mark=5
  1174. *
  1175. * If sw2p2 leaves the bridge, we'll have:
  1176. *
  1177. * br0 ifindex=9
  1178. * sw1p1 ifindex=2 mark=2
  1179. * sw1p2 ifindex=3 mark=2
  1180. * sw2p1 ifindex=4 mark=4
  1181. * sw2p2 ifindex=5 mark=5
  1182. */
  1183. void switchdev_port_fwd_mark_set(struct net_device *dev,
  1184. struct net_device *group_dev,
  1185. bool joining)
  1186. {
  1187. u32 mark = dev->ifindex;
  1188. u32 reset_mark = 0;
  1189. if (group_dev) {
  1190. ASSERT_RTNL();
  1191. if (joining)
  1192. mark = switchdev_port_fwd_mark_get(dev, group_dev);
  1193. else if (dev->offload_fwd_mark == mark)
  1194. /* Ohoh, this port was the mark reference port,
  1195. * but it's leaving the group, so reset the
  1196. * mark for the remaining ports in the group.
  1197. */
  1198. switchdev_port_fwd_mark_reset(group_dev, mark,
  1199. &reset_mark);
  1200. }
  1201. dev->offload_fwd_mark = mark;
  1202. }
  1203. EXPORT_SYMBOL_GPL(switchdev_port_fwd_mark_set);