switchdev.c 34 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372
  1. /*
  2. * net/switchdev/switchdev.c - Switch device API
  3. * Copyright (c) 2014-2015 Jiri Pirko <jiri@resnulli.us>
  4. * Copyright (c) 2014-2015 Scott Feldman <sfeldma@gmail.com>
  5. *
  6. * This program is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU General Public License as published by
  8. * the Free Software Foundation; either version 2 of the License, or
  9. * (at your option) any later version.
  10. */
  11. #include <linux/kernel.h>
  12. #include <linux/types.h>
  13. #include <linux/init.h>
  14. #include <linux/mutex.h>
  15. #include <linux/notifier.h>
  16. #include <linux/netdevice.h>
  17. #include <linux/etherdevice.h>
  18. #include <linux/if_bridge.h>
  19. #include <linux/list.h>
  20. #include <linux/workqueue.h>
  21. #include <linux/if_vlan.h>
  22. #include <net/ip_fib.h>
  23. #include <net/switchdev.h>
  24. /**
  25. * switchdev_trans_item_enqueue - Enqueue data item to transaction queue
  26. *
  27. * @trans: transaction
  28. * @data: pointer to data being queued
  29. * @destructor: data destructor
  30. * @tritem: transaction item being queued
  31. *
  32. * Enqeueue data item to transaction queue. tritem is typically placed in
  33. * cointainter pointed at by data pointer. Destructor is called on
  34. * transaction abort and after successful commit phase in case
  35. * the caller did not dequeue the item before.
  36. */
  37. void switchdev_trans_item_enqueue(struct switchdev_trans *trans,
  38. void *data, void (*destructor)(void const *),
  39. struct switchdev_trans_item *tritem)
  40. {
  41. tritem->data = data;
  42. tritem->destructor = destructor;
  43. list_add_tail(&tritem->list, &trans->item_list);
  44. }
  45. EXPORT_SYMBOL_GPL(switchdev_trans_item_enqueue);
  46. static struct switchdev_trans_item *
  47. __switchdev_trans_item_dequeue(struct switchdev_trans *trans)
  48. {
  49. struct switchdev_trans_item *tritem;
  50. if (list_empty(&trans->item_list))
  51. return NULL;
  52. tritem = list_first_entry(&trans->item_list,
  53. struct switchdev_trans_item, list);
  54. list_del(&tritem->list);
  55. return tritem;
  56. }
  57. /**
  58. * switchdev_trans_item_dequeue - Dequeue data item from transaction queue
  59. *
  60. * @trans: transaction
  61. */
  62. void *switchdev_trans_item_dequeue(struct switchdev_trans *trans)
  63. {
  64. struct switchdev_trans_item *tritem;
  65. tritem = __switchdev_trans_item_dequeue(trans);
  66. BUG_ON(!tritem);
  67. return tritem->data;
  68. }
  69. EXPORT_SYMBOL_GPL(switchdev_trans_item_dequeue);
  70. static void switchdev_trans_init(struct switchdev_trans *trans)
  71. {
  72. INIT_LIST_HEAD(&trans->item_list);
  73. }
  74. static void switchdev_trans_items_destroy(struct switchdev_trans *trans)
  75. {
  76. struct switchdev_trans_item *tritem;
  77. while ((tritem = __switchdev_trans_item_dequeue(trans)))
  78. tritem->destructor(tritem->data);
  79. }
  80. static void switchdev_trans_items_warn_destroy(struct net_device *dev,
  81. struct switchdev_trans *trans)
  82. {
  83. WARN(!list_empty(&trans->item_list), "%s: transaction item queue is not empty.\n",
  84. dev->name);
  85. switchdev_trans_items_destroy(trans);
  86. }
  87. static LIST_HEAD(deferred);
  88. static DEFINE_SPINLOCK(deferred_lock);
  89. typedef void switchdev_deferred_func_t(struct net_device *dev,
  90. const void *data);
  91. struct switchdev_deferred_item {
  92. struct list_head list;
  93. struct net_device *dev;
  94. switchdev_deferred_func_t *func;
  95. unsigned long data[0];
  96. };
  97. static struct switchdev_deferred_item *switchdev_deferred_dequeue(void)
  98. {
  99. struct switchdev_deferred_item *dfitem;
  100. spin_lock_bh(&deferred_lock);
  101. if (list_empty(&deferred)) {
  102. dfitem = NULL;
  103. goto unlock;
  104. }
  105. dfitem = list_first_entry(&deferred,
  106. struct switchdev_deferred_item, list);
  107. list_del(&dfitem->list);
  108. unlock:
  109. spin_unlock_bh(&deferred_lock);
  110. return dfitem;
  111. }
  112. /**
  113. * switchdev_deferred_process - Process ops in deferred queue
  114. *
  115. * Called to flush the ops currently queued in deferred ops queue.
  116. * rtnl_lock must be held.
  117. */
  118. void switchdev_deferred_process(void)
  119. {
  120. struct switchdev_deferred_item *dfitem;
  121. ASSERT_RTNL();
  122. while ((dfitem = switchdev_deferred_dequeue())) {
  123. dfitem->func(dfitem->dev, dfitem->data);
  124. dev_put(dfitem->dev);
  125. kfree(dfitem);
  126. }
  127. }
  128. EXPORT_SYMBOL_GPL(switchdev_deferred_process);
  129. static void switchdev_deferred_process_work(struct work_struct *work)
  130. {
  131. rtnl_lock();
  132. switchdev_deferred_process();
  133. rtnl_unlock();
  134. }
  135. static DECLARE_WORK(deferred_process_work, switchdev_deferred_process_work);
  136. static int switchdev_deferred_enqueue(struct net_device *dev,
  137. const void *data, size_t data_len,
  138. switchdev_deferred_func_t *func)
  139. {
  140. struct switchdev_deferred_item *dfitem;
  141. dfitem = kmalloc(sizeof(*dfitem) + data_len, GFP_ATOMIC);
  142. if (!dfitem)
  143. return -ENOMEM;
  144. dfitem->dev = dev;
  145. dfitem->func = func;
  146. memcpy(dfitem->data, data, data_len);
  147. dev_hold(dev);
  148. spin_lock_bh(&deferred_lock);
  149. list_add_tail(&dfitem->list, &deferred);
  150. spin_unlock_bh(&deferred_lock);
  151. schedule_work(&deferred_process_work);
  152. return 0;
  153. }
  154. /**
  155. * switchdev_port_attr_get - Get port attribute
  156. *
  157. * @dev: port device
  158. * @attr: attribute to get
  159. */
  160. int switchdev_port_attr_get(struct net_device *dev, struct switchdev_attr *attr)
  161. {
  162. const struct switchdev_ops *ops = dev->switchdev_ops;
  163. struct net_device *lower_dev;
  164. struct list_head *iter;
  165. struct switchdev_attr first = {
  166. .id = SWITCHDEV_ATTR_ID_UNDEFINED
  167. };
  168. int err = -EOPNOTSUPP;
  169. if (ops && ops->switchdev_port_attr_get)
  170. return ops->switchdev_port_attr_get(dev, attr);
  171. if (attr->flags & SWITCHDEV_F_NO_RECURSE)
  172. return err;
  173. /* Switch device port(s) may be stacked under
  174. * bond/team/vlan dev, so recurse down to get attr on
  175. * each port. Return -ENODATA if attr values don't
  176. * compare across ports.
  177. */
  178. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  179. err = switchdev_port_attr_get(lower_dev, attr);
  180. if (err)
  181. break;
  182. if (first.id == SWITCHDEV_ATTR_ID_UNDEFINED)
  183. first = *attr;
  184. else if (memcmp(&first, attr, sizeof(*attr)))
  185. return -ENODATA;
  186. }
  187. return err;
  188. }
  189. EXPORT_SYMBOL_GPL(switchdev_port_attr_get);
  190. static int __switchdev_port_attr_set(struct net_device *dev,
  191. const struct switchdev_attr *attr,
  192. struct switchdev_trans *trans)
  193. {
  194. const struct switchdev_ops *ops = dev->switchdev_ops;
  195. struct net_device *lower_dev;
  196. struct list_head *iter;
  197. int err = -EOPNOTSUPP;
  198. if (ops && ops->switchdev_port_attr_set)
  199. return ops->switchdev_port_attr_set(dev, attr, trans);
  200. if (attr->flags & SWITCHDEV_F_NO_RECURSE)
  201. goto done;
  202. /* Switch device port(s) may be stacked under
  203. * bond/team/vlan dev, so recurse down to set attr on
  204. * each port.
  205. */
  206. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  207. err = __switchdev_port_attr_set(lower_dev, attr, trans);
  208. if (err == -EOPNOTSUPP &&
  209. attr->flags & SWITCHDEV_F_SKIP_EOPNOTSUPP)
  210. continue;
  211. if (err)
  212. break;
  213. }
  214. done:
  215. if (err == -EOPNOTSUPP && attr->flags & SWITCHDEV_F_SKIP_EOPNOTSUPP)
  216. err = 0;
  217. return err;
  218. }
  219. static int switchdev_port_attr_set_now(struct net_device *dev,
  220. const struct switchdev_attr *attr)
  221. {
  222. struct switchdev_trans trans;
  223. int err;
  224. switchdev_trans_init(&trans);
  225. /* Phase I: prepare for attr set. Driver/device should fail
  226. * here if there are going to be issues in the commit phase,
  227. * such as lack of resources or support. The driver/device
  228. * should reserve resources needed for the commit phase here,
  229. * but should not commit the attr.
  230. */
  231. trans.ph_prepare = true;
  232. err = __switchdev_port_attr_set(dev, attr, &trans);
  233. if (err) {
  234. /* Prepare phase failed: abort the transaction. Any
  235. * resources reserved in the prepare phase are
  236. * released.
  237. */
  238. if (err != -EOPNOTSUPP)
  239. switchdev_trans_items_destroy(&trans);
  240. return err;
  241. }
  242. /* Phase II: commit attr set. This cannot fail as a fault
  243. * of driver/device. If it does, it's a bug in the driver/device
  244. * because the driver said everythings was OK in phase I.
  245. */
  246. trans.ph_prepare = false;
  247. err = __switchdev_port_attr_set(dev, attr, &trans);
  248. WARN(err, "%s: Commit of attribute (id=%d) failed.\n",
  249. dev->name, attr->id);
  250. switchdev_trans_items_warn_destroy(dev, &trans);
  251. return err;
  252. }
  253. static void switchdev_port_attr_set_deferred(struct net_device *dev,
  254. const void *data)
  255. {
  256. const struct switchdev_attr *attr = data;
  257. int err;
  258. err = switchdev_port_attr_set_now(dev, attr);
  259. if (err && err != -EOPNOTSUPP)
  260. netdev_err(dev, "failed (err=%d) to set attribute (id=%d)\n",
  261. err, attr->id);
  262. }
  263. static int switchdev_port_attr_set_defer(struct net_device *dev,
  264. const struct switchdev_attr *attr)
  265. {
  266. return switchdev_deferred_enqueue(dev, attr, sizeof(*attr),
  267. switchdev_port_attr_set_deferred);
  268. }
  269. /**
  270. * switchdev_port_attr_set - Set port attribute
  271. *
  272. * @dev: port device
  273. * @attr: attribute to set
  274. *
  275. * Use a 2-phase prepare-commit transaction model to ensure
  276. * system is not left in a partially updated state due to
  277. * failure from driver/device.
  278. *
  279. * rtnl_lock must be held and must not be in atomic section,
  280. * in case SWITCHDEV_F_DEFER flag is not set.
  281. */
  282. int switchdev_port_attr_set(struct net_device *dev,
  283. const struct switchdev_attr *attr)
  284. {
  285. if (attr->flags & SWITCHDEV_F_DEFER)
  286. return switchdev_port_attr_set_defer(dev, attr);
  287. ASSERT_RTNL();
  288. return switchdev_port_attr_set_now(dev, attr);
  289. }
  290. EXPORT_SYMBOL_GPL(switchdev_port_attr_set);
  291. static size_t switchdev_obj_size(const struct switchdev_obj *obj)
  292. {
  293. switch (obj->id) {
  294. case SWITCHDEV_OBJ_ID_PORT_VLAN:
  295. return sizeof(struct switchdev_obj_port_vlan);
  296. case SWITCHDEV_OBJ_ID_IPV4_FIB:
  297. return sizeof(struct switchdev_obj_ipv4_fib);
  298. case SWITCHDEV_OBJ_ID_PORT_FDB:
  299. return sizeof(struct switchdev_obj_port_fdb);
  300. default:
  301. BUG();
  302. }
  303. return 0;
  304. }
  305. static int __switchdev_port_obj_add(struct net_device *dev,
  306. const struct switchdev_obj *obj,
  307. struct switchdev_trans *trans)
  308. {
  309. const struct switchdev_ops *ops = dev->switchdev_ops;
  310. struct net_device *lower_dev;
  311. struct list_head *iter;
  312. int err = -EOPNOTSUPP;
  313. if (ops && ops->switchdev_port_obj_add)
  314. return ops->switchdev_port_obj_add(dev, obj, trans);
  315. /* Switch device port(s) may be stacked under
  316. * bond/team/vlan dev, so recurse down to add object on
  317. * each port.
  318. */
  319. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  320. err = __switchdev_port_obj_add(lower_dev, obj, trans);
  321. if (err)
  322. break;
  323. }
  324. return err;
  325. }
  326. static int switchdev_port_obj_add_now(struct net_device *dev,
  327. const struct switchdev_obj *obj)
  328. {
  329. struct switchdev_trans trans;
  330. int err;
  331. ASSERT_RTNL();
  332. switchdev_trans_init(&trans);
  333. /* Phase I: prepare for obj add. Driver/device should fail
  334. * here if there are going to be issues in the commit phase,
  335. * such as lack of resources or support. The driver/device
  336. * should reserve resources needed for the commit phase here,
  337. * but should not commit the obj.
  338. */
  339. trans.ph_prepare = true;
  340. err = __switchdev_port_obj_add(dev, obj, &trans);
  341. if (err) {
  342. /* Prepare phase failed: abort the transaction. Any
  343. * resources reserved in the prepare phase are
  344. * released.
  345. */
  346. if (err != -EOPNOTSUPP)
  347. switchdev_trans_items_destroy(&trans);
  348. return err;
  349. }
  350. /* Phase II: commit obj add. This cannot fail as a fault
  351. * of driver/device. If it does, it's a bug in the driver/device
  352. * because the driver said everythings was OK in phase I.
  353. */
  354. trans.ph_prepare = false;
  355. err = __switchdev_port_obj_add(dev, obj, &trans);
  356. WARN(err, "%s: Commit of object (id=%d) failed.\n", dev->name, obj->id);
  357. switchdev_trans_items_warn_destroy(dev, &trans);
  358. return err;
  359. }
  360. static void switchdev_port_obj_add_deferred(struct net_device *dev,
  361. const void *data)
  362. {
  363. const struct switchdev_obj *obj = data;
  364. int err;
  365. err = switchdev_port_obj_add_now(dev, obj);
  366. if (err && err != -EOPNOTSUPP)
  367. netdev_err(dev, "failed (err=%d) to add object (id=%d)\n",
  368. err, obj->id);
  369. }
  370. static int switchdev_port_obj_add_defer(struct net_device *dev,
  371. const struct switchdev_obj *obj)
  372. {
  373. return switchdev_deferred_enqueue(dev, obj, switchdev_obj_size(obj),
  374. switchdev_port_obj_add_deferred);
  375. }
  376. /**
  377. * switchdev_port_obj_add - Add port object
  378. *
  379. * @dev: port device
  380. * @id: object ID
  381. * @obj: object to add
  382. *
  383. * Use a 2-phase prepare-commit transaction model to ensure
  384. * system is not left in a partially updated state due to
  385. * failure from driver/device.
  386. *
  387. * rtnl_lock must be held and must not be in atomic section,
  388. * in case SWITCHDEV_F_DEFER flag is not set.
  389. */
  390. int switchdev_port_obj_add(struct net_device *dev,
  391. const struct switchdev_obj *obj)
  392. {
  393. if (obj->flags & SWITCHDEV_F_DEFER)
  394. return switchdev_port_obj_add_defer(dev, obj);
  395. ASSERT_RTNL();
  396. return switchdev_port_obj_add_now(dev, obj);
  397. }
  398. EXPORT_SYMBOL_GPL(switchdev_port_obj_add);
  399. static int switchdev_port_obj_del_now(struct net_device *dev,
  400. const struct switchdev_obj *obj)
  401. {
  402. const struct switchdev_ops *ops = dev->switchdev_ops;
  403. struct net_device *lower_dev;
  404. struct list_head *iter;
  405. int err = -EOPNOTSUPP;
  406. if (ops && ops->switchdev_port_obj_del)
  407. return ops->switchdev_port_obj_del(dev, obj);
  408. /* Switch device port(s) may be stacked under
  409. * bond/team/vlan dev, so recurse down to delete object on
  410. * each port.
  411. */
  412. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  413. err = switchdev_port_obj_del_now(lower_dev, obj);
  414. if (err)
  415. break;
  416. }
  417. return err;
  418. }
  419. static void switchdev_port_obj_del_deferred(struct net_device *dev,
  420. const void *data)
  421. {
  422. const struct switchdev_obj *obj = data;
  423. int err;
  424. err = switchdev_port_obj_del_now(dev, obj);
  425. if (err && err != -EOPNOTSUPP)
  426. netdev_err(dev, "failed (err=%d) to del object (id=%d)\n",
  427. err, obj->id);
  428. }
  429. static int switchdev_port_obj_del_defer(struct net_device *dev,
  430. const struct switchdev_obj *obj)
  431. {
  432. return switchdev_deferred_enqueue(dev, obj, switchdev_obj_size(obj),
  433. switchdev_port_obj_del_deferred);
  434. }
  435. /**
  436. * switchdev_port_obj_del - Delete port object
  437. *
  438. * @dev: port device
  439. * @id: object ID
  440. * @obj: object to delete
  441. *
  442. * rtnl_lock must be held and must not be in atomic section,
  443. * in case SWITCHDEV_F_DEFER flag is not set.
  444. */
  445. int switchdev_port_obj_del(struct net_device *dev,
  446. const struct switchdev_obj *obj)
  447. {
  448. if (obj->flags & SWITCHDEV_F_DEFER)
  449. return switchdev_port_obj_del_defer(dev, obj);
  450. ASSERT_RTNL();
  451. return switchdev_port_obj_del_now(dev, obj);
  452. }
  453. EXPORT_SYMBOL_GPL(switchdev_port_obj_del);
  454. /**
  455. * switchdev_port_obj_dump - Dump port objects
  456. *
  457. * @dev: port device
  458. * @id: object ID
  459. * @obj: object to dump
  460. * @cb: function to call with a filled object
  461. *
  462. * rtnl_lock must be held.
  463. */
  464. int switchdev_port_obj_dump(struct net_device *dev, struct switchdev_obj *obj,
  465. switchdev_obj_dump_cb_t *cb)
  466. {
  467. const struct switchdev_ops *ops = dev->switchdev_ops;
  468. struct net_device *lower_dev;
  469. struct list_head *iter;
  470. int err = -EOPNOTSUPP;
  471. ASSERT_RTNL();
  472. if (ops && ops->switchdev_port_obj_dump)
  473. return ops->switchdev_port_obj_dump(dev, obj, cb);
  474. /* Switch device port(s) may be stacked under
  475. * bond/team/vlan dev, so recurse down to dump objects on
  476. * first port at bottom of stack.
  477. */
  478. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  479. err = switchdev_port_obj_dump(lower_dev, obj, cb);
  480. break;
  481. }
  482. return err;
  483. }
  484. EXPORT_SYMBOL_GPL(switchdev_port_obj_dump);
  485. static DEFINE_MUTEX(switchdev_mutex);
  486. static RAW_NOTIFIER_HEAD(switchdev_notif_chain);
  487. /**
  488. * register_switchdev_notifier - Register notifier
  489. * @nb: notifier_block
  490. *
  491. * Register switch device notifier. This should be used by code
  492. * which needs to monitor events happening in particular device.
  493. * Return values are same as for atomic_notifier_chain_register().
  494. */
  495. int register_switchdev_notifier(struct notifier_block *nb)
  496. {
  497. int err;
  498. mutex_lock(&switchdev_mutex);
  499. err = raw_notifier_chain_register(&switchdev_notif_chain, nb);
  500. mutex_unlock(&switchdev_mutex);
  501. return err;
  502. }
  503. EXPORT_SYMBOL_GPL(register_switchdev_notifier);
  504. /**
  505. * unregister_switchdev_notifier - Unregister notifier
  506. * @nb: notifier_block
  507. *
  508. * Unregister switch device notifier.
  509. * Return values are same as for atomic_notifier_chain_unregister().
  510. */
  511. int unregister_switchdev_notifier(struct notifier_block *nb)
  512. {
  513. int err;
  514. mutex_lock(&switchdev_mutex);
  515. err = raw_notifier_chain_unregister(&switchdev_notif_chain, nb);
  516. mutex_unlock(&switchdev_mutex);
  517. return err;
  518. }
  519. EXPORT_SYMBOL_GPL(unregister_switchdev_notifier);
  520. /**
  521. * call_switchdev_notifiers - Call notifiers
  522. * @val: value passed unmodified to notifier function
  523. * @dev: port device
  524. * @info: notifier information data
  525. *
  526. * Call all network notifier blocks. This should be called by driver
  527. * when it needs to propagate hardware event.
  528. * Return values are same as for atomic_notifier_call_chain().
  529. */
  530. int call_switchdev_notifiers(unsigned long val, struct net_device *dev,
  531. struct switchdev_notifier_info *info)
  532. {
  533. int err;
  534. info->dev = dev;
  535. mutex_lock(&switchdev_mutex);
  536. err = raw_notifier_call_chain(&switchdev_notif_chain, val, info);
  537. mutex_unlock(&switchdev_mutex);
  538. return err;
  539. }
  540. EXPORT_SYMBOL_GPL(call_switchdev_notifiers);
  541. struct switchdev_vlan_dump {
  542. struct switchdev_obj_port_vlan vlan;
  543. struct sk_buff *skb;
  544. u32 filter_mask;
  545. u16 flags;
  546. u16 begin;
  547. u16 end;
  548. };
  549. static int switchdev_port_vlan_dump_put(struct switchdev_vlan_dump *dump)
  550. {
  551. struct bridge_vlan_info vinfo;
  552. vinfo.flags = dump->flags;
  553. if (dump->begin == 0 && dump->end == 0) {
  554. return 0;
  555. } else if (dump->begin == dump->end) {
  556. vinfo.vid = dump->begin;
  557. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  558. sizeof(vinfo), &vinfo))
  559. return -EMSGSIZE;
  560. } else {
  561. vinfo.vid = dump->begin;
  562. vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_BEGIN;
  563. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  564. sizeof(vinfo), &vinfo))
  565. return -EMSGSIZE;
  566. vinfo.vid = dump->end;
  567. vinfo.flags &= ~BRIDGE_VLAN_INFO_RANGE_BEGIN;
  568. vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_END;
  569. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  570. sizeof(vinfo), &vinfo))
  571. return -EMSGSIZE;
  572. }
  573. return 0;
  574. }
  575. static int switchdev_port_vlan_dump_cb(struct switchdev_obj *obj)
  576. {
  577. struct switchdev_obj_port_vlan *vlan = SWITCHDEV_OBJ_PORT_VLAN(obj);
  578. struct switchdev_vlan_dump *dump =
  579. container_of(vlan, struct switchdev_vlan_dump, vlan);
  580. int err = 0;
  581. if (vlan->vid_begin > vlan->vid_end)
  582. return -EINVAL;
  583. if (dump->filter_mask & RTEXT_FILTER_BRVLAN) {
  584. dump->flags = vlan->flags;
  585. for (dump->begin = dump->end = vlan->vid_begin;
  586. dump->begin <= vlan->vid_end;
  587. dump->begin++, dump->end++) {
  588. err = switchdev_port_vlan_dump_put(dump);
  589. if (err)
  590. return err;
  591. }
  592. } else if (dump->filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED) {
  593. if (dump->begin > vlan->vid_begin &&
  594. dump->begin >= vlan->vid_end) {
  595. if ((dump->begin - 1) == vlan->vid_end &&
  596. dump->flags == vlan->flags) {
  597. /* prepend */
  598. dump->begin = vlan->vid_begin;
  599. } else {
  600. err = switchdev_port_vlan_dump_put(dump);
  601. dump->flags = vlan->flags;
  602. dump->begin = vlan->vid_begin;
  603. dump->end = vlan->vid_end;
  604. }
  605. } else if (dump->end <= vlan->vid_begin &&
  606. dump->end < vlan->vid_end) {
  607. if ((dump->end + 1) == vlan->vid_begin &&
  608. dump->flags == vlan->flags) {
  609. /* append */
  610. dump->end = vlan->vid_end;
  611. } else {
  612. err = switchdev_port_vlan_dump_put(dump);
  613. dump->flags = vlan->flags;
  614. dump->begin = vlan->vid_begin;
  615. dump->end = vlan->vid_end;
  616. }
  617. } else {
  618. err = -EINVAL;
  619. }
  620. }
  621. return err;
  622. }
  623. static int switchdev_port_vlan_fill(struct sk_buff *skb, struct net_device *dev,
  624. u32 filter_mask)
  625. {
  626. struct switchdev_vlan_dump dump = {
  627. .vlan.obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
  628. .skb = skb,
  629. .filter_mask = filter_mask,
  630. };
  631. int err = 0;
  632. if ((filter_mask & RTEXT_FILTER_BRVLAN) ||
  633. (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)) {
  634. err = switchdev_port_obj_dump(dev, &dump.vlan.obj,
  635. switchdev_port_vlan_dump_cb);
  636. if (err)
  637. goto err_out;
  638. if (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)
  639. /* last one */
  640. err = switchdev_port_vlan_dump_put(&dump);
  641. }
  642. err_out:
  643. return err == -EOPNOTSUPP ? 0 : err;
  644. }
  645. /**
  646. * switchdev_port_bridge_getlink - Get bridge port attributes
  647. *
  648. * @dev: port device
  649. *
  650. * Called for SELF on rtnl_bridge_getlink to get bridge port
  651. * attributes.
  652. */
  653. int switchdev_port_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
  654. struct net_device *dev, u32 filter_mask,
  655. int nlflags)
  656. {
  657. struct switchdev_attr attr = {
  658. .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
  659. };
  660. u16 mode = BRIDGE_MODE_UNDEF;
  661. u32 mask = BR_LEARNING | BR_LEARNING_SYNC | BR_FLOOD;
  662. int err;
  663. err = switchdev_port_attr_get(dev, &attr);
  664. if (err && err != -EOPNOTSUPP)
  665. return err;
  666. return ndo_dflt_bridge_getlink(skb, pid, seq, dev, mode,
  667. attr.u.brport_flags, mask, nlflags,
  668. filter_mask, switchdev_port_vlan_fill);
  669. }
  670. EXPORT_SYMBOL_GPL(switchdev_port_bridge_getlink);
  671. static int switchdev_port_br_setflag(struct net_device *dev,
  672. struct nlattr *nlattr,
  673. unsigned long brport_flag)
  674. {
  675. struct switchdev_attr attr = {
  676. .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
  677. };
  678. u8 flag = nla_get_u8(nlattr);
  679. int err;
  680. err = switchdev_port_attr_get(dev, &attr);
  681. if (err)
  682. return err;
  683. if (flag)
  684. attr.u.brport_flags |= brport_flag;
  685. else
  686. attr.u.brport_flags &= ~brport_flag;
  687. return switchdev_port_attr_set(dev, &attr);
  688. }
  689. static const struct nla_policy
  690. switchdev_port_bridge_policy[IFLA_BRPORT_MAX + 1] = {
  691. [IFLA_BRPORT_STATE] = { .type = NLA_U8 },
  692. [IFLA_BRPORT_COST] = { .type = NLA_U32 },
  693. [IFLA_BRPORT_PRIORITY] = { .type = NLA_U16 },
  694. [IFLA_BRPORT_MODE] = { .type = NLA_U8 },
  695. [IFLA_BRPORT_GUARD] = { .type = NLA_U8 },
  696. [IFLA_BRPORT_PROTECT] = { .type = NLA_U8 },
  697. [IFLA_BRPORT_FAST_LEAVE] = { .type = NLA_U8 },
  698. [IFLA_BRPORT_LEARNING] = { .type = NLA_U8 },
  699. [IFLA_BRPORT_LEARNING_SYNC] = { .type = NLA_U8 },
  700. [IFLA_BRPORT_UNICAST_FLOOD] = { .type = NLA_U8 },
  701. };
  702. static int switchdev_port_br_setlink_protinfo(struct net_device *dev,
  703. struct nlattr *protinfo)
  704. {
  705. struct nlattr *attr;
  706. int rem;
  707. int err;
  708. err = nla_validate_nested(protinfo, IFLA_BRPORT_MAX,
  709. switchdev_port_bridge_policy);
  710. if (err)
  711. return err;
  712. nla_for_each_nested(attr, protinfo, rem) {
  713. switch (nla_type(attr)) {
  714. case IFLA_BRPORT_LEARNING:
  715. err = switchdev_port_br_setflag(dev, attr,
  716. BR_LEARNING);
  717. break;
  718. case IFLA_BRPORT_LEARNING_SYNC:
  719. err = switchdev_port_br_setflag(dev, attr,
  720. BR_LEARNING_SYNC);
  721. break;
  722. case IFLA_BRPORT_UNICAST_FLOOD:
  723. err = switchdev_port_br_setflag(dev, attr, BR_FLOOD);
  724. break;
  725. default:
  726. err = -EOPNOTSUPP;
  727. break;
  728. }
  729. if (err)
  730. return err;
  731. }
  732. return 0;
  733. }
  734. static int switchdev_port_br_afspec(struct net_device *dev,
  735. struct nlattr *afspec,
  736. int (*f)(struct net_device *dev,
  737. const struct switchdev_obj *obj))
  738. {
  739. struct nlattr *attr;
  740. struct bridge_vlan_info *vinfo;
  741. struct switchdev_obj_port_vlan vlan = {
  742. .obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
  743. };
  744. int rem;
  745. int err;
  746. nla_for_each_nested(attr, afspec, rem) {
  747. if (nla_type(attr) != IFLA_BRIDGE_VLAN_INFO)
  748. continue;
  749. if (nla_len(attr) != sizeof(struct bridge_vlan_info))
  750. return -EINVAL;
  751. vinfo = nla_data(attr);
  752. if (!vinfo->vid || vinfo->vid >= VLAN_VID_MASK)
  753. return -EINVAL;
  754. vlan.flags = vinfo->flags;
  755. if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_BEGIN) {
  756. if (vlan.vid_begin)
  757. return -EINVAL;
  758. vlan.vid_begin = vinfo->vid;
  759. /* don't allow range of pvids */
  760. if (vlan.flags & BRIDGE_VLAN_INFO_PVID)
  761. return -EINVAL;
  762. } else if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_END) {
  763. if (!vlan.vid_begin)
  764. return -EINVAL;
  765. vlan.vid_end = vinfo->vid;
  766. if (vlan.vid_end <= vlan.vid_begin)
  767. return -EINVAL;
  768. err = f(dev, &vlan.obj);
  769. if (err)
  770. return err;
  771. vlan.vid_begin = 0;
  772. } else {
  773. if (vlan.vid_begin)
  774. return -EINVAL;
  775. vlan.vid_begin = vinfo->vid;
  776. vlan.vid_end = vinfo->vid;
  777. err = f(dev, &vlan.obj);
  778. if (err)
  779. return err;
  780. vlan.vid_begin = 0;
  781. }
  782. }
  783. return 0;
  784. }
  785. /**
  786. * switchdev_port_bridge_setlink - Set bridge port attributes
  787. *
  788. * @dev: port device
  789. * @nlh: netlink header
  790. * @flags: netlink flags
  791. *
  792. * Called for SELF on rtnl_bridge_setlink to set bridge port
  793. * attributes.
  794. */
  795. int switchdev_port_bridge_setlink(struct net_device *dev,
  796. struct nlmsghdr *nlh, u16 flags)
  797. {
  798. struct nlattr *protinfo;
  799. struct nlattr *afspec;
  800. int err = 0;
  801. protinfo = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  802. IFLA_PROTINFO);
  803. if (protinfo) {
  804. err = switchdev_port_br_setlink_protinfo(dev, protinfo);
  805. if (err)
  806. return err;
  807. }
  808. afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  809. IFLA_AF_SPEC);
  810. if (afspec)
  811. err = switchdev_port_br_afspec(dev, afspec,
  812. switchdev_port_obj_add);
  813. return err;
  814. }
  815. EXPORT_SYMBOL_GPL(switchdev_port_bridge_setlink);
  816. /**
  817. * switchdev_port_bridge_dellink - Set bridge port attributes
  818. *
  819. * @dev: port device
  820. * @nlh: netlink header
  821. * @flags: netlink flags
  822. *
  823. * Called for SELF on rtnl_bridge_dellink to set bridge port
  824. * attributes.
  825. */
  826. int switchdev_port_bridge_dellink(struct net_device *dev,
  827. struct nlmsghdr *nlh, u16 flags)
  828. {
  829. struct nlattr *afspec;
  830. afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  831. IFLA_AF_SPEC);
  832. if (afspec)
  833. return switchdev_port_br_afspec(dev, afspec,
  834. switchdev_port_obj_del);
  835. return 0;
  836. }
  837. EXPORT_SYMBOL_GPL(switchdev_port_bridge_dellink);
  838. /**
  839. * switchdev_port_fdb_add - Add FDB (MAC/VLAN) entry to port
  840. *
  841. * @ndmsg: netlink hdr
  842. * @nlattr: netlink attributes
  843. * @dev: port device
  844. * @addr: MAC address to add
  845. * @vid: VLAN to add
  846. *
  847. * Add FDB entry to switch device.
  848. */
  849. int switchdev_port_fdb_add(struct ndmsg *ndm, struct nlattr *tb[],
  850. struct net_device *dev, const unsigned char *addr,
  851. u16 vid, u16 nlm_flags)
  852. {
  853. struct switchdev_obj_port_fdb fdb = {
  854. .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  855. .vid = vid,
  856. };
  857. ether_addr_copy(fdb.addr, addr);
  858. return switchdev_port_obj_add(dev, &fdb.obj);
  859. }
  860. EXPORT_SYMBOL_GPL(switchdev_port_fdb_add);
  861. /**
  862. * switchdev_port_fdb_del - Delete FDB (MAC/VLAN) entry from port
  863. *
  864. * @ndmsg: netlink hdr
  865. * @nlattr: netlink attributes
  866. * @dev: port device
  867. * @addr: MAC address to delete
  868. * @vid: VLAN to delete
  869. *
  870. * Delete FDB entry from switch device.
  871. */
  872. int switchdev_port_fdb_del(struct ndmsg *ndm, struct nlattr *tb[],
  873. struct net_device *dev, const unsigned char *addr,
  874. u16 vid)
  875. {
  876. struct switchdev_obj_port_fdb fdb = {
  877. .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  878. .vid = vid,
  879. };
  880. ether_addr_copy(fdb.addr, addr);
  881. return switchdev_port_obj_del(dev, &fdb.obj);
  882. }
  883. EXPORT_SYMBOL_GPL(switchdev_port_fdb_del);
  884. struct switchdev_fdb_dump {
  885. struct switchdev_obj_port_fdb fdb;
  886. struct net_device *dev;
  887. struct sk_buff *skb;
  888. struct netlink_callback *cb;
  889. int idx;
  890. };
  891. static int switchdev_port_fdb_dump_cb(struct switchdev_obj *obj)
  892. {
  893. struct switchdev_obj_port_fdb *fdb = SWITCHDEV_OBJ_PORT_FDB(obj);
  894. struct switchdev_fdb_dump *dump =
  895. container_of(fdb, struct switchdev_fdb_dump, fdb);
  896. u32 portid = NETLINK_CB(dump->cb->skb).portid;
  897. u32 seq = dump->cb->nlh->nlmsg_seq;
  898. struct nlmsghdr *nlh;
  899. struct ndmsg *ndm;
  900. if (dump->idx < dump->cb->args[0])
  901. goto skip;
  902. nlh = nlmsg_put(dump->skb, portid, seq, RTM_NEWNEIGH,
  903. sizeof(*ndm), NLM_F_MULTI);
  904. if (!nlh)
  905. return -EMSGSIZE;
  906. ndm = nlmsg_data(nlh);
  907. ndm->ndm_family = AF_BRIDGE;
  908. ndm->ndm_pad1 = 0;
  909. ndm->ndm_pad2 = 0;
  910. ndm->ndm_flags = NTF_SELF;
  911. ndm->ndm_type = 0;
  912. ndm->ndm_ifindex = dump->dev->ifindex;
  913. ndm->ndm_state = fdb->ndm_state;
  914. if (nla_put(dump->skb, NDA_LLADDR, ETH_ALEN, fdb->addr))
  915. goto nla_put_failure;
  916. if (fdb->vid && nla_put_u16(dump->skb, NDA_VLAN, fdb->vid))
  917. goto nla_put_failure;
  918. nlmsg_end(dump->skb, nlh);
  919. skip:
  920. dump->idx++;
  921. return 0;
  922. nla_put_failure:
  923. nlmsg_cancel(dump->skb, nlh);
  924. return -EMSGSIZE;
  925. }
  926. /**
  927. * switchdev_port_fdb_dump - Dump port FDB (MAC/VLAN) entries
  928. *
  929. * @skb: netlink skb
  930. * @cb: netlink callback
  931. * @dev: port device
  932. * @filter_dev: filter device
  933. * @idx:
  934. *
  935. * Delete FDB entry from switch device.
  936. */
  937. int switchdev_port_fdb_dump(struct sk_buff *skb, struct netlink_callback *cb,
  938. struct net_device *dev,
  939. struct net_device *filter_dev, int idx)
  940. {
  941. struct switchdev_fdb_dump dump = {
  942. .fdb.obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  943. .dev = dev,
  944. .skb = skb,
  945. .cb = cb,
  946. .idx = idx,
  947. };
  948. switchdev_port_obj_dump(dev, &dump.fdb.obj, switchdev_port_fdb_dump_cb);
  949. return dump.idx;
  950. }
  951. EXPORT_SYMBOL_GPL(switchdev_port_fdb_dump);
  952. static struct net_device *switchdev_get_lowest_dev(struct net_device *dev)
  953. {
  954. const struct switchdev_ops *ops = dev->switchdev_ops;
  955. struct net_device *lower_dev;
  956. struct net_device *port_dev;
  957. struct list_head *iter;
  958. /* Recusively search down until we find a sw port dev.
  959. * (A sw port dev supports switchdev_port_attr_get).
  960. */
  961. if (ops && ops->switchdev_port_attr_get)
  962. return dev;
  963. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  964. port_dev = switchdev_get_lowest_dev(lower_dev);
  965. if (port_dev)
  966. return port_dev;
  967. }
  968. return NULL;
  969. }
  970. static struct net_device *switchdev_get_dev_by_nhs(struct fib_info *fi)
  971. {
  972. struct switchdev_attr attr = {
  973. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  974. };
  975. struct switchdev_attr prev_attr;
  976. struct net_device *dev = NULL;
  977. int nhsel;
  978. ASSERT_RTNL();
  979. /* For this route, all nexthop devs must be on the same switch. */
  980. for (nhsel = 0; nhsel < fi->fib_nhs; nhsel++) {
  981. const struct fib_nh *nh = &fi->fib_nh[nhsel];
  982. if (!nh->nh_dev)
  983. return NULL;
  984. dev = switchdev_get_lowest_dev(nh->nh_dev);
  985. if (!dev)
  986. return NULL;
  987. if (switchdev_port_attr_get(dev, &attr))
  988. return NULL;
  989. if (nhsel > 0 &&
  990. !netdev_phys_item_id_same(&prev_attr.u.ppid, &attr.u.ppid))
  991. return NULL;
  992. prev_attr = attr;
  993. }
  994. return dev;
  995. }
  996. /**
  997. * switchdev_fib_ipv4_add - Add/modify switch IPv4 route entry
  998. *
  999. * @dst: route's IPv4 destination address
  1000. * @dst_len: destination address length (prefix length)
  1001. * @fi: route FIB info structure
  1002. * @tos: route TOS
  1003. * @type: route type
  1004. * @nlflags: netlink flags passed in (NLM_F_*)
  1005. * @tb_id: route table ID
  1006. *
  1007. * Add/modify switch IPv4 route entry.
  1008. */
  1009. int switchdev_fib_ipv4_add(u32 dst, int dst_len, struct fib_info *fi,
  1010. u8 tos, u8 type, u32 nlflags, u32 tb_id)
  1011. {
  1012. struct switchdev_obj_ipv4_fib ipv4_fib = {
  1013. .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
  1014. .dst = dst,
  1015. .dst_len = dst_len,
  1016. .tos = tos,
  1017. .type = type,
  1018. .nlflags = nlflags,
  1019. .tb_id = tb_id,
  1020. };
  1021. struct net_device *dev;
  1022. int err = 0;
  1023. memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
  1024. /* Don't offload route if using custom ip rules or if
  1025. * IPv4 FIB offloading has been disabled completely.
  1026. */
  1027. #ifdef CONFIG_IP_MULTIPLE_TABLES
  1028. if (fi->fib_net->ipv4.fib_has_custom_rules)
  1029. return 0;
  1030. #endif
  1031. if (fi->fib_net->ipv4.fib_offload_disabled)
  1032. return 0;
  1033. dev = switchdev_get_dev_by_nhs(fi);
  1034. if (!dev)
  1035. return 0;
  1036. err = switchdev_port_obj_add(dev, &ipv4_fib.obj);
  1037. if (!err)
  1038. fi->fib_flags |= RTNH_F_OFFLOAD;
  1039. return err == -EOPNOTSUPP ? 0 : err;
  1040. }
  1041. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_add);
  1042. /**
  1043. * switchdev_fib_ipv4_del - Delete IPv4 route entry from switch
  1044. *
  1045. * @dst: route's IPv4 destination address
  1046. * @dst_len: destination address length (prefix length)
  1047. * @fi: route FIB info structure
  1048. * @tos: route TOS
  1049. * @type: route type
  1050. * @tb_id: route table ID
  1051. *
  1052. * Delete IPv4 route entry from switch device.
  1053. */
  1054. int switchdev_fib_ipv4_del(u32 dst, int dst_len, struct fib_info *fi,
  1055. u8 tos, u8 type, u32 tb_id)
  1056. {
  1057. struct switchdev_obj_ipv4_fib ipv4_fib = {
  1058. .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
  1059. .dst = dst,
  1060. .dst_len = dst_len,
  1061. .tos = tos,
  1062. .type = type,
  1063. .nlflags = 0,
  1064. .tb_id = tb_id,
  1065. };
  1066. struct net_device *dev;
  1067. int err = 0;
  1068. memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
  1069. if (!(fi->fib_flags & RTNH_F_OFFLOAD))
  1070. return 0;
  1071. dev = switchdev_get_dev_by_nhs(fi);
  1072. if (!dev)
  1073. return 0;
  1074. err = switchdev_port_obj_del(dev, &ipv4_fib.obj);
  1075. if (!err)
  1076. fi->fib_flags &= ~RTNH_F_OFFLOAD;
  1077. return err == -EOPNOTSUPP ? 0 : err;
  1078. }
  1079. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_del);
  1080. /**
  1081. * switchdev_fib_ipv4_abort - Abort an IPv4 FIB operation
  1082. *
  1083. * @fi: route FIB info structure
  1084. */
  1085. void switchdev_fib_ipv4_abort(struct fib_info *fi)
  1086. {
  1087. /* There was a problem installing this route to the offload
  1088. * device. For now, until we come up with more refined
  1089. * policy handling, abruptly end IPv4 fib offloading for
  1090. * for entire net by flushing offload device(s) of all
  1091. * IPv4 routes, and mark IPv4 fib offloading broken from
  1092. * this point forward.
  1093. */
  1094. fib_flush_external(fi->fib_net);
  1095. fi->fib_net->ipv4.fib_offload_disabled = true;
  1096. }
  1097. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_abort);
  1098. static bool switchdev_port_same_parent_id(struct net_device *a,
  1099. struct net_device *b)
  1100. {
  1101. struct switchdev_attr a_attr = {
  1102. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  1103. .flags = SWITCHDEV_F_NO_RECURSE,
  1104. };
  1105. struct switchdev_attr b_attr = {
  1106. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  1107. .flags = SWITCHDEV_F_NO_RECURSE,
  1108. };
  1109. if (switchdev_port_attr_get(a, &a_attr) ||
  1110. switchdev_port_attr_get(b, &b_attr))
  1111. return false;
  1112. return netdev_phys_item_id_same(&a_attr.u.ppid, &b_attr.u.ppid);
  1113. }
  1114. static u32 switchdev_port_fwd_mark_get(struct net_device *dev,
  1115. struct net_device *group_dev)
  1116. {
  1117. struct net_device *lower_dev;
  1118. struct list_head *iter;
  1119. netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
  1120. if (lower_dev == dev)
  1121. continue;
  1122. if (switchdev_port_same_parent_id(dev, lower_dev))
  1123. return lower_dev->offload_fwd_mark;
  1124. return switchdev_port_fwd_mark_get(dev, lower_dev);
  1125. }
  1126. return dev->ifindex;
  1127. }
  1128. static void switchdev_port_fwd_mark_reset(struct net_device *group_dev,
  1129. u32 old_mark, u32 *reset_mark)
  1130. {
  1131. struct net_device *lower_dev;
  1132. struct list_head *iter;
  1133. netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
  1134. if (lower_dev->offload_fwd_mark == old_mark) {
  1135. if (!*reset_mark)
  1136. *reset_mark = lower_dev->ifindex;
  1137. lower_dev->offload_fwd_mark = *reset_mark;
  1138. }
  1139. switchdev_port_fwd_mark_reset(lower_dev, old_mark, reset_mark);
  1140. }
  1141. }
  1142. /**
  1143. * switchdev_port_fwd_mark_set - Set port offload forwarding mark
  1144. *
  1145. * @dev: port device
  1146. * @group_dev: containing device
  1147. * @joining: true if dev is joining group; false if leaving group
  1148. *
  1149. * An ungrouped port's offload mark is just its ifindex. A grouped
  1150. * port's (member of a bridge, for example) offload mark is the ifindex
  1151. * of one of the ports in the group with the same parent (switch) ID.
  1152. * Ports on the same device in the same group will have the same mark.
  1153. *
  1154. * Example:
  1155. *
  1156. * br0 ifindex=9
  1157. * sw1p1 ifindex=2 mark=2
  1158. * sw1p2 ifindex=3 mark=2
  1159. * sw2p1 ifindex=4 mark=5
  1160. * sw2p2 ifindex=5 mark=5
  1161. *
  1162. * If sw2p2 leaves the bridge, we'll have:
  1163. *
  1164. * br0 ifindex=9
  1165. * sw1p1 ifindex=2 mark=2
  1166. * sw1p2 ifindex=3 mark=2
  1167. * sw2p1 ifindex=4 mark=4
  1168. * sw2p2 ifindex=5 mark=5
  1169. */
  1170. void switchdev_port_fwd_mark_set(struct net_device *dev,
  1171. struct net_device *group_dev,
  1172. bool joining)
  1173. {
  1174. u32 mark = dev->ifindex;
  1175. u32 reset_mark = 0;
  1176. if (group_dev) {
  1177. ASSERT_RTNL();
  1178. if (joining)
  1179. mark = switchdev_port_fwd_mark_get(dev, group_dev);
  1180. else if (dev->offload_fwd_mark == mark)
  1181. /* Ohoh, this port was the mark reference port,
  1182. * but it's leaving the group, so reset the
  1183. * mark for the remaining ports in the group.
  1184. */
  1185. switchdev_port_fwd_mark_reset(group_dev, mark,
  1186. &reset_mark);
  1187. }
  1188. dev->offload_fwd_mark = mark;
  1189. }
  1190. EXPORT_SYMBOL_GPL(switchdev_port_fwd_mark_set);