switchdev.c 34 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357
  1. /*
  2. * net/switchdev/switchdev.c - Switch device API
  3. * Copyright (c) 2014-2015 Jiri Pirko <jiri@resnulli.us>
  4. * Copyright (c) 2014-2015 Scott Feldman <sfeldma@gmail.com>
  5. *
  6. * This program is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU General Public License as published by
  8. * the Free Software Foundation; either version 2 of the License, or
  9. * (at your option) any later version.
  10. */
  11. #include <linux/kernel.h>
  12. #include <linux/types.h>
  13. #include <linux/init.h>
  14. #include <linux/mutex.h>
  15. #include <linux/notifier.h>
  16. #include <linux/netdevice.h>
  17. #include <linux/etherdevice.h>
  18. #include <linux/if_bridge.h>
  19. #include <linux/list.h>
  20. #include <linux/workqueue.h>
  21. #include <linux/if_vlan.h>
  22. #include <net/ip_fib.h>
  23. #include <net/switchdev.h>
  24. /**
  25. * switchdev_trans_item_enqueue - Enqueue data item to transaction queue
  26. *
  27. * @trans: transaction
  28. * @data: pointer to data being queued
  29. * @destructor: data destructor
  30. * @tritem: transaction item being queued
  31. *
  32. * Enqeueue data item to transaction queue. tritem is typically placed in
  33. * cointainter pointed at by data pointer. Destructor is called on
  34. * transaction abort and after successful commit phase in case
  35. * the caller did not dequeue the item before.
  36. */
  37. void switchdev_trans_item_enqueue(struct switchdev_trans *trans,
  38. void *data, void (*destructor)(void const *),
  39. struct switchdev_trans_item *tritem)
  40. {
  41. tritem->data = data;
  42. tritem->destructor = destructor;
  43. list_add_tail(&tritem->list, &trans->item_list);
  44. }
  45. EXPORT_SYMBOL_GPL(switchdev_trans_item_enqueue);
  46. static struct switchdev_trans_item *
  47. __switchdev_trans_item_dequeue(struct switchdev_trans *trans)
  48. {
  49. struct switchdev_trans_item *tritem;
  50. if (list_empty(&trans->item_list))
  51. return NULL;
  52. tritem = list_first_entry(&trans->item_list,
  53. struct switchdev_trans_item, list);
  54. list_del(&tritem->list);
  55. return tritem;
  56. }
  57. /**
  58. * switchdev_trans_item_dequeue - Dequeue data item from transaction queue
  59. *
  60. * @trans: transaction
  61. */
  62. void *switchdev_trans_item_dequeue(struct switchdev_trans *trans)
  63. {
  64. struct switchdev_trans_item *tritem;
  65. tritem = __switchdev_trans_item_dequeue(trans);
  66. BUG_ON(!tritem);
  67. return tritem->data;
  68. }
  69. EXPORT_SYMBOL_GPL(switchdev_trans_item_dequeue);
  70. static void switchdev_trans_init(struct switchdev_trans *trans)
  71. {
  72. INIT_LIST_HEAD(&trans->item_list);
  73. }
  74. static void switchdev_trans_items_destroy(struct switchdev_trans *trans)
  75. {
  76. struct switchdev_trans_item *tritem;
  77. while ((tritem = __switchdev_trans_item_dequeue(trans)))
  78. tritem->destructor(tritem->data);
  79. }
  80. static void switchdev_trans_items_warn_destroy(struct net_device *dev,
  81. struct switchdev_trans *trans)
  82. {
  83. WARN(!list_empty(&trans->item_list), "%s: transaction item queue is not empty.\n",
  84. dev->name);
  85. switchdev_trans_items_destroy(trans);
  86. }
  87. static LIST_HEAD(deferred);
  88. static DEFINE_SPINLOCK(deferred_lock);
  89. typedef void switchdev_deferred_func_t(struct net_device *dev,
  90. const void *data);
  91. struct switchdev_deferred_item {
  92. struct list_head list;
  93. struct net_device *dev;
  94. switchdev_deferred_func_t *func;
  95. unsigned long data[0];
  96. };
  97. static struct switchdev_deferred_item *switchdev_deferred_dequeue(void)
  98. {
  99. struct switchdev_deferred_item *dfitem;
  100. spin_lock_bh(&deferred_lock);
  101. if (list_empty(&deferred)) {
  102. dfitem = NULL;
  103. goto unlock;
  104. }
  105. dfitem = list_first_entry(&deferred,
  106. struct switchdev_deferred_item, list);
  107. list_del(&dfitem->list);
  108. unlock:
  109. spin_unlock_bh(&deferred_lock);
  110. return dfitem;
  111. }
  112. /**
  113. * switchdev_deferred_process - Process ops in deferred queue
  114. *
  115. * Called to flush the ops currently queued in deferred ops queue.
  116. * rtnl_lock must be held.
  117. */
  118. void switchdev_deferred_process(void)
  119. {
  120. struct switchdev_deferred_item *dfitem;
  121. ASSERT_RTNL();
  122. while ((dfitem = switchdev_deferred_dequeue())) {
  123. dfitem->func(dfitem->dev, dfitem->data);
  124. dev_put(dfitem->dev);
  125. kfree(dfitem);
  126. }
  127. }
  128. EXPORT_SYMBOL_GPL(switchdev_deferred_process);
  129. static void switchdev_deferred_process_work(struct work_struct *work)
  130. {
  131. rtnl_lock();
  132. switchdev_deferred_process();
  133. rtnl_unlock();
  134. }
  135. static DECLARE_WORK(deferred_process_work, switchdev_deferred_process_work);
  136. static int switchdev_deferred_enqueue(struct net_device *dev,
  137. const void *data, size_t data_len,
  138. switchdev_deferred_func_t *func)
  139. {
  140. struct switchdev_deferred_item *dfitem;
  141. dfitem = kmalloc(sizeof(*dfitem) + data_len, GFP_ATOMIC);
  142. if (!dfitem)
  143. return -ENOMEM;
  144. dfitem->dev = dev;
  145. dfitem->func = func;
  146. memcpy(dfitem->data, data, data_len);
  147. dev_hold(dev);
  148. spin_lock_bh(&deferred_lock);
  149. list_add_tail(&dfitem->list, &deferred);
  150. spin_unlock_bh(&deferred_lock);
  151. schedule_work(&deferred_process_work);
  152. return 0;
  153. }
  154. /**
  155. * switchdev_port_attr_get - Get port attribute
  156. *
  157. * @dev: port device
  158. * @attr: attribute to get
  159. */
  160. int switchdev_port_attr_get(struct net_device *dev, struct switchdev_attr *attr)
  161. {
  162. const struct switchdev_ops *ops = dev->switchdev_ops;
  163. struct net_device *lower_dev;
  164. struct list_head *iter;
  165. struct switchdev_attr first = {
  166. .id = SWITCHDEV_ATTR_ID_UNDEFINED
  167. };
  168. int err = -EOPNOTSUPP;
  169. if (ops && ops->switchdev_port_attr_get)
  170. return ops->switchdev_port_attr_get(dev, attr);
  171. if (attr->flags & SWITCHDEV_F_NO_RECURSE)
  172. return err;
  173. /* Switch device port(s) may be stacked under
  174. * bond/team/vlan dev, so recurse down to get attr on
  175. * each port. Return -ENODATA if attr values don't
  176. * compare across ports.
  177. */
  178. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  179. err = switchdev_port_attr_get(lower_dev, attr);
  180. if (err)
  181. break;
  182. if (first.id == SWITCHDEV_ATTR_ID_UNDEFINED)
  183. first = *attr;
  184. else if (memcmp(&first, attr, sizeof(*attr)))
  185. return -ENODATA;
  186. }
  187. return err;
  188. }
  189. EXPORT_SYMBOL_GPL(switchdev_port_attr_get);
  190. static int __switchdev_port_attr_set(struct net_device *dev,
  191. const struct switchdev_attr *attr,
  192. struct switchdev_trans *trans)
  193. {
  194. const struct switchdev_ops *ops = dev->switchdev_ops;
  195. struct net_device *lower_dev;
  196. struct list_head *iter;
  197. int err = -EOPNOTSUPP;
  198. if (ops && ops->switchdev_port_attr_set)
  199. return ops->switchdev_port_attr_set(dev, attr, trans);
  200. if (attr->flags & SWITCHDEV_F_NO_RECURSE)
  201. goto done;
  202. /* Switch device port(s) may be stacked under
  203. * bond/team/vlan dev, so recurse down to set attr on
  204. * each port.
  205. */
  206. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  207. err = __switchdev_port_attr_set(lower_dev, attr, trans);
  208. if (err == -EOPNOTSUPP &&
  209. attr->flags & SWITCHDEV_F_SKIP_EOPNOTSUPP)
  210. continue;
  211. if (err)
  212. break;
  213. }
  214. done:
  215. if (err == -EOPNOTSUPP && attr->flags & SWITCHDEV_F_SKIP_EOPNOTSUPP)
  216. err = 0;
  217. return err;
  218. }
  219. static int switchdev_port_attr_set_now(struct net_device *dev,
  220. const struct switchdev_attr *attr)
  221. {
  222. struct switchdev_trans trans;
  223. int err;
  224. switchdev_trans_init(&trans);
  225. /* Phase I: prepare for attr set. Driver/device should fail
  226. * here if there are going to be issues in the commit phase,
  227. * such as lack of resources or support. The driver/device
  228. * should reserve resources needed for the commit phase here,
  229. * but should not commit the attr.
  230. */
  231. trans.ph_prepare = true;
  232. err = __switchdev_port_attr_set(dev, attr, &trans);
  233. if (err) {
  234. /* Prepare phase failed: abort the transaction. Any
  235. * resources reserved in the prepare phase are
  236. * released.
  237. */
  238. if (err != -EOPNOTSUPP)
  239. switchdev_trans_items_destroy(&trans);
  240. return err;
  241. }
  242. /* Phase II: commit attr set. This cannot fail as a fault
  243. * of driver/device. If it does, it's a bug in the driver/device
  244. * because the driver said everythings was OK in phase I.
  245. */
  246. trans.ph_prepare = false;
  247. err = __switchdev_port_attr_set(dev, attr, &trans);
  248. WARN(err, "%s: Commit of attribute (id=%d) failed.\n",
  249. dev->name, attr->id);
  250. switchdev_trans_items_warn_destroy(dev, &trans);
  251. return err;
  252. }
  253. static void switchdev_port_attr_set_deferred(struct net_device *dev,
  254. const void *data)
  255. {
  256. const struct switchdev_attr *attr = data;
  257. int err;
  258. err = switchdev_port_attr_set_now(dev, attr);
  259. if (err && err != -EOPNOTSUPP)
  260. netdev_err(dev, "failed (err=%d) to set attribute (id=%d)\n",
  261. err, attr->id);
  262. }
  263. static int switchdev_port_attr_set_defer(struct net_device *dev,
  264. const struct switchdev_attr *attr)
  265. {
  266. return switchdev_deferred_enqueue(dev, attr, sizeof(*attr),
  267. switchdev_port_attr_set_deferred);
  268. }
  269. /**
  270. * switchdev_port_attr_set - Set port attribute
  271. *
  272. * @dev: port device
  273. * @attr: attribute to set
  274. *
  275. * Use a 2-phase prepare-commit transaction model to ensure
  276. * system is not left in a partially updated state due to
  277. * failure from driver/device.
  278. *
  279. * rtnl_lock must be held and must not be in atomic section,
  280. * in case SWITCHDEV_F_DEFER flag is not set.
  281. */
  282. int switchdev_port_attr_set(struct net_device *dev,
  283. const struct switchdev_attr *attr)
  284. {
  285. if (attr->flags & SWITCHDEV_F_DEFER)
  286. return switchdev_port_attr_set_defer(dev, attr);
  287. ASSERT_RTNL();
  288. return switchdev_port_attr_set_now(dev, attr);
  289. }
  290. EXPORT_SYMBOL_GPL(switchdev_port_attr_set);
  291. static int __switchdev_port_obj_add(struct net_device *dev,
  292. const struct switchdev_obj *obj,
  293. struct switchdev_trans *trans)
  294. {
  295. const struct switchdev_ops *ops = dev->switchdev_ops;
  296. struct net_device *lower_dev;
  297. struct list_head *iter;
  298. int err = -EOPNOTSUPP;
  299. if (ops && ops->switchdev_port_obj_add)
  300. return ops->switchdev_port_obj_add(dev, obj, trans);
  301. /* Switch device port(s) may be stacked under
  302. * bond/team/vlan dev, so recurse down to add object on
  303. * each port.
  304. */
  305. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  306. err = __switchdev_port_obj_add(lower_dev, obj, trans);
  307. if (err)
  308. break;
  309. }
  310. return err;
  311. }
  312. static int switchdev_port_obj_add_now(struct net_device *dev,
  313. const struct switchdev_obj *obj)
  314. {
  315. struct switchdev_trans trans;
  316. int err;
  317. ASSERT_RTNL();
  318. switchdev_trans_init(&trans);
  319. /* Phase I: prepare for obj add. Driver/device should fail
  320. * here if there are going to be issues in the commit phase,
  321. * such as lack of resources or support. The driver/device
  322. * should reserve resources needed for the commit phase here,
  323. * but should not commit the obj.
  324. */
  325. trans.ph_prepare = true;
  326. err = __switchdev_port_obj_add(dev, obj, &trans);
  327. if (err) {
  328. /* Prepare phase failed: abort the transaction. Any
  329. * resources reserved in the prepare phase are
  330. * released.
  331. */
  332. if (err != -EOPNOTSUPP)
  333. switchdev_trans_items_destroy(&trans);
  334. return err;
  335. }
  336. /* Phase II: commit obj add. This cannot fail as a fault
  337. * of driver/device. If it does, it's a bug in the driver/device
  338. * because the driver said everythings was OK in phase I.
  339. */
  340. trans.ph_prepare = false;
  341. err = __switchdev_port_obj_add(dev, obj, &trans);
  342. WARN(err, "%s: Commit of object (id=%d) failed.\n", dev->name, obj->id);
  343. switchdev_trans_items_warn_destroy(dev, &trans);
  344. return err;
  345. }
  346. static void switchdev_port_obj_add_deferred(struct net_device *dev,
  347. const void *data)
  348. {
  349. const struct switchdev_obj *obj = data;
  350. int err;
  351. err = switchdev_port_obj_add_now(dev, obj);
  352. if (err && err != -EOPNOTSUPP)
  353. netdev_err(dev, "failed (err=%d) to add object (id=%d)\n",
  354. err, obj->id);
  355. }
  356. static int switchdev_port_obj_add_defer(struct net_device *dev,
  357. const struct switchdev_obj *obj)
  358. {
  359. return switchdev_deferred_enqueue(dev, obj, sizeof(*obj),
  360. switchdev_port_obj_add_deferred);
  361. }
  362. /**
  363. * switchdev_port_obj_add - Add port object
  364. *
  365. * @dev: port device
  366. * @id: object ID
  367. * @obj: object to add
  368. *
  369. * Use a 2-phase prepare-commit transaction model to ensure
  370. * system is not left in a partially updated state due to
  371. * failure from driver/device.
  372. *
  373. * rtnl_lock must be held and must not be in atomic section,
  374. * in case SWITCHDEV_F_DEFER flag is not set.
  375. */
  376. int switchdev_port_obj_add(struct net_device *dev,
  377. const struct switchdev_obj *obj)
  378. {
  379. if (obj->flags & SWITCHDEV_F_DEFER)
  380. return switchdev_port_obj_add_defer(dev, obj);
  381. ASSERT_RTNL();
  382. return switchdev_port_obj_add_now(dev, obj);
  383. }
  384. EXPORT_SYMBOL_GPL(switchdev_port_obj_add);
  385. static int switchdev_port_obj_del_now(struct net_device *dev,
  386. const struct switchdev_obj *obj)
  387. {
  388. const struct switchdev_ops *ops = dev->switchdev_ops;
  389. struct net_device *lower_dev;
  390. struct list_head *iter;
  391. int err = -EOPNOTSUPP;
  392. if (ops && ops->switchdev_port_obj_del)
  393. return ops->switchdev_port_obj_del(dev, obj);
  394. /* Switch device port(s) may be stacked under
  395. * bond/team/vlan dev, so recurse down to delete object on
  396. * each port.
  397. */
  398. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  399. err = switchdev_port_obj_del_now(lower_dev, obj);
  400. if (err)
  401. break;
  402. }
  403. return err;
  404. }
  405. static void switchdev_port_obj_del_deferred(struct net_device *dev,
  406. const void *data)
  407. {
  408. const struct switchdev_obj *obj = data;
  409. int err;
  410. err = switchdev_port_obj_del_now(dev, obj);
  411. if (err && err != -EOPNOTSUPP)
  412. netdev_err(dev, "failed (err=%d) to del object (id=%d)\n",
  413. err, obj->id);
  414. }
  415. static int switchdev_port_obj_del_defer(struct net_device *dev,
  416. const struct switchdev_obj *obj)
  417. {
  418. return switchdev_deferred_enqueue(dev, obj, sizeof(*obj),
  419. switchdev_port_obj_del_deferred);
  420. }
  421. /**
  422. * switchdev_port_obj_del - Delete port object
  423. *
  424. * @dev: port device
  425. * @id: object ID
  426. * @obj: object to delete
  427. *
  428. * rtnl_lock must be held and must not be in atomic section,
  429. * in case SWITCHDEV_F_DEFER flag is not set.
  430. */
  431. int switchdev_port_obj_del(struct net_device *dev,
  432. const struct switchdev_obj *obj)
  433. {
  434. if (obj->flags & SWITCHDEV_F_DEFER)
  435. return switchdev_port_obj_del_defer(dev, obj);
  436. ASSERT_RTNL();
  437. return switchdev_port_obj_del_now(dev, obj);
  438. }
  439. EXPORT_SYMBOL_GPL(switchdev_port_obj_del);
  440. /**
  441. * switchdev_port_obj_dump - Dump port objects
  442. *
  443. * @dev: port device
  444. * @id: object ID
  445. * @obj: object to dump
  446. * @cb: function to call with a filled object
  447. *
  448. * rtnl_lock must be held.
  449. */
  450. int switchdev_port_obj_dump(struct net_device *dev, struct switchdev_obj *obj,
  451. switchdev_obj_dump_cb_t *cb)
  452. {
  453. const struct switchdev_ops *ops = dev->switchdev_ops;
  454. struct net_device *lower_dev;
  455. struct list_head *iter;
  456. int err = -EOPNOTSUPP;
  457. ASSERT_RTNL();
  458. if (ops && ops->switchdev_port_obj_dump)
  459. return ops->switchdev_port_obj_dump(dev, obj, cb);
  460. /* Switch device port(s) may be stacked under
  461. * bond/team/vlan dev, so recurse down to dump objects on
  462. * first port at bottom of stack.
  463. */
  464. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  465. err = switchdev_port_obj_dump(lower_dev, obj, cb);
  466. break;
  467. }
  468. return err;
  469. }
  470. EXPORT_SYMBOL_GPL(switchdev_port_obj_dump);
  471. static DEFINE_MUTEX(switchdev_mutex);
  472. static RAW_NOTIFIER_HEAD(switchdev_notif_chain);
  473. /**
  474. * register_switchdev_notifier - Register notifier
  475. * @nb: notifier_block
  476. *
  477. * Register switch device notifier. This should be used by code
  478. * which needs to monitor events happening in particular device.
  479. * Return values are same as for atomic_notifier_chain_register().
  480. */
  481. int register_switchdev_notifier(struct notifier_block *nb)
  482. {
  483. int err;
  484. mutex_lock(&switchdev_mutex);
  485. err = raw_notifier_chain_register(&switchdev_notif_chain, nb);
  486. mutex_unlock(&switchdev_mutex);
  487. return err;
  488. }
  489. EXPORT_SYMBOL_GPL(register_switchdev_notifier);
  490. /**
  491. * unregister_switchdev_notifier - Unregister notifier
  492. * @nb: notifier_block
  493. *
  494. * Unregister switch device notifier.
  495. * Return values are same as for atomic_notifier_chain_unregister().
  496. */
  497. int unregister_switchdev_notifier(struct notifier_block *nb)
  498. {
  499. int err;
  500. mutex_lock(&switchdev_mutex);
  501. err = raw_notifier_chain_unregister(&switchdev_notif_chain, nb);
  502. mutex_unlock(&switchdev_mutex);
  503. return err;
  504. }
  505. EXPORT_SYMBOL_GPL(unregister_switchdev_notifier);
  506. /**
  507. * call_switchdev_notifiers - Call notifiers
  508. * @val: value passed unmodified to notifier function
  509. * @dev: port device
  510. * @info: notifier information data
  511. *
  512. * Call all network notifier blocks. This should be called by driver
  513. * when it needs to propagate hardware event.
  514. * Return values are same as for atomic_notifier_call_chain().
  515. */
  516. int call_switchdev_notifiers(unsigned long val, struct net_device *dev,
  517. struct switchdev_notifier_info *info)
  518. {
  519. int err;
  520. info->dev = dev;
  521. mutex_lock(&switchdev_mutex);
  522. err = raw_notifier_call_chain(&switchdev_notif_chain, val, info);
  523. mutex_unlock(&switchdev_mutex);
  524. return err;
  525. }
  526. EXPORT_SYMBOL_GPL(call_switchdev_notifiers);
  527. struct switchdev_vlan_dump {
  528. struct switchdev_obj_port_vlan vlan;
  529. struct sk_buff *skb;
  530. u32 filter_mask;
  531. u16 flags;
  532. u16 begin;
  533. u16 end;
  534. };
  535. static int switchdev_port_vlan_dump_put(struct switchdev_vlan_dump *dump)
  536. {
  537. struct bridge_vlan_info vinfo;
  538. vinfo.flags = dump->flags;
  539. if (dump->begin == 0 && dump->end == 0) {
  540. return 0;
  541. } else if (dump->begin == dump->end) {
  542. vinfo.vid = dump->begin;
  543. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  544. sizeof(vinfo), &vinfo))
  545. return -EMSGSIZE;
  546. } else {
  547. vinfo.vid = dump->begin;
  548. vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_BEGIN;
  549. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  550. sizeof(vinfo), &vinfo))
  551. return -EMSGSIZE;
  552. vinfo.vid = dump->end;
  553. vinfo.flags &= ~BRIDGE_VLAN_INFO_RANGE_BEGIN;
  554. vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_END;
  555. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  556. sizeof(vinfo), &vinfo))
  557. return -EMSGSIZE;
  558. }
  559. return 0;
  560. }
  561. static int switchdev_port_vlan_dump_cb(struct switchdev_obj *obj)
  562. {
  563. struct switchdev_obj_port_vlan *vlan = SWITCHDEV_OBJ_PORT_VLAN(obj);
  564. struct switchdev_vlan_dump *dump =
  565. container_of(vlan, struct switchdev_vlan_dump, vlan);
  566. int err = 0;
  567. if (vlan->vid_begin > vlan->vid_end)
  568. return -EINVAL;
  569. if (dump->filter_mask & RTEXT_FILTER_BRVLAN) {
  570. dump->flags = vlan->flags;
  571. for (dump->begin = dump->end = vlan->vid_begin;
  572. dump->begin <= vlan->vid_end;
  573. dump->begin++, dump->end++) {
  574. err = switchdev_port_vlan_dump_put(dump);
  575. if (err)
  576. return err;
  577. }
  578. } else if (dump->filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED) {
  579. if (dump->begin > vlan->vid_begin &&
  580. dump->begin >= vlan->vid_end) {
  581. if ((dump->begin - 1) == vlan->vid_end &&
  582. dump->flags == vlan->flags) {
  583. /* prepend */
  584. dump->begin = vlan->vid_begin;
  585. } else {
  586. err = switchdev_port_vlan_dump_put(dump);
  587. dump->flags = vlan->flags;
  588. dump->begin = vlan->vid_begin;
  589. dump->end = vlan->vid_end;
  590. }
  591. } else if (dump->end <= vlan->vid_begin &&
  592. dump->end < vlan->vid_end) {
  593. if ((dump->end + 1) == vlan->vid_begin &&
  594. dump->flags == vlan->flags) {
  595. /* append */
  596. dump->end = vlan->vid_end;
  597. } else {
  598. err = switchdev_port_vlan_dump_put(dump);
  599. dump->flags = vlan->flags;
  600. dump->begin = vlan->vid_begin;
  601. dump->end = vlan->vid_end;
  602. }
  603. } else {
  604. err = -EINVAL;
  605. }
  606. }
  607. return err;
  608. }
  609. static int switchdev_port_vlan_fill(struct sk_buff *skb, struct net_device *dev,
  610. u32 filter_mask)
  611. {
  612. struct switchdev_vlan_dump dump = {
  613. .vlan.obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
  614. .skb = skb,
  615. .filter_mask = filter_mask,
  616. };
  617. int err = 0;
  618. if ((filter_mask & RTEXT_FILTER_BRVLAN) ||
  619. (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)) {
  620. err = switchdev_port_obj_dump(dev, &dump.vlan.obj,
  621. switchdev_port_vlan_dump_cb);
  622. if (err)
  623. goto err_out;
  624. if (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)
  625. /* last one */
  626. err = switchdev_port_vlan_dump_put(&dump);
  627. }
  628. err_out:
  629. return err == -EOPNOTSUPP ? 0 : err;
  630. }
  631. /**
  632. * switchdev_port_bridge_getlink - Get bridge port attributes
  633. *
  634. * @dev: port device
  635. *
  636. * Called for SELF on rtnl_bridge_getlink to get bridge port
  637. * attributes.
  638. */
  639. int switchdev_port_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
  640. struct net_device *dev, u32 filter_mask,
  641. int nlflags)
  642. {
  643. struct switchdev_attr attr = {
  644. .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
  645. };
  646. u16 mode = BRIDGE_MODE_UNDEF;
  647. u32 mask = BR_LEARNING | BR_LEARNING_SYNC | BR_FLOOD;
  648. int err;
  649. err = switchdev_port_attr_get(dev, &attr);
  650. if (err && err != -EOPNOTSUPP)
  651. return err;
  652. return ndo_dflt_bridge_getlink(skb, pid, seq, dev, mode,
  653. attr.u.brport_flags, mask, nlflags,
  654. filter_mask, switchdev_port_vlan_fill);
  655. }
  656. EXPORT_SYMBOL_GPL(switchdev_port_bridge_getlink);
  657. static int switchdev_port_br_setflag(struct net_device *dev,
  658. struct nlattr *nlattr,
  659. unsigned long brport_flag)
  660. {
  661. struct switchdev_attr attr = {
  662. .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
  663. };
  664. u8 flag = nla_get_u8(nlattr);
  665. int err;
  666. err = switchdev_port_attr_get(dev, &attr);
  667. if (err)
  668. return err;
  669. if (flag)
  670. attr.u.brport_flags |= brport_flag;
  671. else
  672. attr.u.brport_flags &= ~brport_flag;
  673. return switchdev_port_attr_set(dev, &attr);
  674. }
  675. static const struct nla_policy
  676. switchdev_port_bridge_policy[IFLA_BRPORT_MAX + 1] = {
  677. [IFLA_BRPORT_STATE] = { .type = NLA_U8 },
  678. [IFLA_BRPORT_COST] = { .type = NLA_U32 },
  679. [IFLA_BRPORT_PRIORITY] = { .type = NLA_U16 },
  680. [IFLA_BRPORT_MODE] = { .type = NLA_U8 },
  681. [IFLA_BRPORT_GUARD] = { .type = NLA_U8 },
  682. [IFLA_BRPORT_PROTECT] = { .type = NLA_U8 },
  683. [IFLA_BRPORT_FAST_LEAVE] = { .type = NLA_U8 },
  684. [IFLA_BRPORT_LEARNING] = { .type = NLA_U8 },
  685. [IFLA_BRPORT_LEARNING_SYNC] = { .type = NLA_U8 },
  686. [IFLA_BRPORT_UNICAST_FLOOD] = { .type = NLA_U8 },
  687. };
  688. static int switchdev_port_br_setlink_protinfo(struct net_device *dev,
  689. struct nlattr *protinfo)
  690. {
  691. struct nlattr *attr;
  692. int rem;
  693. int err;
  694. err = nla_validate_nested(protinfo, IFLA_BRPORT_MAX,
  695. switchdev_port_bridge_policy);
  696. if (err)
  697. return err;
  698. nla_for_each_nested(attr, protinfo, rem) {
  699. switch (nla_type(attr)) {
  700. case IFLA_BRPORT_LEARNING:
  701. err = switchdev_port_br_setflag(dev, attr,
  702. BR_LEARNING);
  703. break;
  704. case IFLA_BRPORT_LEARNING_SYNC:
  705. err = switchdev_port_br_setflag(dev, attr,
  706. BR_LEARNING_SYNC);
  707. break;
  708. case IFLA_BRPORT_UNICAST_FLOOD:
  709. err = switchdev_port_br_setflag(dev, attr, BR_FLOOD);
  710. break;
  711. default:
  712. err = -EOPNOTSUPP;
  713. break;
  714. }
  715. if (err)
  716. return err;
  717. }
  718. return 0;
  719. }
  720. static int switchdev_port_br_afspec(struct net_device *dev,
  721. struct nlattr *afspec,
  722. int (*f)(struct net_device *dev,
  723. const struct switchdev_obj *obj))
  724. {
  725. struct nlattr *attr;
  726. struct bridge_vlan_info *vinfo;
  727. struct switchdev_obj_port_vlan vlan = {
  728. .obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
  729. };
  730. int rem;
  731. int err;
  732. nla_for_each_nested(attr, afspec, rem) {
  733. if (nla_type(attr) != IFLA_BRIDGE_VLAN_INFO)
  734. continue;
  735. if (nla_len(attr) != sizeof(struct bridge_vlan_info))
  736. return -EINVAL;
  737. vinfo = nla_data(attr);
  738. if (!vinfo->vid || vinfo->vid >= VLAN_VID_MASK)
  739. return -EINVAL;
  740. vlan.flags = vinfo->flags;
  741. if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_BEGIN) {
  742. if (vlan.vid_begin)
  743. return -EINVAL;
  744. vlan.vid_begin = vinfo->vid;
  745. /* don't allow range of pvids */
  746. if (vlan.flags & BRIDGE_VLAN_INFO_PVID)
  747. return -EINVAL;
  748. } else if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_END) {
  749. if (!vlan.vid_begin)
  750. return -EINVAL;
  751. vlan.vid_end = vinfo->vid;
  752. if (vlan.vid_end <= vlan.vid_begin)
  753. return -EINVAL;
  754. err = f(dev, &vlan.obj);
  755. if (err)
  756. return err;
  757. memset(&vlan, 0, sizeof(vlan));
  758. } else {
  759. if (vlan.vid_begin)
  760. return -EINVAL;
  761. vlan.vid_begin = vinfo->vid;
  762. vlan.vid_end = vinfo->vid;
  763. err = f(dev, &vlan.obj);
  764. if (err)
  765. return err;
  766. memset(&vlan, 0, sizeof(vlan));
  767. }
  768. }
  769. return 0;
  770. }
  771. /**
  772. * switchdev_port_bridge_setlink - Set bridge port attributes
  773. *
  774. * @dev: port device
  775. * @nlh: netlink header
  776. * @flags: netlink flags
  777. *
  778. * Called for SELF on rtnl_bridge_setlink to set bridge port
  779. * attributes.
  780. */
  781. int switchdev_port_bridge_setlink(struct net_device *dev,
  782. struct nlmsghdr *nlh, u16 flags)
  783. {
  784. struct nlattr *protinfo;
  785. struct nlattr *afspec;
  786. int err = 0;
  787. protinfo = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  788. IFLA_PROTINFO);
  789. if (protinfo) {
  790. err = switchdev_port_br_setlink_protinfo(dev, protinfo);
  791. if (err)
  792. return err;
  793. }
  794. afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  795. IFLA_AF_SPEC);
  796. if (afspec)
  797. err = switchdev_port_br_afspec(dev, afspec,
  798. switchdev_port_obj_add);
  799. return err;
  800. }
  801. EXPORT_SYMBOL_GPL(switchdev_port_bridge_setlink);
  802. /**
  803. * switchdev_port_bridge_dellink - Set bridge port attributes
  804. *
  805. * @dev: port device
  806. * @nlh: netlink header
  807. * @flags: netlink flags
  808. *
  809. * Called for SELF on rtnl_bridge_dellink to set bridge port
  810. * attributes.
  811. */
  812. int switchdev_port_bridge_dellink(struct net_device *dev,
  813. struct nlmsghdr *nlh, u16 flags)
  814. {
  815. struct nlattr *afspec;
  816. afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  817. IFLA_AF_SPEC);
  818. if (afspec)
  819. return switchdev_port_br_afspec(dev, afspec,
  820. switchdev_port_obj_del);
  821. return 0;
  822. }
  823. EXPORT_SYMBOL_GPL(switchdev_port_bridge_dellink);
  824. /**
  825. * switchdev_port_fdb_add - Add FDB (MAC/VLAN) entry to port
  826. *
  827. * @ndmsg: netlink hdr
  828. * @nlattr: netlink attributes
  829. * @dev: port device
  830. * @addr: MAC address to add
  831. * @vid: VLAN to add
  832. *
  833. * Add FDB entry to switch device.
  834. */
  835. int switchdev_port_fdb_add(struct ndmsg *ndm, struct nlattr *tb[],
  836. struct net_device *dev, const unsigned char *addr,
  837. u16 vid, u16 nlm_flags)
  838. {
  839. struct switchdev_obj_port_fdb fdb = {
  840. .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  841. .vid = vid,
  842. };
  843. ether_addr_copy(fdb.addr, addr);
  844. return switchdev_port_obj_add(dev, &fdb.obj);
  845. }
  846. EXPORT_SYMBOL_GPL(switchdev_port_fdb_add);
  847. /**
  848. * switchdev_port_fdb_del - Delete FDB (MAC/VLAN) entry from port
  849. *
  850. * @ndmsg: netlink hdr
  851. * @nlattr: netlink attributes
  852. * @dev: port device
  853. * @addr: MAC address to delete
  854. * @vid: VLAN to delete
  855. *
  856. * Delete FDB entry from switch device.
  857. */
  858. int switchdev_port_fdb_del(struct ndmsg *ndm, struct nlattr *tb[],
  859. struct net_device *dev, const unsigned char *addr,
  860. u16 vid)
  861. {
  862. struct switchdev_obj_port_fdb fdb = {
  863. .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  864. .vid = vid,
  865. };
  866. ether_addr_copy(fdb.addr, addr);
  867. return switchdev_port_obj_del(dev, &fdb.obj);
  868. }
  869. EXPORT_SYMBOL_GPL(switchdev_port_fdb_del);
  870. struct switchdev_fdb_dump {
  871. struct switchdev_obj_port_fdb fdb;
  872. struct net_device *dev;
  873. struct sk_buff *skb;
  874. struct netlink_callback *cb;
  875. int idx;
  876. };
  877. static int switchdev_port_fdb_dump_cb(struct switchdev_obj *obj)
  878. {
  879. struct switchdev_obj_port_fdb *fdb = SWITCHDEV_OBJ_PORT_FDB(obj);
  880. struct switchdev_fdb_dump *dump =
  881. container_of(fdb, struct switchdev_fdb_dump, fdb);
  882. u32 portid = NETLINK_CB(dump->cb->skb).portid;
  883. u32 seq = dump->cb->nlh->nlmsg_seq;
  884. struct nlmsghdr *nlh;
  885. struct ndmsg *ndm;
  886. if (dump->idx < dump->cb->args[0])
  887. goto skip;
  888. nlh = nlmsg_put(dump->skb, portid, seq, RTM_NEWNEIGH,
  889. sizeof(*ndm), NLM_F_MULTI);
  890. if (!nlh)
  891. return -EMSGSIZE;
  892. ndm = nlmsg_data(nlh);
  893. ndm->ndm_family = AF_BRIDGE;
  894. ndm->ndm_pad1 = 0;
  895. ndm->ndm_pad2 = 0;
  896. ndm->ndm_flags = NTF_SELF;
  897. ndm->ndm_type = 0;
  898. ndm->ndm_ifindex = dump->dev->ifindex;
  899. ndm->ndm_state = fdb->ndm_state;
  900. if (nla_put(dump->skb, NDA_LLADDR, ETH_ALEN, fdb->addr))
  901. goto nla_put_failure;
  902. if (fdb->vid && nla_put_u16(dump->skb, NDA_VLAN, fdb->vid))
  903. goto nla_put_failure;
  904. nlmsg_end(dump->skb, nlh);
  905. skip:
  906. dump->idx++;
  907. return 0;
  908. nla_put_failure:
  909. nlmsg_cancel(dump->skb, nlh);
  910. return -EMSGSIZE;
  911. }
  912. /**
  913. * switchdev_port_fdb_dump - Dump port FDB (MAC/VLAN) entries
  914. *
  915. * @skb: netlink skb
  916. * @cb: netlink callback
  917. * @dev: port device
  918. * @filter_dev: filter device
  919. * @idx:
  920. *
  921. * Delete FDB entry from switch device.
  922. */
  923. int switchdev_port_fdb_dump(struct sk_buff *skb, struct netlink_callback *cb,
  924. struct net_device *dev,
  925. struct net_device *filter_dev, int idx)
  926. {
  927. struct switchdev_fdb_dump dump = {
  928. .fdb.obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  929. .dev = dev,
  930. .skb = skb,
  931. .cb = cb,
  932. .idx = idx,
  933. };
  934. switchdev_port_obj_dump(dev, &dump.fdb.obj, switchdev_port_fdb_dump_cb);
  935. return dump.idx;
  936. }
  937. EXPORT_SYMBOL_GPL(switchdev_port_fdb_dump);
  938. static struct net_device *switchdev_get_lowest_dev(struct net_device *dev)
  939. {
  940. const struct switchdev_ops *ops = dev->switchdev_ops;
  941. struct net_device *lower_dev;
  942. struct net_device *port_dev;
  943. struct list_head *iter;
  944. /* Recusively search down until we find a sw port dev.
  945. * (A sw port dev supports switchdev_port_attr_get).
  946. */
  947. if (ops && ops->switchdev_port_attr_get)
  948. return dev;
  949. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  950. port_dev = switchdev_get_lowest_dev(lower_dev);
  951. if (port_dev)
  952. return port_dev;
  953. }
  954. return NULL;
  955. }
  956. static struct net_device *switchdev_get_dev_by_nhs(struct fib_info *fi)
  957. {
  958. struct switchdev_attr attr = {
  959. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  960. };
  961. struct switchdev_attr prev_attr;
  962. struct net_device *dev = NULL;
  963. int nhsel;
  964. ASSERT_RTNL();
  965. /* For this route, all nexthop devs must be on the same switch. */
  966. for (nhsel = 0; nhsel < fi->fib_nhs; nhsel++) {
  967. const struct fib_nh *nh = &fi->fib_nh[nhsel];
  968. if (!nh->nh_dev)
  969. return NULL;
  970. dev = switchdev_get_lowest_dev(nh->nh_dev);
  971. if (!dev)
  972. return NULL;
  973. if (switchdev_port_attr_get(dev, &attr))
  974. return NULL;
  975. if (nhsel > 0 &&
  976. !netdev_phys_item_id_same(&prev_attr.u.ppid, &attr.u.ppid))
  977. return NULL;
  978. prev_attr = attr;
  979. }
  980. return dev;
  981. }
  982. /**
  983. * switchdev_fib_ipv4_add - Add/modify switch IPv4 route entry
  984. *
  985. * @dst: route's IPv4 destination address
  986. * @dst_len: destination address length (prefix length)
  987. * @fi: route FIB info structure
  988. * @tos: route TOS
  989. * @type: route type
  990. * @nlflags: netlink flags passed in (NLM_F_*)
  991. * @tb_id: route table ID
  992. *
  993. * Add/modify switch IPv4 route entry.
  994. */
  995. int switchdev_fib_ipv4_add(u32 dst, int dst_len, struct fib_info *fi,
  996. u8 tos, u8 type, u32 nlflags, u32 tb_id)
  997. {
  998. struct switchdev_obj_ipv4_fib ipv4_fib = {
  999. .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
  1000. .dst = dst,
  1001. .dst_len = dst_len,
  1002. .tos = tos,
  1003. .type = type,
  1004. .nlflags = nlflags,
  1005. .tb_id = tb_id,
  1006. };
  1007. struct net_device *dev;
  1008. int err = 0;
  1009. memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
  1010. /* Don't offload route if using custom ip rules or if
  1011. * IPv4 FIB offloading has been disabled completely.
  1012. */
  1013. #ifdef CONFIG_IP_MULTIPLE_TABLES
  1014. if (fi->fib_net->ipv4.fib_has_custom_rules)
  1015. return 0;
  1016. #endif
  1017. if (fi->fib_net->ipv4.fib_offload_disabled)
  1018. return 0;
  1019. dev = switchdev_get_dev_by_nhs(fi);
  1020. if (!dev)
  1021. return 0;
  1022. err = switchdev_port_obj_add(dev, &ipv4_fib.obj);
  1023. if (!err)
  1024. fi->fib_flags |= RTNH_F_OFFLOAD;
  1025. return err == -EOPNOTSUPP ? 0 : err;
  1026. }
  1027. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_add);
  1028. /**
  1029. * switchdev_fib_ipv4_del - Delete IPv4 route entry from switch
  1030. *
  1031. * @dst: route's IPv4 destination address
  1032. * @dst_len: destination address length (prefix length)
  1033. * @fi: route FIB info structure
  1034. * @tos: route TOS
  1035. * @type: route type
  1036. * @tb_id: route table ID
  1037. *
  1038. * Delete IPv4 route entry from switch device.
  1039. */
  1040. int switchdev_fib_ipv4_del(u32 dst, int dst_len, struct fib_info *fi,
  1041. u8 tos, u8 type, u32 tb_id)
  1042. {
  1043. struct switchdev_obj_ipv4_fib ipv4_fib = {
  1044. .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
  1045. .dst = dst,
  1046. .dst_len = dst_len,
  1047. .tos = tos,
  1048. .type = type,
  1049. .nlflags = 0,
  1050. .tb_id = tb_id,
  1051. };
  1052. struct net_device *dev;
  1053. int err = 0;
  1054. memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
  1055. if (!(fi->fib_flags & RTNH_F_OFFLOAD))
  1056. return 0;
  1057. dev = switchdev_get_dev_by_nhs(fi);
  1058. if (!dev)
  1059. return 0;
  1060. err = switchdev_port_obj_del(dev, &ipv4_fib.obj);
  1061. if (!err)
  1062. fi->fib_flags &= ~RTNH_F_OFFLOAD;
  1063. return err == -EOPNOTSUPP ? 0 : err;
  1064. }
  1065. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_del);
  1066. /**
  1067. * switchdev_fib_ipv4_abort - Abort an IPv4 FIB operation
  1068. *
  1069. * @fi: route FIB info structure
  1070. */
  1071. void switchdev_fib_ipv4_abort(struct fib_info *fi)
  1072. {
  1073. /* There was a problem installing this route to the offload
  1074. * device. For now, until we come up with more refined
  1075. * policy handling, abruptly end IPv4 fib offloading for
  1076. * for entire net by flushing offload device(s) of all
  1077. * IPv4 routes, and mark IPv4 fib offloading broken from
  1078. * this point forward.
  1079. */
  1080. fib_flush_external(fi->fib_net);
  1081. fi->fib_net->ipv4.fib_offload_disabled = true;
  1082. }
  1083. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_abort);
  1084. static bool switchdev_port_same_parent_id(struct net_device *a,
  1085. struct net_device *b)
  1086. {
  1087. struct switchdev_attr a_attr = {
  1088. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  1089. .flags = SWITCHDEV_F_NO_RECURSE,
  1090. };
  1091. struct switchdev_attr b_attr = {
  1092. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  1093. .flags = SWITCHDEV_F_NO_RECURSE,
  1094. };
  1095. if (switchdev_port_attr_get(a, &a_attr) ||
  1096. switchdev_port_attr_get(b, &b_attr))
  1097. return false;
  1098. return netdev_phys_item_id_same(&a_attr.u.ppid, &b_attr.u.ppid);
  1099. }
  1100. static u32 switchdev_port_fwd_mark_get(struct net_device *dev,
  1101. struct net_device *group_dev)
  1102. {
  1103. struct net_device *lower_dev;
  1104. struct list_head *iter;
  1105. netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
  1106. if (lower_dev == dev)
  1107. continue;
  1108. if (switchdev_port_same_parent_id(dev, lower_dev))
  1109. return lower_dev->offload_fwd_mark;
  1110. return switchdev_port_fwd_mark_get(dev, lower_dev);
  1111. }
  1112. return dev->ifindex;
  1113. }
  1114. static void switchdev_port_fwd_mark_reset(struct net_device *group_dev,
  1115. u32 old_mark, u32 *reset_mark)
  1116. {
  1117. struct net_device *lower_dev;
  1118. struct list_head *iter;
  1119. netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
  1120. if (lower_dev->offload_fwd_mark == old_mark) {
  1121. if (!*reset_mark)
  1122. *reset_mark = lower_dev->ifindex;
  1123. lower_dev->offload_fwd_mark = *reset_mark;
  1124. }
  1125. switchdev_port_fwd_mark_reset(lower_dev, old_mark, reset_mark);
  1126. }
  1127. }
  1128. /**
  1129. * switchdev_port_fwd_mark_set - Set port offload forwarding mark
  1130. *
  1131. * @dev: port device
  1132. * @group_dev: containing device
  1133. * @joining: true if dev is joining group; false if leaving group
  1134. *
  1135. * An ungrouped port's offload mark is just its ifindex. A grouped
  1136. * port's (member of a bridge, for example) offload mark is the ifindex
  1137. * of one of the ports in the group with the same parent (switch) ID.
  1138. * Ports on the same device in the same group will have the same mark.
  1139. *
  1140. * Example:
  1141. *
  1142. * br0 ifindex=9
  1143. * sw1p1 ifindex=2 mark=2
  1144. * sw1p2 ifindex=3 mark=2
  1145. * sw2p1 ifindex=4 mark=5
  1146. * sw2p2 ifindex=5 mark=5
  1147. *
  1148. * If sw2p2 leaves the bridge, we'll have:
  1149. *
  1150. * br0 ifindex=9
  1151. * sw1p1 ifindex=2 mark=2
  1152. * sw1p2 ifindex=3 mark=2
  1153. * sw2p1 ifindex=4 mark=4
  1154. * sw2p2 ifindex=5 mark=5
  1155. */
  1156. void switchdev_port_fwd_mark_set(struct net_device *dev,
  1157. struct net_device *group_dev,
  1158. bool joining)
  1159. {
  1160. u32 mark = dev->ifindex;
  1161. u32 reset_mark = 0;
  1162. if (group_dev) {
  1163. ASSERT_RTNL();
  1164. if (joining)
  1165. mark = switchdev_port_fwd_mark_get(dev, group_dev);
  1166. else if (dev->offload_fwd_mark == mark)
  1167. /* Ohoh, this port was the mark reference port,
  1168. * but it's leaving the group, so reset the
  1169. * mark for the remaining ports in the group.
  1170. */
  1171. switchdev_port_fwd_mark_reset(group_dev, mark,
  1172. &reset_mark);
  1173. }
  1174. dev->offload_fwd_mark = mark;
  1175. }
  1176. EXPORT_SYMBOL_GPL(switchdev_port_fwd_mark_set);