switchdev.c 35 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386
  1. /*
  2. * net/switchdev/switchdev.c - Switch device API
  3. * Copyright (c) 2014-2015 Jiri Pirko <jiri@resnulli.us>
  4. * Copyright (c) 2014-2015 Scott Feldman <sfeldma@gmail.com>
  5. *
  6. * This program is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU General Public License as published by
  8. * the Free Software Foundation; either version 2 of the License, or
  9. * (at your option) any later version.
  10. */
  11. #include <linux/kernel.h>
  12. #include <linux/types.h>
  13. #include <linux/init.h>
  14. #include <linux/mutex.h>
  15. #include <linux/notifier.h>
  16. #include <linux/netdevice.h>
  17. #include <linux/etherdevice.h>
  18. #include <linux/if_bridge.h>
  19. #include <linux/list.h>
  20. #include <linux/workqueue.h>
  21. #include <linux/if_vlan.h>
  22. #include <linux/rtnetlink.h>
  23. #include <net/ip_fib.h>
  24. #include <net/switchdev.h>
  25. /**
  26. * switchdev_trans_item_enqueue - Enqueue data item to transaction queue
  27. *
  28. * @trans: transaction
  29. * @data: pointer to data being queued
  30. * @destructor: data destructor
  31. * @tritem: transaction item being queued
  32. *
  33. * Enqeueue data item to transaction queue. tritem is typically placed in
  34. * cointainter pointed at by data pointer. Destructor is called on
  35. * transaction abort and after successful commit phase in case
  36. * the caller did not dequeue the item before.
  37. */
  38. void switchdev_trans_item_enqueue(struct switchdev_trans *trans,
  39. void *data, void (*destructor)(void const *),
  40. struct switchdev_trans_item *tritem)
  41. {
  42. tritem->data = data;
  43. tritem->destructor = destructor;
  44. list_add_tail(&tritem->list, &trans->item_list);
  45. }
  46. EXPORT_SYMBOL_GPL(switchdev_trans_item_enqueue);
  47. static struct switchdev_trans_item *
  48. __switchdev_trans_item_dequeue(struct switchdev_trans *trans)
  49. {
  50. struct switchdev_trans_item *tritem;
  51. if (list_empty(&trans->item_list))
  52. return NULL;
  53. tritem = list_first_entry(&trans->item_list,
  54. struct switchdev_trans_item, list);
  55. list_del(&tritem->list);
  56. return tritem;
  57. }
  58. /**
  59. * switchdev_trans_item_dequeue - Dequeue data item from transaction queue
  60. *
  61. * @trans: transaction
  62. */
  63. void *switchdev_trans_item_dequeue(struct switchdev_trans *trans)
  64. {
  65. struct switchdev_trans_item *tritem;
  66. tritem = __switchdev_trans_item_dequeue(trans);
  67. BUG_ON(!tritem);
  68. return tritem->data;
  69. }
  70. EXPORT_SYMBOL_GPL(switchdev_trans_item_dequeue);
  71. static void switchdev_trans_init(struct switchdev_trans *trans)
  72. {
  73. INIT_LIST_HEAD(&trans->item_list);
  74. }
  75. static void switchdev_trans_items_destroy(struct switchdev_trans *trans)
  76. {
  77. struct switchdev_trans_item *tritem;
  78. while ((tritem = __switchdev_trans_item_dequeue(trans)))
  79. tritem->destructor(tritem->data);
  80. }
  81. static void switchdev_trans_items_warn_destroy(struct net_device *dev,
  82. struct switchdev_trans *trans)
  83. {
  84. WARN(!list_empty(&trans->item_list), "%s: transaction item queue is not empty.\n",
  85. dev->name);
  86. switchdev_trans_items_destroy(trans);
  87. }
  88. static LIST_HEAD(deferred);
  89. static DEFINE_SPINLOCK(deferred_lock);
  90. typedef void switchdev_deferred_func_t(struct net_device *dev,
  91. const void *data);
  92. struct switchdev_deferred_item {
  93. struct list_head list;
  94. struct net_device *dev;
  95. switchdev_deferred_func_t *func;
  96. unsigned long data[0];
  97. };
  98. static struct switchdev_deferred_item *switchdev_deferred_dequeue(void)
  99. {
  100. struct switchdev_deferred_item *dfitem;
  101. spin_lock_bh(&deferred_lock);
  102. if (list_empty(&deferred)) {
  103. dfitem = NULL;
  104. goto unlock;
  105. }
  106. dfitem = list_first_entry(&deferred,
  107. struct switchdev_deferred_item, list);
  108. list_del(&dfitem->list);
  109. unlock:
  110. spin_unlock_bh(&deferred_lock);
  111. return dfitem;
  112. }
  113. /**
  114. * switchdev_deferred_process - Process ops in deferred queue
  115. *
  116. * Called to flush the ops currently queued in deferred ops queue.
  117. * rtnl_lock must be held.
  118. */
  119. void switchdev_deferred_process(void)
  120. {
  121. struct switchdev_deferred_item *dfitem;
  122. ASSERT_RTNL();
  123. while ((dfitem = switchdev_deferred_dequeue())) {
  124. dfitem->func(dfitem->dev, dfitem->data);
  125. dev_put(dfitem->dev);
  126. kfree(dfitem);
  127. }
  128. }
  129. EXPORT_SYMBOL_GPL(switchdev_deferred_process);
  130. static void switchdev_deferred_process_work(struct work_struct *work)
  131. {
  132. rtnl_lock();
  133. switchdev_deferred_process();
  134. rtnl_unlock();
  135. }
  136. static DECLARE_WORK(deferred_process_work, switchdev_deferred_process_work);
  137. static int switchdev_deferred_enqueue(struct net_device *dev,
  138. const void *data, size_t data_len,
  139. switchdev_deferred_func_t *func)
  140. {
  141. struct switchdev_deferred_item *dfitem;
  142. dfitem = kmalloc(sizeof(*dfitem) + data_len, GFP_ATOMIC);
  143. if (!dfitem)
  144. return -ENOMEM;
  145. dfitem->dev = dev;
  146. dfitem->func = func;
  147. memcpy(dfitem->data, data, data_len);
  148. dev_hold(dev);
  149. spin_lock_bh(&deferred_lock);
  150. list_add_tail(&dfitem->list, &deferred);
  151. spin_unlock_bh(&deferred_lock);
  152. schedule_work(&deferred_process_work);
  153. return 0;
  154. }
  155. /**
  156. * switchdev_port_attr_get - Get port attribute
  157. *
  158. * @dev: port device
  159. * @attr: attribute to get
  160. */
  161. int switchdev_port_attr_get(struct net_device *dev, struct switchdev_attr *attr)
  162. {
  163. const struct switchdev_ops *ops = dev->switchdev_ops;
  164. struct net_device *lower_dev;
  165. struct list_head *iter;
  166. struct switchdev_attr first = {
  167. .id = SWITCHDEV_ATTR_ID_UNDEFINED
  168. };
  169. int err = -EOPNOTSUPP;
  170. if (ops && ops->switchdev_port_attr_get)
  171. return ops->switchdev_port_attr_get(dev, attr);
  172. if (attr->flags & SWITCHDEV_F_NO_RECURSE)
  173. return err;
  174. /* Switch device port(s) may be stacked under
  175. * bond/team/vlan dev, so recurse down to get attr on
  176. * each port. Return -ENODATA if attr values don't
  177. * compare across ports.
  178. */
  179. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  180. err = switchdev_port_attr_get(lower_dev, attr);
  181. if (err)
  182. break;
  183. if (first.id == SWITCHDEV_ATTR_ID_UNDEFINED)
  184. first = *attr;
  185. else if (memcmp(&first, attr, sizeof(*attr)))
  186. return -ENODATA;
  187. }
  188. return err;
  189. }
  190. EXPORT_SYMBOL_GPL(switchdev_port_attr_get);
  191. static int __switchdev_port_attr_set(struct net_device *dev,
  192. const struct switchdev_attr *attr,
  193. struct switchdev_trans *trans)
  194. {
  195. const struct switchdev_ops *ops = dev->switchdev_ops;
  196. struct net_device *lower_dev;
  197. struct list_head *iter;
  198. int err = -EOPNOTSUPP;
  199. if (ops && ops->switchdev_port_attr_set) {
  200. err = ops->switchdev_port_attr_set(dev, attr, trans);
  201. goto done;
  202. }
  203. if (attr->flags & SWITCHDEV_F_NO_RECURSE)
  204. goto done;
  205. /* Switch device port(s) may be stacked under
  206. * bond/team/vlan dev, so recurse down to set attr on
  207. * each port.
  208. */
  209. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  210. err = __switchdev_port_attr_set(lower_dev, attr, trans);
  211. if (err)
  212. break;
  213. }
  214. done:
  215. if (err == -EOPNOTSUPP && attr->flags & SWITCHDEV_F_SKIP_EOPNOTSUPP)
  216. err = 0;
  217. return err;
  218. }
  219. static int switchdev_port_attr_set_now(struct net_device *dev,
  220. const struct switchdev_attr *attr)
  221. {
  222. struct switchdev_trans trans;
  223. int err;
  224. switchdev_trans_init(&trans);
  225. /* Phase I: prepare for attr set. Driver/device should fail
  226. * here if there are going to be issues in the commit phase,
  227. * such as lack of resources or support. The driver/device
  228. * should reserve resources needed for the commit phase here,
  229. * but should not commit the attr.
  230. */
  231. trans.ph_prepare = true;
  232. err = __switchdev_port_attr_set(dev, attr, &trans);
  233. if (err) {
  234. /* Prepare phase failed: abort the transaction. Any
  235. * resources reserved in the prepare phase are
  236. * released.
  237. */
  238. if (err != -EOPNOTSUPP)
  239. switchdev_trans_items_destroy(&trans);
  240. return err;
  241. }
  242. /* Phase II: commit attr set. This cannot fail as a fault
  243. * of driver/device. If it does, it's a bug in the driver/device
  244. * because the driver said everythings was OK in phase I.
  245. */
  246. trans.ph_prepare = false;
  247. err = __switchdev_port_attr_set(dev, attr, &trans);
  248. WARN(err, "%s: Commit of attribute (id=%d) failed.\n",
  249. dev->name, attr->id);
  250. switchdev_trans_items_warn_destroy(dev, &trans);
  251. return err;
  252. }
  253. static void switchdev_port_attr_set_deferred(struct net_device *dev,
  254. const void *data)
  255. {
  256. const struct switchdev_attr *attr = data;
  257. int err;
  258. err = switchdev_port_attr_set_now(dev, attr);
  259. if (err && err != -EOPNOTSUPP)
  260. netdev_err(dev, "failed (err=%d) to set attribute (id=%d)\n",
  261. err, attr->id);
  262. }
  263. static int switchdev_port_attr_set_defer(struct net_device *dev,
  264. const struct switchdev_attr *attr)
  265. {
  266. return switchdev_deferred_enqueue(dev, attr, sizeof(*attr),
  267. switchdev_port_attr_set_deferred);
  268. }
  269. /**
  270. * switchdev_port_attr_set - Set port attribute
  271. *
  272. * @dev: port device
  273. * @attr: attribute to set
  274. *
  275. * Use a 2-phase prepare-commit transaction model to ensure
  276. * system is not left in a partially updated state due to
  277. * failure from driver/device.
  278. *
  279. * rtnl_lock must be held and must not be in atomic section,
  280. * in case SWITCHDEV_F_DEFER flag is not set.
  281. */
  282. int switchdev_port_attr_set(struct net_device *dev,
  283. const struct switchdev_attr *attr)
  284. {
  285. if (attr->flags & SWITCHDEV_F_DEFER)
  286. return switchdev_port_attr_set_defer(dev, attr);
  287. ASSERT_RTNL();
  288. return switchdev_port_attr_set_now(dev, attr);
  289. }
  290. EXPORT_SYMBOL_GPL(switchdev_port_attr_set);
  291. static size_t switchdev_obj_size(const struct switchdev_obj *obj)
  292. {
  293. switch (obj->id) {
  294. case SWITCHDEV_OBJ_ID_PORT_VLAN:
  295. return sizeof(struct switchdev_obj_port_vlan);
  296. case SWITCHDEV_OBJ_ID_IPV4_FIB:
  297. return sizeof(struct switchdev_obj_ipv4_fib);
  298. case SWITCHDEV_OBJ_ID_PORT_FDB:
  299. return sizeof(struct switchdev_obj_port_fdb);
  300. case SWITCHDEV_OBJ_ID_PORT_MDB:
  301. return sizeof(struct switchdev_obj_port_mdb);
  302. default:
  303. BUG();
  304. }
  305. return 0;
  306. }
  307. static int __switchdev_port_obj_add(struct net_device *dev,
  308. const struct switchdev_obj *obj,
  309. struct switchdev_trans *trans)
  310. {
  311. const struct switchdev_ops *ops = dev->switchdev_ops;
  312. struct net_device *lower_dev;
  313. struct list_head *iter;
  314. int err = -EOPNOTSUPP;
  315. if (ops && ops->switchdev_port_obj_add)
  316. return ops->switchdev_port_obj_add(dev, obj, trans);
  317. /* Switch device port(s) may be stacked under
  318. * bond/team/vlan dev, so recurse down to add object on
  319. * each port.
  320. */
  321. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  322. err = __switchdev_port_obj_add(lower_dev, obj, trans);
  323. if (err)
  324. break;
  325. }
  326. return err;
  327. }
  328. static int switchdev_port_obj_add_now(struct net_device *dev,
  329. const struct switchdev_obj *obj)
  330. {
  331. struct switchdev_trans trans;
  332. int err;
  333. ASSERT_RTNL();
  334. switchdev_trans_init(&trans);
  335. /* Phase I: prepare for obj add. Driver/device should fail
  336. * here if there are going to be issues in the commit phase,
  337. * such as lack of resources or support. The driver/device
  338. * should reserve resources needed for the commit phase here,
  339. * but should not commit the obj.
  340. */
  341. trans.ph_prepare = true;
  342. err = __switchdev_port_obj_add(dev, obj, &trans);
  343. if (err) {
  344. /* Prepare phase failed: abort the transaction. Any
  345. * resources reserved in the prepare phase are
  346. * released.
  347. */
  348. if (err != -EOPNOTSUPP)
  349. switchdev_trans_items_destroy(&trans);
  350. return err;
  351. }
  352. /* Phase II: commit obj add. This cannot fail as a fault
  353. * of driver/device. If it does, it's a bug in the driver/device
  354. * because the driver said everythings was OK in phase I.
  355. */
  356. trans.ph_prepare = false;
  357. err = __switchdev_port_obj_add(dev, obj, &trans);
  358. WARN(err, "%s: Commit of object (id=%d) failed.\n", dev->name, obj->id);
  359. switchdev_trans_items_warn_destroy(dev, &trans);
  360. return err;
  361. }
  362. static void switchdev_port_obj_add_deferred(struct net_device *dev,
  363. const void *data)
  364. {
  365. const struct switchdev_obj *obj = data;
  366. int err;
  367. err = switchdev_port_obj_add_now(dev, obj);
  368. if (err && err != -EOPNOTSUPP)
  369. netdev_err(dev, "failed (err=%d) to add object (id=%d)\n",
  370. err, obj->id);
  371. }
  372. static int switchdev_port_obj_add_defer(struct net_device *dev,
  373. const struct switchdev_obj *obj)
  374. {
  375. return switchdev_deferred_enqueue(dev, obj, switchdev_obj_size(obj),
  376. switchdev_port_obj_add_deferred);
  377. }
  378. /**
  379. * switchdev_port_obj_add - Add port object
  380. *
  381. * @dev: port device
  382. * @id: object ID
  383. * @obj: object to add
  384. *
  385. * Use a 2-phase prepare-commit transaction model to ensure
  386. * system is not left in a partially updated state due to
  387. * failure from driver/device.
  388. *
  389. * rtnl_lock must be held and must not be in atomic section,
  390. * in case SWITCHDEV_F_DEFER flag is not set.
  391. */
  392. int switchdev_port_obj_add(struct net_device *dev,
  393. const struct switchdev_obj *obj)
  394. {
  395. if (obj->flags & SWITCHDEV_F_DEFER)
  396. return switchdev_port_obj_add_defer(dev, obj);
  397. ASSERT_RTNL();
  398. return switchdev_port_obj_add_now(dev, obj);
  399. }
  400. EXPORT_SYMBOL_GPL(switchdev_port_obj_add);
  401. static int switchdev_port_obj_del_now(struct net_device *dev,
  402. const struct switchdev_obj *obj)
  403. {
  404. const struct switchdev_ops *ops = dev->switchdev_ops;
  405. struct net_device *lower_dev;
  406. struct list_head *iter;
  407. int err = -EOPNOTSUPP;
  408. if (ops && ops->switchdev_port_obj_del)
  409. return ops->switchdev_port_obj_del(dev, obj);
  410. /* Switch device port(s) may be stacked under
  411. * bond/team/vlan dev, so recurse down to delete object on
  412. * each port.
  413. */
  414. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  415. err = switchdev_port_obj_del_now(lower_dev, obj);
  416. if (err)
  417. break;
  418. }
  419. return err;
  420. }
  421. static void switchdev_port_obj_del_deferred(struct net_device *dev,
  422. const void *data)
  423. {
  424. const struct switchdev_obj *obj = data;
  425. int err;
  426. err = switchdev_port_obj_del_now(dev, obj);
  427. if (err && err != -EOPNOTSUPP)
  428. netdev_err(dev, "failed (err=%d) to del object (id=%d)\n",
  429. err, obj->id);
  430. }
  431. static int switchdev_port_obj_del_defer(struct net_device *dev,
  432. const struct switchdev_obj *obj)
  433. {
  434. return switchdev_deferred_enqueue(dev, obj, switchdev_obj_size(obj),
  435. switchdev_port_obj_del_deferred);
  436. }
  437. /**
  438. * switchdev_port_obj_del - Delete port object
  439. *
  440. * @dev: port device
  441. * @id: object ID
  442. * @obj: object to delete
  443. *
  444. * rtnl_lock must be held and must not be in atomic section,
  445. * in case SWITCHDEV_F_DEFER flag is not set.
  446. */
  447. int switchdev_port_obj_del(struct net_device *dev,
  448. const struct switchdev_obj *obj)
  449. {
  450. if (obj->flags & SWITCHDEV_F_DEFER)
  451. return switchdev_port_obj_del_defer(dev, obj);
  452. ASSERT_RTNL();
  453. return switchdev_port_obj_del_now(dev, obj);
  454. }
  455. EXPORT_SYMBOL_GPL(switchdev_port_obj_del);
  456. /**
  457. * switchdev_port_obj_dump - Dump port objects
  458. *
  459. * @dev: port device
  460. * @id: object ID
  461. * @obj: object to dump
  462. * @cb: function to call with a filled object
  463. *
  464. * rtnl_lock must be held.
  465. */
  466. int switchdev_port_obj_dump(struct net_device *dev, struct switchdev_obj *obj,
  467. switchdev_obj_dump_cb_t *cb)
  468. {
  469. const struct switchdev_ops *ops = dev->switchdev_ops;
  470. struct net_device *lower_dev;
  471. struct list_head *iter;
  472. int err = -EOPNOTSUPP;
  473. ASSERT_RTNL();
  474. if (ops && ops->switchdev_port_obj_dump)
  475. return ops->switchdev_port_obj_dump(dev, obj, cb);
  476. /* Switch device port(s) may be stacked under
  477. * bond/team/vlan dev, so recurse down to dump objects on
  478. * first port at bottom of stack.
  479. */
  480. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  481. err = switchdev_port_obj_dump(lower_dev, obj, cb);
  482. break;
  483. }
  484. return err;
  485. }
  486. EXPORT_SYMBOL_GPL(switchdev_port_obj_dump);
  487. static RAW_NOTIFIER_HEAD(switchdev_notif_chain);
  488. /**
  489. * register_switchdev_notifier - Register notifier
  490. * @nb: notifier_block
  491. *
  492. * Register switch device notifier. This should be used by code
  493. * which needs to monitor events happening in particular device.
  494. * Return values are same as for atomic_notifier_chain_register().
  495. */
  496. int register_switchdev_notifier(struct notifier_block *nb)
  497. {
  498. int err;
  499. rtnl_lock();
  500. err = raw_notifier_chain_register(&switchdev_notif_chain, nb);
  501. rtnl_unlock();
  502. return err;
  503. }
  504. EXPORT_SYMBOL_GPL(register_switchdev_notifier);
  505. /**
  506. * unregister_switchdev_notifier - Unregister notifier
  507. * @nb: notifier_block
  508. *
  509. * Unregister switch device notifier.
  510. * Return values are same as for atomic_notifier_chain_unregister().
  511. */
  512. int unregister_switchdev_notifier(struct notifier_block *nb)
  513. {
  514. int err;
  515. rtnl_lock();
  516. err = raw_notifier_chain_unregister(&switchdev_notif_chain, nb);
  517. rtnl_unlock();
  518. return err;
  519. }
  520. EXPORT_SYMBOL_GPL(unregister_switchdev_notifier);
  521. /**
  522. * call_switchdev_notifiers - Call notifiers
  523. * @val: value passed unmodified to notifier function
  524. * @dev: port device
  525. * @info: notifier information data
  526. *
  527. * Call all network notifier blocks. This should be called by driver
  528. * when it needs to propagate hardware event.
  529. * Return values are same as for atomic_notifier_call_chain().
  530. * rtnl_lock must be held.
  531. */
  532. int call_switchdev_notifiers(unsigned long val, struct net_device *dev,
  533. struct switchdev_notifier_info *info)
  534. {
  535. int err;
  536. ASSERT_RTNL();
  537. info->dev = dev;
  538. err = raw_notifier_call_chain(&switchdev_notif_chain, val, info);
  539. return err;
  540. }
  541. EXPORT_SYMBOL_GPL(call_switchdev_notifiers);
  542. struct switchdev_vlan_dump {
  543. struct switchdev_obj_port_vlan vlan;
  544. struct sk_buff *skb;
  545. u32 filter_mask;
  546. u16 flags;
  547. u16 begin;
  548. u16 end;
  549. };
  550. static int switchdev_port_vlan_dump_put(struct switchdev_vlan_dump *dump)
  551. {
  552. struct bridge_vlan_info vinfo;
  553. vinfo.flags = dump->flags;
  554. if (dump->begin == 0 && dump->end == 0) {
  555. return 0;
  556. } else if (dump->begin == dump->end) {
  557. vinfo.vid = dump->begin;
  558. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  559. sizeof(vinfo), &vinfo))
  560. return -EMSGSIZE;
  561. } else {
  562. vinfo.vid = dump->begin;
  563. vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_BEGIN;
  564. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  565. sizeof(vinfo), &vinfo))
  566. return -EMSGSIZE;
  567. vinfo.vid = dump->end;
  568. vinfo.flags &= ~BRIDGE_VLAN_INFO_RANGE_BEGIN;
  569. vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_END;
  570. if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
  571. sizeof(vinfo), &vinfo))
  572. return -EMSGSIZE;
  573. }
  574. return 0;
  575. }
  576. static int switchdev_port_vlan_dump_cb(struct switchdev_obj *obj)
  577. {
  578. struct switchdev_obj_port_vlan *vlan = SWITCHDEV_OBJ_PORT_VLAN(obj);
  579. struct switchdev_vlan_dump *dump =
  580. container_of(vlan, struct switchdev_vlan_dump, vlan);
  581. int err = 0;
  582. if (vlan->vid_begin > vlan->vid_end)
  583. return -EINVAL;
  584. if (dump->filter_mask & RTEXT_FILTER_BRVLAN) {
  585. dump->flags = vlan->flags;
  586. for (dump->begin = dump->end = vlan->vid_begin;
  587. dump->begin <= vlan->vid_end;
  588. dump->begin++, dump->end++) {
  589. err = switchdev_port_vlan_dump_put(dump);
  590. if (err)
  591. return err;
  592. }
  593. } else if (dump->filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED) {
  594. if (dump->begin > vlan->vid_begin &&
  595. dump->begin >= vlan->vid_end) {
  596. if ((dump->begin - 1) == vlan->vid_end &&
  597. dump->flags == vlan->flags) {
  598. /* prepend */
  599. dump->begin = vlan->vid_begin;
  600. } else {
  601. err = switchdev_port_vlan_dump_put(dump);
  602. dump->flags = vlan->flags;
  603. dump->begin = vlan->vid_begin;
  604. dump->end = vlan->vid_end;
  605. }
  606. } else if (dump->end <= vlan->vid_begin &&
  607. dump->end < vlan->vid_end) {
  608. if ((dump->end + 1) == vlan->vid_begin &&
  609. dump->flags == vlan->flags) {
  610. /* append */
  611. dump->end = vlan->vid_end;
  612. } else {
  613. err = switchdev_port_vlan_dump_put(dump);
  614. dump->flags = vlan->flags;
  615. dump->begin = vlan->vid_begin;
  616. dump->end = vlan->vid_end;
  617. }
  618. } else {
  619. err = -EINVAL;
  620. }
  621. }
  622. return err;
  623. }
  624. static int switchdev_port_vlan_fill(struct sk_buff *skb, struct net_device *dev,
  625. u32 filter_mask)
  626. {
  627. struct switchdev_vlan_dump dump = {
  628. .vlan.obj.orig_dev = dev,
  629. .vlan.obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
  630. .skb = skb,
  631. .filter_mask = filter_mask,
  632. };
  633. int err = 0;
  634. if ((filter_mask & RTEXT_FILTER_BRVLAN) ||
  635. (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)) {
  636. err = switchdev_port_obj_dump(dev, &dump.vlan.obj,
  637. switchdev_port_vlan_dump_cb);
  638. if (err)
  639. goto err_out;
  640. if (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)
  641. /* last one */
  642. err = switchdev_port_vlan_dump_put(&dump);
  643. }
  644. err_out:
  645. return err == -EOPNOTSUPP ? 0 : err;
  646. }
  647. /**
  648. * switchdev_port_bridge_getlink - Get bridge port attributes
  649. *
  650. * @dev: port device
  651. *
  652. * Called for SELF on rtnl_bridge_getlink to get bridge port
  653. * attributes.
  654. */
  655. int switchdev_port_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
  656. struct net_device *dev, u32 filter_mask,
  657. int nlflags)
  658. {
  659. struct switchdev_attr attr = {
  660. .orig_dev = dev,
  661. .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
  662. };
  663. u16 mode = BRIDGE_MODE_UNDEF;
  664. u32 mask = BR_LEARNING | BR_LEARNING_SYNC | BR_FLOOD;
  665. int err;
  666. err = switchdev_port_attr_get(dev, &attr);
  667. if (err && err != -EOPNOTSUPP)
  668. return err;
  669. return ndo_dflt_bridge_getlink(skb, pid, seq, dev, mode,
  670. attr.u.brport_flags, mask, nlflags,
  671. filter_mask, switchdev_port_vlan_fill);
  672. }
  673. EXPORT_SYMBOL_GPL(switchdev_port_bridge_getlink);
  674. static int switchdev_port_br_setflag(struct net_device *dev,
  675. struct nlattr *nlattr,
  676. unsigned long brport_flag)
  677. {
  678. struct switchdev_attr attr = {
  679. .orig_dev = dev,
  680. .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
  681. };
  682. u8 flag = nla_get_u8(nlattr);
  683. int err;
  684. err = switchdev_port_attr_get(dev, &attr);
  685. if (err)
  686. return err;
  687. if (flag)
  688. attr.u.brport_flags |= brport_flag;
  689. else
  690. attr.u.brport_flags &= ~brport_flag;
  691. return switchdev_port_attr_set(dev, &attr);
  692. }
  693. static const struct nla_policy
  694. switchdev_port_bridge_policy[IFLA_BRPORT_MAX + 1] = {
  695. [IFLA_BRPORT_STATE] = { .type = NLA_U8 },
  696. [IFLA_BRPORT_COST] = { .type = NLA_U32 },
  697. [IFLA_BRPORT_PRIORITY] = { .type = NLA_U16 },
  698. [IFLA_BRPORT_MODE] = { .type = NLA_U8 },
  699. [IFLA_BRPORT_GUARD] = { .type = NLA_U8 },
  700. [IFLA_BRPORT_PROTECT] = { .type = NLA_U8 },
  701. [IFLA_BRPORT_FAST_LEAVE] = { .type = NLA_U8 },
  702. [IFLA_BRPORT_LEARNING] = { .type = NLA_U8 },
  703. [IFLA_BRPORT_LEARNING_SYNC] = { .type = NLA_U8 },
  704. [IFLA_BRPORT_UNICAST_FLOOD] = { .type = NLA_U8 },
  705. };
  706. static int switchdev_port_br_setlink_protinfo(struct net_device *dev,
  707. struct nlattr *protinfo)
  708. {
  709. struct nlattr *attr;
  710. int rem;
  711. int err;
  712. err = nla_validate_nested(protinfo, IFLA_BRPORT_MAX,
  713. switchdev_port_bridge_policy);
  714. if (err)
  715. return err;
  716. nla_for_each_nested(attr, protinfo, rem) {
  717. switch (nla_type(attr)) {
  718. case IFLA_BRPORT_LEARNING:
  719. err = switchdev_port_br_setflag(dev, attr,
  720. BR_LEARNING);
  721. break;
  722. case IFLA_BRPORT_LEARNING_SYNC:
  723. err = switchdev_port_br_setflag(dev, attr,
  724. BR_LEARNING_SYNC);
  725. break;
  726. case IFLA_BRPORT_UNICAST_FLOOD:
  727. err = switchdev_port_br_setflag(dev, attr, BR_FLOOD);
  728. break;
  729. default:
  730. err = -EOPNOTSUPP;
  731. break;
  732. }
  733. if (err)
  734. return err;
  735. }
  736. return 0;
  737. }
  738. static int switchdev_port_br_afspec(struct net_device *dev,
  739. struct nlattr *afspec,
  740. int (*f)(struct net_device *dev,
  741. const struct switchdev_obj *obj))
  742. {
  743. struct nlattr *attr;
  744. struct bridge_vlan_info *vinfo;
  745. struct switchdev_obj_port_vlan vlan = {
  746. .obj.orig_dev = dev,
  747. .obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
  748. };
  749. int rem;
  750. int err;
  751. nla_for_each_nested(attr, afspec, rem) {
  752. if (nla_type(attr) != IFLA_BRIDGE_VLAN_INFO)
  753. continue;
  754. if (nla_len(attr) != sizeof(struct bridge_vlan_info))
  755. return -EINVAL;
  756. vinfo = nla_data(attr);
  757. if (!vinfo->vid || vinfo->vid >= VLAN_VID_MASK)
  758. return -EINVAL;
  759. vlan.flags = vinfo->flags;
  760. if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_BEGIN) {
  761. if (vlan.vid_begin)
  762. return -EINVAL;
  763. vlan.vid_begin = vinfo->vid;
  764. /* don't allow range of pvids */
  765. if (vlan.flags & BRIDGE_VLAN_INFO_PVID)
  766. return -EINVAL;
  767. } else if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_END) {
  768. if (!vlan.vid_begin)
  769. return -EINVAL;
  770. vlan.vid_end = vinfo->vid;
  771. if (vlan.vid_end <= vlan.vid_begin)
  772. return -EINVAL;
  773. err = f(dev, &vlan.obj);
  774. if (err)
  775. return err;
  776. vlan.vid_begin = 0;
  777. } else {
  778. if (vlan.vid_begin)
  779. return -EINVAL;
  780. vlan.vid_begin = vinfo->vid;
  781. vlan.vid_end = vinfo->vid;
  782. err = f(dev, &vlan.obj);
  783. if (err)
  784. return err;
  785. vlan.vid_begin = 0;
  786. }
  787. }
  788. return 0;
  789. }
  790. /**
  791. * switchdev_port_bridge_setlink - Set bridge port attributes
  792. *
  793. * @dev: port device
  794. * @nlh: netlink header
  795. * @flags: netlink flags
  796. *
  797. * Called for SELF on rtnl_bridge_setlink to set bridge port
  798. * attributes.
  799. */
  800. int switchdev_port_bridge_setlink(struct net_device *dev,
  801. struct nlmsghdr *nlh, u16 flags)
  802. {
  803. struct nlattr *protinfo;
  804. struct nlattr *afspec;
  805. int err = 0;
  806. protinfo = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  807. IFLA_PROTINFO);
  808. if (protinfo) {
  809. err = switchdev_port_br_setlink_protinfo(dev, protinfo);
  810. if (err)
  811. return err;
  812. }
  813. afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  814. IFLA_AF_SPEC);
  815. if (afspec)
  816. err = switchdev_port_br_afspec(dev, afspec,
  817. switchdev_port_obj_add);
  818. return err;
  819. }
  820. EXPORT_SYMBOL_GPL(switchdev_port_bridge_setlink);
  821. /**
  822. * switchdev_port_bridge_dellink - Set bridge port attributes
  823. *
  824. * @dev: port device
  825. * @nlh: netlink header
  826. * @flags: netlink flags
  827. *
  828. * Called for SELF on rtnl_bridge_dellink to set bridge port
  829. * attributes.
  830. */
  831. int switchdev_port_bridge_dellink(struct net_device *dev,
  832. struct nlmsghdr *nlh, u16 flags)
  833. {
  834. struct nlattr *afspec;
  835. afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
  836. IFLA_AF_SPEC);
  837. if (afspec)
  838. return switchdev_port_br_afspec(dev, afspec,
  839. switchdev_port_obj_del);
  840. return 0;
  841. }
  842. EXPORT_SYMBOL_GPL(switchdev_port_bridge_dellink);
  843. /**
  844. * switchdev_port_fdb_add - Add FDB (MAC/VLAN) entry to port
  845. *
  846. * @ndmsg: netlink hdr
  847. * @nlattr: netlink attributes
  848. * @dev: port device
  849. * @addr: MAC address to add
  850. * @vid: VLAN to add
  851. *
  852. * Add FDB entry to switch device.
  853. */
  854. int switchdev_port_fdb_add(struct ndmsg *ndm, struct nlattr *tb[],
  855. struct net_device *dev, const unsigned char *addr,
  856. u16 vid, u16 nlm_flags)
  857. {
  858. struct switchdev_obj_port_fdb fdb = {
  859. .obj.orig_dev = dev,
  860. .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  861. .vid = vid,
  862. };
  863. ether_addr_copy(fdb.addr, addr);
  864. return switchdev_port_obj_add(dev, &fdb.obj);
  865. }
  866. EXPORT_SYMBOL_GPL(switchdev_port_fdb_add);
  867. /**
  868. * switchdev_port_fdb_del - Delete FDB (MAC/VLAN) entry from port
  869. *
  870. * @ndmsg: netlink hdr
  871. * @nlattr: netlink attributes
  872. * @dev: port device
  873. * @addr: MAC address to delete
  874. * @vid: VLAN to delete
  875. *
  876. * Delete FDB entry from switch device.
  877. */
  878. int switchdev_port_fdb_del(struct ndmsg *ndm, struct nlattr *tb[],
  879. struct net_device *dev, const unsigned char *addr,
  880. u16 vid)
  881. {
  882. struct switchdev_obj_port_fdb fdb = {
  883. .obj.orig_dev = dev,
  884. .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  885. .vid = vid,
  886. };
  887. ether_addr_copy(fdb.addr, addr);
  888. return switchdev_port_obj_del(dev, &fdb.obj);
  889. }
  890. EXPORT_SYMBOL_GPL(switchdev_port_fdb_del);
  891. struct switchdev_fdb_dump {
  892. struct switchdev_obj_port_fdb fdb;
  893. struct net_device *dev;
  894. struct sk_buff *skb;
  895. struct netlink_callback *cb;
  896. int idx;
  897. };
  898. static int switchdev_port_fdb_dump_cb(struct switchdev_obj *obj)
  899. {
  900. struct switchdev_obj_port_fdb *fdb = SWITCHDEV_OBJ_PORT_FDB(obj);
  901. struct switchdev_fdb_dump *dump =
  902. container_of(fdb, struct switchdev_fdb_dump, fdb);
  903. u32 portid = NETLINK_CB(dump->cb->skb).portid;
  904. u32 seq = dump->cb->nlh->nlmsg_seq;
  905. struct nlmsghdr *nlh;
  906. struct ndmsg *ndm;
  907. if (dump->idx < dump->cb->args[0])
  908. goto skip;
  909. nlh = nlmsg_put(dump->skb, portid, seq, RTM_NEWNEIGH,
  910. sizeof(*ndm), NLM_F_MULTI);
  911. if (!nlh)
  912. return -EMSGSIZE;
  913. ndm = nlmsg_data(nlh);
  914. ndm->ndm_family = AF_BRIDGE;
  915. ndm->ndm_pad1 = 0;
  916. ndm->ndm_pad2 = 0;
  917. ndm->ndm_flags = NTF_SELF;
  918. ndm->ndm_type = 0;
  919. ndm->ndm_ifindex = dump->dev->ifindex;
  920. ndm->ndm_state = fdb->ndm_state;
  921. if (nla_put(dump->skb, NDA_LLADDR, ETH_ALEN, fdb->addr))
  922. goto nla_put_failure;
  923. if (fdb->vid && nla_put_u16(dump->skb, NDA_VLAN, fdb->vid))
  924. goto nla_put_failure;
  925. nlmsg_end(dump->skb, nlh);
  926. skip:
  927. dump->idx++;
  928. return 0;
  929. nla_put_failure:
  930. nlmsg_cancel(dump->skb, nlh);
  931. return -EMSGSIZE;
  932. }
  933. /**
  934. * switchdev_port_fdb_dump - Dump port FDB (MAC/VLAN) entries
  935. *
  936. * @skb: netlink skb
  937. * @cb: netlink callback
  938. * @dev: port device
  939. * @filter_dev: filter device
  940. * @idx:
  941. *
  942. * Delete FDB entry from switch device.
  943. */
  944. int switchdev_port_fdb_dump(struct sk_buff *skb, struct netlink_callback *cb,
  945. struct net_device *dev,
  946. struct net_device *filter_dev, int idx)
  947. {
  948. struct switchdev_fdb_dump dump = {
  949. .fdb.obj.orig_dev = dev,
  950. .fdb.obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
  951. .dev = dev,
  952. .skb = skb,
  953. .cb = cb,
  954. .idx = idx,
  955. };
  956. switchdev_port_obj_dump(dev, &dump.fdb.obj, switchdev_port_fdb_dump_cb);
  957. return dump.idx;
  958. }
  959. EXPORT_SYMBOL_GPL(switchdev_port_fdb_dump);
  960. static struct net_device *switchdev_get_lowest_dev(struct net_device *dev)
  961. {
  962. const struct switchdev_ops *ops = dev->switchdev_ops;
  963. struct net_device *lower_dev;
  964. struct net_device *port_dev;
  965. struct list_head *iter;
  966. /* Recusively search down until we find a sw port dev.
  967. * (A sw port dev supports switchdev_port_attr_get).
  968. */
  969. if (ops && ops->switchdev_port_attr_get)
  970. return dev;
  971. netdev_for_each_lower_dev(dev, lower_dev, iter) {
  972. port_dev = switchdev_get_lowest_dev(lower_dev);
  973. if (port_dev)
  974. return port_dev;
  975. }
  976. return NULL;
  977. }
  978. static struct net_device *switchdev_get_dev_by_nhs(struct fib_info *fi)
  979. {
  980. struct switchdev_attr attr = {
  981. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  982. };
  983. struct switchdev_attr prev_attr;
  984. struct net_device *dev = NULL;
  985. int nhsel;
  986. ASSERT_RTNL();
  987. /* For this route, all nexthop devs must be on the same switch. */
  988. for (nhsel = 0; nhsel < fi->fib_nhs; nhsel++) {
  989. const struct fib_nh *nh = &fi->fib_nh[nhsel];
  990. if (!nh->nh_dev)
  991. return NULL;
  992. dev = switchdev_get_lowest_dev(nh->nh_dev);
  993. if (!dev)
  994. return NULL;
  995. attr.orig_dev = dev;
  996. if (switchdev_port_attr_get(dev, &attr))
  997. return NULL;
  998. if (nhsel > 0 &&
  999. !netdev_phys_item_id_same(&prev_attr.u.ppid, &attr.u.ppid))
  1000. return NULL;
  1001. prev_attr = attr;
  1002. }
  1003. return dev;
  1004. }
  1005. /**
  1006. * switchdev_fib_ipv4_add - Add/modify switch IPv4 route entry
  1007. *
  1008. * @dst: route's IPv4 destination address
  1009. * @dst_len: destination address length (prefix length)
  1010. * @fi: route FIB info structure
  1011. * @tos: route TOS
  1012. * @type: route type
  1013. * @nlflags: netlink flags passed in (NLM_F_*)
  1014. * @tb_id: route table ID
  1015. *
  1016. * Add/modify switch IPv4 route entry.
  1017. */
  1018. int switchdev_fib_ipv4_add(u32 dst, int dst_len, struct fib_info *fi,
  1019. u8 tos, u8 type, u32 nlflags, u32 tb_id)
  1020. {
  1021. struct switchdev_obj_ipv4_fib ipv4_fib = {
  1022. .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
  1023. .dst = dst,
  1024. .dst_len = dst_len,
  1025. .tos = tos,
  1026. .type = type,
  1027. .nlflags = nlflags,
  1028. .tb_id = tb_id,
  1029. };
  1030. struct net_device *dev;
  1031. int err = 0;
  1032. memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
  1033. /* Don't offload route if using custom ip rules or if
  1034. * IPv4 FIB offloading has been disabled completely.
  1035. */
  1036. #ifdef CONFIG_IP_MULTIPLE_TABLES
  1037. if (fi->fib_net->ipv4.fib_has_custom_rules)
  1038. return 0;
  1039. #endif
  1040. if (fi->fib_net->ipv4.fib_offload_disabled)
  1041. return 0;
  1042. dev = switchdev_get_dev_by_nhs(fi);
  1043. if (!dev)
  1044. return 0;
  1045. ipv4_fib.obj.orig_dev = dev;
  1046. err = switchdev_port_obj_add(dev, &ipv4_fib.obj);
  1047. if (!err)
  1048. fi->fib_flags |= RTNH_F_OFFLOAD;
  1049. return err == -EOPNOTSUPP ? 0 : err;
  1050. }
  1051. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_add);
  1052. /**
  1053. * switchdev_fib_ipv4_del - Delete IPv4 route entry from switch
  1054. *
  1055. * @dst: route's IPv4 destination address
  1056. * @dst_len: destination address length (prefix length)
  1057. * @fi: route FIB info structure
  1058. * @tos: route TOS
  1059. * @type: route type
  1060. * @tb_id: route table ID
  1061. *
  1062. * Delete IPv4 route entry from switch device.
  1063. */
  1064. int switchdev_fib_ipv4_del(u32 dst, int dst_len, struct fib_info *fi,
  1065. u8 tos, u8 type, u32 tb_id)
  1066. {
  1067. struct switchdev_obj_ipv4_fib ipv4_fib = {
  1068. .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
  1069. .dst = dst,
  1070. .dst_len = dst_len,
  1071. .tos = tos,
  1072. .type = type,
  1073. .nlflags = 0,
  1074. .tb_id = tb_id,
  1075. };
  1076. struct net_device *dev;
  1077. int err = 0;
  1078. memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
  1079. if (!(fi->fib_flags & RTNH_F_OFFLOAD))
  1080. return 0;
  1081. dev = switchdev_get_dev_by_nhs(fi);
  1082. if (!dev)
  1083. return 0;
  1084. ipv4_fib.obj.orig_dev = dev;
  1085. err = switchdev_port_obj_del(dev, &ipv4_fib.obj);
  1086. if (!err)
  1087. fi->fib_flags &= ~RTNH_F_OFFLOAD;
  1088. return err == -EOPNOTSUPP ? 0 : err;
  1089. }
  1090. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_del);
  1091. /**
  1092. * switchdev_fib_ipv4_abort - Abort an IPv4 FIB operation
  1093. *
  1094. * @fi: route FIB info structure
  1095. */
  1096. void switchdev_fib_ipv4_abort(struct fib_info *fi)
  1097. {
  1098. /* There was a problem installing this route to the offload
  1099. * device. For now, until we come up with more refined
  1100. * policy handling, abruptly end IPv4 fib offloading for
  1101. * for entire net by flushing offload device(s) of all
  1102. * IPv4 routes, and mark IPv4 fib offloading broken from
  1103. * this point forward.
  1104. */
  1105. fib_flush_external(fi->fib_net);
  1106. fi->fib_net->ipv4.fib_offload_disabled = true;
  1107. }
  1108. EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_abort);
  1109. static bool switchdev_port_same_parent_id(struct net_device *a,
  1110. struct net_device *b)
  1111. {
  1112. struct switchdev_attr a_attr = {
  1113. .orig_dev = a,
  1114. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  1115. .flags = SWITCHDEV_F_NO_RECURSE,
  1116. };
  1117. struct switchdev_attr b_attr = {
  1118. .orig_dev = b,
  1119. .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
  1120. .flags = SWITCHDEV_F_NO_RECURSE,
  1121. };
  1122. if (switchdev_port_attr_get(a, &a_attr) ||
  1123. switchdev_port_attr_get(b, &b_attr))
  1124. return false;
  1125. return netdev_phys_item_id_same(&a_attr.u.ppid, &b_attr.u.ppid);
  1126. }
  1127. static u32 switchdev_port_fwd_mark_get(struct net_device *dev,
  1128. struct net_device *group_dev)
  1129. {
  1130. struct net_device *lower_dev;
  1131. struct list_head *iter;
  1132. netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
  1133. if (lower_dev == dev)
  1134. continue;
  1135. if (switchdev_port_same_parent_id(dev, lower_dev))
  1136. return lower_dev->offload_fwd_mark;
  1137. return switchdev_port_fwd_mark_get(dev, lower_dev);
  1138. }
  1139. return dev->ifindex;
  1140. }
  1141. static void switchdev_port_fwd_mark_reset(struct net_device *group_dev,
  1142. u32 old_mark, u32 *reset_mark)
  1143. {
  1144. struct net_device *lower_dev;
  1145. struct list_head *iter;
  1146. netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
  1147. if (lower_dev->offload_fwd_mark == old_mark) {
  1148. if (!*reset_mark)
  1149. *reset_mark = lower_dev->ifindex;
  1150. lower_dev->offload_fwd_mark = *reset_mark;
  1151. }
  1152. switchdev_port_fwd_mark_reset(lower_dev, old_mark, reset_mark);
  1153. }
  1154. }
  1155. /**
  1156. * switchdev_port_fwd_mark_set - Set port offload forwarding mark
  1157. *
  1158. * @dev: port device
  1159. * @group_dev: containing device
  1160. * @joining: true if dev is joining group; false if leaving group
  1161. *
  1162. * An ungrouped port's offload mark is just its ifindex. A grouped
  1163. * port's (member of a bridge, for example) offload mark is the ifindex
  1164. * of one of the ports in the group with the same parent (switch) ID.
  1165. * Ports on the same device in the same group will have the same mark.
  1166. *
  1167. * Example:
  1168. *
  1169. * br0 ifindex=9
  1170. * sw1p1 ifindex=2 mark=2
  1171. * sw1p2 ifindex=3 mark=2
  1172. * sw2p1 ifindex=4 mark=5
  1173. * sw2p2 ifindex=5 mark=5
  1174. *
  1175. * If sw2p2 leaves the bridge, we'll have:
  1176. *
  1177. * br0 ifindex=9
  1178. * sw1p1 ifindex=2 mark=2
  1179. * sw1p2 ifindex=3 mark=2
  1180. * sw2p1 ifindex=4 mark=4
  1181. * sw2p2 ifindex=5 mark=5
  1182. */
  1183. void switchdev_port_fwd_mark_set(struct net_device *dev,
  1184. struct net_device *group_dev,
  1185. bool joining)
  1186. {
  1187. u32 mark = dev->ifindex;
  1188. u32 reset_mark = 0;
  1189. if (group_dev) {
  1190. ASSERT_RTNL();
  1191. if (joining)
  1192. mark = switchdev_port_fwd_mark_get(dev, group_dev);
  1193. else if (dev->offload_fwd_mark == mark)
  1194. /* Ohoh, this port was the mark reference port,
  1195. * but it's leaving the group, so reset the
  1196. * mark for the remaining ports in the group.
  1197. */
  1198. switchdev_port_fwd_mark_reset(group_dev, mark,
  1199. &reset_mark);
  1200. }
  1201. dev->offload_fwd_mark = mark;
  1202. }
  1203. EXPORT_SYMBOL_GPL(switchdev_port_fwd_mark_set);