]> git.proxmox.com Git - mirror_ubuntu-zesty-kernel.git/blame - net/switchdev/switchdev.c
Merge tag 'sound-fix-4.5-rc1' of git://git.kernel.org/pub/scm/linux/kernel/git/tiwai...
[mirror_ubuntu-zesty-kernel.git] / net / switchdev / switchdev.c
CommitLineData
007f790c
JP
1/*
2 * net/switchdev/switchdev.c - Switch device API
7ea6eb3f 3 * Copyright (c) 2014-2015 Jiri Pirko <jiri@resnulli.us>
f8f21471 4 * Copyright (c) 2014-2015 Scott Feldman <sfeldma@gmail.com>
007f790c
JP
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 */
11
12#include <linux/kernel.h>
13#include <linux/types.h>
14#include <linux/init.h>
03bf0c28
JP
15#include <linux/mutex.h>
16#include <linux/notifier.h>
007f790c 17#include <linux/netdevice.h>
850d0cbc 18#include <linux/etherdevice.h>
47f8328b 19#include <linux/if_bridge.h>
7ea6eb3f 20#include <linux/list.h>
793f4014 21#include <linux/workqueue.h>
87aaf2ca 22#include <linux/if_vlan.h>
5e8d9049 23#include <net/ip_fib.h>
007f790c
JP
24#include <net/switchdev.h>
25
7ea6eb3f
JP
26/**
27 * switchdev_trans_item_enqueue - Enqueue data item to transaction queue
28 *
29 * @trans: transaction
30 * @data: pointer to data being queued
31 * @destructor: data destructor
32 * @tritem: transaction item being queued
33 *
34 * Enqeueue data item to transaction queue. tritem is typically placed in
35 * cointainter pointed at by data pointer. Destructor is called on
36 * transaction abort and after successful commit phase in case
37 * the caller did not dequeue the item before.
38 */
39void switchdev_trans_item_enqueue(struct switchdev_trans *trans,
40 void *data, void (*destructor)(void const *),
41 struct switchdev_trans_item *tritem)
42{
43 tritem->data = data;
44 tritem->destructor = destructor;
45 list_add_tail(&tritem->list, &trans->item_list);
46}
47EXPORT_SYMBOL_GPL(switchdev_trans_item_enqueue);
48
49static struct switchdev_trans_item *
50__switchdev_trans_item_dequeue(struct switchdev_trans *trans)
51{
52 struct switchdev_trans_item *tritem;
53
54 if (list_empty(&trans->item_list))
55 return NULL;
56 tritem = list_first_entry(&trans->item_list,
57 struct switchdev_trans_item, list);
58 list_del(&tritem->list);
59 return tritem;
60}
61
62/**
63 * switchdev_trans_item_dequeue - Dequeue data item from transaction queue
64 *
65 * @trans: transaction
66 */
67void *switchdev_trans_item_dequeue(struct switchdev_trans *trans)
68{
69 struct switchdev_trans_item *tritem;
70
71 tritem = __switchdev_trans_item_dequeue(trans);
72 BUG_ON(!tritem);
73 return tritem->data;
74}
75EXPORT_SYMBOL_GPL(switchdev_trans_item_dequeue);
76
77static void switchdev_trans_init(struct switchdev_trans *trans)
78{
79 INIT_LIST_HEAD(&trans->item_list);
80}
81
82static void switchdev_trans_items_destroy(struct switchdev_trans *trans)
83{
84 struct switchdev_trans_item *tritem;
85
86 while ((tritem = __switchdev_trans_item_dequeue(trans)))
87 tritem->destructor(tritem->data);
88}
89
90static void switchdev_trans_items_warn_destroy(struct net_device *dev,
91 struct switchdev_trans *trans)
92{
93 WARN(!list_empty(&trans->item_list), "%s: transaction item queue is not empty.\n",
94 dev->name);
95 switchdev_trans_items_destroy(trans);
96}
97
793f4014
JP
98static LIST_HEAD(deferred);
99static DEFINE_SPINLOCK(deferred_lock);
100
101typedef void switchdev_deferred_func_t(struct net_device *dev,
102 const void *data);
103
104struct switchdev_deferred_item {
105 struct list_head list;
106 struct net_device *dev;
107 switchdev_deferred_func_t *func;
108 unsigned long data[0];
109};
110
111static struct switchdev_deferred_item *switchdev_deferred_dequeue(void)
112{
113 struct switchdev_deferred_item *dfitem;
114
115 spin_lock_bh(&deferred_lock);
116 if (list_empty(&deferred)) {
117 dfitem = NULL;
118 goto unlock;
119 }
120 dfitem = list_first_entry(&deferred,
121 struct switchdev_deferred_item, list);
122 list_del(&dfitem->list);
123unlock:
124 spin_unlock_bh(&deferred_lock);
125 return dfitem;
126}
127
128/**
129 * switchdev_deferred_process - Process ops in deferred queue
130 *
131 * Called to flush the ops currently queued in deferred ops queue.
132 * rtnl_lock must be held.
133 */
134void switchdev_deferred_process(void)
135{
136 struct switchdev_deferred_item *dfitem;
137
138 ASSERT_RTNL();
139
140 while ((dfitem = switchdev_deferred_dequeue())) {
141 dfitem->func(dfitem->dev, dfitem->data);
142 dev_put(dfitem->dev);
143 kfree(dfitem);
144 }
145}
146EXPORT_SYMBOL_GPL(switchdev_deferred_process);
147
148static void switchdev_deferred_process_work(struct work_struct *work)
149{
150 rtnl_lock();
151 switchdev_deferred_process();
152 rtnl_unlock();
153}
154
155static DECLARE_WORK(deferred_process_work, switchdev_deferred_process_work);
156
157static int switchdev_deferred_enqueue(struct net_device *dev,
158 const void *data, size_t data_len,
159 switchdev_deferred_func_t *func)
160{
161 struct switchdev_deferred_item *dfitem;
162
163 dfitem = kmalloc(sizeof(*dfitem) + data_len, GFP_ATOMIC);
164 if (!dfitem)
165 return -ENOMEM;
166 dfitem->dev = dev;
167 dfitem->func = func;
168 memcpy(dfitem->data, data, data_len);
169 dev_hold(dev);
170 spin_lock_bh(&deferred_lock);
171 list_add_tail(&dfitem->list, &deferred);
172 spin_unlock_bh(&deferred_lock);
173 schedule_work(&deferred_process_work);
174 return 0;
175}
176
3094333d
SF
177/**
178 * switchdev_port_attr_get - Get port attribute
179 *
180 * @dev: port device
181 * @attr: attribute to get
182 */
183int switchdev_port_attr_get(struct net_device *dev, struct switchdev_attr *attr)
184{
185 const struct switchdev_ops *ops = dev->switchdev_ops;
186 struct net_device *lower_dev;
187 struct list_head *iter;
188 struct switchdev_attr first = {
1f868398 189 .id = SWITCHDEV_ATTR_ID_UNDEFINED
3094333d
SF
190 };
191 int err = -EOPNOTSUPP;
192
193 if (ops && ops->switchdev_port_attr_get)
194 return ops->switchdev_port_attr_get(dev, attr);
195
196 if (attr->flags & SWITCHDEV_F_NO_RECURSE)
197 return err;
198
199 /* Switch device port(s) may be stacked under
200 * bond/team/vlan dev, so recurse down to get attr on
201 * each port. Return -ENODATA if attr values don't
202 * compare across ports.
203 */
204
205 netdev_for_each_lower_dev(dev, lower_dev, iter) {
206 err = switchdev_port_attr_get(lower_dev, attr);
207 if (err)
208 break;
1f868398 209 if (first.id == SWITCHDEV_ATTR_ID_UNDEFINED)
3094333d
SF
210 first = *attr;
211 else if (memcmp(&first, attr, sizeof(*attr)))
212 return -ENODATA;
213 }
214
215 return err;
216}
217EXPORT_SYMBOL_GPL(switchdev_port_attr_get);
218
219static int __switchdev_port_attr_set(struct net_device *dev,
f7fadf30 220 const struct switchdev_attr *attr,
7ea6eb3f 221 struct switchdev_trans *trans)
3094333d
SF
222{
223 const struct switchdev_ops *ops = dev->switchdev_ops;
224 struct net_device *lower_dev;
225 struct list_head *iter;
226 int err = -EOPNOTSUPP;
227
0c63d80c
JP
228 if (ops && ops->switchdev_port_attr_set) {
229 err = ops->switchdev_port_attr_set(dev, attr, trans);
230 goto done;
231 }
3094333d
SF
232
233 if (attr->flags & SWITCHDEV_F_NO_RECURSE)
464314ea 234 goto done;
3094333d
SF
235
236 /* Switch device port(s) may be stacked under
237 * bond/team/vlan dev, so recurse down to set attr on
238 * each port.
239 */
240
241 netdev_for_each_lower_dev(dev, lower_dev, iter) {
7ea6eb3f 242 err = __switchdev_port_attr_set(lower_dev, attr, trans);
3094333d
SF
243 if (err)
244 break;
245 }
246
464314ea
SF
247done:
248 if (err == -EOPNOTSUPP && attr->flags & SWITCHDEV_F_SKIP_EOPNOTSUPP)
249 err = 0;
250
3094333d
SF
251 return err;
252}
253
0bc05d58
JP
254static int switchdev_port_attr_set_now(struct net_device *dev,
255 const struct switchdev_attr *attr)
3094333d 256{
7ea6eb3f 257 struct switchdev_trans trans;
3094333d
SF
258 int err;
259
7ea6eb3f
JP
260 switchdev_trans_init(&trans);
261
3094333d
SF
262 /* Phase I: prepare for attr set. Driver/device should fail
263 * here if there are going to be issues in the commit phase,
264 * such as lack of resources or support. The driver/device
265 * should reserve resources needed for the commit phase here,
266 * but should not commit the attr.
267 */
268
f623ab7f 269 trans.ph_prepare = true;
7ea6eb3f 270 err = __switchdev_port_attr_set(dev, attr, &trans);
3094333d
SF
271 if (err) {
272 /* Prepare phase failed: abort the transaction. Any
273 * resources reserved in the prepare phase are
274 * released.
275 */
276
9f6467cf 277 if (err != -EOPNOTSUPP)
7ea6eb3f 278 switchdev_trans_items_destroy(&trans);
3094333d
SF
279
280 return err;
281 }
282
283 /* Phase II: commit attr set. This cannot fail as a fault
284 * of driver/device. If it does, it's a bug in the driver/device
285 * because the driver said everythings was OK in phase I.
286 */
287
f623ab7f 288 trans.ph_prepare = false;
7ea6eb3f 289 err = __switchdev_port_attr_set(dev, attr, &trans);
e9fdaec0
SF
290 WARN(err, "%s: Commit of attribute (id=%d) failed.\n",
291 dev->name, attr->id);
7ea6eb3f 292 switchdev_trans_items_warn_destroy(dev, &trans);
3094333d
SF
293
294 return err;
295}
0bc05d58
JP
296
297static void switchdev_port_attr_set_deferred(struct net_device *dev,
298 const void *data)
299{
300 const struct switchdev_attr *attr = data;
301 int err;
302
303 err = switchdev_port_attr_set_now(dev, attr);
304 if (err && err != -EOPNOTSUPP)
305 netdev_err(dev, "failed (err=%d) to set attribute (id=%d)\n",
306 err, attr->id);
307}
308
309static int switchdev_port_attr_set_defer(struct net_device *dev,
310 const struct switchdev_attr *attr)
311{
312 return switchdev_deferred_enqueue(dev, attr, sizeof(*attr),
313 switchdev_port_attr_set_deferred);
314}
315
316/**
317 * switchdev_port_attr_set - Set port attribute
318 *
319 * @dev: port device
320 * @attr: attribute to set
321 *
322 * Use a 2-phase prepare-commit transaction model to ensure
323 * system is not left in a partially updated state due to
324 * failure from driver/device.
325 *
326 * rtnl_lock must be held and must not be in atomic section,
327 * in case SWITCHDEV_F_DEFER flag is not set.
328 */
329int switchdev_port_attr_set(struct net_device *dev,
330 const struct switchdev_attr *attr)
331{
332 if (attr->flags & SWITCHDEV_F_DEFER)
333 return switchdev_port_attr_set_defer(dev, attr);
334 ASSERT_RTNL();
335 return switchdev_port_attr_set_now(dev, attr);
336}
3094333d
SF
337EXPORT_SYMBOL_GPL(switchdev_port_attr_set);
338
e258d919
SF
339static size_t switchdev_obj_size(const struct switchdev_obj *obj)
340{
341 switch (obj->id) {
342 case SWITCHDEV_OBJ_ID_PORT_VLAN:
343 return sizeof(struct switchdev_obj_port_vlan);
344 case SWITCHDEV_OBJ_ID_IPV4_FIB:
345 return sizeof(struct switchdev_obj_ipv4_fib);
346 case SWITCHDEV_OBJ_ID_PORT_FDB:
347 return sizeof(struct switchdev_obj_port_fdb);
4d41e125
ER
348 case SWITCHDEV_OBJ_ID_PORT_MDB:
349 return sizeof(struct switchdev_obj_port_mdb);
e258d919
SF
350 default:
351 BUG();
352 }
353 return 0;
354}
355
22c1f67e 356static int __switchdev_port_obj_add(struct net_device *dev,
648b4a99 357 const struct switchdev_obj *obj,
7ea6eb3f 358 struct switchdev_trans *trans)
491d0f15
SF
359{
360 const struct switchdev_ops *ops = dev->switchdev_ops;
361 struct net_device *lower_dev;
362 struct list_head *iter;
363 int err = -EOPNOTSUPP;
364
365 if (ops && ops->switchdev_port_obj_add)
9e8f4a54 366 return ops->switchdev_port_obj_add(dev, obj, trans);
491d0f15
SF
367
368 /* Switch device port(s) may be stacked under
369 * bond/team/vlan dev, so recurse down to add object on
370 * each port.
371 */
372
373 netdev_for_each_lower_dev(dev, lower_dev, iter) {
9e8f4a54 374 err = __switchdev_port_obj_add(lower_dev, obj, trans);
491d0f15
SF
375 if (err)
376 break;
377 }
378
379 return err;
380}
381
4d429c5d
JP
382static int switchdev_port_obj_add_now(struct net_device *dev,
383 const struct switchdev_obj *obj)
491d0f15 384{
7ea6eb3f 385 struct switchdev_trans trans;
491d0f15
SF
386 int err;
387
388 ASSERT_RTNL();
389
7ea6eb3f
JP
390 switchdev_trans_init(&trans);
391
491d0f15
SF
392 /* Phase I: prepare for obj add. Driver/device should fail
393 * here if there are going to be issues in the commit phase,
394 * such as lack of resources or support. The driver/device
395 * should reserve resources needed for the commit phase here,
396 * but should not commit the obj.
397 */
398
f623ab7f 399 trans.ph_prepare = true;
9e8f4a54 400 err = __switchdev_port_obj_add(dev, obj, &trans);
491d0f15
SF
401 if (err) {
402 /* Prepare phase failed: abort the transaction. Any
403 * resources reserved in the prepare phase are
404 * released.
405 */
406
9f6467cf 407 if (err != -EOPNOTSUPP)
7ea6eb3f 408 switchdev_trans_items_destroy(&trans);
491d0f15
SF
409
410 return err;
411 }
412
413 /* Phase II: commit obj add. This cannot fail as a fault
414 * of driver/device. If it does, it's a bug in the driver/device
415 * because the driver said everythings was OK in phase I.
416 */
417
f623ab7f 418 trans.ph_prepare = false;
9e8f4a54
JP
419 err = __switchdev_port_obj_add(dev, obj, &trans);
420 WARN(err, "%s: Commit of object (id=%d) failed.\n", dev->name, obj->id);
7ea6eb3f 421 switchdev_trans_items_warn_destroy(dev, &trans);
491d0f15
SF
422
423 return err;
424}
4d429c5d
JP
425
426static void switchdev_port_obj_add_deferred(struct net_device *dev,
427 const void *data)
428{
429 const struct switchdev_obj *obj = data;
430 int err;
431
432 err = switchdev_port_obj_add_now(dev, obj);
433 if (err && err != -EOPNOTSUPP)
434 netdev_err(dev, "failed (err=%d) to add object (id=%d)\n",
435 err, obj->id);
436}
437
438static int switchdev_port_obj_add_defer(struct net_device *dev,
439 const struct switchdev_obj *obj)
440{
e258d919 441 return switchdev_deferred_enqueue(dev, obj, switchdev_obj_size(obj),
4d429c5d
JP
442 switchdev_port_obj_add_deferred);
443}
491d0f15
SF
444
445/**
4d429c5d 446 * switchdev_port_obj_add - Add port object
491d0f15
SF
447 *
448 * @dev: port device
ab069002 449 * @id: object ID
4d429c5d
JP
450 * @obj: object to add
451 *
452 * Use a 2-phase prepare-commit transaction model to ensure
453 * system is not left in a partially updated state due to
454 * failure from driver/device.
455 *
456 * rtnl_lock must be held and must not be in atomic section,
457 * in case SWITCHDEV_F_DEFER flag is not set.
491d0f15 458 */
4d429c5d 459int switchdev_port_obj_add(struct net_device *dev,
648b4a99 460 const struct switchdev_obj *obj)
4d429c5d
JP
461{
462 if (obj->flags & SWITCHDEV_F_DEFER)
463 return switchdev_port_obj_add_defer(dev, obj);
464 ASSERT_RTNL();
465 return switchdev_port_obj_add_now(dev, obj);
466}
467EXPORT_SYMBOL_GPL(switchdev_port_obj_add);
468
469static int switchdev_port_obj_del_now(struct net_device *dev,
470 const struct switchdev_obj *obj)
491d0f15
SF
471{
472 const struct switchdev_ops *ops = dev->switchdev_ops;
473 struct net_device *lower_dev;
474 struct list_head *iter;
475 int err = -EOPNOTSUPP;
476
477 if (ops && ops->switchdev_port_obj_del)
9e8f4a54 478 return ops->switchdev_port_obj_del(dev, obj);
491d0f15
SF
479
480 /* Switch device port(s) may be stacked under
481 * bond/team/vlan dev, so recurse down to delete object on
482 * each port.
483 */
484
485 netdev_for_each_lower_dev(dev, lower_dev, iter) {
4d429c5d 486 err = switchdev_port_obj_del_now(lower_dev, obj);
491d0f15
SF
487 if (err)
488 break;
489 }
490
491 return err;
492}
4d429c5d
JP
493
494static void switchdev_port_obj_del_deferred(struct net_device *dev,
495 const void *data)
496{
497 const struct switchdev_obj *obj = data;
498 int err;
499
500 err = switchdev_port_obj_del_now(dev, obj);
501 if (err && err != -EOPNOTSUPP)
502 netdev_err(dev, "failed (err=%d) to del object (id=%d)\n",
503 err, obj->id);
504}
505
506static int switchdev_port_obj_del_defer(struct net_device *dev,
507 const struct switchdev_obj *obj)
508{
e258d919 509 return switchdev_deferred_enqueue(dev, obj, switchdev_obj_size(obj),
4d429c5d
JP
510 switchdev_port_obj_del_deferred);
511}
512
513/**
514 * switchdev_port_obj_del - Delete port object
515 *
516 * @dev: port device
517 * @id: object ID
518 * @obj: object to delete
519 *
520 * rtnl_lock must be held and must not be in atomic section,
521 * in case SWITCHDEV_F_DEFER flag is not set.
522 */
523int switchdev_port_obj_del(struct net_device *dev,
524 const struct switchdev_obj *obj)
525{
526 if (obj->flags & SWITCHDEV_F_DEFER)
527 return switchdev_port_obj_del_defer(dev, obj);
528 ASSERT_RTNL();
529 return switchdev_port_obj_del_now(dev, obj);
530}
491d0f15
SF
531EXPORT_SYMBOL_GPL(switchdev_port_obj_del);
532
45d4122c
SS
533/**
534 * switchdev_port_obj_dump - Dump port objects
535 *
536 * @dev: port device
25f07adc 537 * @id: object ID
45d4122c 538 * @obj: object to dump
25f07adc 539 * @cb: function to call with a filled object
771acac2
JP
540 *
541 * rtnl_lock must be held.
45d4122c 542 */
9e8f4a54 543int switchdev_port_obj_dump(struct net_device *dev, struct switchdev_obj *obj,
648b4a99 544 switchdev_obj_dump_cb_t *cb)
45d4122c
SS
545{
546 const struct switchdev_ops *ops = dev->switchdev_ops;
547 struct net_device *lower_dev;
548 struct list_head *iter;
549 int err = -EOPNOTSUPP;
550
771acac2
JP
551 ASSERT_RTNL();
552
45d4122c 553 if (ops && ops->switchdev_port_obj_dump)
9e8f4a54 554 return ops->switchdev_port_obj_dump(dev, obj, cb);
45d4122c
SS
555
556 /* Switch device port(s) may be stacked under
557 * bond/team/vlan dev, so recurse down to dump objects on
558 * first port at bottom of stack.
559 */
560
561 netdev_for_each_lower_dev(dev, lower_dev, iter) {
9e8f4a54 562 err = switchdev_port_obj_dump(lower_dev, obj, cb);
45d4122c
SS
563 break;
564 }
565
566 return err;
567}
568EXPORT_SYMBOL_GPL(switchdev_port_obj_dump);
569
ebb9a03a
JP
570static DEFINE_MUTEX(switchdev_mutex);
571static RAW_NOTIFIER_HEAD(switchdev_notif_chain);
03bf0c28
JP
572
573/**
ebb9a03a 574 * register_switchdev_notifier - Register notifier
03bf0c28
JP
575 * @nb: notifier_block
576 *
577 * Register switch device notifier. This should be used by code
578 * which needs to monitor events happening in particular device.
579 * Return values are same as for atomic_notifier_chain_register().
580 */
ebb9a03a 581int register_switchdev_notifier(struct notifier_block *nb)
03bf0c28
JP
582{
583 int err;
584
ebb9a03a
JP
585 mutex_lock(&switchdev_mutex);
586 err = raw_notifier_chain_register(&switchdev_notif_chain, nb);
587 mutex_unlock(&switchdev_mutex);
03bf0c28
JP
588 return err;
589}
ebb9a03a 590EXPORT_SYMBOL_GPL(register_switchdev_notifier);
03bf0c28
JP
591
592/**
ebb9a03a 593 * unregister_switchdev_notifier - Unregister notifier
03bf0c28
JP
594 * @nb: notifier_block
595 *
596 * Unregister switch device notifier.
597 * Return values are same as for atomic_notifier_chain_unregister().
598 */
ebb9a03a 599int unregister_switchdev_notifier(struct notifier_block *nb)
03bf0c28
JP
600{
601 int err;
602
ebb9a03a
JP
603 mutex_lock(&switchdev_mutex);
604 err = raw_notifier_chain_unregister(&switchdev_notif_chain, nb);
605 mutex_unlock(&switchdev_mutex);
03bf0c28
JP
606 return err;
607}
ebb9a03a 608EXPORT_SYMBOL_GPL(unregister_switchdev_notifier);
03bf0c28
JP
609
610/**
ebb9a03a 611 * call_switchdev_notifiers - Call notifiers
03bf0c28
JP
612 * @val: value passed unmodified to notifier function
613 * @dev: port device
614 * @info: notifier information data
615 *
616 * Call all network notifier blocks. This should be called by driver
617 * when it needs to propagate hardware event.
618 * Return values are same as for atomic_notifier_call_chain().
619 */
ebb9a03a
JP
620int call_switchdev_notifiers(unsigned long val, struct net_device *dev,
621 struct switchdev_notifier_info *info)
03bf0c28
JP
622{
623 int err;
624
625 info->dev = dev;
ebb9a03a
JP
626 mutex_lock(&switchdev_mutex);
627 err = raw_notifier_call_chain(&switchdev_notif_chain, val, info);
628 mutex_unlock(&switchdev_mutex);
03bf0c28
JP
629 return err;
630}
ebb9a03a 631EXPORT_SYMBOL_GPL(call_switchdev_notifiers);
8a44dbb2 632
7d4f8d87 633struct switchdev_vlan_dump {
8f24f309 634 struct switchdev_obj_port_vlan vlan;
7d4f8d87
SF
635 struct sk_buff *skb;
636 u32 filter_mask;
637 u16 flags;
638 u16 begin;
639 u16 end;
640};
641
e23b002b 642static int switchdev_port_vlan_dump_put(struct switchdev_vlan_dump *dump)
7d4f8d87
SF
643{
644 struct bridge_vlan_info vinfo;
645
646 vinfo.flags = dump->flags;
647
648 if (dump->begin == 0 && dump->end == 0) {
649 return 0;
650 } else if (dump->begin == dump->end) {
651 vinfo.vid = dump->begin;
652 if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
653 sizeof(vinfo), &vinfo))
654 return -EMSGSIZE;
655 } else {
656 vinfo.vid = dump->begin;
657 vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_BEGIN;
658 if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
659 sizeof(vinfo), &vinfo))
660 return -EMSGSIZE;
661 vinfo.vid = dump->end;
662 vinfo.flags &= ~BRIDGE_VLAN_INFO_RANGE_BEGIN;
663 vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_END;
664 if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
665 sizeof(vinfo), &vinfo))
666 return -EMSGSIZE;
667 }
668
669 return 0;
670}
671
648b4a99 672static int switchdev_port_vlan_dump_cb(struct switchdev_obj *obj)
7d4f8d87 673{
648b4a99 674 struct switchdev_obj_port_vlan *vlan = SWITCHDEV_OBJ_PORT_VLAN(obj);
7d4f8d87 675 struct switchdev_vlan_dump *dump =
25f07adc 676 container_of(vlan, struct switchdev_vlan_dump, vlan);
7d4f8d87
SF
677 int err = 0;
678
679 if (vlan->vid_begin > vlan->vid_end)
680 return -EINVAL;
681
682 if (dump->filter_mask & RTEXT_FILTER_BRVLAN) {
683 dump->flags = vlan->flags;
684 for (dump->begin = dump->end = vlan->vid_begin;
685 dump->begin <= vlan->vid_end;
686 dump->begin++, dump->end++) {
e23b002b 687 err = switchdev_port_vlan_dump_put(dump);
7d4f8d87
SF
688 if (err)
689 return err;
690 }
691 } else if (dump->filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED) {
692 if (dump->begin > vlan->vid_begin &&
693 dump->begin >= vlan->vid_end) {
694 if ((dump->begin - 1) == vlan->vid_end &&
695 dump->flags == vlan->flags) {
696 /* prepend */
697 dump->begin = vlan->vid_begin;
698 } else {
e23b002b 699 err = switchdev_port_vlan_dump_put(dump);
7d4f8d87
SF
700 dump->flags = vlan->flags;
701 dump->begin = vlan->vid_begin;
702 dump->end = vlan->vid_end;
703 }
704 } else if (dump->end <= vlan->vid_begin &&
705 dump->end < vlan->vid_end) {
706 if ((dump->end + 1) == vlan->vid_begin &&
707 dump->flags == vlan->flags) {
708 /* append */
709 dump->end = vlan->vid_end;
710 } else {
e23b002b 711 err = switchdev_port_vlan_dump_put(dump);
7d4f8d87
SF
712 dump->flags = vlan->flags;
713 dump->begin = vlan->vid_begin;
714 dump->end = vlan->vid_end;
715 }
716 } else {
717 err = -EINVAL;
718 }
719 }
720
721 return err;
722}
723
724static int switchdev_port_vlan_fill(struct sk_buff *skb, struct net_device *dev,
725 u32 filter_mask)
726{
727 struct switchdev_vlan_dump dump = {
6ff64f6f 728 .vlan.obj.orig_dev = dev,
9e8f4a54 729 .vlan.obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
7d4f8d87
SF
730 .skb = skb,
731 .filter_mask = filter_mask,
732 };
733 int err = 0;
734
735 if ((filter_mask & RTEXT_FILTER_BRVLAN) ||
736 (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)) {
9e8f4a54 737 err = switchdev_port_obj_dump(dev, &dump.vlan.obj,
25f07adc 738 switchdev_port_vlan_dump_cb);
7d4f8d87
SF
739 if (err)
740 goto err_out;
741 if (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)
742 /* last one */
e23b002b 743 err = switchdev_port_vlan_dump_put(&dump);
7d4f8d87
SF
744 }
745
746err_out:
747 return err == -EOPNOTSUPP ? 0 : err;
748}
749
8793d0a6
SF
750/**
751 * switchdev_port_bridge_getlink - Get bridge port attributes
752 *
753 * @dev: port device
754 *
755 * Called for SELF on rtnl_bridge_getlink to get bridge port
756 * attributes.
757 */
758int switchdev_port_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
759 struct net_device *dev, u32 filter_mask,
760 int nlflags)
761{
762 struct switchdev_attr attr = {
6ff64f6f 763 .orig_dev = dev,
1f868398 764 .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
8793d0a6
SF
765 };
766 u16 mode = BRIDGE_MODE_UNDEF;
741af005 767 u32 mask = BR_LEARNING | BR_LEARNING_SYNC | BR_FLOOD;
8793d0a6
SF
768 int err;
769
770 err = switchdev_port_attr_get(dev, &attr);
5c8079d0 771 if (err && err != -EOPNOTSUPP)
8793d0a6
SF
772 return err;
773
774 return ndo_dflt_bridge_getlink(skb, pid, seq, dev, mode,
7d4f8d87
SF
775 attr.u.brport_flags, mask, nlflags,
776 filter_mask, switchdev_port_vlan_fill);
8793d0a6
SF
777}
778EXPORT_SYMBOL_GPL(switchdev_port_bridge_getlink);
779
47f8328b
SF
780static int switchdev_port_br_setflag(struct net_device *dev,
781 struct nlattr *nlattr,
782 unsigned long brport_flag)
783{
784 struct switchdev_attr attr = {
6ff64f6f 785 .orig_dev = dev,
1f868398 786 .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
47f8328b
SF
787 };
788 u8 flag = nla_get_u8(nlattr);
789 int err;
790
791 err = switchdev_port_attr_get(dev, &attr);
792 if (err)
793 return err;
794
795 if (flag)
42275bd8 796 attr.u.brport_flags |= brport_flag;
47f8328b 797 else
42275bd8 798 attr.u.brport_flags &= ~brport_flag;
47f8328b
SF
799
800 return switchdev_port_attr_set(dev, &attr);
801}
802
803static const struct nla_policy
804switchdev_port_bridge_policy[IFLA_BRPORT_MAX + 1] = {
805 [IFLA_BRPORT_STATE] = { .type = NLA_U8 },
806 [IFLA_BRPORT_COST] = { .type = NLA_U32 },
807 [IFLA_BRPORT_PRIORITY] = { .type = NLA_U16 },
808 [IFLA_BRPORT_MODE] = { .type = NLA_U8 },
809 [IFLA_BRPORT_GUARD] = { .type = NLA_U8 },
810 [IFLA_BRPORT_PROTECT] = { .type = NLA_U8 },
811 [IFLA_BRPORT_FAST_LEAVE] = { .type = NLA_U8 },
812 [IFLA_BRPORT_LEARNING] = { .type = NLA_U8 },
813 [IFLA_BRPORT_LEARNING_SYNC] = { .type = NLA_U8 },
814 [IFLA_BRPORT_UNICAST_FLOOD] = { .type = NLA_U8 },
815};
816
817static int switchdev_port_br_setlink_protinfo(struct net_device *dev,
818 struct nlattr *protinfo)
819{
820 struct nlattr *attr;
821 int rem;
822 int err;
823
824 err = nla_validate_nested(protinfo, IFLA_BRPORT_MAX,
825 switchdev_port_bridge_policy);
826 if (err)
827 return err;
828
829 nla_for_each_nested(attr, protinfo, rem) {
830 switch (nla_type(attr)) {
831 case IFLA_BRPORT_LEARNING:
832 err = switchdev_port_br_setflag(dev, attr,
833 BR_LEARNING);
834 break;
835 case IFLA_BRPORT_LEARNING_SYNC:
836 err = switchdev_port_br_setflag(dev, attr,
837 BR_LEARNING_SYNC);
838 break;
741af005
IS
839 case IFLA_BRPORT_UNICAST_FLOOD:
840 err = switchdev_port_br_setflag(dev, attr, BR_FLOOD);
841 break;
47f8328b
SF
842 default:
843 err = -EOPNOTSUPP;
844 break;
845 }
846 if (err)
847 return err;
848 }
849
850 return 0;
851}
852
853static int switchdev_port_br_afspec(struct net_device *dev,
854 struct nlattr *afspec,
855 int (*f)(struct net_device *dev,
648b4a99 856 const struct switchdev_obj *obj))
47f8328b
SF
857{
858 struct nlattr *attr;
859 struct bridge_vlan_info *vinfo;
9e8f4a54 860 struct switchdev_obj_port_vlan vlan = {
6ff64f6f 861 .obj.orig_dev = dev,
9e8f4a54
JP
862 .obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
863 };
47f8328b
SF
864 int rem;
865 int err;
866
867 nla_for_each_nested(attr, afspec, rem) {
868 if (nla_type(attr) != IFLA_BRIDGE_VLAN_INFO)
869 continue;
870 if (nla_len(attr) != sizeof(struct bridge_vlan_info))
871 return -EINVAL;
872 vinfo = nla_data(attr);
87aaf2ca
NA
873 if (!vinfo->vid || vinfo->vid >= VLAN_VID_MASK)
874 return -EINVAL;
ab069002 875 vlan.flags = vinfo->flags;
47f8328b 876 if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_BEGIN) {
ab069002 877 if (vlan.vid_begin)
47f8328b 878 return -EINVAL;
ab069002 879 vlan.vid_begin = vinfo->vid;
cc02aa8e
NA
880 /* don't allow range of pvids */
881 if (vlan.flags & BRIDGE_VLAN_INFO_PVID)
882 return -EINVAL;
47f8328b 883 } else if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_END) {
ab069002 884 if (!vlan.vid_begin)
47f8328b 885 return -EINVAL;
ab069002
VD
886 vlan.vid_end = vinfo->vid;
887 if (vlan.vid_end <= vlan.vid_begin)
47f8328b 888 return -EINVAL;
9e8f4a54 889 err = f(dev, &vlan.obj);
47f8328b
SF
890 if (err)
891 return err;
3a7bde55 892 vlan.vid_begin = 0;
47f8328b 893 } else {
ab069002 894 if (vlan.vid_begin)
47f8328b 895 return -EINVAL;
ab069002
VD
896 vlan.vid_begin = vinfo->vid;
897 vlan.vid_end = vinfo->vid;
9e8f4a54 898 err = f(dev, &vlan.obj);
47f8328b
SF
899 if (err)
900 return err;
3a7bde55 901 vlan.vid_begin = 0;
47f8328b
SF
902 }
903 }
904
905 return 0;
906}
907
8a44dbb2 908/**
47f8328b 909 * switchdev_port_bridge_setlink - Set bridge port attributes
8a44dbb2
RP
910 *
911 * @dev: port device
47f8328b
SF
912 * @nlh: netlink header
913 * @flags: netlink flags
8a44dbb2 914 *
47f8328b
SF
915 * Called for SELF on rtnl_bridge_setlink to set bridge port
916 * attributes.
8a44dbb2 917 */
ebb9a03a
JP
918int switchdev_port_bridge_setlink(struct net_device *dev,
919 struct nlmsghdr *nlh, u16 flags)
8a44dbb2 920{
47f8328b
SF
921 struct nlattr *protinfo;
922 struct nlattr *afspec;
923 int err = 0;
924
925 protinfo = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
926 IFLA_PROTINFO);
927 if (protinfo) {
928 err = switchdev_port_br_setlink_protinfo(dev, protinfo);
929 if (err)
930 return err;
931 }
8a44dbb2 932
47f8328b
SF
933 afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
934 IFLA_AF_SPEC);
935 if (afspec)
936 err = switchdev_port_br_afspec(dev, afspec,
937 switchdev_port_obj_add);
8a44dbb2 938
47f8328b 939 return err;
8a44dbb2 940}
ebb9a03a 941EXPORT_SYMBOL_GPL(switchdev_port_bridge_setlink);
8a44dbb2
RP
942
943/**
5c34e022 944 * switchdev_port_bridge_dellink - Set bridge port attributes
8a44dbb2
RP
945 *
946 * @dev: port device
5c34e022
SF
947 * @nlh: netlink header
948 * @flags: netlink flags
8a44dbb2 949 *
5c34e022
SF
950 * Called for SELF on rtnl_bridge_dellink to set bridge port
951 * attributes.
8a44dbb2 952 */
ebb9a03a
JP
953int switchdev_port_bridge_dellink(struct net_device *dev,
954 struct nlmsghdr *nlh, u16 flags)
8a44dbb2 955{
5c34e022 956 struct nlattr *afspec;
8a44dbb2 957
5c34e022
SF
958 afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
959 IFLA_AF_SPEC);
960 if (afspec)
961 return switchdev_port_br_afspec(dev, afspec,
962 switchdev_port_obj_del);
8a44dbb2 963
5c34e022 964 return 0;
8a44dbb2 965}
ebb9a03a 966EXPORT_SYMBOL_GPL(switchdev_port_bridge_dellink);
8a44dbb2 967
45d4122c
SS
968/**
969 * switchdev_port_fdb_add - Add FDB (MAC/VLAN) entry to port
970 *
971 * @ndmsg: netlink hdr
972 * @nlattr: netlink attributes
973 * @dev: port device
974 * @addr: MAC address to add
975 * @vid: VLAN to add
976 *
977 * Add FDB entry to switch device.
978 */
979int switchdev_port_fdb_add(struct ndmsg *ndm, struct nlattr *tb[],
980 struct net_device *dev, const unsigned char *addr,
981 u16 vid, u16 nlm_flags)
982{
52ba57cf 983 struct switchdev_obj_port_fdb fdb = {
6ff64f6f 984 .obj.orig_dev = dev,
9e8f4a54 985 .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
ab069002 986 .vid = vid,
45d4122c
SS
987 };
988
850d0cbc 989 ether_addr_copy(fdb.addr, addr);
9e8f4a54 990 return switchdev_port_obj_add(dev, &fdb.obj);
45d4122c
SS
991}
992EXPORT_SYMBOL_GPL(switchdev_port_fdb_add);
993
994/**
995 * switchdev_port_fdb_del - Delete FDB (MAC/VLAN) entry from port
996 *
997 * @ndmsg: netlink hdr
998 * @nlattr: netlink attributes
999 * @dev: port device
1000 * @addr: MAC address to delete
1001 * @vid: VLAN to delete
1002 *
1003 * Delete FDB entry from switch device.
1004 */
1005int switchdev_port_fdb_del(struct ndmsg *ndm, struct nlattr *tb[],
1006 struct net_device *dev, const unsigned char *addr,
1007 u16 vid)
1008{
52ba57cf 1009 struct switchdev_obj_port_fdb fdb = {
6ff64f6f 1010 .obj.orig_dev = dev,
9e8f4a54 1011 .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
ab069002 1012 .vid = vid,
45d4122c
SS
1013 };
1014
850d0cbc 1015 ether_addr_copy(fdb.addr, addr);
9e8f4a54 1016 return switchdev_port_obj_del(dev, &fdb.obj);
45d4122c
SS
1017}
1018EXPORT_SYMBOL_GPL(switchdev_port_fdb_del);
1019
1020struct switchdev_fdb_dump {
52ba57cf 1021 struct switchdev_obj_port_fdb fdb;
e02a06b2 1022 struct net_device *dev;
45d4122c
SS
1023 struct sk_buff *skb;
1024 struct netlink_callback *cb;
45d4122c
SS
1025 int idx;
1026};
1027
648b4a99 1028static int switchdev_port_fdb_dump_cb(struct switchdev_obj *obj)
45d4122c 1029{
648b4a99 1030 struct switchdev_obj_port_fdb *fdb = SWITCHDEV_OBJ_PORT_FDB(obj);
45d4122c 1031 struct switchdev_fdb_dump *dump =
25f07adc 1032 container_of(fdb, struct switchdev_fdb_dump, fdb);
45d4122c
SS
1033 u32 portid = NETLINK_CB(dump->cb->skb).portid;
1034 u32 seq = dump->cb->nlh->nlmsg_seq;
1035 struct nlmsghdr *nlh;
1036 struct ndmsg *ndm;
45d4122c
SS
1037
1038 if (dump->idx < dump->cb->args[0])
1039 goto skip;
1040
45d4122c
SS
1041 nlh = nlmsg_put(dump->skb, portid, seq, RTM_NEWNEIGH,
1042 sizeof(*ndm), NLM_F_MULTI);
1043 if (!nlh)
1044 return -EMSGSIZE;
1045
1046 ndm = nlmsg_data(nlh);
1047 ndm->ndm_family = AF_BRIDGE;
1048 ndm->ndm_pad1 = 0;
1049 ndm->ndm_pad2 = 0;
1050 ndm->ndm_flags = NTF_SELF;
1051 ndm->ndm_type = 0;
e02a06b2 1052 ndm->ndm_ifindex = dump->dev->ifindex;
25f07adc 1053 ndm->ndm_state = fdb->ndm_state;
45d4122c 1054
25f07adc 1055 if (nla_put(dump->skb, NDA_LLADDR, ETH_ALEN, fdb->addr))
45d4122c
SS
1056 goto nla_put_failure;
1057
25f07adc 1058 if (fdb->vid && nla_put_u16(dump->skb, NDA_VLAN, fdb->vid))
45d4122c
SS
1059 goto nla_put_failure;
1060
1061 nlmsg_end(dump->skb, nlh);
1062
1063skip:
1064 dump->idx++;
1065 return 0;
1066
1067nla_put_failure:
1068 nlmsg_cancel(dump->skb, nlh);
1069 return -EMSGSIZE;
1070}
1071
1072/**
1073 * switchdev_port_fdb_dump - Dump port FDB (MAC/VLAN) entries
1074 *
1075 * @skb: netlink skb
1076 * @cb: netlink callback
1077 * @dev: port device
1078 * @filter_dev: filter device
1079 * @idx:
1080 *
1081 * Delete FDB entry from switch device.
1082 */
1083int switchdev_port_fdb_dump(struct sk_buff *skb, struct netlink_callback *cb,
1084 struct net_device *dev,
1085 struct net_device *filter_dev, int idx)
1086{
1087 struct switchdev_fdb_dump dump = {
6ff64f6f 1088 .fdb.obj.orig_dev = dev,
9e8f4a54 1089 .fdb.obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
e02a06b2 1090 .dev = dev,
45d4122c
SS
1091 .skb = skb,
1092 .cb = cb,
45d4122c
SS
1093 .idx = idx,
1094 };
45d4122c 1095
9e8f4a54 1096 switchdev_port_obj_dump(dev, &dump.fdb.obj, switchdev_port_fdb_dump_cb);
45d4122c
SS
1097 return dump.idx;
1098}
1099EXPORT_SYMBOL_GPL(switchdev_port_fdb_dump);
1100
ebb9a03a 1101static struct net_device *switchdev_get_lowest_dev(struct net_device *dev)
b5d6fbde 1102{
9d47c0a2 1103 const struct switchdev_ops *ops = dev->switchdev_ops;
b5d6fbde
SF
1104 struct net_device *lower_dev;
1105 struct net_device *port_dev;
1106 struct list_head *iter;
1107
1108 /* Recusively search down until we find a sw port dev.
f8e20a9f 1109 * (A sw port dev supports switchdev_port_attr_get).
b5d6fbde
SF
1110 */
1111
f8e20a9f 1112 if (ops && ops->switchdev_port_attr_get)
b5d6fbde
SF
1113 return dev;
1114
1115 netdev_for_each_lower_dev(dev, lower_dev, iter) {
ebb9a03a 1116 port_dev = switchdev_get_lowest_dev(lower_dev);
b5d6fbde
SF
1117 if (port_dev)
1118 return port_dev;
1119 }
1120
1121 return NULL;
1122}
1123
ebb9a03a 1124static struct net_device *switchdev_get_dev_by_nhs(struct fib_info *fi)
b5d6fbde 1125{
f8e20a9f 1126 struct switchdev_attr attr = {
1f868398 1127 .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
f8e20a9f
SF
1128 };
1129 struct switchdev_attr prev_attr;
b5d6fbde
SF
1130 struct net_device *dev = NULL;
1131 int nhsel;
1132
771acac2
JP
1133 ASSERT_RTNL();
1134
b5d6fbde
SF
1135 /* For this route, all nexthop devs must be on the same switch. */
1136
1137 for (nhsel = 0; nhsel < fi->fib_nhs; nhsel++) {
1138 const struct fib_nh *nh = &fi->fib_nh[nhsel];
1139
1140 if (!nh->nh_dev)
1141 return NULL;
1142
ebb9a03a 1143 dev = switchdev_get_lowest_dev(nh->nh_dev);
b5d6fbde
SF
1144 if (!dev)
1145 return NULL;
1146
6ff64f6f 1147 attr.orig_dev = dev;
f8e20a9f 1148 if (switchdev_port_attr_get(dev, &attr))
b5d6fbde
SF
1149 return NULL;
1150
d754f98b
SF
1151 if (nhsel > 0 &&
1152 !netdev_phys_item_id_same(&prev_attr.u.ppid, &attr.u.ppid))
b5d6fbde 1153 return NULL;
b5d6fbde 1154
f8e20a9f 1155 prev_attr = attr;
b5d6fbde
SF
1156 }
1157
1158 return dev;
1159}
1160
5e8d9049 1161/**
7616dcbb 1162 * switchdev_fib_ipv4_add - Add/modify switch IPv4 route entry
5e8d9049
SF
1163 *
1164 * @dst: route's IPv4 destination address
1165 * @dst_len: destination address length (prefix length)
1166 * @fi: route FIB info structure
1167 * @tos: route TOS
1168 * @type: route type
f8f21471 1169 * @nlflags: netlink flags passed in (NLM_F_*)
5e8d9049
SF
1170 * @tb_id: route table ID
1171 *
7616dcbb 1172 * Add/modify switch IPv4 route entry.
5e8d9049 1173 */
ebb9a03a
JP
1174int switchdev_fib_ipv4_add(u32 dst, int dst_len, struct fib_info *fi,
1175 u8 tos, u8 type, u32 nlflags, u32 tb_id)
5e8d9049 1176{
ab069002 1177 struct switchdev_obj_ipv4_fib ipv4_fib = {
9e8f4a54 1178 .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
ab069002
VD
1179 .dst = dst,
1180 .dst_len = dst_len,
ab069002
VD
1181 .tos = tos,
1182 .type = type,
1183 .nlflags = nlflags,
1184 .tb_id = tb_id,
58c2cb16 1185 };
b5d6fbde 1186 struct net_device *dev;
b5d6fbde
SF
1187 int err = 0;
1188
850d0cbc
JP
1189 memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
1190
8e05fd71
SF
1191 /* Don't offload route if using custom ip rules or if
1192 * IPv4 FIB offloading has been disabled completely.
1193 */
1194
e1315db1
SF
1195#ifdef CONFIG_IP_MULTIPLE_TABLES
1196 if (fi->fib_net->ipv4.fib_has_custom_rules)
1197 return 0;
1198#endif
1199
1200 if (fi->fib_net->ipv4.fib_offload_disabled)
104616e7
SF
1201 return 0;
1202
ebb9a03a 1203 dev = switchdev_get_dev_by_nhs(fi);
b5d6fbde
SF
1204 if (!dev)
1205 return 0;
58c2cb16 1206
6ff64f6f 1207 ipv4_fib.obj.orig_dev = dev;
9e8f4a54 1208 err = switchdev_port_obj_add(dev, &ipv4_fib.obj);
58c2cb16 1209 if (!err)
36583eb5 1210 fi->fib_flags |= RTNH_F_OFFLOAD;
b5d6fbde 1211
af201f72 1212 return err == -EOPNOTSUPP ? 0 : err;
5e8d9049 1213}
ebb9a03a 1214EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_add);
5e8d9049
SF
1215
1216/**
ebb9a03a 1217 * switchdev_fib_ipv4_del - Delete IPv4 route entry from switch
5e8d9049
SF
1218 *
1219 * @dst: route's IPv4 destination address
1220 * @dst_len: destination address length (prefix length)
1221 * @fi: route FIB info structure
1222 * @tos: route TOS
1223 * @type: route type
1224 * @tb_id: route table ID
1225 *
1226 * Delete IPv4 route entry from switch device.
1227 */
ebb9a03a
JP
1228int switchdev_fib_ipv4_del(u32 dst, int dst_len, struct fib_info *fi,
1229 u8 tos, u8 type, u32 tb_id)
5e8d9049 1230{
ab069002 1231 struct switchdev_obj_ipv4_fib ipv4_fib = {
9e8f4a54 1232 .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
ab069002
VD
1233 .dst = dst,
1234 .dst_len = dst_len,
ab069002
VD
1235 .tos = tos,
1236 .type = type,
1237 .nlflags = 0,
1238 .tb_id = tb_id,
58c2cb16 1239 };
b5d6fbde 1240 struct net_device *dev;
b5d6fbde
SF
1241 int err = 0;
1242
850d0cbc
JP
1243 memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
1244
eea39946 1245 if (!(fi->fib_flags & RTNH_F_OFFLOAD))
b5d6fbde
SF
1246 return 0;
1247
ebb9a03a 1248 dev = switchdev_get_dev_by_nhs(fi);
b5d6fbde
SF
1249 if (!dev)
1250 return 0;
b5d6fbde 1251
6ff64f6f 1252 ipv4_fib.obj.orig_dev = dev;
9e8f4a54 1253 err = switchdev_port_obj_del(dev, &ipv4_fib.obj);
58c2cb16 1254 if (!err)
36583eb5 1255 fi->fib_flags &= ~RTNH_F_OFFLOAD;
b5d6fbde 1256
af201f72 1257 return err == -EOPNOTSUPP ? 0 : err;
5e8d9049 1258}
ebb9a03a 1259EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_del);
8e05fd71
SF
1260
1261/**
ebb9a03a 1262 * switchdev_fib_ipv4_abort - Abort an IPv4 FIB operation
8e05fd71
SF
1263 *
1264 * @fi: route FIB info structure
1265 */
ebb9a03a 1266void switchdev_fib_ipv4_abort(struct fib_info *fi)
8e05fd71
SF
1267{
1268 /* There was a problem installing this route to the offload
1269 * device. For now, until we come up with more refined
1270 * policy handling, abruptly end IPv4 fib offloading for
1271 * for entire net by flushing offload device(s) of all
1272 * IPv4 routes, and mark IPv4 fib offloading broken from
1273 * this point forward.
1274 */
1275
1276 fib_flush_external(fi->fib_net);
1277 fi->fib_net->ipv4.fib_offload_disabled = true;
1278}
ebb9a03a 1279EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_abort);
1a3b2ec9
SF
1280
1281static bool switchdev_port_same_parent_id(struct net_device *a,
1282 struct net_device *b)
1283{
1284 struct switchdev_attr a_attr = {
6ff64f6f 1285 .orig_dev = a,
1f868398 1286 .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
1a3b2ec9
SF
1287 .flags = SWITCHDEV_F_NO_RECURSE,
1288 };
1289 struct switchdev_attr b_attr = {
6ff64f6f 1290 .orig_dev = b,
1f868398 1291 .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
1a3b2ec9
SF
1292 .flags = SWITCHDEV_F_NO_RECURSE,
1293 };
1294
1295 if (switchdev_port_attr_get(a, &a_attr) ||
1296 switchdev_port_attr_get(b, &b_attr))
1297 return false;
1298
1299 return netdev_phys_item_id_same(&a_attr.u.ppid, &b_attr.u.ppid);
1300}
1301
1302static u32 switchdev_port_fwd_mark_get(struct net_device *dev,
1303 struct net_device *group_dev)
1304{
1305 struct net_device *lower_dev;
1306 struct list_head *iter;
1307
1308 netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
1309 if (lower_dev == dev)
1310 continue;
1311 if (switchdev_port_same_parent_id(dev, lower_dev))
1312 return lower_dev->offload_fwd_mark;
1313 return switchdev_port_fwd_mark_get(dev, lower_dev);
1314 }
1315
1316 return dev->ifindex;
1317}
1318
1319static void switchdev_port_fwd_mark_reset(struct net_device *group_dev,
1320 u32 old_mark, u32 *reset_mark)
1321{
1322 struct net_device *lower_dev;
1323 struct list_head *iter;
1324
1325 netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
1326 if (lower_dev->offload_fwd_mark == old_mark) {
1327 if (!*reset_mark)
1328 *reset_mark = lower_dev->ifindex;
1329 lower_dev->offload_fwd_mark = *reset_mark;
1330 }
1331 switchdev_port_fwd_mark_reset(lower_dev, old_mark, reset_mark);
1332 }
1333}
1334
1335/**
1336 * switchdev_port_fwd_mark_set - Set port offload forwarding mark
1337 *
1338 * @dev: port device
1339 * @group_dev: containing device
1340 * @joining: true if dev is joining group; false if leaving group
1341 *
1342 * An ungrouped port's offload mark is just its ifindex. A grouped
1343 * port's (member of a bridge, for example) offload mark is the ifindex
1344 * of one of the ports in the group with the same parent (switch) ID.
1345 * Ports on the same device in the same group will have the same mark.
1346 *
1347 * Example:
1348 *
1349 * br0 ifindex=9
1350 * sw1p1 ifindex=2 mark=2
1351 * sw1p2 ifindex=3 mark=2
1352 * sw2p1 ifindex=4 mark=5
1353 * sw2p2 ifindex=5 mark=5
1354 *
1355 * If sw2p2 leaves the bridge, we'll have:
1356 *
1357 * br0 ifindex=9
1358 * sw1p1 ifindex=2 mark=2
1359 * sw1p2 ifindex=3 mark=2
1360 * sw2p1 ifindex=4 mark=4
1361 * sw2p2 ifindex=5 mark=5
1362 */
1363void switchdev_port_fwd_mark_set(struct net_device *dev,
1364 struct net_device *group_dev,
1365 bool joining)
1366{
1367 u32 mark = dev->ifindex;
1368 u32 reset_mark = 0;
1369
771acac2
JP
1370 if (group_dev) {
1371 ASSERT_RTNL();
1372 if (joining)
1373 mark = switchdev_port_fwd_mark_get(dev, group_dev);
1374 else if (dev->offload_fwd_mark == mark)
1a3b2ec9
SF
1375 /* Ohoh, this port was the mark reference port,
1376 * but it's leaving the group, so reset the
1377 * mark for the remaining ports in the group.
1378 */
1379 switchdev_port_fwd_mark_reset(group_dev, mark,
1380 &reset_mark);
1381 }
1382
1383 dev->offload_fwd_mark = mark;
1384}
1385EXPORT_SYMBOL_GPL(switchdev_port_fwd_mark_set);