blob: 1eb76956b4390fef09825f38bda1f1b29a1ab352 [file] [log] [blame]
Jiri Pirko007f7902014-11-28 14:34:17 +01001/*
2 * net/switchdev/switchdev.c - Switch device API
Jiri Pirko7ea6eb32015-09-24 10:02:41 +02003 * Copyright (c) 2014-2015 Jiri Pirko <jiri@resnulli.us>
Scott Feldmanf8f21472015-03-09 13:59:09 -07004 * Copyright (c) 2014-2015 Scott Feldman <sfeldma@gmail.com>
Jiri Pirko007f7902014-11-28 14:34:17 +01005 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 */
11
12#include <linux/kernel.h>
13#include <linux/types.h>
14#include <linux/init.h>
Jiri Pirko03bf0c22015-01-15 23:49:36 +010015#include <linux/mutex.h>
16#include <linux/notifier.h>
Jiri Pirko007f7902014-11-28 14:34:17 +010017#include <linux/netdevice.h>
Jiri Pirko850d0cb2015-10-14 19:40:51 +020018#include <linux/etherdevice.h>
Scott Feldman47f83282015-05-10 09:47:56 -070019#include <linux/if_bridge.h>
Jiri Pirko7ea6eb32015-09-24 10:02:41 +020020#include <linux/list.h>
Jiri Pirko793f4012015-10-14 19:40:48 +020021#include <linux/workqueue.h>
Nikolay Aleksandrov87aaf2c2015-10-12 14:31:01 +020022#include <linux/if_vlan.h>
Scott Feldman5e8d9042015-03-05 21:21:15 -080023#include <net/ip_fib.h>
Jiri Pirko007f7902014-11-28 14:34:17 +010024#include <net/switchdev.h>
25
26/**
Jiri Pirko7ea6eb32015-09-24 10:02:41 +020027 * switchdev_trans_item_enqueue - Enqueue data item to transaction queue
28 *
29 * @trans: transaction
30 * @data: pointer to data being queued
31 * @destructor: data destructor
32 * @tritem: transaction item being queued
33 *
34 * Enqeueue data item to transaction queue. tritem is typically placed in
35 * cointainter pointed at by data pointer. Destructor is called on
36 * transaction abort and after successful commit phase in case
37 * the caller did not dequeue the item before.
38 */
39void switchdev_trans_item_enqueue(struct switchdev_trans *trans,
40 void *data, void (*destructor)(void const *),
41 struct switchdev_trans_item *tritem)
42{
43 tritem->data = data;
44 tritem->destructor = destructor;
45 list_add_tail(&tritem->list, &trans->item_list);
46}
47EXPORT_SYMBOL_GPL(switchdev_trans_item_enqueue);
48
49static struct switchdev_trans_item *
50__switchdev_trans_item_dequeue(struct switchdev_trans *trans)
51{
52 struct switchdev_trans_item *tritem;
53
54 if (list_empty(&trans->item_list))
55 return NULL;
56 tritem = list_first_entry(&trans->item_list,
57 struct switchdev_trans_item, list);
58 list_del(&tritem->list);
59 return tritem;
60}
61
62/**
63 * switchdev_trans_item_dequeue - Dequeue data item from transaction queue
64 *
65 * @trans: transaction
66 */
67void *switchdev_trans_item_dequeue(struct switchdev_trans *trans)
68{
69 struct switchdev_trans_item *tritem;
70
71 tritem = __switchdev_trans_item_dequeue(trans);
72 BUG_ON(!tritem);
73 return tritem->data;
74}
75EXPORT_SYMBOL_GPL(switchdev_trans_item_dequeue);
76
77static void switchdev_trans_init(struct switchdev_trans *trans)
78{
79 INIT_LIST_HEAD(&trans->item_list);
80}
81
82static void switchdev_trans_items_destroy(struct switchdev_trans *trans)
83{
84 struct switchdev_trans_item *tritem;
85
86 while ((tritem = __switchdev_trans_item_dequeue(trans)))
87 tritem->destructor(tritem->data);
88}
89
90static void switchdev_trans_items_warn_destroy(struct net_device *dev,
91 struct switchdev_trans *trans)
92{
93 WARN(!list_empty(&trans->item_list), "%s: transaction item queue is not empty.\n",
94 dev->name);
95 switchdev_trans_items_destroy(trans);
96}
97
Jiri Pirko793f4012015-10-14 19:40:48 +020098static LIST_HEAD(deferred);
99static DEFINE_SPINLOCK(deferred_lock);
100
101typedef void switchdev_deferred_func_t(struct net_device *dev,
102 const void *data);
103
104struct switchdev_deferred_item {
105 struct list_head list;
106 struct net_device *dev;
107 switchdev_deferred_func_t *func;
108 unsigned long data[0];
109};
110
111static struct switchdev_deferred_item *switchdev_deferred_dequeue(void)
112{
113 struct switchdev_deferred_item *dfitem;
114
115 spin_lock_bh(&deferred_lock);
116 if (list_empty(&deferred)) {
117 dfitem = NULL;
118 goto unlock;
119 }
120 dfitem = list_first_entry(&deferred,
121 struct switchdev_deferred_item, list);
122 list_del(&dfitem->list);
123unlock:
124 spin_unlock_bh(&deferred_lock);
125 return dfitem;
126}
127
128/**
129 * switchdev_deferred_process - Process ops in deferred queue
130 *
131 * Called to flush the ops currently queued in deferred ops queue.
132 * rtnl_lock must be held.
133 */
134void switchdev_deferred_process(void)
135{
136 struct switchdev_deferred_item *dfitem;
137
138 ASSERT_RTNL();
139
140 while ((dfitem = switchdev_deferred_dequeue())) {
141 dfitem->func(dfitem->dev, dfitem->data);
142 dev_put(dfitem->dev);
143 kfree(dfitem);
144 }
145}
146EXPORT_SYMBOL_GPL(switchdev_deferred_process);
147
148static void switchdev_deferred_process_work(struct work_struct *work)
149{
150 rtnl_lock();
151 switchdev_deferred_process();
152 rtnl_unlock();
153}
154
155static DECLARE_WORK(deferred_process_work, switchdev_deferred_process_work);
156
157static int switchdev_deferred_enqueue(struct net_device *dev,
158 const void *data, size_t data_len,
159 switchdev_deferred_func_t *func)
160{
161 struct switchdev_deferred_item *dfitem;
162
163 dfitem = kmalloc(sizeof(*dfitem) + data_len, GFP_ATOMIC);
164 if (!dfitem)
165 return -ENOMEM;
166 dfitem->dev = dev;
167 dfitem->func = func;
168 memcpy(dfitem->data, data, data_len);
169 dev_hold(dev);
170 spin_lock_bh(&deferred_lock);
171 list_add_tail(&dfitem->list, &deferred);
172 spin_unlock_bh(&deferred_lock);
173 schedule_work(&deferred_process_work);
174 return 0;
175}
176
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200177/**
Scott Feldman30943332015-05-10 09:47:48 -0700178 * switchdev_port_attr_get - Get port attribute
179 *
180 * @dev: port device
181 * @attr: attribute to get
182 */
183int switchdev_port_attr_get(struct net_device *dev, struct switchdev_attr *attr)
184{
185 const struct switchdev_ops *ops = dev->switchdev_ops;
186 struct net_device *lower_dev;
187 struct list_head *iter;
188 struct switchdev_attr first = {
Jiri Pirko1f868392015-10-01 11:03:42 +0200189 .id = SWITCHDEV_ATTR_ID_UNDEFINED
Scott Feldman30943332015-05-10 09:47:48 -0700190 };
191 int err = -EOPNOTSUPP;
192
193 if (ops && ops->switchdev_port_attr_get)
194 return ops->switchdev_port_attr_get(dev, attr);
195
196 if (attr->flags & SWITCHDEV_F_NO_RECURSE)
197 return err;
198
199 /* Switch device port(s) may be stacked under
200 * bond/team/vlan dev, so recurse down to get attr on
201 * each port. Return -ENODATA if attr values don't
202 * compare across ports.
203 */
204
205 netdev_for_each_lower_dev(dev, lower_dev, iter) {
206 err = switchdev_port_attr_get(lower_dev, attr);
207 if (err)
208 break;
Jiri Pirko1f868392015-10-01 11:03:42 +0200209 if (first.id == SWITCHDEV_ATTR_ID_UNDEFINED)
Scott Feldman30943332015-05-10 09:47:48 -0700210 first = *attr;
211 else if (memcmp(&first, attr, sizeof(*attr)))
212 return -ENODATA;
213 }
214
215 return err;
216}
217EXPORT_SYMBOL_GPL(switchdev_port_attr_get);
218
219static int __switchdev_port_attr_set(struct net_device *dev,
Jiri Pirkof7fadf32015-10-14 19:40:49 +0200220 const struct switchdev_attr *attr,
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200221 struct switchdev_trans *trans)
Scott Feldman30943332015-05-10 09:47:48 -0700222{
223 const struct switchdev_ops *ops = dev->switchdev_ops;
224 struct net_device *lower_dev;
225 struct list_head *iter;
226 int err = -EOPNOTSUPP;
227
228 if (ops && ops->switchdev_port_attr_set)
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200229 return ops->switchdev_port_attr_set(dev, attr, trans);
Scott Feldman30943332015-05-10 09:47:48 -0700230
231 if (attr->flags & SWITCHDEV_F_NO_RECURSE)
Scott Feldman464314e2015-10-08 19:23:18 -0700232 goto done;
Scott Feldman30943332015-05-10 09:47:48 -0700233
234 /* Switch device port(s) may be stacked under
235 * bond/team/vlan dev, so recurse down to set attr on
236 * each port.
237 */
238
239 netdev_for_each_lower_dev(dev, lower_dev, iter) {
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200240 err = __switchdev_port_attr_set(lower_dev, attr, trans);
Scott Feldman464314e2015-10-08 19:23:18 -0700241 if (err == -EOPNOTSUPP &&
242 attr->flags & SWITCHDEV_F_SKIP_EOPNOTSUPP)
243 continue;
Scott Feldman30943332015-05-10 09:47:48 -0700244 if (err)
245 break;
246 }
247
Scott Feldman464314e2015-10-08 19:23:18 -0700248done:
249 if (err == -EOPNOTSUPP && attr->flags & SWITCHDEV_F_SKIP_EOPNOTSUPP)
250 err = 0;
251
Scott Feldman30943332015-05-10 09:47:48 -0700252 return err;
253}
254
Jiri Pirko0bc05d52015-10-14 19:40:50 +0200255static int switchdev_port_attr_set_now(struct net_device *dev,
256 const struct switchdev_attr *attr)
Scott Feldman30943332015-05-10 09:47:48 -0700257{
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200258 struct switchdev_trans trans;
Scott Feldman30943332015-05-10 09:47:48 -0700259 int err;
260
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200261 switchdev_trans_init(&trans);
262
Scott Feldman30943332015-05-10 09:47:48 -0700263 /* Phase I: prepare for attr set. Driver/device should fail
264 * here if there are going to be issues in the commit phase,
265 * such as lack of resources or support. The driver/device
266 * should reserve resources needed for the commit phase here,
267 * but should not commit the attr.
268 */
269
Jiri Pirkof623ab72015-09-24 10:02:49 +0200270 trans.ph_prepare = true;
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200271 err = __switchdev_port_attr_set(dev, attr, &trans);
Scott Feldman30943332015-05-10 09:47:48 -0700272 if (err) {
273 /* Prepare phase failed: abort the transaction. Any
274 * resources reserved in the prepare phase are
275 * released.
276 */
277
Jiri Pirko9f6467c2015-09-24 10:02:47 +0200278 if (err != -EOPNOTSUPP)
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200279 switchdev_trans_items_destroy(&trans);
Scott Feldman30943332015-05-10 09:47:48 -0700280
281 return err;
282 }
283
284 /* Phase II: commit attr set. This cannot fail as a fault
285 * of driver/device. If it does, it's a bug in the driver/device
286 * because the driver said everythings was OK in phase I.
287 */
288
Jiri Pirkof623ab72015-09-24 10:02:49 +0200289 trans.ph_prepare = false;
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200290 err = __switchdev_port_attr_set(dev, attr, &trans);
Scott Feldmane9fdaec2015-06-11 11:20:42 -0700291 WARN(err, "%s: Commit of attribute (id=%d) failed.\n",
292 dev->name, attr->id);
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200293 switchdev_trans_items_warn_destroy(dev, &trans);
Scott Feldman30943332015-05-10 09:47:48 -0700294
295 return err;
296}
Jiri Pirko0bc05d52015-10-14 19:40:50 +0200297
298static void switchdev_port_attr_set_deferred(struct net_device *dev,
299 const void *data)
300{
301 const struct switchdev_attr *attr = data;
302 int err;
303
304 err = switchdev_port_attr_set_now(dev, attr);
305 if (err && err != -EOPNOTSUPP)
306 netdev_err(dev, "failed (err=%d) to set attribute (id=%d)\n",
307 err, attr->id);
308}
309
310static int switchdev_port_attr_set_defer(struct net_device *dev,
311 const struct switchdev_attr *attr)
312{
313 return switchdev_deferred_enqueue(dev, attr, sizeof(*attr),
314 switchdev_port_attr_set_deferred);
315}
316
317/**
318 * switchdev_port_attr_set - Set port attribute
319 *
320 * @dev: port device
321 * @attr: attribute to set
322 *
323 * Use a 2-phase prepare-commit transaction model to ensure
324 * system is not left in a partially updated state due to
325 * failure from driver/device.
326 *
327 * rtnl_lock must be held and must not be in atomic section,
328 * in case SWITCHDEV_F_DEFER flag is not set.
329 */
330int switchdev_port_attr_set(struct net_device *dev,
331 const struct switchdev_attr *attr)
332{
333 if (attr->flags & SWITCHDEV_F_DEFER)
334 return switchdev_port_attr_set_defer(dev, attr);
335 ASSERT_RTNL();
336 return switchdev_port_attr_set_now(dev, attr);
337}
Scott Feldman30943332015-05-10 09:47:48 -0700338EXPORT_SYMBOL_GPL(switchdev_port_attr_set);
339
Scott Feldman22c1f672015-05-12 23:03:51 -0700340static int __switchdev_port_obj_add(struct net_device *dev,
Jiri Pirko648b4a92015-10-01 11:03:45 +0200341 const struct switchdev_obj *obj,
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200342 struct switchdev_trans *trans)
Scott Feldman491d0f12015-05-10 09:47:52 -0700343{
344 const struct switchdev_ops *ops = dev->switchdev_ops;
345 struct net_device *lower_dev;
346 struct list_head *iter;
347 int err = -EOPNOTSUPP;
348
349 if (ops && ops->switchdev_port_obj_add)
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200350 return ops->switchdev_port_obj_add(dev, obj, trans);
Scott Feldman491d0f12015-05-10 09:47:52 -0700351
352 /* Switch device port(s) may be stacked under
353 * bond/team/vlan dev, so recurse down to add object on
354 * each port.
355 */
356
357 netdev_for_each_lower_dev(dev, lower_dev, iter) {
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200358 err = __switchdev_port_obj_add(lower_dev, obj, trans);
Scott Feldman491d0f12015-05-10 09:47:52 -0700359 if (err)
360 break;
361 }
362
363 return err;
364}
365
Jiri Pirko4d429c52015-10-14 19:40:52 +0200366static int switchdev_port_obj_add_now(struct net_device *dev,
367 const struct switchdev_obj *obj)
Scott Feldman491d0f12015-05-10 09:47:52 -0700368{
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200369 struct switchdev_trans trans;
Scott Feldman491d0f12015-05-10 09:47:52 -0700370 int err;
371
372 ASSERT_RTNL();
373
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200374 switchdev_trans_init(&trans);
375
Scott Feldman491d0f12015-05-10 09:47:52 -0700376 /* Phase I: prepare for obj add. Driver/device should fail
377 * here if there are going to be issues in the commit phase,
378 * such as lack of resources or support. The driver/device
379 * should reserve resources needed for the commit phase here,
380 * but should not commit the obj.
381 */
382
Jiri Pirkof623ab72015-09-24 10:02:49 +0200383 trans.ph_prepare = true;
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200384 err = __switchdev_port_obj_add(dev, obj, &trans);
Scott Feldman491d0f12015-05-10 09:47:52 -0700385 if (err) {
386 /* Prepare phase failed: abort the transaction. Any
387 * resources reserved in the prepare phase are
388 * released.
389 */
390
Jiri Pirko9f6467c2015-09-24 10:02:47 +0200391 if (err != -EOPNOTSUPP)
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200392 switchdev_trans_items_destroy(&trans);
Scott Feldman491d0f12015-05-10 09:47:52 -0700393
394 return err;
395 }
396
397 /* Phase II: commit obj add. This cannot fail as a fault
398 * of driver/device. If it does, it's a bug in the driver/device
399 * because the driver said everythings was OK in phase I.
400 */
401
Jiri Pirkof623ab72015-09-24 10:02:49 +0200402 trans.ph_prepare = false;
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200403 err = __switchdev_port_obj_add(dev, obj, &trans);
404 WARN(err, "%s: Commit of object (id=%d) failed.\n", dev->name, obj->id);
Jiri Pirko7ea6eb32015-09-24 10:02:41 +0200405 switchdev_trans_items_warn_destroy(dev, &trans);
Scott Feldman491d0f12015-05-10 09:47:52 -0700406
407 return err;
408}
Jiri Pirko4d429c52015-10-14 19:40:52 +0200409
410static void switchdev_port_obj_add_deferred(struct net_device *dev,
411 const void *data)
412{
413 const struct switchdev_obj *obj = data;
414 int err;
415
416 err = switchdev_port_obj_add_now(dev, obj);
417 if (err && err != -EOPNOTSUPP)
418 netdev_err(dev, "failed (err=%d) to add object (id=%d)\n",
419 err, obj->id);
420}
421
422static int switchdev_port_obj_add_defer(struct net_device *dev,
423 const struct switchdev_obj *obj)
424{
425 return switchdev_deferred_enqueue(dev, obj, sizeof(*obj),
426 switchdev_port_obj_add_deferred);
427}
Scott Feldman491d0f12015-05-10 09:47:52 -0700428
429/**
Jiri Pirko4d429c52015-10-14 19:40:52 +0200430 * switchdev_port_obj_add - Add port object
Scott Feldman491d0f12015-05-10 09:47:52 -0700431 *
432 * @dev: port device
Vivien Didelotab069002015-09-29 12:07:17 -0400433 * @id: object ID
Jiri Pirko4d429c52015-10-14 19:40:52 +0200434 * @obj: object to add
435 *
436 * Use a 2-phase prepare-commit transaction model to ensure
437 * system is not left in a partially updated state due to
438 * failure from driver/device.
439 *
440 * rtnl_lock must be held and must not be in atomic section,
441 * in case SWITCHDEV_F_DEFER flag is not set.
Scott Feldman491d0f12015-05-10 09:47:52 -0700442 */
Jiri Pirko4d429c52015-10-14 19:40:52 +0200443int switchdev_port_obj_add(struct net_device *dev,
Jiri Pirko648b4a92015-10-01 11:03:45 +0200444 const struct switchdev_obj *obj)
Scott Feldman491d0f12015-05-10 09:47:52 -0700445{
Jiri Pirko4d429c52015-10-14 19:40:52 +0200446 if (obj->flags & SWITCHDEV_F_DEFER)
447 return switchdev_port_obj_add_defer(dev, obj);
448 ASSERT_RTNL();
449 return switchdev_port_obj_add_now(dev, obj);
450}
451EXPORT_SYMBOL_GPL(switchdev_port_obj_add);
452
453static int switchdev_port_obj_del_now(struct net_device *dev,
454 const struct switchdev_obj *obj)
455{
Scott Feldman491d0f12015-05-10 09:47:52 -0700456 const struct switchdev_ops *ops = dev->switchdev_ops;
457 struct net_device *lower_dev;
458 struct list_head *iter;
459 int err = -EOPNOTSUPP;
460
461 if (ops && ops->switchdev_port_obj_del)
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200462 return ops->switchdev_port_obj_del(dev, obj);
Scott Feldman491d0f12015-05-10 09:47:52 -0700463
464 /* Switch device port(s) may be stacked under
465 * bond/team/vlan dev, so recurse down to delete object on
466 * each port.
467 */
468
469 netdev_for_each_lower_dev(dev, lower_dev, iter) {
Jiri Pirko4d429c52015-10-14 19:40:52 +0200470 err = switchdev_port_obj_del_now(lower_dev, obj);
Scott Feldman491d0f12015-05-10 09:47:52 -0700471 if (err)
472 break;
473 }
474
475 return err;
476}
Jiri Pirko4d429c52015-10-14 19:40:52 +0200477
478static void switchdev_port_obj_del_deferred(struct net_device *dev,
479 const void *data)
480{
481 const struct switchdev_obj *obj = data;
482 int err;
483
484 err = switchdev_port_obj_del_now(dev, obj);
485 if (err && err != -EOPNOTSUPP)
486 netdev_err(dev, "failed (err=%d) to del object (id=%d)\n",
487 err, obj->id);
488}
489
490static int switchdev_port_obj_del_defer(struct net_device *dev,
491 const struct switchdev_obj *obj)
492{
493 return switchdev_deferred_enqueue(dev, obj, sizeof(*obj),
494 switchdev_port_obj_del_deferred);
495}
496
497/**
498 * switchdev_port_obj_del - Delete port object
499 *
500 * @dev: port device
501 * @id: object ID
502 * @obj: object to delete
503 *
504 * rtnl_lock must be held and must not be in atomic section,
505 * in case SWITCHDEV_F_DEFER flag is not set.
506 */
507int switchdev_port_obj_del(struct net_device *dev,
508 const struct switchdev_obj *obj)
509{
510 if (obj->flags & SWITCHDEV_F_DEFER)
511 return switchdev_port_obj_del_defer(dev, obj);
512 ASSERT_RTNL();
513 return switchdev_port_obj_del_now(dev, obj);
514}
Scott Feldman491d0f12015-05-10 09:47:52 -0700515EXPORT_SYMBOL_GPL(switchdev_port_obj_del);
516
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700517/**
518 * switchdev_port_obj_dump - Dump port objects
519 *
520 * @dev: port device
Vivien Didelot25f07ad2015-09-29 12:07:16 -0400521 * @id: object ID
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700522 * @obj: object to dump
Vivien Didelot25f07ad2015-09-29 12:07:16 -0400523 * @cb: function to call with a filled object
Jiri Pirko771acac2015-10-14 19:40:55 +0200524 *
525 * rtnl_lock must be held.
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700526 */
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200527int switchdev_port_obj_dump(struct net_device *dev, struct switchdev_obj *obj,
Jiri Pirko648b4a92015-10-01 11:03:45 +0200528 switchdev_obj_dump_cb_t *cb)
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700529{
530 const struct switchdev_ops *ops = dev->switchdev_ops;
531 struct net_device *lower_dev;
532 struct list_head *iter;
533 int err = -EOPNOTSUPP;
534
Jiri Pirko771acac2015-10-14 19:40:55 +0200535 ASSERT_RTNL();
536
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700537 if (ops && ops->switchdev_port_obj_dump)
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200538 return ops->switchdev_port_obj_dump(dev, obj, cb);
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700539
540 /* Switch device port(s) may be stacked under
541 * bond/team/vlan dev, so recurse down to dump objects on
542 * first port at bottom of stack.
543 */
544
545 netdev_for_each_lower_dev(dev, lower_dev, iter) {
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200546 err = switchdev_port_obj_dump(lower_dev, obj, cb);
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700547 break;
548 }
549
550 return err;
551}
552EXPORT_SYMBOL_GPL(switchdev_port_obj_dump);
553
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700554static DEFINE_MUTEX(switchdev_mutex);
555static RAW_NOTIFIER_HEAD(switchdev_notif_chain);
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100556
557/**
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700558 * register_switchdev_notifier - Register notifier
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100559 * @nb: notifier_block
560 *
561 * Register switch device notifier. This should be used by code
562 * which needs to monitor events happening in particular device.
563 * Return values are same as for atomic_notifier_chain_register().
564 */
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700565int register_switchdev_notifier(struct notifier_block *nb)
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100566{
567 int err;
568
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700569 mutex_lock(&switchdev_mutex);
570 err = raw_notifier_chain_register(&switchdev_notif_chain, nb);
571 mutex_unlock(&switchdev_mutex);
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100572 return err;
573}
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700574EXPORT_SYMBOL_GPL(register_switchdev_notifier);
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100575
576/**
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700577 * unregister_switchdev_notifier - Unregister notifier
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100578 * @nb: notifier_block
579 *
580 * Unregister switch device notifier.
581 * Return values are same as for atomic_notifier_chain_unregister().
582 */
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700583int unregister_switchdev_notifier(struct notifier_block *nb)
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100584{
585 int err;
586
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700587 mutex_lock(&switchdev_mutex);
588 err = raw_notifier_chain_unregister(&switchdev_notif_chain, nb);
589 mutex_unlock(&switchdev_mutex);
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100590 return err;
591}
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700592EXPORT_SYMBOL_GPL(unregister_switchdev_notifier);
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100593
594/**
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700595 * call_switchdev_notifiers - Call notifiers
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100596 * @val: value passed unmodified to notifier function
597 * @dev: port device
598 * @info: notifier information data
599 *
600 * Call all network notifier blocks. This should be called by driver
601 * when it needs to propagate hardware event.
602 * Return values are same as for atomic_notifier_call_chain().
603 */
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700604int call_switchdev_notifiers(unsigned long val, struct net_device *dev,
605 struct switchdev_notifier_info *info)
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100606{
607 int err;
608
609 info->dev = dev;
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700610 mutex_lock(&switchdev_mutex);
611 err = raw_notifier_call_chain(&switchdev_notif_chain, val, info);
612 mutex_unlock(&switchdev_mutex);
Jiri Pirko03bf0c22015-01-15 23:49:36 +0100613 return err;
614}
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700615EXPORT_SYMBOL_GPL(call_switchdev_notifiers);
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800616
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700617struct switchdev_vlan_dump {
Jiri Pirko8f24f302015-10-01 11:03:43 +0200618 struct switchdev_obj_port_vlan vlan;
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700619 struct sk_buff *skb;
620 u32 filter_mask;
621 u16 flags;
622 u16 begin;
623 u16 end;
624};
625
Vivien Didelote23b0022015-09-29 12:07:13 -0400626static int switchdev_port_vlan_dump_put(struct switchdev_vlan_dump *dump)
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700627{
628 struct bridge_vlan_info vinfo;
629
630 vinfo.flags = dump->flags;
631
632 if (dump->begin == 0 && dump->end == 0) {
633 return 0;
634 } else if (dump->begin == dump->end) {
635 vinfo.vid = dump->begin;
636 if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
637 sizeof(vinfo), &vinfo))
638 return -EMSGSIZE;
639 } else {
640 vinfo.vid = dump->begin;
641 vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_BEGIN;
642 if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
643 sizeof(vinfo), &vinfo))
644 return -EMSGSIZE;
645 vinfo.vid = dump->end;
646 vinfo.flags &= ~BRIDGE_VLAN_INFO_RANGE_BEGIN;
647 vinfo.flags |= BRIDGE_VLAN_INFO_RANGE_END;
648 if (nla_put(dump->skb, IFLA_BRIDGE_VLAN_INFO,
649 sizeof(vinfo), &vinfo))
650 return -EMSGSIZE;
651 }
652
653 return 0;
654}
655
Jiri Pirko648b4a92015-10-01 11:03:45 +0200656static int switchdev_port_vlan_dump_cb(struct switchdev_obj *obj)
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700657{
Jiri Pirko648b4a92015-10-01 11:03:45 +0200658 struct switchdev_obj_port_vlan *vlan = SWITCHDEV_OBJ_PORT_VLAN(obj);
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700659 struct switchdev_vlan_dump *dump =
Vivien Didelot25f07ad2015-09-29 12:07:16 -0400660 container_of(vlan, struct switchdev_vlan_dump, vlan);
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700661 int err = 0;
662
663 if (vlan->vid_begin > vlan->vid_end)
664 return -EINVAL;
665
666 if (dump->filter_mask & RTEXT_FILTER_BRVLAN) {
667 dump->flags = vlan->flags;
668 for (dump->begin = dump->end = vlan->vid_begin;
669 dump->begin <= vlan->vid_end;
670 dump->begin++, dump->end++) {
Vivien Didelote23b0022015-09-29 12:07:13 -0400671 err = switchdev_port_vlan_dump_put(dump);
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700672 if (err)
673 return err;
674 }
675 } else if (dump->filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED) {
676 if (dump->begin > vlan->vid_begin &&
677 dump->begin >= vlan->vid_end) {
678 if ((dump->begin - 1) == vlan->vid_end &&
679 dump->flags == vlan->flags) {
680 /* prepend */
681 dump->begin = vlan->vid_begin;
682 } else {
Vivien Didelote23b0022015-09-29 12:07:13 -0400683 err = switchdev_port_vlan_dump_put(dump);
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700684 dump->flags = vlan->flags;
685 dump->begin = vlan->vid_begin;
686 dump->end = vlan->vid_end;
687 }
688 } else if (dump->end <= vlan->vid_begin &&
689 dump->end < vlan->vid_end) {
690 if ((dump->end + 1) == vlan->vid_begin &&
691 dump->flags == vlan->flags) {
692 /* append */
693 dump->end = vlan->vid_end;
694 } else {
Vivien Didelote23b0022015-09-29 12:07:13 -0400695 err = switchdev_port_vlan_dump_put(dump);
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700696 dump->flags = vlan->flags;
697 dump->begin = vlan->vid_begin;
698 dump->end = vlan->vid_end;
699 }
700 } else {
701 err = -EINVAL;
702 }
703 }
704
705 return err;
706}
707
708static int switchdev_port_vlan_fill(struct sk_buff *skb, struct net_device *dev,
709 u32 filter_mask)
710{
711 struct switchdev_vlan_dump dump = {
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200712 .vlan.obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700713 .skb = skb,
714 .filter_mask = filter_mask,
715 };
716 int err = 0;
717
718 if ((filter_mask & RTEXT_FILTER_BRVLAN) ||
719 (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)) {
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200720 err = switchdev_port_obj_dump(dev, &dump.vlan.obj,
Vivien Didelot25f07ad2015-09-29 12:07:16 -0400721 switchdev_port_vlan_dump_cb);
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700722 if (err)
723 goto err_out;
724 if (filter_mask & RTEXT_FILTER_BRVLAN_COMPRESSED)
725 /* last one */
Vivien Didelote23b0022015-09-29 12:07:13 -0400726 err = switchdev_port_vlan_dump_put(&dump);
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700727 }
728
729err_out:
730 return err == -EOPNOTSUPP ? 0 : err;
731}
732
Scott Feldman8793d0a2015-05-10 09:48:04 -0700733/**
734 * switchdev_port_bridge_getlink - Get bridge port attributes
735 *
736 * @dev: port device
737 *
738 * Called for SELF on rtnl_bridge_getlink to get bridge port
739 * attributes.
740 */
741int switchdev_port_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
742 struct net_device *dev, u32 filter_mask,
743 int nlflags)
744{
745 struct switchdev_attr attr = {
Jiri Pirko1f868392015-10-01 11:03:42 +0200746 .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
Scott Feldman8793d0a2015-05-10 09:48:04 -0700747 };
748 u16 mode = BRIDGE_MODE_UNDEF;
749 u32 mask = BR_LEARNING | BR_LEARNING_SYNC;
750 int err;
751
752 err = switchdev_port_attr_get(dev, &attr);
Vivien Didelot5c8079d2015-06-23 10:26:04 -0400753 if (err && err != -EOPNOTSUPP)
Scott Feldman8793d0a2015-05-10 09:48:04 -0700754 return err;
755
756 return ndo_dflt_bridge_getlink(skb, pid, seq, dev, mode,
Scott Feldman7d4f8d82015-06-22 00:27:17 -0700757 attr.u.brport_flags, mask, nlflags,
758 filter_mask, switchdev_port_vlan_fill);
Scott Feldman8793d0a2015-05-10 09:48:04 -0700759}
760EXPORT_SYMBOL_GPL(switchdev_port_bridge_getlink);
761
Scott Feldman47f83282015-05-10 09:47:56 -0700762static int switchdev_port_br_setflag(struct net_device *dev,
763 struct nlattr *nlattr,
764 unsigned long brport_flag)
765{
766 struct switchdev_attr attr = {
Jiri Pirko1f868392015-10-01 11:03:42 +0200767 .id = SWITCHDEV_ATTR_ID_PORT_BRIDGE_FLAGS,
Scott Feldman47f83282015-05-10 09:47:56 -0700768 };
769 u8 flag = nla_get_u8(nlattr);
770 int err;
771
772 err = switchdev_port_attr_get(dev, &attr);
773 if (err)
774 return err;
775
776 if (flag)
Scott Feldman42275bd2015-05-13 11:16:50 -0700777 attr.u.brport_flags |= brport_flag;
Scott Feldman47f83282015-05-10 09:47:56 -0700778 else
Scott Feldman42275bd2015-05-13 11:16:50 -0700779 attr.u.brport_flags &= ~brport_flag;
Scott Feldman47f83282015-05-10 09:47:56 -0700780
781 return switchdev_port_attr_set(dev, &attr);
782}
783
784static const struct nla_policy
785switchdev_port_bridge_policy[IFLA_BRPORT_MAX + 1] = {
786 [IFLA_BRPORT_STATE] = { .type = NLA_U8 },
787 [IFLA_BRPORT_COST] = { .type = NLA_U32 },
788 [IFLA_BRPORT_PRIORITY] = { .type = NLA_U16 },
789 [IFLA_BRPORT_MODE] = { .type = NLA_U8 },
790 [IFLA_BRPORT_GUARD] = { .type = NLA_U8 },
791 [IFLA_BRPORT_PROTECT] = { .type = NLA_U8 },
792 [IFLA_BRPORT_FAST_LEAVE] = { .type = NLA_U8 },
793 [IFLA_BRPORT_LEARNING] = { .type = NLA_U8 },
794 [IFLA_BRPORT_LEARNING_SYNC] = { .type = NLA_U8 },
795 [IFLA_BRPORT_UNICAST_FLOOD] = { .type = NLA_U8 },
796};
797
798static int switchdev_port_br_setlink_protinfo(struct net_device *dev,
799 struct nlattr *protinfo)
800{
801 struct nlattr *attr;
802 int rem;
803 int err;
804
805 err = nla_validate_nested(protinfo, IFLA_BRPORT_MAX,
806 switchdev_port_bridge_policy);
807 if (err)
808 return err;
809
810 nla_for_each_nested(attr, protinfo, rem) {
811 switch (nla_type(attr)) {
812 case IFLA_BRPORT_LEARNING:
813 err = switchdev_port_br_setflag(dev, attr,
814 BR_LEARNING);
815 break;
816 case IFLA_BRPORT_LEARNING_SYNC:
817 err = switchdev_port_br_setflag(dev, attr,
818 BR_LEARNING_SYNC);
819 break;
820 default:
821 err = -EOPNOTSUPP;
822 break;
823 }
824 if (err)
825 return err;
826 }
827
828 return 0;
829}
830
831static int switchdev_port_br_afspec(struct net_device *dev,
832 struct nlattr *afspec,
833 int (*f)(struct net_device *dev,
Jiri Pirko648b4a92015-10-01 11:03:45 +0200834 const struct switchdev_obj *obj))
Scott Feldman47f83282015-05-10 09:47:56 -0700835{
836 struct nlattr *attr;
837 struct bridge_vlan_info *vinfo;
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200838 struct switchdev_obj_port_vlan vlan = {
839 .obj.id = SWITCHDEV_OBJ_ID_PORT_VLAN,
840 };
Scott Feldman47f83282015-05-10 09:47:56 -0700841 int rem;
842 int err;
843
844 nla_for_each_nested(attr, afspec, rem) {
845 if (nla_type(attr) != IFLA_BRIDGE_VLAN_INFO)
846 continue;
847 if (nla_len(attr) != sizeof(struct bridge_vlan_info))
848 return -EINVAL;
849 vinfo = nla_data(attr);
Nikolay Aleksandrov87aaf2c2015-10-12 14:31:01 +0200850 if (!vinfo->vid || vinfo->vid >= VLAN_VID_MASK)
851 return -EINVAL;
Vivien Didelotab069002015-09-29 12:07:17 -0400852 vlan.flags = vinfo->flags;
Scott Feldman47f83282015-05-10 09:47:56 -0700853 if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_BEGIN) {
Vivien Didelotab069002015-09-29 12:07:17 -0400854 if (vlan.vid_begin)
Scott Feldman47f83282015-05-10 09:47:56 -0700855 return -EINVAL;
Vivien Didelotab069002015-09-29 12:07:17 -0400856 vlan.vid_begin = vinfo->vid;
Nikolay Aleksandrovcc02aa82015-10-12 14:01:39 +0200857 /* don't allow range of pvids */
858 if (vlan.flags & BRIDGE_VLAN_INFO_PVID)
859 return -EINVAL;
Scott Feldman47f83282015-05-10 09:47:56 -0700860 } else if (vinfo->flags & BRIDGE_VLAN_INFO_RANGE_END) {
Vivien Didelotab069002015-09-29 12:07:17 -0400861 if (!vlan.vid_begin)
Scott Feldman47f83282015-05-10 09:47:56 -0700862 return -EINVAL;
Vivien Didelotab069002015-09-29 12:07:17 -0400863 vlan.vid_end = vinfo->vid;
864 if (vlan.vid_end <= vlan.vid_begin)
Scott Feldman47f83282015-05-10 09:47:56 -0700865 return -EINVAL;
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200866 err = f(dev, &vlan.obj);
Scott Feldman47f83282015-05-10 09:47:56 -0700867 if (err)
868 return err;
Vivien Didelotab069002015-09-29 12:07:17 -0400869 memset(&vlan, 0, sizeof(vlan));
Scott Feldman47f83282015-05-10 09:47:56 -0700870 } else {
Vivien Didelotab069002015-09-29 12:07:17 -0400871 if (vlan.vid_begin)
Scott Feldman47f83282015-05-10 09:47:56 -0700872 return -EINVAL;
Vivien Didelotab069002015-09-29 12:07:17 -0400873 vlan.vid_begin = vinfo->vid;
874 vlan.vid_end = vinfo->vid;
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200875 err = f(dev, &vlan.obj);
Scott Feldman47f83282015-05-10 09:47:56 -0700876 if (err)
877 return err;
Vivien Didelotab069002015-09-29 12:07:17 -0400878 memset(&vlan, 0, sizeof(vlan));
Scott Feldman47f83282015-05-10 09:47:56 -0700879 }
880 }
881
882 return 0;
883}
884
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800885/**
Scott Feldman47f83282015-05-10 09:47:56 -0700886 * switchdev_port_bridge_setlink - Set bridge port attributes
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800887 *
888 * @dev: port device
Scott Feldman47f83282015-05-10 09:47:56 -0700889 * @nlh: netlink header
890 * @flags: netlink flags
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800891 *
Scott Feldman47f83282015-05-10 09:47:56 -0700892 * Called for SELF on rtnl_bridge_setlink to set bridge port
893 * attributes.
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800894 */
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700895int switchdev_port_bridge_setlink(struct net_device *dev,
896 struct nlmsghdr *nlh, u16 flags)
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800897{
Scott Feldman47f83282015-05-10 09:47:56 -0700898 struct nlattr *protinfo;
899 struct nlattr *afspec;
900 int err = 0;
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800901
Scott Feldman47f83282015-05-10 09:47:56 -0700902 protinfo = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
903 IFLA_PROTINFO);
904 if (protinfo) {
905 err = switchdev_port_br_setlink_protinfo(dev, protinfo);
906 if (err)
907 return err;
908 }
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800909
Scott Feldman47f83282015-05-10 09:47:56 -0700910 afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
911 IFLA_AF_SPEC);
912 if (afspec)
913 err = switchdev_port_br_afspec(dev, afspec,
914 switchdev_port_obj_add);
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800915
Scott Feldman47f83282015-05-10 09:47:56 -0700916 return err;
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800917}
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700918EXPORT_SYMBOL_GPL(switchdev_port_bridge_setlink);
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800919
920/**
Scott Feldman5c34e022015-05-10 09:48:00 -0700921 * switchdev_port_bridge_dellink - Set bridge port attributes
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800922 *
923 * @dev: port device
Scott Feldman5c34e022015-05-10 09:48:00 -0700924 * @nlh: netlink header
925 * @flags: netlink flags
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800926 *
Scott Feldman5c34e022015-05-10 09:48:00 -0700927 * Called for SELF on rtnl_bridge_dellink to set bridge port
928 * attributes.
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800929 */
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700930int switchdev_port_bridge_dellink(struct net_device *dev,
931 struct nlmsghdr *nlh, u16 flags)
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800932{
Scott Feldman5c34e022015-05-10 09:48:00 -0700933 struct nlattr *afspec;
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800934
Scott Feldman5c34e022015-05-10 09:48:00 -0700935 afspec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg),
936 IFLA_AF_SPEC);
937 if (afspec)
938 return switchdev_port_br_afspec(dev, afspec,
939 switchdev_port_obj_del);
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800940
Scott Feldman5c34e022015-05-10 09:48:00 -0700941 return 0;
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800942}
Jiri Pirkoebb9a032015-05-10 09:47:46 -0700943EXPORT_SYMBOL_GPL(switchdev_port_bridge_dellink);
Roopa Prabhu8a44dbb2015-01-29 22:40:13 -0800944
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700945/**
946 * switchdev_port_fdb_add - Add FDB (MAC/VLAN) entry to port
947 *
948 * @ndmsg: netlink hdr
949 * @nlattr: netlink attributes
950 * @dev: port device
951 * @addr: MAC address to add
952 * @vid: VLAN to add
953 *
954 * Add FDB entry to switch device.
955 */
956int switchdev_port_fdb_add(struct ndmsg *ndm, struct nlattr *tb[],
957 struct net_device *dev, const unsigned char *addr,
958 u16 vid, u16 nlm_flags)
959{
Jiri Pirko52ba57c2015-10-01 11:03:44 +0200960 struct switchdev_obj_port_fdb fdb = {
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200961 .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
Vivien Didelotab069002015-09-29 12:07:17 -0400962 .vid = vid,
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700963 };
964
Jiri Pirko850d0cb2015-10-14 19:40:51 +0200965 ether_addr_copy(fdb.addr, addr);
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200966 return switchdev_port_obj_add(dev, &fdb.obj);
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700967}
968EXPORT_SYMBOL_GPL(switchdev_port_fdb_add);
969
970/**
971 * switchdev_port_fdb_del - Delete FDB (MAC/VLAN) entry from port
972 *
973 * @ndmsg: netlink hdr
974 * @nlattr: netlink attributes
975 * @dev: port device
976 * @addr: MAC address to delete
977 * @vid: VLAN to delete
978 *
979 * Delete FDB entry from switch device.
980 */
981int switchdev_port_fdb_del(struct ndmsg *ndm, struct nlattr *tb[],
982 struct net_device *dev, const unsigned char *addr,
983 u16 vid)
984{
Jiri Pirko52ba57c2015-10-01 11:03:44 +0200985 struct switchdev_obj_port_fdb fdb = {
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200986 .obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
Vivien Didelotab069002015-09-29 12:07:17 -0400987 .vid = vid,
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700988 };
989
Jiri Pirko850d0cb2015-10-14 19:40:51 +0200990 ether_addr_copy(fdb.addr, addr);
Jiri Pirko9e8f4a52015-10-01 11:03:46 +0200991 return switchdev_port_obj_del(dev, &fdb.obj);
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700992}
993EXPORT_SYMBOL_GPL(switchdev_port_fdb_del);
994
995struct switchdev_fdb_dump {
Jiri Pirko52ba57c2015-10-01 11:03:44 +0200996 struct switchdev_obj_port_fdb fdb;
Vivien Didelote02a06b2015-09-29 12:07:14 -0400997 struct net_device *dev;
Samudrala, Sridhar45d41222015-05-13 21:55:43 -0700998 struct sk_buff *skb;
999 struct netlink_callback *cb;
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001000 int idx;
1001};
1002
Jiri Pirko648b4a92015-10-01 11:03:45 +02001003static int switchdev_port_fdb_dump_cb(struct switchdev_obj *obj)
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001004{
Jiri Pirko648b4a92015-10-01 11:03:45 +02001005 struct switchdev_obj_port_fdb *fdb = SWITCHDEV_OBJ_PORT_FDB(obj);
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001006 struct switchdev_fdb_dump *dump =
Vivien Didelot25f07ad2015-09-29 12:07:16 -04001007 container_of(fdb, struct switchdev_fdb_dump, fdb);
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001008 u32 portid = NETLINK_CB(dump->cb->skb).portid;
1009 u32 seq = dump->cb->nlh->nlmsg_seq;
1010 struct nlmsghdr *nlh;
1011 struct ndmsg *ndm;
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001012
1013 if (dump->idx < dump->cb->args[0])
1014 goto skip;
1015
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001016 nlh = nlmsg_put(dump->skb, portid, seq, RTM_NEWNEIGH,
1017 sizeof(*ndm), NLM_F_MULTI);
1018 if (!nlh)
1019 return -EMSGSIZE;
1020
1021 ndm = nlmsg_data(nlh);
1022 ndm->ndm_family = AF_BRIDGE;
1023 ndm->ndm_pad1 = 0;
1024 ndm->ndm_pad2 = 0;
1025 ndm->ndm_flags = NTF_SELF;
1026 ndm->ndm_type = 0;
Vivien Didelote02a06b2015-09-29 12:07:14 -04001027 ndm->ndm_ifindex = dump->dev->ifindex;
Vivien Didelot25f07ad2015-09-29 12:07:16 -04001028 ndm->ndm_state = fdb->ndm_state;
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001029
Vivien Didelot25f07ad2015-09-29 12:07:16 -04001030 if (nla_put(dump->skb, NDA_LLADDR, ETH_ALEN, fdb->addr))
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001031 goto nla_put_failure;
1032
Vivien Didelot25f07ad2015-09-29 12:07:16 -04001033 if (fdb->vid && nla_put_u16(dump->skb, NDA_VLAN, fdb->vid))
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001034 goto nla_put_failure;
1035
1036 nlmsg_end(dump->skb, nlh);
1037
1038skip:
1039 dump->idx++;
1040 return 0;
1041
1042nla_put_failure:
1043 nlmsg_cancel(dump->skb, nlh);
1044 return -EMSGSIZE;
1045}
1046
1047/**
1048 * switchdev_port_fdb_dump - Dump port FDB (MAC/VLAN) entries
1049 *
1050 * @skb: netlink skb
1051 * @cb: netlink callback
1052 * @dev: port device
1053 * @filter_dev: filter device
1054 * @idx:
1055 *
1056 * Delete FDB entry from switch device.
1057 */
1058int switchdev_port_fdb_dump(struct sk_buff *skb, struct netlink_callback *cb,
1059 struct net_device *dev,
1060 struct net_device *filter_dev, int idx)
1061{
1062 struct switchdev_fdb_dump dump = {
Jiri Pirko9e8f4a52015-10-01 11:03:46 +02001063 .fdb.obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
Vivien Didelote02a06b2015-09-29 12:07:14 -04001064 .dev = dev,
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001065 .skb = skb,
1066 .cb = cb,
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001067 .idx = idx,
1068 };
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001069
Jiri Pirko9e8f4a52015-10-01 11:03:46 +02001070 switchdev_port_obj_dump(dev, &dump.fdb.obj, switchdev_port_fdb_dump_cb);
Samudrala, Sridhar45d41222015-05-13 21:55:43 -07001071 return dump.idx;
1072}
1073EXPORT_SYMBOL_GPL(switchdev_port_fdb_dump);
1074
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001075static struct net_device *switchdev_get_lowest_dev(struct net_device *dev)
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001076{
Jiri Pirko9d47c0a2015-05-10 09:47:47 -07001077 const struct switchdev_ops *ops = dev->switchdev_ops;
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001078 struct net_device *lower_dev;
1079 struct net_device *port_dev;
1080 struct list_head *iter;
1081
1082 /* Recusively search down until we find a sw port dev.
Scott Feldmanf8e20a92015-05-10 09:47:49 -07001083 * (A sw port dev supports switchdev_port_attr_get).
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001084 */
1085
Scott Feldmanf8e20a92015-05-10 09:47:49 -07001086 if (ops && ops->switchdev_port_attr_get)
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001087 return dev;
1088
1089 netdev_for_each_lower_dev(dev, lower_dev, iter) {
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001090 port_dev = switchdev_get_lowest_dev(lower_dev);
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001091 if (port_dev)
1092 return port_dev;
1093 }
1094
1095 return NULL;
1096}
1097
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001098static struct net_device *switchdev_get_dev_by_nhs(struct fib_info *fi)
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001099{
Scott Feldmanf8e20a92015-05-10 09:47:49 -07001100 struct switchdev_attr attr = {
Jiri Pirko1f868392015-10-01 11:03:42 +02001101 .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
Scott Feldmanf8e20a92015-05-10 09:47:49 -07001102 };
1103 struct switchdev_attr prev_attr;
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001104 struct net_device *dev = NULL;
1105 int nhsel;
1106
Jiri Pirko771acac2015-10-14 19:40:55 +02001107 ASSERT_RTNL();
1108
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001109 /* For this route, all nexthop devs must be on the same switch. */
1110
1111 for (nhsel = 0; nhsel < fi->fib_nhs; nhsel++) {
1112 const struct fib_nh *nh = &fi->fib_nh[nhsel];
1113
1114 if (!nh->nh_dev)
1115 return NULL;
1116
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001117 dev = switchdev_get_lowest_dev(nh->nh_dev);
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001118 if (!dev)
1119 return NULL;
1120
Scott Feldmanf8e20a92015-05-10 09:47:49 -07001121 if (switchdev_port_attr_get(dev, &attr))
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001122 return NULL;
1123
Scott Feldmand754f982015-07-18 18:24:49 -07001124 if (nhsel > 0 &&
1125 !netdev_phys_item_id_same(&prev_attr.u.ppid, &attr.u.ppid))
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001126 return NULL;
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001127
Scott Feldmanf8e20a92015-05-10 09:47:49 -07001128 prev_attr = attr;
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001129 }
1130
1131 return dev;
1132}
1133
Scott Feldman5e8d9042015-03-05 21:21:15 -08001134/**
Scott Feldman7616dcb2015-06-03 20:43:43 -07001135 * switchdev_fib_ipv4_add - Add/modify switch IPv4 route entry
Scott Feldman5e8d9042015-03-05 21:21:15 -08001136 *
1137 * @dst: route's IPv4 destination address
1138 * @dst_len: destination address length (prefix length)
1139 * @fi: route FIB info structure
1140 * @tos: route TOS
1141 * @type: route type
Scott Feldmanf8f21472015-03-09 13:59:09 -07001142 * @nlflags: netlink flags passed in (NLM_F_*)
Scott Feldman5e8d9042015-03-05 21:21:15 -08001143 * @tb_id: route table ID
1144 *
Scott Feldman7616dcb2015-06-03 20:43:43 -07001145 * Add/modify switch IPv4 route entry.
Scott Feldman5e8d9042015-03-05 21:21:15 -08001146 */
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001147int switchdev_fib_ipv4_add(u32 dst, int dst_len, struct fib_info *fi,
1148 u8 tos, u8 type, u32 nlflags, u32 tb_id)
Scott Feldman5e8d9042015-03-05 21:21:15 -08001149{
Vivien Didelotab069002015-09-29 12:07:17 -04001150 struct switchdev_obj_ipv4_fib ipv4_fib = {
Jiri Pirko9e8f4a52015-10-01 11:03:46 +02001151 .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
Vivien Didelotab069002015-09-29 12:07:17 -04001152 .dst = dst,
1153 .dst_len = dst_len,
Vivien Didelotab069002015-09-29 12:07:17 -04001154 .tos = tos,
1155 .type = type,
1156 .nlflags = nlflags,
1157 .tb_id = tb_id,
Scott Feldman58c2cb12015-05-10 09:48:06 -07001158 };
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001159 struct net_device *dev;
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001160 int err = 0;
1161
Jiri Pirko850d0cb2015-10-14 19:40:51 +02001162 memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
1163
Scott Feldman8e05fd72015-03-05 21:21:19 -08001164 /* Don't offload route if using custom ip rules or if
1165 * IPv4 FIB offloading has been disabled completely.
1166 */
1167
Scott Feldmane1315db2015-03-06 01:14:36 -08001168#ifdef CONFIG_IP_MULTIPLE_TABLES
1169 if (fi->fib_net->ipv4.fib_has_custom_rules)
1170 return 0;
1171#endif
1172
1173 if (fi->fib_net->ipv4.fib_offload_disabled)
Scott Feldman104616e2015-03-05 21:21:16 -08001174 return 0;
1175
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001176 dev = switchdev_get_dev_by_nhs(fi);
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001177 if (!dev)
1178 return 0;
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001179
Jiri Pirko9e8f4a52015-10-01 11:03:46 +02001180 err = switchdev_port_obj_add(dev, &ipv4_fib.obj);
Scott Feldman58c2cb12015-05-10 09:48:06 -07001181 if (!err)
David S. Miller36583eb2015-05-23 01:22:35 -04001182 fi->fib_flags |= RTNH_F_OFFLOAD;
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001183
Scott Feldmanaf201f72015-06-10 17:04:49 -07001184 return err == -EOPNOTSUPP ? 0 : err;
Scott Feldman5e8d9042015-03-05 21:21:15 -08001185}
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001186EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_add);
Scott Feldman5e8d9042015-03-05 21:21:15 -08001187
1188/**
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001189 * switchdev_fib_ipv4_del - Delete IPv4 route entry from switch
Scott Feldman5e8d9042015-03-05 21:21:15 -08001190 *
1191 * @dst: route's IPv4 destination address
1192 * @dst_len: destination address length (prefix length)
1193 * @fi: route FIB info structure
1194 * @tos: route TOS
1195 * @type: route type
1196 * @tb_id: route table ID
1197 *
1198 * Delete IPv4 route entry from switch device.
1199 */
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001200int switchdev_fib_ipv4_del(u32 dst, int dst_len, struct fib_info *fi,
1201 u8 tos, u8 type, u32 tb_id)
Scott Feldman5e8d9042015-03-05 21:21:15 -08001202{
Vivien Didelotab069002015-09-29 12:07:17 -04001203 struct switchdev_obj_ipv4_fib ipv4_fib = {
Jiri Pirko9e8f4a52015-10-01 11:03:46 +02001204 .obj.id = SWITCHDEV_OBJ_ID_IPV4_FIB,
Vivien Didelotab069002015-09-29 12:07:17 -04001205 .dst = dst,
1206 .dst_len = dst_len,
Vivien Didelotab069002015-09-29 12:07:17 -04001207 .tos = tos,
1208 .type = type,
1209 .nlflags = 0,
1210 .tb_id = tb_id,
Scott Feldman58c2cb12015-05-10 09:48:06 -07001211 };
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001212 struct net_device *dev;
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001213 int err = 0;
1214
Jiri Pirko850d0cb2015-10-14 19:40:51 +02001215 memcpy(&ipv4_fib.fi, fi, sizeof(ipv4_fib.fi));
1216
Roopa Prabhueea39942015-05-13 21:17:41 -07001217 if (!(fi->fib_flags & RTNH_F_OFFLOAD))
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001218 return 0;
1219
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001220 dev = switchdev_get_dev_by_nhs(fi);
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001221 if (!dev)
1222 return 0;
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001223
Jiri Pirko9e8f4a52015-10-01 11:03:46 +02001224 err = switchdev_port_obj_del(dev, &ipv4_fib.obj);
Scott Feldman58c2cb12015-05-10 09:48:06 -07001225 if (!err)
David S. Miller36583eb2015-05-23 01:22:35 -04001226 fi->fib_flags &= ~RTNH_F_OFFLOAD;
Scott Feldmanb5d6fbd2015-03-05 21:21:17 -08001227
Scott Feldmanaf201f72015-06-10 17:04:49 -07001228 return err == -EOPNOTSUPP ? 0 : err;
Scott Feldman5e8d9042015-03-05 21:21:15 -08001229}
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001230EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_del);
Scott Feldman8e05fd72015-03-05 21:21:19 -08001231
1232/**
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001233 * switchdev_fib_ipv4_abort - Abort an IPv4 FIB operation
Scott Feldman8e05fd72015-03-05 21:21:19 -08001234 *
1235 * @fi: route FIB info structure
1236 */
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001237void switchdev_fib_ipv4_abort(struct fib_info *fi)
Scott Feldman8e05fd72015-03-05 21:21:19 -08001238{
1239 /* There was a problem installing this route to the offload
1240 * device. For now, until we come up with more refined
1241 * policy handling, abruptly end IPv4 fib offloading for
1242 * for entire net by flushing offload device(s) of all
1243 * IPv4 routes, and mark IPv4 fib offloading broken from
1244 * this point forward.
1245 */
1246
1247 fib_flush_external(fi->fib_net);
1248 fi->fib_net->ipv4.fib_offload_disabled = true;
1249}
Jiri Pirkoebb9a032015-05-10 09:47:46 -07001250EXPORT_SYMBOL_GPL(switchdev_fib_ipv4_abort);
Scott Feldman1a3b2ec2015-07-18 18:24:50 -07001251
1252static bool switchdev_port_same_parent_id(struct net_device *a,
1253 struct net_device *b)
1254{
1255 struct switchdev_attr a_attr = {
Jiri Pirko1f868392015-10-01 11:03:42 +02001256 .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
Scott Feldman1a3b2ec2015-07-18 18:24:50 -07001257 .flags = SWITCHDEV_F_NO_RECURSE,
1258 };
1259 struct switchdev_attr b_attr = {
Jiri Pirko1f868392015-10-01 11:03:42 +02001260 .id = SWITCHDEV_ATTR_ID_PORT_PARENT_ID,
Scott Feldman1a3b2ec2015-07-18 18:24:50 -07001261 .flags = SWITCHDEV_F_NO_RECURSE,
1262 };
1263
1264 if (switchdev_port_attr_get(a, &a_attr) ||
1265 switchdev_port_attr_get(b, &b_attr))
1266 return false;
1267
1268 return netdev_phys_item_id_same(&a_attr.u.ppid, &b_attr.u.ppid);
1269}
1270
1271static u32 switchdev_port_fwd_mark_get(struct net_device *dev,
1272 struct net_device *group_dev)
1273{
1274 struct net_device *lower_dev;
1275 struct list_head *iter;
1276
1277 netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
1278 if (lower_dev == dev)
1279 continue;
1280 if (switchdev_port_same_parent_id(dev, lower_dev))
1281 return lower_dev->offload_fwd_mark;
1282 return switchdev_port_fwd_mark_get(dev, lower_dev);
1283 }
1284
1285 return dev->ifindex;
1286}
1287
1288static void switchdev_port_fwd_mark_reset(struct net_device *group_dev,
1289 u32 old_mark, u32 *reset_mark)
1290{
1291 struct net_device *lower_dev;
1292 struct list_head *iter;
1293
1294 netdev_for_each_lower_dev(group_dev, lower_dev, iter) {
1295 if (lower_dev->offload_fwd_mark == old_mark) {
1296 if (!*reset_mark)
1297 *reset_mark = lower_dev->ifindex;
1298 lower_dev->offload_fwd_mark = *reset_mark;
1299 }
1300 switchdev_port_fwd_mark_reset(lower_dev, old_mark, reset_mark);
1301 }
1302}
1303
1304/**
1305 * switchdev_port_fwd_mark_set - Set port offload forwarding mark
1306 *
1307 * @dev: port device
1308 * @group_dev: containing device
1309 * @joining: true if dev is joining group; false if leaving group
1310 *
1311 * An ungrouped port's offload mark is just its ifindex. A grouped
1312 * port's (member of a bridge, for example) offload mark is the ifindex
1313 * of one of the ports in the group with the same parent (switch) ID.
1314 * Ports on the same device in the same group will have the same mark.
1315 *
1316 * Example:
1317 *
1318 * br0 ifindex=9
1319 * sw1p1 ifindex=2 mark=2
1320 * sw1p2 ifindex=3 mark=2
1321 * sw2p1 ifindex=4 mark=5
1322 * sw2p2 ifindex=5 mark=5
1323 *
1324 * If sw2p2 leaves the bridge, we'll have:
1325 *
1326 * br0 ifindex=9
1327 * sw1p1 ifindex=2 mark=2
1328 * sw1p2 ifindex=3 mark=2
1329 * sw2p1 ifindex=4 mark=4
1330 * sw2p2 ifindex=5 mark=5
1331 */
1332void switchdev_port_fwd_mark_set(struct net_device *dev,
1333 struct net_device *group_dev,
1334 bool joining)
1335{
1336 u32 mark = dev->ifindex;
1337 u32 reset_mark = 0;
1338
Jiri Pirko771acac2015-10-14 19:40:55 +02001339 if (group_dev) {
1340 ASSERT_RTNL();
1341 if (joining)
1342 mark = switchdev_port_fwd_mark_get(dev, group_dev);
1343 else if (dev->offload_fwd_mark == mark)
Scott Feldman1a3b2ec2015-07-18 18:24:50 -07001344 /* Ohoh, this port was the mark reference port,
1345 * but it's leaving the group, so reset the
1346 * mark for the remaining ports in the group.
1347 */
1348 switchdev_port_fwd_mark_reset(group_dev, mark,
1349 &reset_mark);
1350 }
1351
1352 dev->offload_fwd_mark = mark;
1353}
1354EXPORT_SYMBOL_GPL(switchdev_port_fwd_mark_set);