]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blame - drivers/net/ethernet/mellanox/mlxsw/spectrum_router.c
mlxsw: spectrum_router: Generalize __mlxsw_sp_ipip_entry_update_tunnel()
[mirror_ubuntu-jammy-kernel.git] / drivers / net / ethernet / mellanox / mlxsw / spectrum_router.c
CommitLineData
464dce18
IS
1/*
2 * drivers/net/ethernet/mellanox/mlxsw/spectrum_router.c
6ddb7426 3 * Copyright (c) 2016-2017 Mellanox Technologies. All rights reserved.
464dce18
IS
4 * Copyright (c) 2016 Jiri Pirko <jiri@mellanox.com>
5 * Copyright (c) 2016 Ido Schimmel <idosch@mellanox.com>
c723c735 6 * Copyright (c) 2016 Yotam Gigi <yotamg@mellanox.com>
6ddb7426 7 * Copyright (c) 2017 Petr Machata <petrm@mellanox.com>
464dce18
IS
8 *
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions are met:
11 *
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
17 * 3. Neither the names of the copyright holders nor the names of its
18 * contributors may be used to endorse or promote products derived from
19 * this software without specific prior written permission.
20 *
21 * Alternatively, this software may be distributed under the terms of the
22 * GNU General Public License ("GPL") version 2 as published by the Free
23 * Software Foundation.
24 *
25 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
26 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
27 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
28 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
29 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
30 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
31 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
32 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
33 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
34 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
35 * POSSIBILITY OF SUCH DAMAGE.
36 */
37
38#include <linux/kernel.h>
39#include <linux/types.h>
5e9c16cc
JP
40#include <linux/rhashtable.h>
41#include <linux/bitops.h>
42#include <linux/in6.h>
c723c735 43#include <linux/notifier.h>
df6dd79b 44#include <linux/inetdevice.h>
9db032bb 45#include <linux/netdevice.h>
03ea01e9 46#include <linux/if_bridge.h>
b5f3e0d4 47#include <linux/socket.h>
428b851f 48#include <linux/route.h>
eb789980 49#include <linux/gcd.h>
af658b6a 50#include <linux/random.h>
c723c735 51#include <net/netevent.h>
6cf3c971
JP
52#include <net/neighbour.h>
53#include <net/arp.h>
b45f64d1 54#include <net/ip_fib.h>
583419fd 55#include <net/ip6_fib.h>
5d7bfd14 56#include <net/fib_rules.h>
6ddb7426 57#include <net/ip_tunnels.h>
57837885 58#include <net/l3mdev.h>
5ea1237f 59#include <net/addrconf.h>
d5eb89cf
AS
60#include <net/ndisc.h>
61#include <net/ipv6.h>
04b1d4e5 62#include <net/fib_notifier.h>
464dce18
IS
63
64#include "spectrum.h"
65#include "core.h"
66#include "reg.h"
e0c0afd8
AS
67#include "spectrum_cnt.h"
68#include "spectrum_dpipe.h"
38ebc0f4 69#include "spectrum_ipip.h"
d42b0965
YG
70#include "spectrum_mr.h"
71#include "spectrum_mr_tcam.h"
e0c0afd8 72#include "spectrum_router.h"
464dce18 73
9011b677
IS
74struct mlxsw_sp_vr;
75struct mlxsw_sp_lpm_tree;
e4f3c1c1 76struct mlxsw_sp_rif_ops;
9011b677
IS
77
78struct mlxsw_sp_router {
79 struct mlxsw_sp *mlxsw_sp;
5f9efffb 80 struct mlxsw_sp_rif **rifs;
9011b677
IS
81 struct mlxsw_sp_vr *vrs;
82 struct rhashtable neigh_ht;
83 struct rhashtable nexthop_group_ht;
84 struct rhashtable nexthop_ht;
dbe4598c 85 struct list_head nexthop_list;
9011b677
IS
86 struct {
87 struct mlxsw_sp_lpm_tree *trees;
88 unsigned int tree_count;
89 } lpm;
90 struct {
91 struct delayed_work dw;
92 unsigned long interval; /* ms */
93 } neighs_update;
94 struct delayed_work nexthop_probe_dw;
95#define MLXSW_SP_UNRESOLVED_NH_PROBE_INTERVAL 5000 /* ms */
96 struct list_head nexthop_neighs_list;
1012b9ac 97 struct list_head ipip_list;
9011b677 98 bool aborted;
7e39d115 99 struct notifier_block fib_nb;
48fac885 100 struct notifier_block netevent_nb;
e4f3c1c1 101 const struct mlxsw_sp_rif_ops **rif_ops_arr;
38ebc0f4 102 const struct mlxsw_sp_ipip_ops **ipip_ops_arr;
9011b677
IS
103};
104
4724ba56
IS
105struct mlxsw_sp_rif {
106 struct list_head nexthop_list;
107 struct list_head neigh_list;
108 struct net_device *dev;
a1107487 109 struct mlxsw_sp_fid *fid;
4724ba56
IS
110 unsigned char addr[ETH_ALEN];
111 int mtu;
bf95233e 112 u16 rif_index;
6913229e 113 u16 vr_id;
e4f3c1c1
IS
114 const struct mlxsw_sp_rif_ops *ops;
115 struct mlxsw_sp *mlxsw_sp;
116
e0c0afd8
AS
117 unsigned int counter_ingress;
118 bool counter_ingress_valid;
119 unsigned int counter_egress;
120 bool counter_egress_valid;
4724ba56
IS
121};
122
e4f3c1c1
IS
123struct mlxsw_sp_rif_params {
124 struct net_device *dev;
125 union {
126 u16 system_port;
127 u16 lag_id;
128 };
129 u16 vid;
130 bool lag;
131};
132
4d93ceeb
IS
133struct mlxsw_sp_rif_subport {
134 struct mlxsw_sp_rif common;
135 union {
136 u16 system_port;
137 u16 lag_id;
138 };
139 u16 vid;
140 bool lag;
141};
142
6ddb7426
PM
143struct mlxsw_sp_rif_ipip_lb {
144 struct mlxsw_sp_rif common;
145 struct mlxsw_sp_rif_ipip_lb_config lb_config;
146 u16 ul_vr_id; /* Reserved for Spectrum-2. */
147};
148
149struct mlxsw_sp_rif_params_ipip_lb {
150 struct mlxsw_sp_rif_params common;
151 struct mlxsw_sp_rif_ipip_lb_config lb_config;
152};
153
e4f3c1c1
IS
154struct mlxsw_sp_rif_ops {
155 enum mlxsw_sp_rif_type type;
156 size_t rif_size;
157
158 void (*setup)(struct mlxsw_sp_rif *rif,
159 const struct mlxsw_sp_rif_params *params);
160 int (*configure)(struct mlxsw_sp_rif *rif);
161 void (*deconfigure)(struct mlxsw_sp_rif *rif);
162 struct mlxsw_sp_fid * (*fid_get)(struct mlxsw_sp_rif *rif);
163};
164
e0c0afd8
AS
165static unsigned int *
166mlxsw_sp_rif_p_counter_get(struct mlxsw_sp_rif *rif,
167 enum mlxsw_sp_rif_counter_dir dir)
168{
169 switch (dir) {
170 case MLXSW_SP_RIF_COUNTER_EGRESS:
171 return &rif->counter_egress;
172 case MLXSW_SP_RIF_COUNTER_INGRESS:
173 return &rif->counter_ingress;
174 }
175 return NULL;
176}
177
178static bool
179mlxsw_sp_rif_counter_valid_get(struct mlxsw_sp_rif *rif,
180 enum mlxsw_sp_rif_counter_dir dir)
181{
182 switch (dir) {
183 case MLXSW_SP_RIF_COUNTER_EGRESS:
184 return rif->counter_egress_valid;
185 case MLXSW_SP_RIF_COUNTER_INGRESS:
186 return rif->counter_ingress_valid;
187 }
188 return false;
189}
190
191static void
192mlxsw_sp_rif_counter_valid_set(struct mlxsw_sp_rif *rif,
193 enum mlxsw_sp_rif_counter_dir dir,
194 bool valid)
195{
196 switch (dir) {
197 case MLXSW_SP_RIF_COUNTER_EGRESS:
198 rif->counter_egress_valid = valid;
199 break;
200 case MLXSW_SP_RIF_COUNTER_INGRESS:
201 rif->counter_ingress_valid = valid;
202 break;
203 }
204}
205
206static int mlxsw_sp_rif_counter_edit(struct mlxsw_sp *mlxsw_sp, u16 rif_index,
207 unsigned int counter_index, bool enable,
208 enum mlxsw_sp_rif_counter_dir dir)
209{
210 char ritr_pl[MLXSW_REG_RITR_LEN];
211 bool is_egress = false;
212 int err;
213
214 if (dir == MLXSW_SP_RIF_COUNTER_EGRESS)
215 is_egress = true;
216 mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index);
217 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
218 if (err)
219 return err;
220
221 mlxsw_reg_ritr_counter_pack(ritr_pl, counter_index, enable,
222 is_egress);
223 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
224}
225
226int mlxsw_sp_rif_counter_value_get(struct mlxsw_sp *mlxsw_sp,
227 struct mlxsw_sp_rif *rif,
228 enum mlxsw_sp_rif_counter_dir dir, u64 *cnt)
229{
230 char ricnt_pl[MLXSW_REG_RICNT_LEN];
231 unsigned int *p_counter_index;
232 bool valid;
233 int err;
234
235 valid = mlxsw_sp_rif_counter_valid_get(rif, dir);
236 if (!valid)
237 return -EINVAL;
238
239 p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir);
240 if (!p_counter_index)
241 return -EINVAL;
242 mlxsw_reg_ricnt_pack(ricnt_pl, *p_counter_index,
243 MLXSW_REG_RICNT_OPCODE_NOP);
244 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ricnt), ricnt_pl);
245 if (err)
246 return err;
247 *cnt = mlxsw_reg_ricnt_good_unicast_packets_get(ricnt_pl);
248 return 0;
249}
250
251static int mlxsw_sp_rif_counter_clear(struct mlxsw_sp *mlxsw_sp,
252 unsigned int counter_index)
253{
254 char ricnt_pl[MLXSW_REG_RICNT_LEN];
255
256 mlxsw_reg_ricnt_pack(ricnt_pl, counter_index,
257 MLXSW_REG_RICNT_OPCODE_CLEAR);
258 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ricnt), ricnt_pl);
259}
260
261int mlxsw_sp_rif_counter_alloc(struct mlxsw_sp *mlxsw_sp,
262 struct mlxsw_sp_rif *rif,
263 enum mlxsw_sp_rif_counter_dir dir)
264{
265 unsigned int *p_counter_index;
266 int err;
267
268 p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir);
269 if (!p_counter_index)
270 return -EINVAL;
271 err = mlxsw_sp_counter_alloc(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF,
272 p_counter_index);
273 if (err)
274 return err;
275
276 err = mlxsw_sp_rif_counter_clear(mlxsw_sp, *p_counter_index);
277 if (err)
278 goto err_counter_clear;
279
280 err = mlxsw_sp_rif_counter_edit(mlxsw_sp, rif->rif_index,
281 *p_counter_index, true, dir);
282 if (err)
283 goto err_counter_edit;
284 mlxsw_sp_rif_counter_valid_set(rif, dir, true);
285 return 0;
286
287err_counter_edit:
288err_counter_clear:
289 mlxsw_sp_counter_free(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF,
290 *p_counter_index);
291 return err;
292}
293
294void mlxsw_sp_rif_counter_free(struct mlxsw_sp *mlxsw_sp,
295 struct mlxsw_sp_rif *rif,
296 enum mlxsw_sp_rif_counter_dir dir)
297{
298 unsigned int *p_counter_index;
299
6b1206bb
AS
300 if (!mlxsw_sp_rif_counter_valid_get(rif, dir))
301 return;
302
e0c0afd8
AS
303 p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir);
304 if (WARN_ON(!p_counter_index))
305 return;
306 mlxsw_sp_rif_counter_edit(mlxsw_sp, rif->rif_index,
307 *p_counter_index, false, dir);
308 mlxsw_sp_counter_free(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF,
309 *p_counter_index);
310 mlxsw_sp_rif_counter_valid_set(rif, dir, false);
311}
312
e4f3c1c1
IS
313static void mlxsw_sp_rif_counters_alloc(struct mlxsw_sp_rif *rif)
314{
315 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
316 struct devlink *devlink;
317
318 devlink = priv_to_devlink(mlxsw_sp->core);
319 if (!devlink_dpipe_table_counter_enabled(devlink,
320 MLXSW_SP_DPIPE_TABLE_NAME_ERIF))
321 return;
322 mlxsw_sp_rif_counter_alloc(mlxsw_sp, rif, MLXSW_SP_RIF_COUNTER_EGRESS);
323}
324
325static void mlxsw_sp_rif_counters_free(struct mlxsw_sp_rif *rif)
326{
327 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
328
329 mlxsw_sp_rif_counter_free(mlxsw_sp, rif, MLXSW_SP_RIF_COUNTER_EGRESS);
330}
331
4724ba56
IS
332static struct mlxsw_sp_rif *
333mlxsw_sp_rif_find_by_dev(const struct mlxsw_sp *mlxsw_sp,
334 const struct net_device *dev);
335
7dcc18ad 336#define MLXSW_SP_PREFIX_COUNT (sizeof(struct in6_addr) * BITS_PER_BYTE + 1)
9011b677
IS
337
338struct mlxsw_sp_prefix_usage {
339 DECLARE_BITMAP(b, MLXSW_SP_PREFIX_COUNT);
340};
341
53342023
JP
342#define mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage) \
343 for_each_set_bit(prefix, (prefix_usage)->b, MLXSW_SP_PREFIX_COUNT)
344
345static bool
346mlxsw_sp_prefix_usage_eq(struct mlxsw_sp_prefix_usage *prefix_usage1,
347 struct mlxsw_sp_prefix_usage *prefix_usage2)
348{
349 return !memcmp(prefix_usage1, prefix_usage2, sizeof(*prefix_usage1));
350}
351
6b75c480
JP
352static bool
353mlxsw_sp_prefix_usage_none(struct mlxsw_sp_prefix_usage *prefix_usage)
354{
355 struct mlxsw_sp_prefix_usage prefix_usage_none = {{ 0 } };
356
357 return mlxsw_sp_prefix_usage_eq(prefix_usage, &prefix_usage_none);
358}
359
360static void
361mlxsw_sp_prefix_usage_cpy(struct mlxsw_sp_prefix_usage *prefix_usage1,
362 struct mlxsw_sp_prefix_usage *prefix_usage2)
363{
364 memcpy(prefix_usage1, prefix_usage2, sizeof(*prefix_usage1));
365}
366
5e9c16cc
JP
367static void
368mlxsw_sp_prefix_usage_set(struct mlxsw_sp_prefix_usage *prefix_usage,
369 unsigned char prefix_len)
370{
371 set_bit(prefix_len, prefix_usage->b);
372}
373
374static void
375mlxsw_sp_prefix_usage_clear(struct mlxsw_sp_prefix_usage *prefix_usage,
376 unsigned char prefix_len)
377{
378 clear_bit(prefix_len, prefix_usage->b);
379}
380
381struct mlxsw_sp_fib_key {
382 unsigned char addr[sizeof(struct in6_addr)];
383 unsigned char prefix_len;
384};
385
61c503f9
JP
386enum mlxsw_sp_fib_entry_type {
387 MLXSW_SP_FIB_ENTRY_TYPE_REMOTE,
388 MLXSW_SP_FIB_ENTRY_TYPE_LOCAL,
389 MLXSW_SP_FIB_ENTRY_TYPE_TRAP,
4607f6d2
PM
390
391 /* This is a special case of local delivery, where a packet should be
392 * decapsulated on reception. Note that there is no corresponding ENCAP,
393 * because that's a type of next hop, not of FIB entry. (There can be
394 * several next hops in a REMOTE entry, and some of them may be
395 * encapsulating entries.)
396 */
397 MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP,
61c503f9
JP
398};
399
a7ff87ac 400struct mlxsw_sp_nexthop_group;
9011b677 401struct mlxsw_sp_fib;
a7ff87ac 402
9aecce1c
IS
403struct mlxsw_sp_fib_node {
404 struct list_head entry_list;
b45f64d1 405 struct list_head list;
9aecce1c 406 struct rhash_head ht_node;
76610ebb 407 struct mlxsw_sp_fib *fib;
5e9c16cc 408 struct mlxsw_sp_fib_key key;
9aecce1c
IS
409};
410
4607f6d2
PM
411struct mlxsw_sp_fib_entry_decap {
412 struct mlxsw_sp_ipip_entry *ipip_entry;
413 u32 tunnel_index;
414};
415
9aecce1c
IS
416struct mlxsw_sp_fib_entry {
417 struct list_head list;
418 struct mlxsw_sp_fib_node *fib_node;
61c503f9 419 enum mlxsw_sp_fib_entry_type type;
a7ff87ac
JP
420 struct list_head nexthop_group_node;
421 struct mlxsw_sp_nexthop_group *nh_group;
4607f6d2 422 struct mlxsw_sp_fib_entry_decap decap; /* Valid for decap entries. */
5e9c16cc
JP
423};
424
4f1c7f1f
IS
425struct mlxsw_sp_fib4_entry {
426 struct mlxsw_sp_fib_entry common;
427 u32 tb_id;
428 u32 prio;
429 u8 tos;
430 u8 type;
431};
432
428b851f
IS
433struct mlxsw_sp_fib6_entry {
434 struct mlxsw_sp_fib_entry common;
435 struct list_head rt6_list;
436 unsigned int nrt6;
437};
438
439struct mlxsw_sp_rt6 {
440 struct list_head list;
441 struct rt6_info *rt;
442};
443
9011b677
IS
444struct mlxsw_sp_lpm_tree {
445 u8 id; /* tree ID */
446 unsigned int ref_count;
447 enum mlxsw_sp_l3proto proto;
448 struct mlxsw_sp_prefix_usage prefix_usage;
449};
450
5e9c16cc
JP
451struct mlxsw_sp_fib {
452 struct rhashtable ht;
9aecce1c 453 struct list_head node_list;
76610ebb
IS
454 struct mlxsw_sp_vr *vr;
455 struct mlxsw_sp_lpm_tree *lpm_tree;
5e9c16cc
JP
456 unsigned long prefix_ref_count[MLXSW_SP_PREFIX_COUNT];
457 struct mlxsw_sp_prefix_usage prefix_usage;
76610ebb 458 enum mlxsw_sp_l3proto proto;
5e9c16cc
JP
459};
460
9011b677
IS
461struct mlxsw_sp_vr {
462 u16 id; /* virtual router ID */
463 u32 tb_id; /* kernel fib table id */
464 unsigned int rif_count;
465 struct mlxsw_sp_fib *fib4;
a3d9bc50 466 struct mlxsw_sp_fib *fib6;
d42b0965 467 struct mlxsw_sp_mr_table *mr4_table;
9011b677
IS
468};
469
9aecce1c 470static const struct rhashtable_params mlxsw_sp_fib_ht_params;
5e9c16cc 471
76610ebb
IS
472static struct mlxsw_sp_fib *mlxsw_sp_fib_create(struct mlxsw_sp_vr *vr,
473 enum mlxsw_sp_l3proto proto)
5e9c16cc
JP
474{
475 struct mlxsw_sp_fib *fib;
476 int err;
477
478 fib = kzalloc(sizeof(*fib), GFP_KERNEL);
479 if (!fib)
480 return ERR_PTR(-ENOMEM);
481 err = rhashtable_init(&fib->ht, &mlxsw_sp_fib_ht_params);
482 if (err)
483 goto err_rhashtable_init;
9aecce1c 484 INIT_LIST_HEAD(&fib->node_list);
76610ebb
IS
485 fib->proto = proto;
486 fib->vr = vr;
5e9c16cc
JP
487 return fib;
488
489err_rhashtable_init:
490 kfree(fib);
491 return ERR_PTR(err);
492}
493
494static void mlxsw_sp_fib_destroy(struct mlxsw_sp_fib *fib)
495{
9aecce1c 496 WARN_ON(!list_empty(&fib->node_list));
76610ebb 497 WARN_ON(fib->lpm_tree);
5e9c16cc
JP
498 rhashtable_destroy(&fib->ht);
499 kfree(fib);
500}
501
53342023 502static struct mlxsw_sp_lpm_tree *
382dbb40 503mlxsw_sp_lpm_tree_find_unused(struct mlxsw_sp *mlxsw_sp)
53342023
JP
504{
505 static struct mlxsw_sp_lpm_tree *lpm_tree;
506 int i;
507
9011b677
IS
508 for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) {
509 lpm_tree = &mlxsw_sp->router->lpm.trees[i];
382dbb40
IS
510 if (lpm_tree->ref_count == 0)
511 return lpm_tree;
53342023
JP
512 }
513 return NULL;
514}
515
516static int mlxsw_sp_lpm_tree_alloc(struct mlxsw_sp *mlxsw_sp,
517 struct mlxsw_sp_lpm_tree *lpm_tree)
518{
519 char ralta_pl[MLXSW_REG_RALTA_LEN];
520
1a9234e6
IS
521 mlxsw_reg_ralta_pack(ralta_pl, true,
522 (enum mlxsw_reg_ralxx_protocol) lpm_tree->proto,
523 lpm_tree->id);
53342023
JP
524 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl);
525}
526
cc702670
IS
527static void mlxsw_sp_lpm_tree_free(struct mlxsw_sp *mlxsw_sp,
528 struct mlxsw_sp_lpm_tree *lpm_tree)
53342023
JP
529{
530 char ralta_pl[MLXSW_REG_RALTA_LEN];
531
1a9234e6
IS
532 mlxsw_reg_ralta_pack(ralta_pl, false,
533 (enum mlxsw_reg_ralxx_protocol) lpm_tree->proto,
534 lpm_tree->id);
cc702670 535 mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl);
53342023
JP
536}
537
538static int
539mlxsw_sp_lpm_tree_left_struct_set(struct mlxsw_sp *mlxsw_sp,
540 struct mlxsw_sp_prefix_usage *prefix_usage,
541 struct mlxsw_sp_lpm_tree *lpm_tree)
542{
543 char ralst_pl[MLXSW_REG_RALST_LEN];
544 u8 root_bin = 0;
545 u8 prefix;
546 u8 last_prefix = MLXSW_REG_RALST_BIN_NO_CHILD;
547
548 mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage)
549 root_bin = prefix;
550
551 mlxsw_reg_ralst_pack(ralst_pl, root_bin, lpm_tree->id);
552 mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage) {
553 if (prefix == 0)
554 continue;
555 mlxsw_reg_ralst_bin_pack(ralst_pl, prefix, last_prefix,
556 MLXSW_REG_RALST_BIN_NO_CHILD);
557 last_prefix = prefix;
558 }
559 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralst), ralst_pl);
560}
561
562static struct mlxsw_sp_lpm_tree *
563mlxsw_sp_lpm_tree_create(struct mlxsw_sp *mlxsw_sp,
564 struct mlxsw_sp_prefix_usage *prefix_usage,
382dbb40 565 enum mlxsw_sp_l3proto proto)
53342023
JP
566{
567 struct mlxsw_sp_lpm_tree *lpm_tree;
568 int err;
569
382dbb40 570 lpm_tree = mlxsw_sp_lpm_tree_find_unused(mlxsw_sp);
53342023
JP
571 if (!lpm_tree)
572 return ERR_PTR(-EBUSY);
573 lpm_tree->proto = proto;
574 err = mlxsw_sp_lpm_tree_alloc(mlxsw_sp, lpm_tree);
575 if (err)
576 return ERR_PTR(err);
577
578 err = mlxsw_sp_lpm_tree_left_struct_set(mlxsw_sp, prefix_usage,
579 lpm_tree);
580 if (err)
581 goto err_left_struct_set;
2083d367
JP
582 memcpy(&lpm_tree->prefix_usage, prefix_usage,
583 sizeof(lpm_tree->prefix_usage));
53342023
JP
584 return lpm_tree;
585
586err_left_struct_set:
587 mlxsw_sp_lpm_tree_free(mlxsw_sp, lpm_tree);
588 return ERR_PTR(err);
589}
590
cc702670
IS
591static void mlxsw_sp_lpm_tree_destroy(struct mlxsw_sp *mlxsw_sp,
592 struct mlxsw_sp_lpm_tree *lpm_tree)
53342023 593{
cc702670 594 mlxsw_sp_lpm_tree_free(mlxsw_sp, lpm_tree);
53342023
JP
595}
596
597static struct mlxsw_sp_lpm_tree *
598mlxsw_sp_lpm_tree_get(struct mlxsw_sp *mlxsw_sp,
599 struct mlxsw_sp_prefix_usage *prefix_usage,
382dbb40 600 enum mlxsw_sp_l3proto proto)
53342023
JP
601{
602 struct mlxsw_sp_lpm_tree *lpm_tree;
603 int i;
604
9011b677
IS
605 for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) {
606 lpm_tree = &mlxsw_sp->router->lpm.trees[i];
8b99becd
JP
607 if (lpm_tree->ref_count != 0 &&
608 lpm_tree->proto == proto &&
53342023
JP
609 mlxsw_sp_prefix_usage_eq(&lpm_tree->prefix_usage,
610 prefix_usage))
fc922bb0 611 return lpm_tree;
53342023 612 }
fc922bb0
IS
613 return mlxsw_sp_lpm_tree_create(mlxsw_sp, prefix_usage, proto);
614}
53342023 615
fc922bb0
IS
616static void mlxsw_sp_lpm_tree_hold(struct mlxsw_sp_lpm_tree *lpm_tree)
617{
53342023 618 lpm_tree->ref_count++;
53342023
JP
619}
620
cc702670
IS
621static void mlxsw_sp_lpm_tree_put(struct mlxsw_sp *mlxsw_sp,
622 struct mlxsw_sp_lpm_tree *lpm_tree)
53342023
JP
623{
624 if (--lpm_tree->ref_count == 0)
cc702670 625 mlxsw_sp_lpm_tree_destroy(mlxsw_sp, lpm_tree);
53342023
JP
626}
627
d7a60306 628#define MLXSW_SP_LPM_TREE_MIN 1 /* tree 0 is reserved */
8494ab06
IS
629
630static int mlxsw_sp_lpm_init(struct mlxsw_sp *mlxsw_sp)
53342023
JP
631{
632 struct mlxsw_sp_lpm_tree *lpm_tree;
8494ab06 633 u64 max_trees;
53342023
JP
634 int i;
635
8494ab06
IS
636 if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_LPM_TREES))
637 return -EIO;
638
639 max_trees = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_LPM_TREES);
9011b677
IS
640 mlxsw_sp->router->lpm.tree_count = max_trees - MLXSW_SP_LPM_TREE_MIN;
641 mlxsw_sp->router->lpm.trees = kcalloc(mlxsw_sp->router->lpm.tree_count,
8494ab06
IS
642 sizeof(struct mlxsw_sp_lpm_tree),
643 GFP_KERNEL);
9011b677 644 if (!mlxsw_sp->router->lpm.trees)
8494ab06
IS
645 return -ENOMEM;
646
9011b677
IS
647 for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) {
648 lpm_tree = &mlxsw_sp->router->lpm.trees[i];
53342023
JP
649 lpm_tree->id = i + MLXSW_SP_LPM_TREE_MIN;
650 }
8494ab06
IS
651
652 return 0;
653}
654
655static void mlxsw_sp_lpm_fini(struct mlxsw_sp *mlxsw_sp)
656{
9011b677 657 kfree(mlxsw_sp->router->lpm.trees);
53342023
JP
658}
659
76610ebb
IS
660static bool mlxsw_sp_vr_is_used(const struct mlxsw_sp_vr *vr)
661{
d42b0965 662 return !!vr->fib4 || !!vr->fib6 || !!vr->mr4_table;
76610ebb
IS
663}
664
6b75c480
JP
665static struct mlxsw_sp_vr *mlxsw_sp_vr_find_unused(struct mlxsw_sp *mlxsw_sp)
666{
667 struct mlxsw_sp_vr *vr;
668 int i;
669
c1a38311 670 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
9011b677 671 vr = &mlxsw_sp->router->vrs[i];
76610ebb 672 if (!mlxsw_sp_vr_is_used(vr))
6b75c480
JP
673 return vr;
674 }
675 return NULL;
676}
677
678static int mlxsw_sp_vr_lpm_tree_bind(struct mlxsw_sp *mlxsw_sp,
0adb214b 679 const struct mlxsw_sp_fib *fib, u8 tree_id)
6b75c480
JP
680{
681 char raltb_pl[MLXSW_REG_RALTB_LEN];
682
76610ebb
IS
683 mlxsw_reg_raltb_pack(raltb_pl, fib->vr->id,
684 (enum mlxsw_reg_ralxx_protocol) fib->proto,
0adb214b 685 tree_id);
6b75c480
JP
686 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb), raltb_pl);
687}
688
689static int mlxsw_sp_vr_lpm_tree_unbind(struct mlxsw_sp *mlxsw_sp,
76610ebb 690 const struct mlxsw_sp_fib *fib)
6b75c480
JP
691{
692 char raltb_pl[MLXSW_REG_RALTB_LEN];
693
694 /* Bind to tree 0 which is default */
76610ebb
IS
695 mlxsw_reg_raltb_pack(raltb_pl, fib->vr->id,
696 (enum mlxsw_reg_ralxx_protocol) fib->proto, 0);
6b75c480
JP
697 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb), raltb_pl);
698}
699
700static u32 mlxsw_sp_fix_tb_id(u32 tb_id)
701{
7e50d435
YG
702 /* For our purpose, squash main, default and local tables into one */
703 if (tb_id == RT_TABLE_LOCAL || tb_id == RT_TABLE_DEFAULT)
6b75c480
JP
704 tb_id = RT_TABLE_MAIN;
705 return tb_id;
706}
707
708static struct mlxsw_sp_vr *mlxsw_sp_vr_find(struct mlxsw_sp *mlxsw_sp,
76610ebb 709 u32 tb_id)
6b75c480
JP
710{
711 struct mlxsw_sp_vr *vr;
712 int i;
713
714 tb_id = mlxsw_sp_fix_tb_id(tb_id);
9497c042 715
c1a38311 716 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
9011b677 717 vr = &mlxsw_sp->router->vrs[i];
76610ebb 718 if (mlxsw_sp_vr_is_used(vr) && vr->tb_id == tb_id)
6b75c480
JP
719 return vr;
720 }
721 return NULL;
722}
723
76610ebb
IS
724static struct mlxsw_sp_fib *mlxsw_sp_vr_fib(const struct mlxsw_sp_vr *vr,
725 enum mlxsw_sp_l3proto proto)
726{
727 switch (proto) {
728 case MLXSW_SP_L3_PROTO_IPV4:
729 return vr->fib4;
730 case MLXSW_SP_L3_PROTO_IPV6:
a3d9bc50 731 return vr->fib6;
76610ebb
IS
732 }
733 return NULL;
734}
735
6b75c480 736static struct mlxsw_sp_vr *mlxsw_sp_vr_create(struct mlxsw_sp *mlxsw_sp,
f8fa9b4e
DA
737 u32 tb_id,
738 struct netlink_ext_ack *extack)
6b75c480 739{
6b75c480 740 struct mlxsw_sp_vr *vr;
a3d9bc50 741 int err;
6b75c480
JP
742
743 vr = mlxsw_sp_vr_find_unused(mlxsw_sp);
f8fa9b4e
DA
744 if (!vr) {
745 NL_SET_ERR_MSG(extack, "spectrum: Exceeded number of supported virtual routers");
6b75c480 746 return ERR_PTR(-EBUSY);
f8fa9b4e 747 }
76610ebb
IS
748 vr->fib4 = mlxsw_sp_fib_create(vr, MLXSW_SP_L3_PROTO_IPV4);
749 if (IS_ERR(vr->fib4))
750 return ERR_CAST(vr->fib4);
a3d9bc50
IS
751 vr->fib6 = mlxsw_sp_fib_create(vr, MLXSW_SP_L3_PROTO_IPV6);
752 if (IS_ERR(vr->fib6)) {
753 err = PTR_ERR(vr->fib6);
754 goto err_fib6_create;
755 }
d42b0965
YG
756 vr->mr4_table = mlxsw_sp_mr_table_create(mlxsw_sp, vr->id,
757 MLXSW_SP_L3_PROTO_IPV4);
758 if (IS_ERR(vr->mr4_table)) {
759 err = PTR_ERR(vr->mr4_table);
760 goto err_mr_table_create;
761 }
6b75c480 762 vr->tb_id = tb_id;
6b75c480 763 return vr;
a3d9bc50 764
d42b0965
YG
765err_mr_table_create:
766 mlxsw_sp_fib_destroy(vr->fib6);
767 vr->fib6 = NULL;
a3d9bc50
IS
768err_fib6_create:
769 mlxsw_sp_fib_destroy(vr->fib4);
770 vr->fib4 = NULL;
771 return ERR_PTR(err);
6b75c480
JP
772}
773
76610ebb 774static void mlxsw_sp_vr_destroy(struct mlxsw_sp_vr *vr)
6b75c480 775{
d42b0965
YG
776 mlxsw_sp_mr_table_destroy(vr->mr4_table);
777 vr->mr4_table = NULL;
a3d9bc50
IS
778 mlxsw_sp_fib_destroy(vr->fib6);
779 vr->fib6 = NULL;
76610ebb
IS
780 mlxsw_sp_fib_destroy(vr->fib4);
781 vr->fib4 = NULL;
6b75c480
JP
782}
783
f8fa9b4e
DA
784static struct mlxsw_sp_vr *mlxsw_sp_vr_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id,
785 struct netlink_ext_ack *extack)
6b75c480
JP
786{
787 struct mlxsw_sp_vr *vr;
6b75c480
JP
788
789 tb_id = mlxsw_sp_fix_tb_id(tb_id);
76610ebb
IS
790 vr = mlxsw_sp_vr_find(mlxsw_sp, tb_id);
791 if (!vr)
f8fa9b4e 792 vr = mlxsw_sp_vr_create(mlxsw_sp, tb_id, extack);
6b75c480
JP
793 return vr;
794}
795
76610ebb 796static void mlxsw_sp_vr_put(struct mlxsw_sp_vr *vr)
6b75c480 797{
a3d9bc50 798 if (!vr->rif_count && list_empty(&vr->fib4->node_list) &&
d42b0965
YG
799 list_empty(&vr->fib6->node_list) &&
800 mlxsw_sp_mr_table_empty(vr->mr4_table))
76610ebb 801 mlxsw_sp_vr_destroy(vr);
6b75c480
JP
802}
803
fc922bb0
IS
804static bool
805mlxsw_sp_vr_lpm_tree_should_replace(struct mlxsw_sp_vr *vr,
806 enum mlxsw_sp_l3proto proto, u8 tree_id)
807{
808 struct mlxsw_sp_fib *fib = mlxsw_sp_vr_fib(vr, proto);
809
810 if (!mlxsw_sp_vr_is_used(vr))
811 return false;
812 if (fib->lpm_tree && fib->lpm_tree->id == tree_id)
813 return true;
814 return false;
815}
816
817static int mlxsw_sp_vr_lpm_tree_replace(struct mlxsw_sp *mlxsw_sp,
818 struct mlxsw_sp_fib *fib,
819 struct mlxsw_sp_lpm_tree *new_tree)
820{
821 struct mlxsw_sp_lpm_tree *old_tree = fib->lpm_tree;
822 int err;
823
824 err = mlxsw_sp_vr_lpm_tree_bind(mlxsw_sp, fib, new_tree->id);
825 if (err)
826 return err;
827 fib->lpm_tree = new_tree;
828 mlxsw_sp_lpm_tree_hold(new_tree);
829 mlxsw_sp_lpm_tree_put(mlxsw_sp, old_tree);
830 return 0;
831}
832
833static int mlxsw_sp_vrs_lpm_tree_replace(struct mlxsw_sp *mlxsw_sp,
834 struct mlxsw_sp_fib *fib,
835 struct mlxsw_sp_lpm_tree *new_tree)
836{
837 struct mlxsw_sp_lpm_tree *old_tree = fib->lpm_tree;
838 enum mlxsw_sp_l3proto proto = fib->proto;
839 u8 old_id, new_id = new_tree->id;
840 struct mlxsw_sp_vr *vr;
841 int i, err;
842
843 if (!old_tree)
844 goto no_replace;
845 old_id = old_tree->id;
846
847 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
848 vr = &mlxsw_sp->router->vrs[i];
849 if (!mlxsw_sp_vr_lpm_tree_should_replace(vr, proto, old_id))
850 continue;
851 err = mlxsw_sp_vr_lpm_tree_replace(mlxsw_sp,
852 mlxsw_sp_vr_fib(vr, proto),
853 new_tree);
854 if (err)
855 goto err_tree_replace;
856 }
857
858 return 0;
859
860err_tree_replace:
861 for (i--; i >= 0; i--) {
862 if (!mlxsw_sp_vr_lpm_tree_should_replace(vr, proto, new_id))
863 continue;
864 mlxsw_sp_vr_lpm_tree_replace(mlxsw_sp,
865 mlxsw_sp_vr_fib(vr, proto),
866 old_tree);
867 }
868 return err;
869
870no_replace:
871 err = mlxsw_sp_vr_lpm_tree_bind(mlxsw_sp, fib, new_tree->id);
872 if (err)
873 return err;
874 fib->lpm_tree = new_tree;
875 mlxsw_sp_lpm_tree_hold(new_tree);
876 return 0;
877}
878
879static void
880mlxsw_sp_vrs_prefixes(struct mlxsw_sp *mlxsw_sp,
881 enum mlxsw_sp_l3proto proto,
882 struct mlxsw_sp_prefix_usage *req_prefix_usage)
883{
884 int i;
885
886 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
887 struct mlxsw_sp_vr *vr = &mlxsw_sp->router->vrs[i];
888 struct mlxsw_sp_fib *fib = mlxsw_sp_vr_fib(vr, proto);
889 unsigned char prefix;
890
891 if (!mlxsw_sp_vr_is_used(vr))
892 continue;
893 mlxsw_sp_prefix_usage_for_each(prefix, &fib->prefix_usage)
894 mlxsw_sp_prefix_usage_set(req_prefix_usage, prefix);
895 }
896}
897
9497c042 898static int mlxsw_sp_vrs_init(struct mlxsw_sp *mlxsw_sp)
6b75c480
JP
899{
900 struct mlxsw_sp_vr *vr;
c1a38311 901 u64 max_vrs;
6b75c480
JP
902 int i;
903
c1a38311 904 if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_VRS))
9497c042
NF
905 return -EIO;
906
c1a38311 907 max_vrs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS);
9011b677
IS
908 mlxsw_sp->router->vrs = kcalloc(max_vrs, sizeof(struct mlxsw_sp_vr),
909 GFP_KERNEL);
910 if (!mlxsw_sp->router->vrs)
9497c042
NF
911 return -ENOMEM;
912
c1a38311 913 for (i = 0; i < max_vrs; i++) {
9011b677 914 vr = &mlxsw_sp->router->vrs[i];
6b75c480
JP
915 vr->id = i;
916 }
9497c042
NF
917
918 return 0;
919}
920
ac571de9
IS
921static void mlxsw_sp_router_fib_flush(struct mlxsw_sp *mlxsw_sp);
922
9497c042
NF
923static void mlxsw_sp_vrs_fini(struct mlxsw_sp *mlxsw_sp)
924{
3057224e
IS
925 /* At this stage we're guaranteed not to have new incoming
926 * FIB notifications and the work queue is free from FIBs
927 * sitting on top of mlxsw netdevs. However, we can still
928 * have other FIBs queued. Flush the queue before flushing
929 * the device's tables. No need for locks, as we're the only
930 * writer.
931 */
932 mlxsw_core_flush_owq();
ac571de9 933 mlxsw_sp_router_fib_flush(mlxsw_sp);
9011b677 934 kfree(mlxsw_sp->router->vrs);
6b75c480
JP
935}
936
6ddb7426
PM
937static struct net_device *
938__mlxsw_sp_ipip_netdev_ul_dev_get(const struct net_device *ol_dev)
939{
940 struct ip_tunnel *tun = netdev_priv(ol_dev);
941 struct net *net = dev_net(ol_dev);
942
943 return __dev_get_by_index(net, tun->parms.link);
944}
945
946static u32 mlxsw_sp_ipip_dev_ul_tb_id(const struct net_device *ol_dev)
947{
948 struct net_device *d = __mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev);
949
950 if (d)
951 return l3mdev_fib_table(d) ? : RT_TABLE_MAIN;
952 else
953 return l3mdev_fib_table(ol_dev) ? : RT_TABLE_MAIN;
954}
955
1012b9ac
PM
956static struct mlxsw_sp_rif *
957mlxsw_sp_rif_create(struct mlxsw_sp *mlxsw_sp,
f8fa9b4e
DA
958 const struct mlxsw_sp_rif_params *params,
959 struct netlink_ext_ack *extack);
1012b9ac
PM
960
961static struct mlxsw_sp_rif_ipip_lb *
962mlxsw_sp_ipip_ol_ipip_lb_create(struct mlxsw_sp *mlxsw_sp,
963 enum mlxsw_sp_ipip_type ipipt,
7e75af63
PM
964 struct net_device *ol_dev,
965 struct netlink_ext_ack *extack)
1012b9ac
PM
966{
967 struct mlxsw_sp_rif_params_ipip_lb lb_params;
968 const struct mlxsw_sp_ipip_ops *ipip_ops;
969 struct mlxsw_sp_rif *rif;
970
971 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipipt];
972 lb_params = (struct mlxsw_sp_rif_params_ipip_lb) {
973 .common.dev = ol_dev,
974 .common.lag = false,
975 .lb_config = ipip_ops->ol_loopback_config(mlxsw_sp, ol_dev),
976 };
977
7e75af63 978 rif = mlxsw_sp_rif_create(mlxsw_sp, &lb_params.common, extack);
1012b9ac
PM
979 if (IS_ERR(rif))
980 return ERR_CAST(rif);
981 return container_of(rif, struct mlxsw_sp_rif_ipip_lb, common);
982}
983
984static struct mlxsw_sp_ipip_entry *
985mlxsw_sp_ipip_entry_alloc(struct mlxsw_sp *mlxsw_sp,
986 enum mlxsw_sp_ipip_type ipipt,
987 struct net_device *ol_dev)
988{
989 struct mlxsw_sp_ipip_entry *ipip_entry;
990 struct mlxsw_sp_ipip_entry *ret = NULL;
991
992 ipip_entry = kzalloc(sizeof(*ipip_entry), GFP_KERNEL);
993 if (!ipip_entry)
994 return ERR_PTR(-ENOMEM);
995
996 ipip_entry->ol_lb = mlxsw_sp_ipip_ol_ipip_lb_create(mlxsw_sp, ipipt,
7e75af63 997 ol_dev, NULL);
1012b9ac
PM
998 if (IS_ERR(ipip_entry->ol_lb)) {
999 ret = ERR_CAST(ipip_entry->ol_lb);
1000 goto err_ol_ipip_lb_create;
1001 }
1002
1003 ipip_entry->ipipt = ipipt;
1004 ipip_entry->ol_dev = ol_dev;
1005
1006 return ipip_entry;
1007
1008err_ol_ipip_lb_create:
1009 kfree(ipip_entry);
1010 return ret;
1011}
1012
1013static void
4cccb737 1014mlxsw_sp_ipip_entry_dealloc(struct mlxsw_sp_ipip_entry *ipip_entry)
1012b9ac 1015{
1012b9ac
PM
1016 mlxsw_sp_rif_destroy(&ipip_entry->ol_lb->common);
1017 kfree(ipip_entry);
1018}
1019
1012b9ac
PM
1020static bool mlxsw_sp_l3addr_eq(const union mlxsw_sp_l3addr *addr1,
1021 const union mlxsw_sp_l3addr *addr2)
1022{
1023 return !memcmp(addr1, addr2, sizeof(*addr1));
1024}
1025
1026static bool
1027mlxsw_sp_ipip_entry_saddr_matches(struct mlxsw_sp *mlxsw_sp,
1028 const enum mlxsw_sp_l3proto ul_proto,
1029 union mlxsw_sp_l3addr saddr,
1030 u32 ul_tb_id,
1031 struct mlxsw_sp_ipip_entry *ipip_entry)
1032{
1033 u32 tun_ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev);
1034 enum mlxsw_sp_ipip_type ipipt = ipip_entry->ipipt;
1035 union mlxsw_sp_l3addr tun_saddr;
1036
1037 if (mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto != ul_proto)
1038 return false;
1039
1040 tun_saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ipip_entry->ol_dev);
1041 return tun_ul_tb_id == ul_tb_id &&
1042 mlxsw_sp_l3addr_eq(&tun_saddr, &saddr);
1043}
1044
4607f6d2
PM
1045static int
1046mlxsw_sp_fib_entry_decap_init(struct mlxsw_sp *mlxsw_sp,
1047 struct mlxsw_sp_fib_entry *fib_entry,
1048 struct mlxsw_sp_ipip_entry *ipip_entry)
1049{
1050 u32 tunnel_index;
1051 int err;
1052
1053 err = mlxsw_sp_kvdl_alloc(mlxsw_sp, 1, &tunnel_index);
1054 if (err)
1055 return err;
1056
1057 ipip_entry->decap_fib_entry = fib_entry;
1058 fib_entry->decap.ipip_entry = ipip_entry;
1059 fib_entry->decap.tunnel_index = tunnel_index;
1060 return 0;
1061}
1062
1063static void mlxsw_sp_fib_entry_decap_fini(struct mlxsw_sp *mlxsw_sp,
1064 struct mlxsw_sp_fib_entry *fib_entry)
1065{
1066 /* Unlink this node from the IPIP entry that it's the decap entry of. */
1067 fib_entry->decap.ipip_entry->decap_fib_entry = NULL;
1068 fib_entry->decap.ipip_entry = NULL;
1069 mlxsw_sp_kvdl_free(mlxsw_sp, fib_entry->decap.tunnel_index);
1070}
1071
1cc38fb1
PM
1072static struct mlxsw_sp_fib_node *
1073mlxsw_sp_fib_node_lookup(struct mlxsw_sp_fib *fib, const void *addr,
1074 size_t addr_len, unsigned char prefix_len);
4607f6d2
PM
1075static int mlxsw_sp_fib_entry_update(struct mlxsw_sp *mlxsw_sp,
1076 struct mlxsw_sp_fib_entry *fib_entry);
1077
1078static void
1079mlxsw_sp_ipip_entry_demote_decap(struct mlxsw_sp *mlxsw_sp,
1080 struct mlxsw_sp_ipip_entry *ipip_entry)
1081{
1082 struct mlxsw_sp_fib_entry *fib_entry = ipip_entry->decap_fib_entry;
1083
1084 mlxsw_sp_fib_entry_decap_fini(mlxsw_sp, fib_entry);
1085 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
1086
1087 mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
1088}
1089
1cc38fb1
PM
1090static void
1091mlxsw_sp_ipip_entry_promote_decap(struct mlxsw_sp *mlxsw_sp,
1092 struct mlxsw_sp_ipip_entry *ipip_entry,
1093 struct mlxsw_sp_fib_entry *decap_fib_entry)
1094{
1095 if (mlxsw_sp_fib_entry_decap_init(mlxsw_sp, decap_fib_entry,
1096 ipip_entry))
1097 return;
1098 decap_fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP;
1099
1100 if (mlxsw_sp_fib_entry_update(mlxsw_sp, decap_fib_entry))
1101 mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry);
1102}
1103
1104/* Given an IPIP entry, find the corresponding decap route. */
1105static struct mlxsw_sp_fib_entry *
1106mlxsw_sp_ipip_entry_find_decap(struct mlxsw_sp *mlxsw_sp,
1107 struct mlxsw_sp_ipip_entry *ipip_entry)
1108{
1109 static struct mlxsw_sp_fib_node *fib_node;
1110 const struct mlxsw_sp_ipip_ops *ipip_ops;
1111 struct mlxsw_sp_fib_entry *fib_entry;
1112 unsigned char saddr_prefix_len;
1113 union mlxsw_sp_l3addr saddr;
1114 struct mlxsw_sp_fib *ul_fib;
1115 struct mlxsw_sp_vr *ul_vr;
1116 const void *saddrp;
1117 size_t saddr_len;
1118 u32 ul_tb_id;
1119 u32 saddr4;
1120
1121 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
1122
1123 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev);
1124 ul_vr = mlxsw_sp_vr_find(mlxsw_sp, ul_tb_id);
1125 if (!ul_vr)
1126 return NULL;
1127
1128 ul_fib = mlxsw_sp_vr_fib(ul_vr, ipip_ops->ul_proto);
1129 saddr = mlxsw_sp_ipip_netdev_saddr(ipip_ops->ul_proto,
1130 ipip_entry->ol_dev);
1131
1132 switch (ipip_ops->ul_proto) {
1133 case MLXSW_SP_L3_PROTO_IPV4:
1134 saddr4 = be32_to_cpu(saddr.addr4);
1135 saddrp = &saddr4;
1136 saddr_len = 4;
1137 saddr_prefix_len = 32;
1138 break;
1139 case MLXSW_SP_L3_PROTO_IPV6:
1140 WARN_ON(1);
1141 return NULL;
1142 }
1143
1144 fib_node = mlxsw_sp_fib_node_lookup(ul_fib, saddrp, saddr_len,
1145 saddr_prefix_len);
1146 if (!fib_node || list_empty(&fib_node->entry_list))
1147 return NULL;
1148
1149 fib_entry = list_first_entry(&fib_node->entry_list,
1150 struct mlxsw_sp_fib_entry, list);
1151 if (fib_entry->type != MLXSW_SP_FIB_ENTRY_TYPE_TRAP)
1152 return NULL;
1153
1154 return fib_entry;
1155}
1156
1012b9ac 1157static struct mlxsw_sp_ipip_entry *
4cccb737
PM
1158mlxsw_sp_ipip_entry_create(struct mlxsw_sp *mlxsw_sp,
1159 enum mlxsw_sp_ipip_type ipipt,
1160 struct net_device *ol_dev)
1012b9ac
PM
1161{
1162 u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ol_dev);
1163 struct mlxsw_sp_router *router = mlxsw_sp->router;
1164 struct mlxsw_sp_ipip_entry *ipip_entry;
1165 enum mlxsw_sp_l3proto ul_proto;
1166 union mlxsw_sp_l3addr saddr;
1167
4cccb737
PM
1168 /* The configuration where several tunnels have the same local address
1169 * in the same underlay table needs special treatment in the HW. That is
1170 * currently not implemented in the driver.
1171 */
1012b9ac
PM
1172 list_for_each_entry(ipip_entry, &mlxsw_sp->router->ipip_list,
1173 ipip_list_node) {
1012b9ac
PM
1174 ul_proto = router->ipip_ops_arr[ipip_entry->ipipt]->ul_proto;
1175 saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ol_dev);
1176 if (mlxsw_sp_ipip_entry_saddr_matches(mlxsw_sp, ul_proto, saddr,
1177 ul_tb_id, ipip_entry))
1178 return ERR_PTR(-EEXIST);
1179 }
1180
1181 ipip_entry = mlxsw_sp_ipip_entry_alloc(mlxsw_sp, ipipt, ol_dev);
1182 if (IS_ERR(ipip_entry))
1183 return ipip_entry;
1184
1185 list_add_tail(&ipip_entry->ipip_list_node,
1186 &mlxsw_sp->router->ipip_list);
1187
1012b9ac
PM
1188 return ipip_entry;
1189}
1190
1191static void
4cccb737
PM
1192mlxsw_sp_ipip_entry_destroy(struct mlxsw_sp *mlxsw_sp,
1193 struct mlxsw_sp_ipip_entry *ipip_entry)
1012b9ac 1194{
4cccb737
PM
1195 list_del(&ipip_entry->ipip_list_node);
1196 mlxsw_sp_ipip_entry_dealloc(ipip_entry);
1012b9ac
PM
1197}
1198
4607f6d2
PM
1199static bool
1200mlxsw_sp_ipip_entry_matches_decap(struct mlxsw_sp *mlxsw_sp,
1201 const struct net_device *ul_dev,
1202 enum mlxsw_sp_l3proto ul_proto,
1203 union mlxsw_sp_l3addr ul_dip,
1204 struct mlxsw_sp_ipip_entry *ipip_entry)
1205{
1206 u32 ul_tb_id = l3mdev_fib_table(ul_dev) ? : RT_TABLE_MAIN;
1207 enum mlxsw_sp_ipip_type ipipt = ipip_entry->ipipt;
1208 struct net_device *ipip_ul_dev;
1209
1210 if (mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto != ul_proto)
1211 return false;
1212
1213 ipip_ul_dev = __mlxsw_sp_ipip_netdev_ul_dev_get(ipip_entry->ol_dev);
1214 return mlxsw_sp_ipip_entry_saddr_matches(mlxsw_sp, ul_proto, ul_dip,
1215 ul_tb_id, ipip_entry) &&
1216 (!ipip_ul_dev || ipip_ul_dev == ul_dev);
1217}
1218
1219/* Given decap parameters, find the corresponding IPIP entry. */
1220static struct mlxsw_sp_ipip_entry *
1221mlxsw_sp_ipip_entry_find_by_decap(struct mlxsw_sp *mlxsw_sp,
1222 const struct net_device *ul_dev,
1223 enum mlxsw_sp_l3proto ul_proto,
1224 union mlxsw_sp_l3addr ul_dip)
1225{
1226 struct mlxsw_sp_ipip_entry *ipip_entry;
1227
1228 list_for_each_entry(ipip_entry, &mlxsw_sp->router->ipip_list,
1229 ipip_list_node)
1230 if (mlxsw_sp_ipip_entry_matches_decap(mlxsw_sp, ul_dev,
1231 ul_proto, ul_dip,
1232 ipip_entry))
1233 return ipip_entry;
1234
1235 return NULL;
1236}
1237
6698c168
PM
1238static bool mlxsw_sp_netdev_ipip_type(const struct mlxsw_sp *mlxsw_sp,
1239 const struct net_device *dev,
1240 enum mlxsw_sp_ipip_type *p_type)
1241{
1242 struct mlxsw_sp_router *router = mlxsw_sp->router;
1243 const struct mlxsw_sp_ipip_ops *ipip_ops;
1244 enum mlxsw_sp_ipip_type ipipt;
1245
1246 for (ipipt = 0; ipipt < MLXSW_SP_IPIP_TYPE_MAX; ++ipipt) {
1247 ipip_ops = router->ipip_ops_arr[ipipt];
1248 if (dev->type == ipip_ops->dev_type) {
1249 if (p_type)
1250 *p_type = ipipt;
1251 return true;
1252 }
1253 }
1254 return false;
1255}
1256
796ec776
PM
1257bool mlxsw_sp_netdev_is_ipip_ol(const struct mlxsw_sp *mlxsw_sp,
1258 const struct net_device *dev)
0063587d
PM
1259{
1260 return mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, NULL);
1261}
1262
1263static struct mlxsw_sp_ipip_entry *
1264mlxsw_sp_ipip_entry_find_by_ol_dev(struct mlxsw_sp *mlxsw_sp,
1265 const struct net_device *ol_dev)
1266{
1267 struct mlxsw_sp_ipip_entry *ipip_entry;
1268
1269 list_for_each_entry(ipip_entry, &mlxsw_sp->router->ipip_list,
1270 ipip_list_node)
1271 if (ipip_entry->ol_dev == ol_dev)
1272 return ipip_entry;
1273
1274 return NULL;
1275}
1276
cafdb2a0
PM
1277static bool mlxsw_sp_netdevice_ipip_can_offload(struct mlxsw_sp *mlxsw_sp,
1278 const struct net_device *ol_dev,
1279 enum mlxsw_sp_ipip_type ipipt)
1280{
1281 const struct mlxsw_sp_ipip_ops *ops
1282 = mlxsw_sp->router->ipip_ops_arr[ipipt];
1283
1284 /* For deciding whether decap should be offloaded, we don't care about
1285 * overlay protocol, so ask whether either one is supported.
1286 */
1287 return ops->can_offload(mlxsw_sp, ol_dev, MLXSW_SP_L3_PROTO_IPV4) ||
1288 ops->can_offload(mlxsw_sp, ol_dev, MLXSW_SP_L3_PROTO_IPV6);
1289}
1290
796ec776
PM
1291static int mlxsw_sp_netdevice_ipip_ol_reg_event(struct mlxsw_sp *mlxsw_sp,
1292 struct net_device *ol_dev)
0063587d 1293{
0063587d
PM
1294 struct mlxsw_sp_ipip_entry *ipip_entry;
1295 enum mlxsw_sp_ipip_type ipipt;
1296
1297 mlxsw_sp_netdev_ipip_type(mlxsw_sp, ol_dev, &ipipt);
cafdb2a0 1298 if (mlxsw_sp_netdevice_ipip_can_offload(mlxsw_sp, ol_dev, ipipt)) {
4cccb737
PM
1299 ipip_entry = mlxsw_sp_ipip_entry_create(mlxsw_sp, ipipt,
1300 ol_dev);
0063587d
PM
1301 if (IS_ERR(ipip_entry))
1302 return PTR_ERR(ipip_entry);
1303 }
1304
1305 return 0;
1306}
1307
796ec776
PM
1308static void mlxsw_sp_netdevice_ipip_ol_unreg_event(struct mlxsw_sp *mlxsw_sp,
1309 struct net_device *ol_dev)
0063587d
PM
1310{
1311 struct mlxsw_sp_ipip_entry *ipip_entry;
1312
1313 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
1314 if (ipip_entry)
4cccb737 1315 mlxsw_sp_ipip_entry_destroy(mlxsw_sp, ipip_entry);
0063587d
PM
1316}
1317
47518ca5
PM
1318static void
1319mlxsw_sp_ipip_entry_ol_up_event(struct mlxsw_sp *mlxsw_sp,
1320 struct mlxsw_sp_ipip_entry *ipip_entry)
1321{
1322 struct mlxsw_sp_fib_entry *decap_fib_entry;
1323
1324 decap_fib_entry = mlxsw_sp_ipip_entry_find_decap(mlxsw_sp, ipip_entry);
1325 if (decap_fib_entry)
1326 mlxsw_sp_ipip_entry_promote_decap(mlxsw_sp, ipip_entry,
1327 decap_fib_entry);
1328}
1329
6d4de445
PM
1330static void mlxsw_sp_netdevice_ipip_ol_up_event(struct mlxsw_sp *mlxsw_sp,
1331 struct net_device *ol_dev)
0063587d 1332{
0063587d
PM
1333 struct mlxsw_sp_ipip_entry *ipip_entry;
1334
1335 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
47518ca5
PM
1336 if (ipip_entry)
1337 mlxsw_sp_ipip_entry_ol_up_event(mlxsw_sp, ipip_entry);
0063587d
PM
1338}
1339
a3fe198e
PM
1340static void
1341mlxsw_sp_ipip_entry_ol_down_event(struct mlxsw_sp *mlxsw_sp,
1342 struct mlxsw_sp_ipip_entry *ipip_entry)
1343{
1344 if (ipip_entry->decap_fib_entry)
1345 mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry);
1346}
1347
796ec776
PM
1348static void mlxsw_sp_netdevice_ipip_ol_down_event(struct mlxsw_sp *mlxsw_sp,
1349 struct net_device *ol_dev)
0063587d
PM
1350{
1351 struct mlxsw_sp_ipip_entry *ipip_entry;
1352
1353 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
a3fe198e
PM
1354 if (ipip_entry)
1355 mlxsw_sp_ipip_entry_ol_down_event(mlxsw_sp, ipip_entry);
0063587d
PM
1356}
1357
0c5f1cd5
PM
1358static void mlxsw_sp_nexthop_rif_update(struct mlxsw_sp *mlxsw_sp,
1359 struct mlxsw_sp_rif *rif);
65a6121b
PM
1360static int
1361mlxsw_sp_ipip_entry_ol_lb_update(struct mlxsw_sp *mlxsw_sp,
1362 struct mlxsw_sp_ipip_entry *ipip_entry,
0c5f1cd5 1363 bool keep_encap,
65a6121b
PM
1364 struct netlink_ext_ack *extack)
1365{
1366 struct mlxsw_sp_rif_ipip_lb *old_lb_rif = ipip_entry->ol_lb;
1367 struct mlxsw_sp_rif_ipip_lb *new_lb_rif;
1368
1369 new_lb_rif = mlxsw_sp_ipip_ol_ipip_lb_create(mlxsw_sp,
1370 ipip_entry->ipipt,
1371 ipip_entry->ol_dev,
1372 extack);
1373 if (IS_ERR(new_lb_rif))
1374 return PTR_ERR(new_lb_rif);
1375 ipip_entry->ol_lb = new_lb_rif;
0c5f1cd5
PM
1376
1377 if (keep_encap) {
1378 list_splice_init(&old_lb_rif->common.nexthop_list,
1379 &new_lb_rif->common.nexthop_list);
1380 mlxsw_sp_nexthop_rif_update(mlxsw_sp, &new_lb_rif->common);
1381 }
1382
65a6121b 1383 mlxsw_sp_rif_destroy(&old_lb_rif->common);
f63ce4e5 1384
65a6121b
PM
1385 return 0;
1386}
1387
0c5f1cd5
PM
1388/**
1389 * Update the offload related to an IPIP entry. This always updates decap, and
1390 * in addition to that it also:
1391 * @recreate_loopback: recreates the associated loopback RIF
1392 * @keep_encap: updates next hops that use the tunnel netdevice. This is only
1393 * relevant when recreate_loopback is true.
1394 * @update_nexthops: updates next hops, keeping the current loopback RIF. This
1395 * is only relevant when recreate_loopback is false.
1396 */
65a6121b
PM
1397int __mlxsw_sp_ipip_entry_update_tunnel(struct mlxsw_sp *mlxsw_sp,
1398 struct mlxsw_sp_ipip_entry *ipip_entry,
0c5f1cd5
PM
1399 bool recreate_loopback,
1400 bool keep_encap,
1401 bool update_nexthops,
65a6121b
PM
1402 struct netlink_ext_ack *extack)
1403{
1404 int err;
f63ce4e5 1405
65a6121b
PM
1406 /* RIFs can't be edited, so to update loopback, we need to destroy and
1407 * recreate it. That creates a window of opportunity where RALUE and
1408 * RATR registers end up referencing a RIF that's already gone. RATRs
1409 * are handled in mlxsw_sp_ipip_entry_ol_lb_update(), and to take care
f63ce4e5
PM
1410 * of RALUE, demote the decap route back.
1411 */
1412 if (ipip_entry->decap_fib_entry)
1413 mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry);
1414
0c5f1cd5
PM
1415 if (recreate_loopback) {
1416 err = mlxsw_sp_ipip_entry_ol_lb_update(mlxsw_sp, ipip_entry,
1417 keep_encap, extack);
1418 if (err)
1419 return err;
1420 } else if (update_nexthops) {
1421 mlxsw_sp_nexthop_rif_update(mlxsw_sp,
1422 &ipip_entry->ol_lb->common);
1423 }
65a6121b
PM
1424
1425 if (ipip_entry->ol_dev->flags & IFF_UP)
1426 mlxsw_sp_ipip_entry_ol_up_event(mlxsw_sp, ipip_entry);
f63ce4e5
PM
1427
1428 return 0;
1429}
1430
65a6121b
PM
1431static int mlxsw_sp_netdevice_ipip_ol_vrf_event(struct mlxsw_sp *mlxsw_sp,
1432 struct net_device *ol_dev,
1433 struct netlink_ext_ack *extack)
1434{
1435 struct mlxsw_sp_ipip_entry *ipip_entry =
1436 mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
1437
1438 if (!ipip_entry)
1439 return 0;
1440 return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
0c5f1cd5 1441 true, false, false, extack);
65a6121b
PM
1442}
1443
7e75af63
PM
1444int mlxsw_sp_netdevice_ipip_ol_event(struct mlxsw_sp *mlxsw_sp,
1445 struct net_device *ol_dev,
1446 unsigned long event,
1447 struct netdev_notifier_info *info)
0063587d 1448{
7e75af63
PM
1449 struct netdev_notifier_changeupper_info *chup;
1450 struct netlink_ext_ack *extack;
1451
0063587d
PM
1452 switch (event) {
1453 case NETDEV_REGISTER:
796ec776 1454 return mlxsw_sp_netdevice_ipip_ol_reg_event(mlxsw_sp, ol_dev);
0063587d 1455 case NETDEV_UNREGISTER:
796ec776 1456 mlxsw_sp_netdevice_ipip_ol_unreg_event(mlxsw_sp, ol_dev);
0063587d
PM
1457 return 0;
1458 case NETDEV_UP:
6d4de445
PM
1459 mlxsw_sp_netdevice_ipip_ol_up_event(mlxsw_sp, ol_dev);
1460 return 0;
0063587d 1461 case NETDEV_DOWN:
796ec776 1462 mlxsw_sp_netdevice_ipip_ol_down_event(mlxsw_sp, ol_dev);
0063587d 1463 return 0;
f63ce4e5 1464 case NETDEV_CHANGEUPPER:
7e75af63
PM
1465 chup = container_of(info, typeof(*chup), info);
1466 extack = info->extack;
1467 if (netif_is_l3_master(chup->upper_dev))
796ec776 1468 return mlxsw_sp_netdevice_ipip_ol_vrf_event(mlxsw_sp,
7e75af63
PM
1469 ol_dev,
1470 extack);
f63ce4e5 1471 return 0;
0063587d
PM
1472 }
1473 return 0;
1474}
1475
6cf3c971 1476struct mlxsw_sp_neigh_key {
33b1341c 1477 struct neighbour *n;
6cf3c971
JP
1478};
1479
1480struct mlxsw_sp_neigh_entry {
9665b745 1481 struct list_head rif_list_node;
6cf3c971
JP
1482 struct rhash_head ht_node;
1483 struct mlxsw_sp_neigh_key key;
1484 u16 rif;
5c8802f1 1485 bool connected;
a6bf9e93 1486 unsigned char ha[ETH_ALEN];
a7ff87ac
JP
1487 struct list_head nexthop_list; /* list of nexthops using
1488 * this neigh entry
1489 */
b2157149 1490 struct list_head nexthop_neighs_list_node;
7cfcbc75
AS
1491 unsigned int counter_index;
1492 bool counter_valid;
6cf3c971
JP
1493};
1494
1495static const struct rhashtable_params mlxsw_sp_neigh_ht_params = {
1496 .key_offset = offsetof(struct mlxsw_sp_neigh_entry, key),
1497 .head_offset = offsetof(struct mlxsw_sp_neigh_entry, ht_node),
1498 .key_len = sizeof(struct mlxsw_sp_neigh_key),
1499};
1500
f17cc84d
AS
1501struct mlxsw_sp_neigh_entry *
1502mlxsw_sp_rif_neigh_next(struct mlxsw_sp_rif *rif,
1503 struct mlxsw_sp_neigh_entry *neigh_entry)
1504{
1505 if (!neigh_entry) {
1506 if (list_empty(&rif->neigh_list))
1507 return NULL;
1508 else
1509 return list_first_entry(&rif->neigh_list,
1510 typeof(*neigh_entry),
1511 rif_list_node);
1512 }
ec2437f4 1513 if (list_is_last(&neigh_entry->rif_list_node, &rif->neigh_list))
f17cc84d
AS
1514 return NULL;
1515 return list_next_entry(neigh_entry, rif_list_node);
1516}
1517
1518int mlxsw_sp_neigh_entry_type(struct mlxsw_sp_neigh_entry *neigh_entry)
1519{
1520 return neigh_entry->key.n->tbl->family;
1521}
1522
1523unsigned char *
1524mlxsw_sp_neigh_entry_ha(struct mlxsw_sp_neigh_entry *neigh_entry)
1525{
1526 return neigh_entry->ha;
1527}
1528
1529u32 mlxsw_sp_neigh4_entry_dip(struct mlxsw_sp_neigh_entry *neigh_entry)
1530{
1531 struct neighbour *n;
1532
1533 n = neigh_entry->key.n;
1534 return ntohl(*((__be32 *) n->primary_key));
1535}
1536
0250768c
AS
1537struct in6_addr *
1538mlxsw_sp_neigh6_entry_dip(struct mlxsw_sp_neigh_entry *neigh_entry)
1539{
1540 struct neighbour *n;
1541
1542 n = neigh_entry->key.n;
1543 return (struct in6_addr *) &n->primary_key;
1544}
1545
7cfcbc75
AS
1546int mlxsw_sp_neigh_counter_get(struct mlxsw_sp *mlxsw_sp,
1547 struct mlxsw_sp_neigh_entry *neigh_entry,
1548 u64 *p_counter)
1549{
1550 if (!neigh_entry->counter_valid)
1551 return -EINVAL;
1552
1553 return mlxsw_sp_flow_counter_get(mlxsw_sp, neigh_entry->counter_index,
1554 p_counter, NULL);
1555}
1556
6cf3c971 1557static struct mlxsw_sp_neigh_entry *
5c8802f1
IS
1558mlxsw_sp_neigh_entry_alloc(struct mlxsw_sp *mlxsw_sp, struct neighbour *n,
1559 u16 rif)
6cf3c971
JP
1560{
1561 struct mlxsw_sp_neigh_entry *neigh_entry;
1562
5c8802f1 1563 neigh_entry = kzalloc(sizeof(*neigh_entry), GFP_KERNEL);
6cf3c971
JP
1564 if (!neigh_entry)
1565 return NULL;
5c8802f1 1566
33b1341c 1567 neigh_entry->key.n = n;
6cf3c971 1568 neigh_entry->rif = rif;
a7ff87ac 1569 INIT_LIST_HEAD(&neigh_entry->nexthop_list);
5c8802f1 1570
6cf3c971
JP
1571 return neigh_entry;
1572}
1573
5c8802f1 1574static void mlxsw_sp_neigh_entry_free(struct mlxsw_sp_neigh_entry *neigh_entry)
6cf3c971
JP
1575{
1576 kfree(neigh_entry);
1577}
1578
5c8802f1
IS
1579static int
1580mlxsw_sp_neigh_entry_insert(struct mlxsw_sp *mlxsw_sp,
1581 struct mlxsw_sp_neigh_entry *neigh_entry)
6cf3c971 1582{
9011b677 1583 return rhashtable_insert_fast(&mlxsw_sp->router->neigh_ht,
5c8802f1
IS
1584 &neigh_entry->ht_node,
1585 mlxsw_sp_neigh_ht_params);
1586}
6cf3c971 1587
5c8802f1
IS
1588static void
1589mlxsw_sp_neigh_entry_remove(struct mlxsw_sp *mlxsw_sp,
1590 struct mlxsw_sp_neigh_entry *neigh_entry)
1591{
9011b677 1592 rhashtable_remove_fast(&mlxsw_sp->router->neigh_ht,
5c8802f1
IS
1593 &neigh_entry->ht_node,
1594 mlxsw_sp_neigh_ht_params);
6cf3c971
JP
1595}
1596
7cfcbc75 1597static bool
1ed5574c
AS
1598mlxsw_sp_neigh_counter_should_alloc(struct mlxsw_sp *mlxsw_sp,
1599 struct mlxsw_sp_neigh_entry *neigh_entry)
7cfcbc75
AS
1600{
1601 struct devlink *devlink;
1ed5574c
AS
1602 const char *table_name;
1603
1604 switch (mlxsw_sp_neigh_entry_type(neigh_entry)) {
1605 case AF_INET:
1606 table_name = MLXSW_SP_DPIPE_TABLE_NAME_HOST4;
1607 break;
1608 case AF_INET6:
1609 table_name = MLXSW_SP_DPIPE_TABLE_NAME_HOST6;
1610 break;
1611 default:
1612 WARN_ON(1);
1613 return false;
1614 }
7cfcbc75
AS
1615
1616 devlink = priv_to_devlink(mlxsw_sp->core);
1ed5574c 1617 return devlink_dpipe_table_counter_enabled(devlink, table_name);
7cfcbc75
AS
1618}
1619
1620static void
1621mlxsw_sp_neigh_counter_alloc(struct mlxsw_sp *mlxsw_sp,
1622 struct mlxsw_sp_neigh_entry *neigh_entry)
1623{
1ed5574c 1624 if (!mlxsw_sp_neigh_counter_should_alloc(mlxsw_sp, neigh_entry))
7cfcbc75
AS
1625 return;
1626
1627 if (mlxsw_sp_flow_counter_alloc(mlxsw_sp, &neigh_entry->counter_index))
1628 return;
1629
1630 neigh_entry->counter_valid = true;
1631}
1632
1633static void
1634mlxsw_sp_neigh_counter_free(struct mlxsw_sp *mlxsw_sp,
1635 struct mlxsw_sp_neigh_entry *neigh_entry)
1636{
1637 if (!neigh_entry->counter_valid)
1638 return;
1639 mlxsw_sp_flow_counter_free(mlxsw_sp,
1640 neigh_entry->counter_index);
1641 neigh_entry->counter_valid = false;
1642}
1643
5c8802f1
IS
1644static struct mlxsw_sp_neigh_entry *
1645mlxsw_sp_neigh_entry_create(struct mlxsw_sp *mlxsw_sp, struct neighbour *n)
6cf3c971 1646{
6cf3c971 1647 struct mlxsw_sp_neigh_entry *neigh_entry;
bf95233e 1648 struct mlxsw_sp_rif *rif;
6cf3c971
JP
1649 int err;
1650
bf95233e
AS
1651 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, n->dev);
1652 if (!rif)
5c8802f1 1653 return ERR_PTR(-EINVAL);
6cf3c971 1654
bf95233e 1655 neigh_entry = mlxsw_sp_neigh_entry_alloc(mlxsw_sp, n, rif->rif_index);
6cf3c971 1656 if (!neigh_entry)
5c8802f1
IS
1657 return ERR_PTR(-ENOMEM);
1658
6cf3c971
JP
1659 err = mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry);
1660 if (err)
1661 goto err_neigh_entry_insert;
5c8802f1 1662
7cfcbc75 1663 mlxsw_sp_neigh_counter_alloc(mlxsw_sp, neigh_entry);
bf95233e 1664 list_add(&neigh_entry->rif_list_node, &rif->neigh_list);
9665b745 1665
5c8802f1 1666 return neigh_entry;
6cf3c971
JP
1667
1668err_neigh_entry_insert:
5c8802f1
IS
1669 mlxsw_sp_neigh_entry_free(neigh_entry);
1670 return ERR_PTR(err);
6cf3c971
JP
1671}
1672
5c8802f1
IS
1673static void
1674mlxsw_sp_neigh_entry_destroy(struct mlxsw_sp *mlxsw_sp,
1675 struct mlxsw_sp_neigh_entry *neigh_entry)
6cf3c971 1676{
9665b745 1677 list_del(&neigh_entry->rif_list_node);
7cfcbc75 1678 mlxsw_sp_neigh_counter_free(mlxsw_sp, neigh_entry);
5c8802f1
IS
1679 mlxsw_sp_neigh_entry_remove(mlxsw_sp, neigh_entry);
1680 mlxsw_sp_neigh_entry_free(neigh_entry);
1681}
6cf3c971 1682
5c8802f1
IS
1683static struct mlxsw_sp_neigh_entry *
1684mlxsw_sp_neigh_entry_lookup(struct mlxsw_sp *mlxsw_sp, struct neighbour *n)
1685{
1686 struct mlxsw_sp_neigh_key key;
6cf3c971 1687
5c8802f1 1688 key.n = n;
9011b677 1689 return rhashtable_lookup_fast(&mlxsw_sp->router->neigh_ht,
5c8802f1 1690 &key, mlxsw_sp_neigh_ht_params);
6cf3c971
JP
1691}
1692
c723c735
YG
1693static void
1694mlxsw_sp_router_neighs_update_interval_init(struct mlxsw_sp *mlxsw_sp)
1695{
a6c9b5d1 1696 unsigned long interval;
c723c735 1697
b5f3e0d4 1698#if IS_ENABLED(CONFIG_IPV6)
a6c9b5d1
AS
1699 interval = min_t(unsigned long,
1700 NEIGH_VAR(&arp_tbl.parms, DELAY_PROBE_TIME),
1701 NEIGH_VAR(&nd_tbl.parms, DELAY_PROBE_TIME));
b5f3e0d4
IS
1702#else
1703 interval = NEIGH_VAR(&arp_tbl.parms, DELAY_PROBE_TIME);
1704#endif
9011b677 1705 mlxsw_sp->router->neighs_update.interval = jiffies_to_msecs(interval);
c723c735
YG
1706}
1707
1708static void mlxsw_sp_router_neigh_ent_ipv4_process(struct mlxsw_sp *mlxsw_sp,
1709 char *rauhtd_pl,
1710 int ent_index)
1711{
1712 struct net_device *dev;
1713 struct neighbour *n;
1714 __be32 dipn;
1715 u32 dip;
1716 u16 rif;
1717
1718 mlxsw_reg_rauhtd_ent_ipv4_unpack(rauhtd_pl, ent_index, &rif, &dip);
1719
5f9efffb 1720 if (!mlxsw_sp->router->rifs[rif]) {
c723c735
YG
1721 dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Incorrect RIF in neighbour entry\n");
1722 return;
1723 }
1724
1725 dipn = htonl(dip);
5f9efffb 1726 dev = mlxsw_sp->router->rifs[rif]->dev;
c723c735
YG
1727 n = neigh_lookup(&arp_tbl, &dipn, dev);
1728 if (!n) {
1729 netdev_err(dev, "Failed to find matching neighbour for IP=%pI4h\n",
1730 &dip);
1731 return;
1732 }
1733
1734 netdev_dbg(dev, "Updating neighbour with IP=%pI4h\n", &dip);
1735 neigh_event_send(n, NULL);
1736 neigh_release(n);
1737}
1738
df9a21f1 1739#if IS_ENABLED(CONFIG_IPV6)
60f040ca
AS
1740static void mlxsw_sp_router_neigh_ent_ipv6_process(struct mlxsw_sp *mlxsw_sp,
1741 char *rauhtd_pl,
1742 int rec_index)
1743{
1744 struct net_device *dev;
1745 struct neighbour *n;
1746 struct in6_addr dip;
1747 u16 rif;
1748
1749 mlxsw_reg_rauhtd_ent_ipv6_unpack(rauhtd_pl, rec_index, &rif,
1750 (char *) &dip);
1751
1752 if (!mlxsw_sp->router->rifs[rif]) {
1753 dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Incorrect RIF in neighbour entry\n");
1754 return;
1755 }
1756
1757 dev = mlxsw_sp->router->rifs[rif]->dev;
1758 n = neigh_lookup(&nd_tbl, &dip, dev);
1759 if (!n) {
1760 netdev_err(dev, "Failed to find matching neighbour for IP=%pI6c\n",
1761 &dip);
1762 return;
1763 }
1764
1765 netdev_dbg(dev, "Updating neighbour with IP=%pI6c\n", &dip);
1766 neigh_event_send(n, NULL);
1767 neigh_release(n);
1768}
b5f3e0d4
IS
1769#else
1770static void mlxsw_sp_router_neigh_ent_ipv6_process(struct mlxsw_sp *mlxsw_sp,
1771 char *rauhtd_pl,
1772 int rec_index)
1773{
1774}
1775#endif
60f040ca 1776
c723c735
YG
1777static void mlxsw_sp_router_neigh_rec_ipv4_process(struct mlxsw_sp *mlxsw_sp,
1778 char *rauhtd_pl,
1779 int rec_index)
1780{
1781 u8 num_entries;
1782 int i;
1783
1784 num_entries = mlxsw_reg_rauhtd_ipv4_rec_num_entries_get(rauhtd_pl,
1785 rec_index);
1786 /* Hardware starts counting at 0, so add 1. */
1787 num_entries++;
1788
1789 /* Each record consists of several neighbour entries. */
1790 for (i = 0; i < num_entries; i++) {
1791 int ent_index;
1792
1793 ent_index = rec_index * MLXSW_REG_RAUHTD_IPV4_ENT_PER_REC + i;
1794 mlxsw_sp_router_neigh_ent_ipv4_process(mlxsw_sp, rauhtd_pl,
1795 ent_index);
1796 }
1797
1798}
1799
60f040ca
AS
1800static void mlxsw_sp_router_neigh_rec_ipv6_process(struct mlxsw_sp *mlxsw_sp,
1801 char *rauhtd_pl,
1802 int rec_index)
1803{
1804 /* One record contains one entry. */
1805 mlxsw_sp_router_neigh_ent_ipv6_process(mlxsw_sp, rauhtd_pl,
1806 rec_index);
1807}
1808
c723c735
YG
1809static void mlxsw_sp_router_neigh_rec_process(struct mlxsw_sp *mlxsw_sp,
1810 char *rauhtd_pl, int rec_index)
1811{
1812 switch (mlxsw_reg_rauhtd_rec_type_get(rauhtd_pl, rec_index)) {
1813 case MLXSW_REG_RAUHTD_TYPE_IPV4:
1814 mlxsw_sp_router_neigh_rec_ipv4_process(mlxsw_sp, rauhtd_pl,
1815 rec_index);
1816 break;
1817 case MLXSW_REG_RAUHTD_TYPE_IPV6:
60f040ca
AS
1818 mlxsw_sp_router_neigh_rec_ipv6_process(mlxsw_sp, rauhtd_pl,
1819 rec_index);
c723c735
YG
1820 break;
1821 }
1822}
1823
42cdb338
AS
1824static bool mlxsw_sp_router_rauhtd_is_full(char *rauhtd_pl)
1825{
1826 u8 num_rec, last_rec_index, num_entries;
1827
1828 num_rec = mlxsw_reg_rauhtd_num_rec_get(rauhtd_pl);
1829 last_rec_index = num_rec - 1;
1830
1831 if (num_rec < MLXSW_REG_RAUHTD_REC_MAX_NUM)
1832 return false;
1833 if (mlxsw_reg_rauhtd_rec_type_get(rauhtd_pl, last_rec_index) ==
1834 MLXSW_REG_RAUHTD_TYPE_IPV6)
1835 return true;
1836
1837 num_entries = mlxsw_reg_rauhtd_ipv4_rec_num_entries_get(rauhtd_pl,
1838 last_rec_index);
1839 if (++num_entries == MLXSW_REG_RAUHTD_IPV4_ENT_PER_REC)
1840 return true;
1841 return false;
1842}
1843
60f040ca
AS
1844static int
1845__mlxsw_sp_router_neighs_update_rauhtd(struct mlxsw_sp *mlxsw_sp,
1846 char *rauhtd_pl,
1847 enum mlxsw_reg_rauhtd_type type)
c723c735 1848{
60f040ca
AS
1849 int i, num_rec;
1850 int err;
c723c735
YG
1851
1852 /* Make sure the neighbour's netdev isn't removed in the
1853 * process.
1854 */
1855 rtnl_lock();
1856 do {
60f040ca 1857 mlxsw_reg_rauhtd_pack(rauhtd_pl, type);
c723c735
YG
1858 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(rauhtd),
1859 rauhtd_pl);
1860 if (err) {
7ff176f8 1861 dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Failed to dump neighbour table\n");
c723c735
YG
1862 break;
1863 }
1864 num_rec = mlxsw_reg_rauhtd_num_rec_get(rauhtd_pl);
1865 for (i = 0; i < num_rec; i++)
1866 mlxsw_sp_router_neigh_rec_process(mlxsw_sp, rauhtd_pl,
1867 i);
42cdb338 1868 } while (mlxsw_sp_router_rauhtd_is_full(rauhtd_pl));
c723c735
YG
1869 rtnl_unlock();
1870
60f040ca
AS
1871 return err;
1872}
1873
1874static int mlxsw_sp_router_neighs_update_rauhtd(struct mlxsw_sp *mlxsw_sp)
1875{
1876 enum mlxsw_reg_rauhtd_type type;
1877 char *rauhtd_pl;
1878 int err;
1879
1880 rauhtd_pl = kmalloc(MLXSW_REG_RAUHTD_LEN, GFP_KERNEL);
1881 if (!rauhtd_pl)
1882 return -ENOMEM;
1883
1884 type = MLXSW_REG_RAUHTD_TYPE_IPV4;
1885 err = __mlxsw_sp_router_neighs_update_rauhtd(mlxsw_sp, rauhtd_pl, type);
1886 if (err)
1887 goto out;
1888
1889 type = MLXSW_REG_RAUHTD_TYPE_IPV6;
1890 err = __mlxsw_sp_router_neighs_update_rauhtd(mlxsw_sp, rauhtd_pl, type);
1891out:
c723c735 1892 kfree(rauhtd_pl);
b2157149
YG
1893 return err;
1894}
1895
1896static void mlxsw_sp_router_neighs_update_nh(struct mlxsw_sp *mlxsw_sp)
1897{
1898 struct mlxsw_sp_neigh_entry *neigh_entry;
1899
1900 /* Take RTNL mutex here to prevent lists from changes */
1901 rtnl_lock();
9011b677 1902 list_for_each_entry(neigh_entry, &mlxsw_sp->router->nexthop_neighs_list,
8a0b7275 1903 nexthop_neighs_list_node)
b2157149
YG
1904 /* If this neigh have nexthops, make the kernel think this neigh
1905 * is active regardless of the traffic.
1906 */
8a0b7275 1907 neigh_event_send(neigh_entry->key.n, NULL);
b2157149
YG
1908 rtnl_unlock();
1909}
1910
1911static void
1912mlxsw_sp_router_neighs_update_work_schedule(struct mlxsw_sp *mlxsw_sp)
1913{
9011b677 1914 unsigned long interval = mlxsw_sp->router->neighs_update.interval;
b2157149 1915
9011b677 1916 mlxsw_core_schedule_dw(&mlxsw_sp->router->neighs_update.dw,
b2157149
YG
1917 msecs_to_jiffies(interval));
1918}
1919
1920static void mlxsw_sp_router_neighs_update_work(struct work_struct *work)
1921{
9011b677 1922 struct mlxsw_sp_router *router;
b2157149
YG
1923 int err;
1924
9011b677
IS
1925 router = container_of(work, struct mlxsw_sp_router,
1926 neighs_update.dw.work);
1927 err = mlxsw_sp_router_neighs_update_rauhtd(router->mlxsw_sp);
b2157149 1928 if (err)
9011b677 1929 dev_err(router->mlxsw_sp->bus_info->dev, "Could not update kernel for neigh activity");
b2157149 1930
9011b677 1931 mlxsw_sp_router_neighs_update_nh(router->mlxsw_sp);
b2157149 1932
9011b677 1933 mlxsw_sp_router_neighs_update_work_schedule(router->mlxsw_sp);
c723c735
YG
1934}
1935
0b2361d9
YG
1936static void mlxsw_sp_router_probe_unresolved_nexthops(struct work_struct *work)
1937{
1938 struct mlxsw_sp_neigh_entry *neigh_entry;
9011b677 1939 struct mlxsw_sp_router *router;
0b2361d9 1940
9011b677
IS
1941 router = container_of(work, struct mlxsw_sp_router,
1942 nexthop_probe_dw.work);
0b2361d9
YG
1943 /* Iterate over nexthop neighbours, find those who are unresolved and
1944 * send arp on them. This solves the chicken-egg problem when
1945 * the nexthop wouldn't get offloaded until the neighbor is resolved
1946 * but it wouldn't get resolved ever in case traffic is flowing in HW
1947 * using different nexthop.
1948 *
1949 * Take RTNL mutex here to prevent lists from changes.
1950 */
1951 rtnl_lock();
9011b677 1952 list_for_each_entry(neigh_entry, &router->nexthop_neighs_list,
8a0b7275 1953 nexthop_neighs_list_node)
01b1aa35 1954 if (!neigh_entry->connected)
33b1341c 1955 neigh_event_send(neigh_entry->key.n, NULL);
0b2361d9
YG
1956 rtnl_unlock();
1957
9011b677 1958 mlxsw_core_schedule_dw(&router->nexthop_probe_dw,
0b2361d9
YG
1959 MLXSW_SP_UNRESOLVED_NH_PROBE_INTERVAL);
1960}
1961
a7ff87ac
JP
1962static void
1963mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp *mlxsw_sp,
1964 struct mlxsw_sp_neigh_entry *neigh_entry,
1965 bool removing);
1966
5c8802f1
IS
1967static enum mlxsw_reg_rauht_op mlxsw_sp_rauht_op(bool adding)
1968{
1969 return adding ? MLXSW_REG_RAUHT_OP_WRITE_ADD :
1970 MLXSW_REG_RAUHT_OP_WRITE_DELETE;
1971}
1972
1973static void
1974mlxsw_sp_router_neigh_entry_op4(struct mlxsw_sp *mlxsw_sp,
1975 struct mlxsw_sp_neigh_entry *neigh_entry,
1976 enum mlxsw_reg_rauht_op op)
a6bf9e93 1977{
33b1341c 1978 struct neighbour *n = neigh_entry->key.n;
5c8802f1 1979 u32 dip = ntohl(*((__be32 *) n->primary_key));
a6bf9e93 1980 char rauht_pl[MLXSW_REG_RAUHT_LEN];
5c8802f1
IS
1981
1982 mlxsw_reg_rauht_pack4(rauht_pl, op, neigh_entry->rif, neigh_entry->ha,
1983 dip);
7cfcbc75
AS
1984 if (neigh_entry->counter_valid)
1985 mlxsw_reg_rauht_pack_counter(rauht_pl,
1986 neigh_entry->counter_index);
5c8802f1
IS
1987 mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rauht), rauht_pl);
1988}
1989
d5eb89cf
AS
1990static void
1991mlxsw_sp_router_neigh_entry_op6(struct mlxsw_sp *mlxsw_sp,
1992 struct mlxsw_sp_neigh_entry *neigh_entry,
1993 enum mlxsw_reg_rauht_op op)
1994{
1995 struct neighbour *n = neigh_entry->key.n;
1996 char rauht_pl[MLXSW_REG_RAUHT_LEN];
1997 const char *dip = n->primary_key;
1998
1999 mlxsw_reg_rauht_pack6(rauht_pl, op, neigh_entry->rif, neigh_entry->ha,
2000 dip);
7cfcbc75
AS
2001 if (neigh_entry->counter_valid)
2002 mlxsw_reg_rauht_pack_counter(rauht_pl,
2003 neigh_entry->counter_index);
d5eb89cf
AS
2004 mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rauht), rauht_pl);
2005}
2006
1d1056d8 2007bool mlxsw_sp_neigh_ipv6_ignore(struct mlxsw_sp_neigh_entry *neigh_entry)
d5eb89cf 2008{
1d1056d8
AS
2009 struct neighbour *n = neigh_entry->key.n;
2010
d5eb89cf
AS
2011 /* Packets with a link-local destination address are trapped
2012 * after LPM lookup and never reach the neighbour table, so
2013 * there is no need to program such neighbours to the device.
2014 */
2015 if (ipv6_addr_type((struct in6_addr *) &n->primary_key) &
2016 IPV6_ADDR_LINKLOCAL)
2017 return true;
2018 return false;
2019}
2020
5c8802f1
IS
2021static void
2022mlxsw_sp_neigh_entry_update(struct mlxsw_sp *mlxsw_sp,
2023 struct mlxsw_sp_neigh_entry *neigh_entry,
2024 bool adding)
2025{
2026 if (!adding && !neigh_entry->connected)
2027 return;
2028 neigh_entry->connected = adding;
b5f3e0d4 2029 if (neigh_entry->key.n->tbl->family == AF_INET) {
5c8802f1
IS
2030 mlxsw_sp_router_neigh_entry_op4(mlxsw_sp, neigh_entry,
2031 mlxsw_sp_rauht_op(adding));
b5f3e0d4 2032 } else if (neigh_entry->key.n->tbl->family == AF_INET6) {
1d1056d8 2033 if (mlxsw_sp_neigh_ipv6_ignore(neigh_entry))
d5eb89cf
AS
2034 return;
2035 mlxsw_sp_router_neigh_entry_op6(mlxsw_sp, neigh_entry,
2036 mlxsw_sp_rauht_op(adding));
2037 } else {
5c8802f1 2038 WARN_ON_ONCE(1);
d5eb89cf 2039 }
5c8802f1
IS
2040}
2041
a481d713
AS
2042void
2043mlxsw_sp_neigh_entry_counter_update(struct mlxsw_sp *mlxsw_sp,
2044 struct mlxsw_sp_neigh_entry *neigh_entry,
2045 bool adding)
2046{
2047 if (adding)
2048 mlxsw_sp_neigh_counter_alloc(mlxsw_sp, neigh_entry);
2049 else
2050 mlxsw_sp_neigh_counter_free(mlxsw_sp, neigh_entry);
2051 mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, true);
2052}
2053
ceb8881d 2054struct mlxsw_sp_netevent_work {
5c8802f1
IS
2055 struct work_struct work;
2056 struct mlxsw_sp *mlxsw_sp;
2057 struct neighbour *n;
2058};
2059
2060static void mlxsw_sp_router_neigh_event_work(struct work_struct *work)
2061{
ceb8881d
IS
2062 struct mlxsw_sp_netevent_work *net_work =
2063 container_of(work, struct mlxsw_sp_netevent_work, work);
2064 struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp;
5c8802f1 2065 struct mlxsw_sp_neigh_entry *neigh_entry;
ceb8881d 2066 struct neighbour *n = net_work->n;
5c8802f1 2067 unsigned char ha[ETH_ALEN];
a6bf9e93 2068 bool entry_connected;
93a87e5e 2069 u8 nud_state, dead;
a6bf9e93 2070
5c8802f1
IS
2071 /* If these parameters are changed after we release the lock,
2072 * then we are guaranteed to receive another event letting us
2073 * know about it.
2074 */
a6bf9e93 2075 read_lock_bh(&n->lock);
5c8802f1 2076 memcpy(ha, n->ha, ETH_ALEN);
a6bf9e93 2077 nud_state = n->nud_state;
93a87e5e 2078 dead = n->dead;
a6bf9e93
YG
2079 read_unlock_bh(&n->lock);
2080
5c8802f1 2081 rtnl_lock();
93a87e5e 2082 entry_connected = nud_state & NUD_VALID && !dead;
5c8802f1
IS
2083 neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, n);
2084 if (!entry_connected && !neigh_entry)
2085 goto out;
2086 if (!neigh_entry) {
2087 neigh_entry = mlxsw_sp_neigh_entry_create(mlxsw_sp, n);
2088 if (IS_ERR(neigh_entry))
2089 goto out;
a6bf9e93
YG
2090 }
2091
5c8802f1
IS
2092 memcpy(neigh_entry->ha, ha, ETH_ALEN);
2093 mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, entry_connected);
2094 mlxsw_sp_nexthop_neigh_update(mlxsw_sp, neigh_entry, !entry_connected);
2095
2096 if (!neigh_entry->connected && list_empty(&neigh_entry->nexthop_list))
2097 mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry);
2098
2099out:
2100 rtnl_unlock();
a6bf9e93 2101 neigh_release(n);
ceb8881d 2102 kfree(net_work);
a6bf9e93
YG
2103}
2104
28678f07
IS
2105static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp);
2106
2107static void mlxsw_sp_router_mp_hash_event_work(struct work_struct *work)
2108{
2109 struct mlxsw_sp_netevent_work *net_work =
2110 container_of(work, struct mlxsw_sp_netevent_work, work);
2111 struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp;
2112
2113 mlxsw_sp_mp_hash_init(mlxsw_sp);
2114 kfree(net_work);
2115}
2116
2117static int mlxsw_sp_router_netevent_event(struct notifier_block *nb,
48fac885 2118 unsigned long event, void *ptr)
c723c735 2119{
ceb8881d 2120 struct mlxsw_sp_netevent_work *net_work;
c723c735 2121 struct mlxsw_sp_port *mlxsw_sp_port;
28678f07 2122 struct mlxsw_sp_router *router;
c723c735
YG
2123 struct mlxsw_sp *mlxsw_sp;
2124 unsigned long interval;
2125 struct neigh_parms *p;
a6bf9e93 2126 struct neighbour *n;
28678f07 2127 struct net *net;
c723c735
YG
2128
2129 switch (event) {
2130 case NETEVENT_DELAY_PROBE_TIME_UPDATE:
2131 p = ptr;
2132
2133 /* We don't care about changes in the default table. */
b5f3e0d4
IS
2134 if (!p->dev || (p->tbl->family != AF_INET &&
2135 p->tbl->family != AF_INET6))
c723c735
YG
2136 return NOTIFY_DONE;
2137
2138 /* We are in atomic context and can't take RTNL mutex,
2139 * so use RCU variant to walk the device chain.
2140 */
2141 mlxsw_sp_port = mlxsw_sp_port_lower_dev_hold(p->dev);
2142 if (!mlxsw_sp_port)
2143 return NOTIFY_DONE;
2144
2145 mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
2146 interval = jiffies_to_msecs(NEIGH_VAR(p, DELAY_PROBE_TIME));
9011b677 2147 mlxsw_sp->router->neighs_update.interval = interval;
c723c735
YG
2148
2149 mlxsw_sp_port_dev_put(mlxsw_sp_port);
2150 break;
a6bf9e93
YG
2151 case NETEVENT_NEIGH_UPDATE:
2152 n = ptr;
a6bf9e93 2153
b5f3e0d4 2154 if (n->tbl->family != AF_INET && n->tbl->family != AF_INET6)
a6bf9e93
YG
2155 return NOTIFY_DONE;
2156
5c8802f1 2157 mlxsw_sp_port = mlxsw_sp_port_lower_dev_hold(n->dev);
a6bf9e93
YG
2158 if (!mlxsw_sp_port)
2159 return NOTIFY_DONE;
2160
ceb8881d
IS
2161 net_work = kzalloc(sizeof(*net_work), GFP_ATOMIC);
2162 if (!net_work) {
a6bf9e93 2163 mlxsw_sp_port_dev_put(mlxsw_sp_port);
5c8802f1 2164 return NOTIFY_BAD;
a6bf9e93 2165 }
5c8802f1 2166
ceb8881d
IS
2167 INIT_WORK(&net_work->work, mlxsw_sp_router_neigh_event_work);
2168 net_work->mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
2169 net_work->n = n;
a6bf9e93
YG
2170
2171 /* Take a reference to ensure the neighbour won't be
2172 * destructed until we drop the reference in delayed
2173 * work.
2174 */
2175 neigh_clone(n);
ceb8881d 2176 mlxsw_core_schedule_work(&net_work->work);
5c8802f1 2177 mlxsw_sp_port_dev_put(mlxsw_sp_port);
a6bf9e93 2178 break;
28678f07
IS
2179 case NETEVENT_MULTIPATH_HASH_UPDATE:
2180 net = ptr;
2181
2182 if (!net_eq(net, &init_net))
2183 return NOTIFY_DONE;
2184
2185 net_work = kzalloc(sizeof(*net_work), GFP_ATOMIC);
2186 if (!net_work)
2187 return NOTIFY_BAD;
2188
2189 router = container_of(nb, struct mlxsw_sp_router, netevent_nb);
2190 INIT_WORK(&net_work->work, mlxsw_sp_router_mp_hash_event_work);
2191 net_work->mlxsw_sp = router->mlxsw_sp;
2192 mlxsw_core_schedule_work(&net_work->work);
2193 break;
c723c735
YG
2194 }
2195
2196 return NOTIFY_DONE;
2197}
2198
6cf3c971
JP
2199static int mlxsw_sp_neigh_init(struct mlxsw_sp *mlxsw_sp)
2200{
c723c735
YG
2201 int err;
2202
9011b677 2203 err = rhashtable_init(&mlxsw_sp->router->neigh_ht,
c723c735
YG
2204 &mlxsw_sp_neigh_ht_params);
2205 if (err)
2206 return err;
2207
2208 /* Initialize the polling interval according to the default
2209 * table.
2210 */
2211 mlxsw_sp_router_neighs_update_interval_init(mlxsw_sp);
2212
0b2361d9 2213 /* Create the delayed works for the activity_update */
9011b677 2214 INIT_DELAYED_WORK(&mlxsw_sp->router->neighs_update.dw,
c723c735 2215 mlxsw_sp_router_neighs_update_work);
9011b677 2216 INIT_DELAYED_WORK(&mlxsw_sp->router->nexthop_probe_dw,
0b2361d9 2217 mlxsw_sp_router_probe_unresolved_nexthops);
9011b677
IS
2218 mlxsw_core_schedule_dw(&mlxsw_sp->router->neighs_update.dw, 0);
2219 mlxsw_core_schedule_dw(&mlxsw_sp->router->nexthop_probe_dw, 0);
c723c735 2220 return 0;
6cf3c971
JP
2221}
2222
2223static void mlxsw_sp_neigh_fini(struct mlxsw_sp *mlxsw_sp)
2224{
9011b677
IS
2225 cancel_delayed_work_sync(&mlxsw_sp->router->neighs_update.dw);
2226 cancel_delayed_work_sync(&mlxsw_sp->router->nexthop_probe_dw);
2227 rhashtable_destroy(&mlxsw_sp->router->neigh_ht);
6cf3c971
JP
2228}
2229
9665b745 2230static void mlxsw_sp_neigh_rif_gone_sync(struct mlxsw_sp *mlxsw_sp,
bf95233e 2231 struct mlxsw_sp_rif *rif)
9665b745
IS
2232{
2233 struct mlxsw_sp_neigh_entry *neigh_entry, *tmp;
2234
bf95233e 2235 list_for_each_entry_safe(neigh_entry, tmp, &rif->neigh_list,
4a3c67a6
IS
2236 rif_list_node) {
2237 mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, false);
9665b745 2238 mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry);
4a3c67a6 2239 }
9665b745
IS
2240}
2241
35225e47
PM
2242enum mlxsw_sp_nexthop_type {
2243 MLXSW_SP_NEXTHOP_TYPE_ETH,
1012b9ac 2244 MLXSW_SP_NEXTHOP_TYPE_IPIP,
35225e47
PM
2245};
2246
c53b8e1b
IS
2247struct mlxsw_sp_nexthop_key {
2248 struct fib_nh *fib_nh;
2249};
2250
a7ff87ac
JP
2251struct mlxsw_sp_nexthop {
2252 struct list_head neigh_list_node; /* member of neigh entry list */
9665b745 2253 struct list_head rif_list_node;
dbe4598c 2254 struct list_head router_list_node;
a7ff87ac
JP
2255 struct mlxsw_sp_nexthop_group *nh_grp; /* pointer back to the group
2256 * this belongs to
2257 */
c53b8e1b
IS
2258 struct rhash_head ht_node;
2259 struct mlxsw_sp_nexthop_key key;
58adf2c4 2260 unsigned char gw_addr[sizeof(struct in6_addr)];
e6f3b379 2261 int ifindex;
408bd946 2262 int nh_weight;
eb789980
IS
2263 int norm_nh_weight;
2264 int num_adj_entries;
bf95233e 2265 struct mlxsw_sp_rif *rif;
a7ff87ac
JP
2266 u8 should_offload:1, /* set indicates this neigh is connected and
2267 * should be put to KVD linear area of this group.
2268 */
2269 offloaded:1, /* set in case the neigh is actually put into
2270 * KVD linear area of this group.
2271 */
2272 update:1; /* set indicates that MAC of this neigh should be
2273 * updated in HW
2274 */
35225e47
PM
2275 enum mlxsw_sp_nexthop_type type;
2276 union {
2277 struct mlxsw_sp_neigh_entry *neigh_entry;
1012b9ac 2278 struct mlxsw_sp_ipip_entry *ipip_entry;
35225e47 2279 };
a5390278
AS
2280 unsigned int counter_index;
2281 bool counter_valid;
a7ff87ac
JP
2282};
2283
2284struct mlxsw_sp_nexthop_group {
ba31d366 2285 void *priv;
e9ad5e7d 2286 struct rhash_head ht_node;
a7ff87ac 2287 struct list_head fib_list; /* list of fib entries that use this group */
58adf2c4 2288 struct neigh_table *neigh_tbl;
b3e8d1eb
IS
2289 u8 adj_index_valid:1,
2290 gateway:1; /* routes using the group use a gateway */
a7ff87ac
JP
2291 u32 adj_index;
2292 u16 ecmp_size;
2293 u16 count;
eb789980 2294 int sum_norm_weight;
a7ff87ac 2295 struct mlxsw_sp_nexthop nexthops[0];
bf95233e 2296#define nh_rif nexthops[0].rif
a7ff87ac
JP
2297};
2298
427e652a
AS
2299void mlxsw_sp_nexthop_counter_alloc(struct mlxsw_sp *mlxsw_sp,
2300 struct mlxsw_sp_nexthop *nh)
a5390278
AS
2301{
2302 struct devlink *devlink;
2303
2304 devlink = priv_to_devlink(mlxsw_sp->core);
2305 if (!devlink_dpipe_table_counter_enabled(devlink,
2306 MLXSW_SP_DPIPE_TABLE_NAME_ADJ))
2307 return;
2308
2309 if (mlxsw_sp_flow_counter_alloc(mlxsw_sp, &nh->counter_index))
2310 return;
2311
2312 nh->counter_valid = true;
2313}
2314
427e652a
AS
2315void mlxsw_sp_nexthop_counter_free(struct mlxsw_sp *mlxsw_sp,
2316 struct mlxsw_sp_nexthop *nh)
a5390278
AS
2317{
2318 if (!nh->counter_valid)
2319 return;
2320 mlxsw_sp_flow_counter_free(mlxsw_sp, nh->counter_index);
2321 nh->counter_valid = false;
2322}
2323
2324int mlxsw_sp_nexthop_counter_get(struct mlxsw_sp *mlxsw_sp,
2325 struct mlxsw_sp_nexthop *nh, u64 *p_counter)
2326{
2327 if (!nh->counter_valid)
2328 return -EINVAL;
2329
2330 return mlxsw_sp_flow_counter_get(mlxsw_sp, nh->counter_index,
2331 p_counter, NULL);
2332}
2333
c556cd28
AS
2334struct mlxsw_sp_nexthop *mlxsw_sp_nexthop_next(struct mlxsw_sp_router *router,
2335 struct mlxsw_sp_nexthop *nh)
2336{
2337 if (!nh) {
2338 if (list_empty(&router->nexthop_list))
2339 return NULL;
2340 else
2341 return list_first_entry(&router->nexthop_list,
2342 typeof(*nh), router_list_node);
2343 }
2344 if (list_is_last(&nh->router_list_node, &router->nexthop_list))
2345 return NULL;
2346 return list_next_entry(nh, router_list_node);
2347}
2348
2349bool mlxsw_sp_nexthop_offload(struct mlxsw_sp_nexthop *nh)
2350{
2351 return nh->offloaded;
2352}
2353
2354unsigned char *mlxsw_sp_nexthop_ha(struct mlxsw_sp_nexthop *nh)
2355{
2356 if (!nh->offloaded)
2357 return NULL;
2358 return nh->neigh_entry->ha;
2359}
2360
2361int mlxsw_sp_nexthop_indexes(struct mlxsw_sp_nexthop *nh, u32 *p_adj_index,
e69cd9d7 2362 u32 *p_adj_size, u32 *p_adj_hash_index)
c556cd28
AS
2363{
2364 struct mlxsw_sp_nexthop_group *nh_grp = nh->nh_grp;
2365 u32 adj_hash_index = 0;
2366 int i;
2367
2368 if (!nh->offloaded || !nh_grp->adj_index_valid)
2369 return -EINVAL;
2370
2371 *p_adj_index = nh_grp->adj_index;
e69cd9d7 2372 *p_adj_size = nh_grp->ecmp_size;
c556cd28
AS
2373
2374 for (i = 0; i < nh_grp->count; i++) {
2375 struct mlxsw_sp_nexthop *nh_iter = &nh_grp->nexthops[i];
2376
2377 if (nh_iter == nh)
2378 break;
2379 if (nh_iter->offloaded)
eb789980 2380 adj_hash_index += nh_iter->num_adj_entries;
c556cd28
AS
2381 }
2382
2383 *p_adj_hash_index = adj_hash_index;
2384 return 0;
2385}
2386
2387struct mlxsw_sp_rif *mlxsw_sp_nexthop_rif(struct mlxsw_sp_nexthop *nh)
2388{
2389 return nh->rif;
2390}
2391
2392bool mlxsw_sp_nexthop_group_has_ipip(struct mlxsw_sp_nexthop *nh)
2393{
2394 struct mlxsw_sp_nexthop_group *nh_grp = nh->nh_grp;
2395 int i;
2396
2397 for (i = 0; i < nh_grp->count; i++) {
2398 struct mlxsw_sp_nexthop *nh_iter = &nh_grp->nexthops[i];
2399
2400 if (nh_iter->type == MLXSW_SP_NEXTHOP_TYPE_IPIP)
2401 return true;
2402 }
2403 return false;
2404}
2405
ba31d366
AS
2406static struct fib_info *
2407mlxsw_sp_nexthop4_group_fi(const struct mlxsw_sp_nexthop_group *nh_grp)
2408{
2409 return nh_grp->priv;
2410}
2411
2412struct mlxsw_sp_nexthop_group_cmp_arg {
e6f3b379
AS
2413 enum mlxsw_sp_l3proto proto;
2414 union {
2415 struct fib_info *fi;
2416 struct mlxsw_sp_fib6_entry *fib6_entry;
2417 };
ba31d366
AS
2418};
2419
e6f3b379
AS
2420static bool
2421mlxsw_sp_nexthop6_group_has_nexthop(const struct mlxsw_sp_nexthop_group *nh_grp,
2422 const struct in6_addr *gw, int ifindex)
2423{
2424 int i;
2425
2426 for (i = 0; i < nh_grp->count; i++) {
2427 const struct mlxsw_sp_nexthop *nh;
2428
2429 nh = &nh_grp->nexthops[i];
2430 if (nh->ifindex == ifindex &&
2431 ipv6_addr_equal(gw, (struct in6_addr *) nh->gw_addr))
2432 return true;
2433 }
2434
2435 return false;
2436}
2437
2438static bool
2439mlxsw_sp_nexthop6_group_cmp(const struct mlxsw_sp_nexthop_group *nh_grp,
2440 const struct mlxsw_sp_fib6_entry *fib6_entry)
2441{
2442 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
2443
2444 if (nh_grp->count != fib6_entry->nrt6)
2445 return false;
2446
2447 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
2448 struct in6_addr *gw;
2449 int ifindex;
2450
2451 ifindex = mlxsw_sp_rt6->rt->dst.dev->ifindex;
2452 gw = &mlxsw_sp_rt6->rt->rt6i_gateway;
2453 if (!mlxsw_sp_nexthop6_group_has_nexthop(nh_grp, gw, ifindex))
2454 return false;
2455 }
2456
2457 return true;
2458}
2459
ba31d366
AS
2460static int
2461mlxsw_sp_nexthop_group_cmp(struct rhashtable_compare_arg *arg, const void *ptr)
2462{
2463 const struct mlxsw_sp_nexthop_group_cmp_arg *cmp_arg = arg->key;
2464 const struct mlxsw_sp_nexthop_group *nh_grp = ptr;
2465
e6f3b379
AS
2466 switch (cmp_arg->proto) {
2467 case MLXSW_SP_L3_PROTO_IPV4:
2468 return cmp_arg->fi != mlxsw_sp_nexthop4_group_fi(nh_grp);
2469 case MLXSW_SP_L3_PROTO_IPV6:
2470 return !mlxsw_sp_nexthop6_group_cmp(nh_grp,
2471 cmp_arg->fib6_entry);
2472 default:
2473 WARN_ON(1);
2474 return 1;
2475 }
2476}
2477
2478static int
2479mlxsw_sp_nexthop_group_type(const struct mlxsw_sp_nexthop_group *nh_grp)
2480{
2481 return nh_grp->neigh_tbl->family;
ba31d366
AS
2482}
2483
2484static u32 mlxsw_sp_nexthop_group_hash_obj(const void *data, u32 len, u32 seed)
2485{
2486 const struct mlxsw_sp_nexthop_group *nh_grp = data;
e6f3b379
AS
2487 const struct mlxsw_sp_nexthop *nh;
2488 struct fib_info *fi;
2489 unsigned int val;
2490 int i;
ba31d366 2491
e6f3b379
AS
2492 switch (mlxsw_sp_nexthop_group_type(nh_grp)) {
2493 case AF_INET:
2494 fi = mlxsw_sp_nexthop4_group_fi(nh_grp);
2495 return jhash(&fi, sizeof(fi), seed);
2496 case AF_INET6:
2497 val = nh_grp->count;
2498 for (i = 0; i < nh_grp->count; i++) {
2499 nh = &nh_grp->nexthops[i];
2500 val ^= nh->ifindex;
2501 }
2502 return jhash(&val, sizeof(val), seed);
2503 default:
2504 WARN_ON(1);
2505 return 0;
2506 }
2507}
2508
2509static u32
2510mlxsw_sp_nexthop6_group_hash(struct mlxsw_sp_fib6_entry *fib6_entry, u32 seed)
2511{
2512 unsigned int val = fib6_entry->nrt6;
2513 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
2514 struct net_device *dev;
2515
2516 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
2517 dev = mlxsw_sp_rt6->rt->dst.dev;
2518 val ^= dev->ifindex;
2519 }
2520
2521 return jhash(&val, sizeof(val), seed);
ba31d366
AS
2522}
2523
2524static u32
2525mlxsw_sp_nexthop_group_hash(const void *data, u32 len, u32 seed)
2526{
2527 const struct mlxsw_sp_nexthop_group_cmp_arg *cmp_arg = data;
2528
e6f3b379
AS
2529 switch (cmp_arg->proto) {
2530 case MLXSW_SP_L3_PROTO_IPV4:
2531 return jhash(&cmp_arg->fi, sizeof(cmp_arg->fi), seed);
2532 case MLXSW_SP_L3_PROTO_IPV6:
2533 return mlxsw_sp_nexthop6_group_hash(cmp_arg->fib6_entry, seed);
2534 default:
2535 WARN_ON(1);
2536 return 0;
2537 }
ba31d366
AS
2538}
2539
e9ad5e7d 2540static const struct rhashtable_params mlxsw_sp_nexthop_group_ht_params = {
e9ad5e7d 2541 .head_offset = offsetof(struct mlxsw_sp_nexthop_group, ht_node),
ba31d366
AS
2542 .hashfn = mlxsw_sp_nexthop_group_hash,
2543 .obj_hashfn = mlxsw_sp_nexthop_group_hash_obj,
2544 .obj_cmpfn = mlxsw_sp_nexthop_group_cmp,
e9ad5e7d
IS
2545};
2546
2547static int mlxsw_sp_nexthop_group_insert(struct mlxsw_sp *mlxsw_sp,
2548 struct mlxsw_sp_nexthop_group *nh_grp)
2549{
e6f3b379
AS
2550 if (mlxsw_sp_nexthop_group_type(nh_grp) == AF_INET6 &&
2551 !nh_grp->gateway)
2552 return 0;
2553
9011b677 2554 return rhashtable_insert_fast(&mlxsw_sp->router->nexthop_group_ht,
e9ad5e7d
IS
2555 &nh_grp->ht_node,
2556 mlxsw_sp_nexthop_group_ht_params);
2557}
2558
2559static void mlxsw_sp_nexthop_group_remove(struct mlxsw_sp *mlxsw_sp,
2560 struct mlxsw_sp_nexthop_group *nh_grp)
2561{
e6f3b379
AS
2562 if (mlxsw_sp_nexthop_group_type(nh_grp) == AF_INET6 &&
2563 !nh_grp->gateway)
2564 return;
2565
9011b677 2566 rhashtable_remove_fast(&mlxsw_sp->router->nexthop_group_ht,
e9ad5e7d
IS
2567 &nh_grp->ht_node,
2568 mlxsw_sp_nexthop_group_ht_params);
2569}
2570
2571static struct mlxsw_sp_nexthop_group *
ba31d366
AS
2572mlxsw_sp_nexthop4_group_lookup(struct mlxsw_sp *mlxsw_sp,
2573 struct fib_info *fi)
e9ad5e7d 2574{
ba31d366
AS
2575 struct mlxsw_sp_nexthop_group_cmp_arg cmp_arg;
2576
e6f3b379 2577 cmp_arg.proto = MLXSW_SP_L3_PROTO_IPV4;
ba31d366
AS
2578 cmp_arg.fi = fi;
2579 return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_group_ht,
2580 &cmp_arg,
e9ad5e7d
IS
2581 mlxsw_sp_nexthop_group_ht_params);
2582}
2583
e6f3b379
AS
2584static struct mlxsw_sp_nexthop_group *
2585mlxsw_sp_nexthop6_group_lookup(struct mlxsw_sp *mlxsw_sp,
2586 struct mlxsw_sp_fib6_entry *fib6_entry)
2587{
2588 struct mlxsw_sp_nexthop_group_cmp_arg cmp_arg;
2589
2590 cmp_arg.proto = MLXSW_SP_L3_PROTO_IPV6;
2591 cmp_arg.fib6_entry = fib6_entry;
2592 return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_group_ht,
2593 &cmp_arg,
2594 mlxsw_sp_nexthop_group_ht_params);
2595}
2596
c53b8e1b
IS
2597static const struct rhashtable_params mlxsw_sp_nexthop_ht_params = {
2598 .key_offset = offsetof(struct mlxsw_sp_nexthop, key),
2599 .head_offset = offsetof(struct mlxsw_sp_nexthop, ht_node),
2600 .key_len = sizeof(struct mlxsw_sp_nexthop_key),
2601};
2602
2603static int mlxsw_sp_nexthop_insert(struct mlxsw_sp *mlxsw_sp,
2604 struct mlxsw_sp_nexthop *nh)
2605{
9011b677 2606 return rhashtable_insert_fast(&mlxsw_sp->router->nexthop_ht,
c53b8e1b
IS
2607 &nh->ht_node, mlxsw_sp_nexthop_ht_params);
2608}
2609
2610static void mlxsw_sp_nexthop_remove(struct mlxsw_sp *mlxsw_sp,
2611 struct mlxsw_sp_nexthop *nh)
2612{
9011b677 2613 rhashtable_remove_fast(&mlxsw_sp->router->nexthop_ht, &nh->ht_node,
c53b8e1b
IS
2614 mlxsw_sp_nexthop_ht_params);
2615}
2616
ad178c8e
IS
2617static struct mlxsw_sp_nexthop *
2618mlxsw_sp_nexthop_lookup(struct mlxsw_sp *mlxsw_sp,
2619 struct mlxsw_sp_nexthop_key key)
2620{
9011b677 2621 return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_ht, &key,
ad178c8e
IS
2622 mlxsw_sp_nexthop_ht_params);
2623}
2624
a7ff87ac 2625static int mlxsw_sp_adj_index_mass_update_vr(struct mlxsw_sp *mlxsw_sp,
76610ebb 2626 const struct mlxsw_sp_fib *fib,
a7ff87ac
JP
2627 u32 adj_index, u16 ecmp_size,
2628 u32 new_adj_index,
2629 u16 new_ecmp_size)
2630{
2631 char raleu_pl[MLXSW_REG_RALEU_LEN];
2632
1a9234e6 2633 mlxsw_reg_raleu_pack(raleu_pl,
76610ebb
IS
2634 (enum mlxsw_reg_ralxx_protocol) fib->proto,
2635 fib->vr->id, adj_index, ecmp_size, new_adj_index,
1a9234e6 2636 new_ecmp_size);
a7ff87ac
JP
2637 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raleu), raleu_pl);
2638}
2639
2640static int mlxsw_sp_adj_index_mass_update(struct mlxsw_sp *mlxsw_sp,
2641 struct mlxsw_sp_nexthop_group *nh_grp,
2642 u32 old_adj_index, u16 old_ecmp_size)
2643{
2644 struct mlxsw_sp_fib_entry *fib_entry;
76610ebb 2645 struct mlxsw_sp_fib *fib = NULL;
a7ff87ac
JP
2646 int err;
2647
2648 list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) {
76610ebb 2649 if (fib == fib_entry->fib_node->fib)
a7ff87ac 2650 continue;
76610ebb
IS
2651 fib = fib_entry->fib_node->fib;
2652 err = mlxsw_sp_adj_index_mass_update_vr(mlxsw_sp, fib,
a7ff87ac
JP
2653 old_adj_index,
2654 old_ecmp_size,
2655 nh_grp->adj_index,
2656 nh_grp->ecmp_size);
2657 if (err)
2658 return err;
2659 }
2660 return 0;
2661}
2662
eb789980
IS
2663static int __mlxsw_sp_nexthop_update(struct mlxsw_sp *mlxsw_sp, u32 adj_index,
2664 struct mlxsw_sp_nexthop *nh)
a7ff87ac
JP
2665{
2666 struct mlxsw_sp_neigh_entry *neigh_entry = nh->neigh_entry;
2667 char ratr_pl[MLXSW_REG_RATR_LEN];
2668
2669 mlxsw_reg_ratr_pack(ratr_pl, MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY,
89e41982
PM
2670 true, MLXSW_REG_RATR_TYPE_ETHERNET,
2671 adj_index, neigh_entry->rif);
a7ff87ac 2672 mlxsw_reg_ratr_eth_entry_pack(ratr_pl, neigh_entry->ha);
a5390278
AS
2673 if (nh->counter_valid)
2674 mlxsw_reg_ratr_counter_pack(ratr_pl, nh->counter_index, true);
2675 else
2676 mlxsw_reg_ratr_counter_pack(ratr_pl, 0, false);
2677
a7ff87ac
JP
2678 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl);
2679}
2680
eb789980
IS
2681int mlxsw_sp_nexthop_update(struct mlxsw_sp *mlxsw_sp, u32 adj_index,
2682 struct mlxsw_sp_nexthop *nh)
2683{
2684 int i;
2685
2686 for (i = 0; i < nh->num_adj_entries; i++) {
2687 int err;
2688
2689 err = __mlxsw_sp_nexthop_update(mlxsw_sp, adj_index + i, nh);
2690 if (err)
2691 return err;
2692 }
2693
2694 return 0;
2695}
2696
2697static int __mlxsw_sp_nexthop_ipip_update(struct mlxsw_sp *mlxsw_sp,
2698 u32 adj_index,
2699 struct mlxsw_sp_nexthop *nh)
1012b9ac
PM
2700{
2701 const struct mlxsw_sp_ipip_ops *ipip_ops;
2702
2703 ipip_ops = mlxsw_sp->router->ipip_ops_arr[nh->ipip_entry->ipipt];
2704 return ipip_ops->nexthop_update(mlxsw_sp, adj_index, nh->ipip_entry);
2705}
2706
eb789980
IS
2707static int mlxsw_sp_nexthop_ipip_update(struct mlxsw_sp *mlxsw_sp,
2708 u32 adj_index,
2709 struct mlxsw_sp_nexthop *nh)
2710{
2711 int i;
2712
2713 for (i = 0; i < nh->num_adj_entries; i++) {
2714 int err;
2715
2716 err = __mlxsw_sp_nexthop_ipip_update(mlxsw_sp, adj_index + i,
2717 nh);
2718 if (err)
2719 return err;
2720 }
2721
2722 return 0;
2723}
2724
a7ff87ac 2725static int
35225e47
PM
2726mlxsw_sp_nexthop_group_update(struct mlxsw_sp *mlxsw_sp,
2727 struct mlxsw_sp_nexthop_group *nh_grp,
2728 bool reallocate)
a7ff87ac
JP
2729{
2730 u32 adj_index = nh_grp->adj_index; /* base */
2731 struct mlxsw_sp_nexthop *nh;
2732 int i;
2733 int err;
2734
2735 for (i = 0; i < nh_grp->count; i++) {
2736 nh = &nh_grp->nexthops[i];
2737
2738 if (!nh->should_offload) {
2739 nh->offloaded = 0;
2740 continue;
2741 }
2742
a59b7e02 2743 if (nh->update || reallocate) {
35225e47
PM
2744 switch (nh->type) {
2745 case MLXSW_SP_NEXTHOP_TYPE_ETH:
a5390278 2746 err = mlxsw_sp_nexthop_update
35225e47
PM
2747 (mlxsw_sp, adj_index, nh);
2748 break;
1012b9ac
PM
2749 case MLXSW_SP_NEXTHOP_TYPE_IPIP:
2750 err = mlxsw_sp_nexthop_ipip_update
2751 (mlxsw_sp, adj_index, nh);
2752 break;
35225e47 2753 }
a7ff87ac
JP
2754 if (err)
2755 return err;
2756 nh->update = 0;
2757 nh->offloaded = 1;
2758 }
eb789980 2759 adj_index += nh->num_adj_entries;
a7ff87ac
JP
2760 }
2761 return 0;
2762}
2763
1819ae3d
IS
2764static bool
2765mlxsw_sp_fib_node_entry_is_first(const struct mlxsw_sp_fib_node *fib_node,
2766 const struct mlxsw_sp_fib_entry *fib_entry);
2767
a7ff87ac
JP
2768static int
2769mlxsw_sp_nexthop_fib_entries_update(struct mlxsw_sp *mlxsw_sp,
2770 struct mlxsw_sp_nexthop_group *nh_grp)
2771{
2772 struct mlxsw_sp_fib_entry *fib_entry;
2773 int err;
2774
2775 list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) {
1819ae3d
IS
2776 if (!mlxsw_sp_fib_node_entry_is_first(fib_entry->fib_node,
2777 fib_entry))
2778 continue;
a7ff87ac
JP
2779 err = mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
2780 if (err)
2781 return err;
2782 }
2783 return 0;
2784}
2785
77d964e6
IS
2786static void
2787mlxsw_sp_fib_entry_offload_refresh(struct mlxsw_sp_fib_entry *fib_entry,
2788 enum mlxsw_reg_ralue_op op, int err);
2789
2790static void
2791mlxsw_sp_nexthop_fib_entries_refresh(struct mlxsw_sp_nexthop_group *nh_grp)
2792{
2793 enum mlxsw_reg_ralue_op op = MLXSW_REG_RALUE_OP_WRITE_WRITE;
2794 struct mlxsw_sp_fib_entry *fib_entry;
2795
2796 list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) {
2797 if (!mlxsw_sp_fib_node_entry_is_first(fib_entry->fib_node,
2798 fib_entry))
2799 continue;
2800 mlxsw_sp_fib_entry_offload_refresh(fib_entry, op, 0);
2801 }
2802}
2803
425a08c6
IS
2804static void mlxsw_sp_adj_grp_size_round_up(u16 *p_adj_grp_size)
2805{
2806 /* Valid sizes for an adjacency group are:
2807 * 1-64, 512, 1024, 2048 and 4096.
2808 */
2809 if (*p_adj_grp_size <= 64)
2810 return;
2811 else if (*p_adj_grp_size <= 512)
2812 *p_adj_grp_size = 512;
2813 else if (*p_adj_grp_size <= 1024)
2814 *p_adj_grp_size = 1024;
2815 else if (*p_adj_grp_size <= 2048)
2816 *p_adj_grp_size = 2048;
2817 else
2818 *p_adj_grp_size = 4096;
2819}
2820
2821static void mlxsw_sp_adj_grp_size_round_down(u16 *p_adj_grp_size,
2822 unsigned int alloc_size)
2823{
2824 if (alloc_size >= 4096)
2825 *p_adj_grp_size = 4096;
2826 else if (alloc_size >= 2048)
2827 *p_adj_grp_size = 2048;
2828 else if (alloc_size >= 1024)
2829 *p_adj_grp_size = 1024;
2830 else if (alloc_size >= 512)
2831 *p_adj_grp_size = 512;
2832}
2833
2834static int mlxsw_sp_fix_adj_grp_size(struct mlxsw_sp *mlxsw_sp,
2835 u16 *p_adj_grp_size)
2836{
2837 unsigned int alloc_size;
2838 int err;
2839
2840 /* Round up the requested group size to the next size supported
2841 * by the device and make sure the request can be satisfied.
2842 */
2843 mlxsw_sp_adj_grp_size_round_up(p_adj_grp_size);
2844 err = mlxsw_sp_kvdl_alloc_size_query(mlxsw_sp, *p_adj_grp_size,
2845 &alloc_size);
2846 if (err)
2847 return err;
2848 /* It is possible the allocation results in more allocated
2849 * entries than requested. Try to use as much of them as
2850 * possible.
2851 */
2852 mlxsw_sp_adj_grp_size_round_down(p_adj_grp_size, alloc_size);
2853
2854 return 0;
2855}
2856
eb789980
IS
2857static void
2858mlxsw_sp_nexthop_group_normalize(struct mlxsw_sp_nexthop_group *nh_grp)
2859{
2860 int i, g = 0, sum_norm_weight = 0;
2861 struct mlxsw_sp_nexthop *nh;
2862
2863 for (i = 0; i < nh_grp->count; i++) {
2864 nh = &nh_grp->nexthops[i];
2865
2866 if (!nh->should_offload)
2867 continue;
2868 if (g > 0)
2869 g = gcd(nh->nh_weight, g);
2870 else
2871 g = nh->nh_weight;
2872 }
2873
2874 for (i = 0; i < nh_grp->count; i++) {
2875 nh = &nh_grp->nexthops[i];
2876
2877 if (!nh->should_offload)
2878 continue;
2879 nh->norm_nh_weight = nh->nh_weight / g;
2880 sum_norm_weight += nh->norm_nh_weight;
2881 }
2882
2883 nh_grp->sum_norm_weight = sum_norm_weight;
2884}
2885
2886static void
2887mlxsw_sp_nexthop_group_rebalance(struct mlxsw_sp_nexthop_group *nh_grp)
2888{
2889 int total = nh_grp->sum_norm_weight;
2890 u16 ecmp_size = nh_grp->ecmp_size;
2891 int i, weight = 0, lower_bound = 0;
2892
2893 for (i = 0; i < nh_grp->count; i++) {
2894 struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
2895 int upper_bound;
2896
2897 if (!nh->should_offload)
2898 continue;
2899 weight += nh->norm_nh_weight;
2900 upper_bound = DIV_ROUND_CLOSEST(ecmp_size * weight, total);
2901 nh->num_adj_entries = upper_bound - lower_bound;
2902 lower_bound = upper_bound;
2903 }
2904}
2905
a7ff87ac
JP
2906static void
2907mlxsw_sp_nexthop_group_refresh(struct mlxsw_sp *mlxsw_sp,
2908 struct mlxsw_sp_nexthop_group *nh_grp)
2909{
eb789980 2910 u16 ecmp_size, old_ecmp_size;
a7ff87ac
JP
2911 struct mlxsw_sp_nexthop *nh;
2912 bool offload_change = false;
2913 u32 adj_index;
a7ff87ac
JP
2914 bool old_adj_index_valid;
2915 u32 old_adj_index;
a7ff87ac
JP
2916 int i;
2917 int err;
2918
b3e8d1eb
IS
2919 if (!nh_grp->gateway) {
2920 mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp);
2921 return;
2922 }
2923
a7ff87ac
JP
2924 for (i = 0; i < nh_grp->count; i++) {
2925 nh = &nh_grp->nexthops[i];
2926
56b8a9ed 2927 if (nh->should_offload != nh->offloaded) {
a7ff87ac
JP
2928 offload_change = true;
2929 if (nh->should_offload)
2930 nh->update = 1;
2931 }
a7ff87ac
JP
2932 }
2933 if (!offload_change) {
2934 /* Nothing was added or removed, so no need to reallocate. Just
2935 * update MAC on existing adjacency indexes.
2936 */
35225e47 2937 err = mlxsw_sp_nexthop_group_update(mlxsw_sp, nh_grp, false);
a7ff87ac
JP
2938 if (err) {
2939 dev_warn(mlxsw_sp->bus_info->dev, "Failed to update neigh MAC in adjacency table.\n");
2940 goto set_trap;
2941 }
2942 return;
2943 }
eb789980
IS
2944 mlxsw_sp_nexthop_group_normalize(nh_grp);
2945 if (!nh_grp->sum_norm_weight)
a7ff87ac
JP
2946 /* No neigh of this group is connected so we just set
2947 * the trap and let everthing flow through kernel.
2948 */
2949 goto set_trap;
2950
eb789980 2951 ecmp_size = nh_grp->sum_norm_weight;
425a08c6
IS
2952 err = mlxsw_sp_fix_adj_grp_size(mlxsw_sp, &ecmp_size);
2953 if (err)
2954 /* No valid allocation size available. */
2955 goto set_trap;
2956
13124443
AS
2957 err = mlxsw_sp_kvdl_alloc(mlxsw_sp, ecmp_size, &adj_index);
2958 if (err) {
a7ff87ac
JP
2959 /* We ran out of KVD linear space, just set the
2960 * trap and let everything flow through kernel.
2961 */
2962 dev_warn(mlxsw_sp->bus_info->dev, "Failed to allocate KVD linear area for nexthop group.\n");
2963 goto set_trap;
2964 }
a7ff87ac
JP
2965 old_adj_index_valid = nh_grp->adj_index_valid;
2966 old_adj_index = nh_grp->adj_index;
2967 old_ecmp_size = nh_grp->ecmp_size;
2968 nh_grp->adj_index_valid = 1;
2969 nh_grp->adj_index = adj_index;
2970 nh_grp->ecmp_size = ecmp_size;
eb789980 2971 mlxsw_sp_nexthop_group_rebalance(nh_grp);
35225e47 2972 err = mlxsw_sp_nexthop_group_update(mlxsw_sp, nh_grp, true);
a7ff87ac
JP
2973 if (err) {
2974 dev_warn(mlxsw_sp->bus_info->dev, "Failed to update neigh MAC in adjacency table.\n");
2975 goto set_trap;
2976 }
2977
2978 if (!old_adj_index_valid) {
2979 /* The trap was set for fib entries, so we have to call
2980 * fib entry update to unset it and use adjacency index.
2981 */
2982 err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp);
2983 if (err) {
2984 dev_warn(mlxsw_sp->bus_info->dev, "Failed to add adjacency index to fib entries.\n");
2985 goto set_trap;
2986 }
2987 return;
2988 }
2989
2990 err = mlxsw_sp_adj_index_mass_update(mlxsw_sp, nh_grp,
2991 old_adj_index, old_ecmp_size);
2992 mlxsw_sp_kvdl_free(mlxsw_sp, old_adj_index);
2993 if (err) {
2994 dev_warn(mlxsw_sp->bus_info->dev, "Failed to mass-update adjacency index for nexthop group.\n");
2995 goto set_trap;
2996 }
77d964e6
IS
2997
2998 /* Offload state within the group changed, so update the flags. */
2999 mlxsw_sp_nexthop_fib_entries_refresh(nh_grp);
3000
a7ff87ac
JP
3001 return;
3002
3003set_trap:
3004 old_adj_index_valid = nh_grp->adj_index_valid;
3005 nh_grp->adj_index_valid = 0;
3006 for (i = 0; i < nh_grp->count; i++) {
3007 nh = &nh_grp->nexthops[i];
3008 nh->offloaded = 0;
3009 }
3010 err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp);
3011 if (err)
3012 dev_warn(mlxsw_sp->bus_info->dev, "Failed to set traps for fib entries.\n");
3013 if (old_adj_index_valid)
3014 mlxsw_sp_kvdl_free(mlxsw_sp, nh_grp->adj_index);
3015}
3016
3017static void __mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp_nexthop *nh,
3018 bool removing)
3019{
213666a3 3020 if (!removing)
a7ff87ac 3021 nh->should_offload = 1;
213666a3 3022 else if (nh->offloaded)
a7ff87ac
JP
3023 nh->should_offload = 0;
3024 nh->update = 1;
3025}
3026
3027static void
3028mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp *mlxsw_sp,
3029 struct mlxsw_sp_neigh_entry *neigh_entry,
3030 bool removing)
3031{
3032 struct mlxsw_sp_nexthop *nh;
3033
a7ff87ac
JP
3034 list_for_each_entry(nh, &neigh_entry->nexthop_list,
3035 neigh_list_node) {
3036 __mlxsw_sp_nexthop_neigh_update(nh, removing);
3037 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
3038 }
a7ff87ac
JP
3039}
3040
9665b745 3041static void mlxsw_sp_nexthop_rif_init(struct mlxsw_sp_nexthop *nh,
bf95233e 3042 struct mlxsw_sp_rif *rif)
9665b745 3043{
bf95233e 3044 if (nh->rif)
9665b745
IS
3045 return;
3046
bf95233e
AS
3047 nh->rif = rif;
3048 list_add(&nh->rif_list_node, &rif->nexthop_list);
9665b745
IS
3049}
3050
3051static void mlxsw_sp_nexthop_rif_fini(struct mlxsw_sp_nexthop *nh)
3052{
bf95233e 3053 if (!nh->rif)
9665b745
IS
3054 return;
3055
3056 list_del(&nh->rif_list_node);
bf95233e 3057 nh->rif = NULL;
9665b745
IS
3058}
3059
a8c97014
IS
3060static int mlxsw_sp_nexthop_neigh_init(struct mlxsw_sp *mlxsw_sp,
3061 struct mlxsw_sp_nexthop *nh)
a7ff87ac
JP
3062{
3063 struct mlxsw_sp_neigh_entry *neigh_entry;
a7ff87ac 3064 struct neighbour *n;
93a87e5e 3065 u8 nud_state, dead;
c53b8e1b
IS
3066 int err;
3067
ad178c8e 3068 if (!nh->nh_grp->gateway || nh->neigh_entry)
b8399a1e
IS
3069 return 0;
3070
33b1341c 3071 /* Take a reference of neigh here ensuring that neigh would
8de3c178 3072 * not be destructed before the nexthop entry is finished.
33b1341c 3073 * The reference is taken either in neigh_lookup() or
fd76d910 3074 * in neigh_create() in case n is not found.
33b1341c 3075 */
58adf2c4 3076 n = neigh_lookup(nh->nh_grp->neigh_tbl, &nh->gw_addr, nh->rif->dev);
33b1341c 3077 if (!n) {
58adf2c4
IS
3078 n = neigh_create(nh->nh_grp->neigh_tbl, &nh->gw_addr,
3079 nh->rif->dev);
a8c97014
IS
3080 if (IS_ERR(n))
3081 return PTR_ERR(n);
a7ff87ac 3082 neigh_event_send(n, NULL);
33b1341c
JP
3083 }
3084 neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, n);
3085 if (!neigh_entry) {
5c8802f1
IS
3086 neigh_entry = mlxsw_sp_neigh_entry_create(mlxsw_sp, n);
3087 if (IS_ERR(neigh_entry)) {
c53b8e1b
IS
3088 err = -EINVAL;
3089 goto err_neigh_entry_create;
5c8802f1 3090 }
a7ff87ac 3091 }
b2157149
YG
3092
3093 /* If that is the first nexthop connected to that neigh, add to
3094 * nexthop_neighs_list
3095 */
3096 if (list_empty(&neigh_entry->nexthop_list))
3097 list_add_tail(&neigh_entry->nexthop_neighs_list_node,
9011b677 3098 &mlxsw_sp->router->nexthop_neighs_list);
b2157149 3099
a7ff87ac
JP
3100 nh->neigh_entry = neigh_entry;
3101 list_add_tail(&nh->neigh_list_node, &neigh_entry->nexthop_list);
3102 read_lock_bh(&n->lock);
3103 nud_state = n->nud_state;
93a87e5e 3104 dead = n->dead;
a7ff87ac 3105 read_unlock_bh(&n->lock);
93a87e5e 3106 __mlxsw_sp_nexthop_neigh_update(nh, !(nud_state & NUD_VALID && !dead));
a7ff87ac
JP
3107
3108 return 0;
c53b8e1b
IS
3109
3110err_neigh_entry_create:
3111 neigh_release(n);
c53b8e1b 3112 return err;
a7ff87ac
JP
3113}
3114
a8c97014
IS
3115static void mlxsw_sp_nexthop_neigh_fini(struct mlxsw_sp *mlxsw_sp,
3116 struct mlxsw_sp_nexthop *nh)
a7ff87ac
JP
3117{
3118 struct mlxsw_sp_neigh_entry *neigh_entry = nh->neigh_entry;
a8c97014 3119 struct neighbour *n;
a7ff87ac 3120
b8399a1e 3121 if (!neigh_entry)
a8c97014
IS
3122 return;
3123 n = neigh_entry->key.n;
b8399a1e 3124
58312125 3125 __mlxsw_sp_nexthop_neigh_update(nh, true);
a7ff87ac 3126 list_del(&nh->neigh_list_node);
e58be79e 3127 nh->neigh_entry = NULL;
b2157149
YG
3128
3129 /* If that is the last nexthop connected to that neigh, remove from
3130 * nexthop_neighs_list
3131 */
e58be79e
IS
3132 if (list_empty(&neigh_entry->nexthop_list))
3133 list_del(&neigh_entry->nexthop_neighs_list_node);
b2157149 3134
5c8802f1
IS
3135 if (!neigh_entry->connected && list_empty(&neigh_entry->nexthop_list))
3136 mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry);
3137
3138 neigh_release(n);
a8c97014 3139}
c53b8e1b 3140
1012b9ac 3141static int mlxsw_sp_nexthop_ipip_init(struct mlxsw_sp *mlxsw_sp,
1012b9ac
PM
3142 struct mlxsw_sp_nexthop *nh,
3143 struct net_device *ol_dev)
3144{
3145 if (!nh->nh_grp->gateway || nh->ipip_entry)
3146 return 0;
3147
4cccb737
PM
3148 nh->ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
3149 if (!nh->ipip_entry)
3150 return -ENOENT;
1012b9ac
PM
3151
3152 __mlxsw_sp_nexthop_neigh_update(nh, false);
3153 return 0;
3154}
3155
3156static void mlxsw_sp_nexthop_ipip_fini(struct mlxsw_sp *mlxsw_sp,
3157 struct mlxsw_sp_nexthop *nh)
3158{
3159 struct mlxsw_sp_ipip_entry *ipip_entry = nh->ipip_entry;
3160
3161 if (!ipip_entry)
3162 return;
3163
3164 __mlxsw_sp_nexthop_neigh_update(nh, true);
1012b9ac
PM
3165 nh->ipip_entry = NULL;
3166}
3167
3168static bool mlxsw_sp_nexthop4_ipip_type(const struct mlxsw_sp *mlxsw_sp,
3169 const struct fib_nh *fib_nh,
3170 enum mlxsw_sp_ipip_type *p_ipipt)
3171{
3172 struct net_device *dev = fib_nh->nh_dev;
3173
3174 return dev &&
3175 fib_nh->nh_parent->fib_type == RTN_UNICAST &&
3176 mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, p_ipipt);
3177}
3178
35225e47
PM
3179static void mlxsw_sp_nexthop_type_fini(struct mlxsw_sp *mlxsw_sp,
3180 struct mlxsw_sp_nexthop *nh)
3181{
3182 switch (nh->type) {
3183 case MLXSW_SP_NEXTHOP_TYPE_ETH:
3184 mlxsw_sp_nexthop_neigh_fini(mlxsw_sp, nh);
3185 mlxsw_sp_nexthop_rif_fini(nh);
3186 break;
1012b9ac 3187 case MLXSW_SP_NEXTHOP_TYPE_IPIP:
de0f43c0 3188 mlxsw_sp_nexthop_rif_fini(nh);
1012b9ac
PM
3189 mlxsw_sp_nexthop_ipip_fini(mlxsw_sp, nh);
3190 break;
35225e47
PM
3191 }
3192}
3193
3194static int mlxsw_sp_nexthop4_type_init(struct mlxsw_sp *mlxsw_sp,
3195 struct mlxsw_sp_nexthop *nh,
3196 struct fib_nh *fib_nh)
3197{
1012b9ac 3198 struct mlxsw_sp_router *router = mlxsw_sp->router;
35225e47 3199 struct net_device *dev = fib_nh->nh_dev;
1012b9ac 3200 enum mlxsw_sp_ipip_type ipipt;
35225e47
PM
3201 struct mlxsw_sp_rif *rif;
3202 int err;
3203
1012b9ac
PM
3204 if (mlxsw_sp_nexthop4_ipip_type(mlxsw_sp, fib_nh, &ipipt) &&
3205 router->ipip_ops_arr[ipipt]->can_offload(mlxsw_sp, dev,
3206 MLXSW_SP_L3_PROTO_IPV4)) {
3207 nh->type = MLXSW_SP_NEXTHOP_TYPE_IPIP;
4cccb737 3208 err = mlxsw_sp_nexthop_ipip_init(mlxsw_sp, nh, dev);
de0f43c0
PM
3209 if (err)
3210 return err;
3211 mlxsw_sp_nexthop_rif_init(nh, &nh->ipip_entry->ol_lb->common);
3212 return 0;
1012b9ac
PM
3213 }
3214
35225e47
PM
3215 nh->type = MLXSW_SP_NEXTHOP_TYPE_ETH;
3216 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
3217 if (!rif)
3218 return 0;
3219
3220 mlxsw_sp_nexthop_rif_init(nh, rif);
3221 err = mlxsw_sp_nexthop_neigh_init(mlxsw_sp, nh);
3222 if (err)
3223 goto err_neigh_init;
3224
3225 return 0;
3226
3227err_neigh_init:
3228 mlxsw_sp_nexthop_rif_fini(nh);
3229 return err;
3230}
3231
3232static void mlxsw_sp_nexthop4_type_fini(struct mlxsw_sp *mlxsw_sp,
3233 struct mlxsw_sp_nexthop *nh)
3234{
3235 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh);
3236}
3237
0e6ea2a4
IS
3238static int mlxsw_sp_nexthop4_init(struct mlxsw_sp *mlxsw_sp,
3239 struct mlxsw_sp_nexthop_group *nh_grp,
3240 struct mlxsw_sp_nexthop *nh,
3241 struct fib_nh *fib_nh)
a8c97014
IS
3242{
3243 struct net_device *dev = fib_nh->nh_dev;
df6dd79b 3244 struct in_device *in_dev;
a8c97014
IS
3245 int err;
3246
3247 nh->nh_grp = nh_grp;
3248 nh->key.fib_nh = fib_nh;
408bd946
IS
3249#ifdef CONFIG_IP_ROUTE_MULTIPATH
3250 nh->nh_weight = fib_nh->nh_weight;
3251#else
3252 nh->nh_weight = 1;
3253#endif
58adf2c4 3254 memcpy(&nh->gw_addr, &fib_nh->nh_gw, sizeof(fib_nh->nh_gw));
a8c97014
IS
3255 err = mlxsw_sp_nexthop_insert(mlxsw_sp, nh);
3256 if (err)
3257 return err;
3258
a5390278 3259 mlxsw_sp_nexthop_counter_alloc(mlxsw_sp, nh);
dbe4598c
AS
3260 list_add_tail(&nh->router_list_node, &mlxsw_sp->router->nexthop_list);
3261
97989ee0
IS
3262 if (!dev)
3263 return 0;
3264
df6dd79b
IS
3265 in_dev = __in_dev_get_rtnl(dev);
3266 if (in_dev && IN_DEV_IGNORE_ROUTES_WITH_LINKDOWN(in_dev) &&
3267 fib_nh->nh_flags & RTNH_F_LINKDOWN)
3268 return 0;
3269
35225e47 3270 err = mlxsw_sp_nexthop4_type_init(mlxsw_sp, nh, fib_nh);
a8c97014
IS
3271 if (err)
3272 goto err_nexthop_neigh_init;
3273
3274 return 0;
3275
3276err_nexthop_neigh_init:
3277 mlxsw_sp_nexthop_remove(mlxsw_sp, nh);
3278 return err;
3279}
3280
0e6ea2a4
IS
3281static void mlxsw_sp_nexthop4_fini(struct mlxsw_sp *mlxsw_sp,
3282 struct mlxsw_sp_nexthop *nh)
a8c97014 3283{
35225e47 3284 mlxsw_sp_nexthop4_type_fini(mlxsw_sp, nh);
dbe4598c 3285 list_del(&nh->router_list_node);
a5390278 3286 mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh);
c53b8e1b 3287 mlxsw_sp_nexthop_remove(mlxsw_sp, nh);
a7ff87ac
JP
3288}
3289
0e6ea2a4
IS
3290static void mlxsw_sp_nexthop4_event(struct mlxsw_sp *mlxsw_sp,
3291 unsigned long event, struct fib_nh *fib_nh)
ad178c8e
IS
3292{
3293 struct mlxsw_sp_nexthop_key key;
3294 struct mlxsw_sp_nexthop *nh;
ad178c8e 3295
9011b677 3296 if (mlxsw_sp->router->aborted)
ad178c8e
IS
3297 return;
3298
3299 key.fib_nh = fib_nh;
3300 nh = mlxsw_sp_nexthop_lookup(mlxsw_sp, key);
3301 if (WARN_ON_ONCE(!nh))
3302 return;
3303
ad178c8e
IS
3304 switch (event) {
3305 case FIB_EVENT_NH_ADD:
35225e47 3306 mlxsw_sp_nexthop4_type_init(mlxsw_sp, nh, fib_nh);
ad178c8e
IS
3307 break;
3308 case FIB_EVENT_NH_DEL:
35225e47 3309 mlxsw_sp_nexthop4_type_fini(mlxsw_sp, nh);
ad178c8e
IS
3310 break;
3311 }
3312
3313 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
3314}
3315
0c5f1cd5
PM
3316static void mlxsw_sp_nexthop_rif_update(struct mlxsw_sp *mlxsw_sp,
3317 struct mlxsw_sp_rif *rif)
3318{
3319 struct mlxsw_sp_nexthop *nh;
3320
3321 list_for_each_entry(nh, &rif->nexthop_list, rif_list_node) {
3322 __mlxsw_sp_nexthop_neigh_update(nh, false);
3323 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
3324 }
3325}
3326
9665b745 3327static void mlxsw_sp_nexthop_rif_gone_sync(struct mlxsw_sp *mlxsw_sp,
bf95233e 3328 struct mlxsw_sp_rif *rif)
9665b745
IS
3329{
3330 struct mlxsw_sp_nexthop *nh, *tmp;
3331
bf95233e 3332 list_for_each_entry_safe(nh, tmp, &rif->nexthop_list, rif_list_node) {
35225e47 3333 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh);
9665b745
IS
3334 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
3335 }
3336}
3337
9b01451a
PM
3338static bool mlxsw_sp_fi_is_gateway(const struct mlxsw_sp *mlxsw_sp,
3339 const struct fib_info *fi)
3340{
1012b9ac
PM
3341 return fi->fib_nh->nh_scope == RT_SCOPE_LINK ||
3342 mlxsw_sp_nexthop4_ipip_type(mlxsw_sp, fi->fib_nh, NULL);
9b01451a
PM
3343}
3344
a7ff87ac 3345static struct mlxsw_sp_nexthop_group *
0e6ea2a4 3346mlxsw_sp_nexthop4_group_create(struct mlxsw_sp *mlxsw_sp, struct fib_info *fi)
a7ff87ac
JP
3347{
3348 struct mlxsw_sp_nexthop_group *nh_grp;
3349 struct mlxsw_sp_nexthop *nh;
3350 struct fib_nh *fib_nh;
3351 size_t alloc_size;
3352 int i;
3353 int err;
3354
3355 alloc_size = sizeof(*nh_grp) +
3356 fi->fib_nhs * sizeof(struct mlxsw_sp_nexthop);
3357 nh_grp = kzalloc(alloc_size, GFP_KERNEL);
3358 if (!nh_grp)
3359 return ERR_PTR(-ENOMEM);
ba31d366 3360 nh_grp->priv = fi;
a7ff87ac 3361 INIT_LIST_HEAD(&nh_grp->fib_list);
58adf2c4
IS
3362 nh_grp->neigh_tbl = &arp_tbl;
3363
9b01451a 3364 nh_grp->gateway = mlxsw_sp_fi_is_gateway(mlxsw_sp, fi);
a7ff87ac 3365 nh_grp->count = fi->fib_nhs;
7387dbbc 3366 fib_info_hold(fi);
a7ff87ac
JP
3367 for (i = 0; i < nh_grp->count; i++) {
3368 nh = &nh_grp->nexthops[i];
3369 fib_nh = &fi->fib_nh[i];
0e6ea2a4 3370 err = mlxsw_sp_nexthop4_init(mlxsw_sp, nh_grp, nh, fib_nh);
a7ff87ac 3371 if (err)
0e6ea2a4 3372 goto err_nexthop4_init;
a7ff87ac 3373 }
e9ad5e7d
IS
3374 err = mlxsw_sp_nexthop_group_insert(mlxsw_sp, nh_grp);
3375 if (err)
3376 goto err_nexthop_group_insert;
a7ff87ac
JP
3377 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
3378 return nh_grp;
3379
e9ad5e7d 3380err_nexthop_group_insert:
0e6ea2a4 3381err_nexthop4_init:
df6dd79b
IS
3382 for (i--; i >= 0; i--) {
3383 nh = &nh_grp->nexthops[i];
0e6ea2a4 3384 mlxsw_sp_nexthop4_fini(mlxsw_sp, nh);
df6dd79b 3385 }
ba31d366 3386 fib_info_put(fi);
a7ff87ac
JP
3387 kfree(nh_grp);
3388 return ERR_PTR(err);
3389}
3390
3391static void
0e6ea2a4
IS
3392mlxsw_sp_nexthop4_group_destroy(struct mlxsw_sp *mlxsw_sp,
3393 struct mlxsw_sp_nexthop_group *nh_grp)
a7ff87ac
JP
3394{
3395 struct mlxsw_sp_nexthop *nh;
3396 int i;
3397
e9ad5e7d 3398 mlxsw_sp_nexthop_group_remove(mlxsw_sp, nh_grp);
a7ff87ac
JP
3399 for (i = 0; i < nh_grp->count; i++) {
3400 nh = &nh_grp->nexthops[i];
0e6ea2a4 3401 mlxsw_sp_nexthop4_fini(mlxsw_sp, nh);
a7ff87ac 3402 }
58312125
IS
3403 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
3404 WARN_ON_ONCE(nh_grp->adj_index_valid);
ba31d366 3405 fib_info_put(mlxsw_sp_nexthop4_group_fi(nh_grp));
a7ff87ac
JP
3406 kfree(nh_grp);
3407}
3408
0e6ea2a4
IS
3409static int mlxsw_sp_nexthop4_group_get(struct mlxsw_sp *mlxsw_sp,
3410 struct mlxsw_sp_fib_entry *fib_entry,
3411 struct fib_info *fi)
a7ff87ac
JP
3412{
3413 struct mlxsw_sp_nexthop_group *nh_grp;
3414
ba31d366 3415 nh_grp = mlxsw_sp_nexthop4_group_lookup(mlxsw_sp, fi);
a7ff87ac 3416 if (!nh_grp) {
0e6ea2a4 3417 nh_grp = mlxsw_sp_nexthop4_group_create(mlxsw_sp, fi);
a7ff87ac
JP
3418 if (IS_ERR(nh_grp))
3419 return PTR_ERR(nh_grp);
3420 }
3421 list_add_tail(&fib_entry->nexthop_group_node, &nh_grp->fib_list);
3422 fib_entry->nh_group = nh_grp;
3423 return 0;
3424}
3425
0e6ea2a4
IS
3426static void mlxsw_sp_nexthop4_group_put(struct mlxsw_sp *mlxsw_sp,
3427 struct mlxsw_sp_fib_entry *fib_entry)
a7ff87ac
JP
3428{
3429 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
3430
3431 list_del(&fib_entry->nexthop_group_node);
3432 if (!list_empty(&nh_grp->fib_list))
3433 return;
0e6ea2a4 3434 mlxsw_sp_nexthop4_group_destroy(mlxsw_sp, nh_grp);
a7ff87ac
JP
3435}
3436
4f1c7f1f
IS
3437static bool
3438mlxsw_sp_fib4_entry_should_offload(const struct mlxsw_sp_fib_entry *fib_entry)
3439{
3440 struct mlxsw_sp_fib4_entry *fib4_entry;
3441
3442 fib4_entry = container_of(fib_entry, struct mlxsw_sp_fib4_entry,
3443 common);
3444 return !fib4_entry->tos;
3445}
3446
013b20f9
IS
3447static bool
3448mlxsw_sp_fib_entry_should_offload(const struct mlxsw_sp_fib_entry *fib_entry)
3449{
3450 struct mlxsw_sp_nexthop_group *nh_group = fib_entry->nh_group;
3451
4f1c7f1f
IS
3452 switch (fib_entry->fib_node->fib->proto) {
3453 case MLXSW_SP_L3_PROTO_IPV4:
3454 if (!mlxsw_sp_fib4_entry_should_offload(fib_entry))
3455 return false;
3456 break;
3457 case MLXSW_SP_L3_PROTO_IPV6:
3458 break;
3459 }
9aecce1c 3460
013b20f9
IS
3461 switch (fib_entry->type) {
3462 case MLXSW_SP_FIB_ENTRY_TYPE_REMOTE:
3463 return !!nh_group->adj_index_valid;
3464 case MLXSW_SP_FIB_ENTRY_TYPE_LOCAL:
70ad3506 3465 return !!nh_group->nh_rif;
4607f6d2
PM
3466 case MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP:
3467 return true;
013b20f9
IS
3468 default:
3469 return false;
3470 }
3471}
3472
428b851f
IS
3473static struct mlxsw_sp_nexthop *
3474mlxsw_sp_rt6_nexthop(struct mlxsw_sp_nexthop_group *nh_grp,
3475 const struct mlxsw_sp_rt6 *mlxsw_sp_rt6)
3476{
3477 int i;
3478
3479 for (i = 0; i < nh_grp->count; i++) {
3480 struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
3481 struct rt6_info *rt = mlxsw_sp_rt6->rt;
3482
3483 if (nh->rif && nh->rif->dev == rt->dst.dev &&
3484 ipv6_addr_equal((const struct in6_addr *) &nh->gw_addr,
3485 &rt->rt6i_gateway))
3486 return nh;
3487 continue;
3488 }
3489
3490 return NULL;
3491}
3492
3984d1a8
IS
3493static void
3494mlxsw_sp_fib4_entry_offload_set(struct mlxsw_sp_fib_entry *fib_entry)
3495{
3496 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
3497 int i;
3498
4607f6d2
PM
3499 if (fib_entry->type == MLXSW_SP_FIB_ENTRY_TYPE_LOCAL ||
3500 fib_entry->type == MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP) {
3984d1a8
IS
3501 nh_grp->nexthops->key.fib_nh->nh_flags |= RTNH_F_OFFLOAD;
3502 return;
3503 }
3504
3505 for (i = 0; i < nh_grp->count; i++) {
3506 struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
3507
3508 if (nh->offloaded)
3509 nh->key.fib_nh->nh_flags |= RTNH_F_OFFLOAD;
3510 else
3511 nh->key.fib_nh->nh_flags &= ~RTNH_F_OFFLOAD;
3512 }
3513}
3514
3515static void
3516mlxsw_sp_fib4_entry_offload_unset(struct mlxsw_sp_fib_entry *fib_entry)
3517{
3518 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
3519 int i;
3520
3521 for (i = 0; i < nh_grp->count; i++) {
3522 struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
3523
3524 nh->key.fib_nh->nh_flags &= ~RTNH_F_OFFLOAD;
3525 }
3526}
3527
428b851f
IS
3528static void
3529mlxsw_sp_fib6_entry_offload_set(struct mlxsw_sp_fib_entry *fib_entry)
3530{
3531 struct mlxsw_sp_fib6_entry *fib6_entry;
3532 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
3533
3534 fib6_entry = container_of(fib_entry, struct mlxsw_sp_fib6_entry,
3535 common);
3536
3537 if (fib_entry->type == MLXSW_SP_FIB_ENTRY_TYPE_LOCAL) {
3538 list_first_entry(&fib6_entry->rt6_list, struct mlxsw_sp_rt6,
fe400799 3539 list)->rt->rt6i_nh_flags |= RTNH_F_OFFLOAD;
428b851f
IS
3540 return;
3541 }
3542
3543 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
3544 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
3545 struct mlxsw_sp_nexthop *nh;
3546
3547 nh = mlxsw_sp_rt6_nexthop(nh_grp, mlxsw_sp_rt6);
3548 if (nh && nh->offloaded)
fe400799 3549 mlxsw_sp_rt6->rt->rt6i_nh_flags |= RTNH_F_OFFLOAD;
428b851f 3550 else
fe400799 3551 mlxsw_sp_rt6->rt->rt6i_nh_flags &= ~RTNH_F_OFFLOAD;
428b851f
IS
3552 }
3553}
3554
3555static void
3556mlxsw_sp_fib6_entry_offload_unset(struct mlxsw_sp_fib_entry *fib_entry)
3557{
3558 struct mlxsw_sp_fib6_entry *fib6_entry;
3559 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
3560
3561 fib6_entry = container_of(fib_entry, struct mlxsw_sp_fib6_entry,
3562 common);
3563 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
3564 struct rt6_info *rt = mlxsw_sp_rt6->rt;
3565
fe400799 3566 rt->rt6i_nh_flags &= ~RTNH_F_OFFLOAD;
428b851f
IS
3567 }
3568}
3569
013b20f9
IS
3570static void mlxsw_sp_fib_entry_offload_set(struct mlxsw_sp_fib_entry *fib_entry)
3571{
76610ebb 3572 switch (fib_entry->fib_node->fib->proto) {
013b20f9 3573 case MLXSW_SP_L3_PROTO_IPV4:
3984d1a8 3574 mlxsw_sp_fib4_entry_offload_set(fib_entry);
013b20f9
IS
3575 break;
3576 case MLXSW_SP_L3_PROTO_IPV6:
428b851f
IS
3577 mlxsw_sp_fib6_entry_offload_set(fib_entry);
3578 break;
013b20f9
IS
3579 }
3580}
3581
3582static void
3583mlxsw_sp_fib_entry_offload_unset(struct mlxsw_sp_fib_entry *fib_entry)
3584{
76610ebb 3585 switch (fib_entry->fib_node->fib->proto) {
013b20f9 3586 case MLXSW_SP_L3_PROTO_IPV4:
3984d1a8 3587 mlxsw_sp_fib4_entry_offload_unset(fib_entry);
013b20f9
IS
3588 break;
3589 case MLXSW_SP_L3_PROTO_IPV6:
428b851f
IS
3590 mlxsw_sp_fib6_entry_offload_unset(fib_entry);
3591 break;
013b20f9 3592 }
013b20f9
IS
3593}
3594
3595static void
3596mlxsw_sp_fib_entry_offload_refresh(struct mlxsw_sp_fib_entry *fib_entry,
3597 enum mlxsw_reg_ralue_op op, int err)
3598{
3599 switch (op) {
3600 case MLXSW_REG_RALUE_OP_WRITE_DELETE:
013b20f9
IS
3601 return mlxsw_sp_fib_entry_offload_unset(fib_entry);
3602 case MLXSW_REG_RALUE_OP_WRITE_WRITE:
3603 if (err)
3604 return;
1353ee70 3605 if (mlxsw_sp_fib_entry_should_offload(fib_entry))
013b20f9 3606 mlxsw_sp_fib_entry_offload_set(fib_entry);
85f44a15 3607 else
013b20f9
IS
3608 mlxsw_sp_fib_entry_offload_unset(fib_entry);
3609 return;
3610 default:
3611 return;
3612 }
3613}
3614
9dbf4d76
IS
3615static void
3616mlxsw_sp_fib_entry_ralue_pack(char *ralue_pl,
3617 const struct mlxsw_sp_fib_entry *fib_entry,
3618 enum mlxsw_reg_ralue_op op)
a7ff87ac 3619{
76610ebb 3620 struct mlxsw_sp_fib *fib = fib_entry->fib_node->fib;
9dbf4d76
IS
3621 enum mlxsw_reg_ralxx_protocol proto;
3622 u32 *p_dip;
3623
3624 proto = (enum mlxsw_reg_ralxx_protocol) fib->proto;
3625
3626 switch (fib->proto) {
3627 case MLXSW_SP_L3_PROTO_IPV4:
3628 p_dip = (u32 *) fib_entry->fib_node->key.addr;
3629 mlxsw_reg_ralue_pack4(ralue_pl, proto, op, fib->vr->id,
3630 fib_entry->fib_node->key.prefix_len,
3631 *p_dip);
3632 break;
3633 case MLXSW_SP_L3_PROTO_IPV6:
3634 mlxsw_reg_ralue_pack6(ralue_pl, proto, op, fib->vr->id,
3635 fib_entry->fib_node->key.prefix_len,
3636 fib_entry->fib_node->key.addr);
3637 break;
3638 }
3639}
3640
3641static int mlxsw_sp_fib_entry_op_remote(struct mlxsw_sp *mlxsw_sp,
3642 struct mlxsw_sp_fib_entry *fib_entry,
3643 enum mlxsw_reg_ralue_op op)
3644{
3645 char ralue_pl[MLXSW_REG_RALUE_LEN];
a7ff87ac
JP
3646 enum mlxsw_reg_ralue_trap_action trap_action;
3647 u16 trap_id = 0;
3648 u32 adjacency_index = 0;
3649 u16 ecmp_size = 0;
3650
3651 /* In case the nexthop group adjacency index is valid, use it
3652 * with provided ECMP size. Otherwise, setup trap and pass
3653 * traffic to kernel.
3654 */
4b411477 3655 if (mlxsw_sp_fib_entry_should_offload(fib_entry)) {
a7ff87ac
JP
3656 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP;
3657 adjacency_index = fib_entry->nh_group->adj_index;
3658 ecmp_size = fib_entry->nh_group->ecmp_size;
3659 } else {
3660 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP;
3661 trap_id = MLXSW_TRAP_ID_RTR_INGRESS0;
3662 }
3663
9dbf4d76 3664 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
a7ff87ac
JP
3665 mlxsw_reg_ralue_act_remote_pack(ralue_pl, trap_action, trap_id,
3666 adjacency_index, ecmp_size);
3667 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
3668}
3669
9dbf4d76
IS
3670static int mlxsw_sp_fib_entry_op_local(struct mlxsw_sp *mlxsw_sp,
3671 struct mlxsw_sp_fib_entry *fib_entry,
3672 enum mlxsw_reg_ralue_op op)
61c503f9 3673{
bf95233e 3674 struct mlxsw_sp_rif *rif = fib_entry->nh_group->nh_rif;
70ad3506 3675 enum mlxsw_reg_ralue_trap_action trap_action;
61c503f9 3676 char ralue_pl[MLXSW_REG_RALUE_LEN];
70ad3506 3677 u16 trap_id = 0;
bf95233e 3678 u16 rif_index = 0;
70ad3506
IS
3679
3680 if (mlxsw_sp_fib_entry_should_offload(fib_entry)) {
3681 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP;
bf95233e 3682 rif_index = rif->rif_index;
70ad3506
IS
3683 } else {
3684 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP;
3685 trap_id = MLXSW_TRAP_ID_RTR_INGRESS0;
3686 }
61c503f9 3687
9dbf4d76 3688 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
bf95233e
AS
3689 mlxsw_reg_ralue_act_local_pack(ralue_pl, trap_action, trap_id,
3690 rif_index);
61c503f9
JP
3691 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
3692}
3693
9dbf4d76
IS
3694static int mlxsw_sp_fib_entry_op_trap(struct mlxsw_sp *mlxsw_sp,
3695 struct mlxsw_sp_fib_entry *fib_entry,
3696 enum mlxsw_reg_ralue_op op)
61c503f9
JP
3697{
3698 char ralue_pl[MLXSW_REG_RALUE_LEN];
61c503f9 3699
9dbf4d76 3700 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
61c503f9
JP
3701 mlxsw_reg_ralue_act_ip2me_pack(ralue_pl);
3702 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
3703}
3704
4607f6d2
PM
3705static int
3706mlxsw_sp_fib_entry_op_ipip_decap(struct mlxsw_sp *mlxsw_sp,
3707 struct mlxsw_sp_fib_entry *fib_entry,
3708 enum mlxsw_reg_ralue_op op)
3709{
3710 struct mlxsw_sp_ipip_entry *ipip_entry = fib_entry->decap.ipip_entry;
3711 const struct mlxsw_sp_ipip_ops *ipip_ops;
3712
3713 if (WARN_ON(!ipip_entry))
3714 return -EINVAL;
3715
3716 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
3717 return ipip_ops->fib_entry_op(mlxsw_sp, ipip_entry, op,
3718 fib_entry->decap.tunnel_index);
3719}
3720
9dbf4d76
IS
3721static int __mlxsw_sp_fib_entry_op(struct mlxsw_sp *mlxsw_sp,
3722 struct mlxsw_sp_fib_entry *fib_entry,
3723 enum mlxsw_reg_ralue_op op)
61c503f9
JP
3724{
3725 switch (fib_entry->type) {
3726 case MLXSW_SP_FIB_ENTRY_TYPE_REMOTE:
9dbf4d76 3727 return mlxsw_sp_fib_entry_op_remote(mlxsw_sp, fib_entry, op);
61c503f9 3728 case MLXSW_SP_FIB_ENTRY_TYPE_LOCAL:
9dbf4d76 3729 return mlxsw_sp_fib_entry_op_local(mlxsw_sp, fib_entry, op);
61c503f9 3730 case MLXSW_SP_FIB_ENTRY_TYPE_TRAP:
9dbf4d76 3731 return mlxsw_sp_fib_entry_op_trap(mlxsw_sp, fib_entry, op);
4607f6d2
PM
3732 case MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP:
3733 return mlxsw_sp_fib_entry_op_ipip_decap(mlxsw_sp,
3734 fib_entry, op);
61c503f9
JP
3735 }
3736 return -EINVAL;
3737}
3738
3739static int mlxsw_sp_fib_entry_op(struct mlxsw_sp *mlxsw_sp,
3740 struct mlxsw_sp_fib_entry *fib_entry,
3741 enum mlxsw_reg_ralue_op op)
3742{
9dbf4d76 3743 int err = __mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry, op);
013b20f9 3744
013b20f9 3745 mlxsw_sp_fib_entry_offload_refresh(fib_entry, op, err);
9dbf4d76 3746
013b20f9 3747 return err;
61c503f9
JP
3748}
3749
3750static int mlxsw_sp_fib_entry_update(struct mlxsw_sp *mlxsw_sp,
3751 struct mlxsw_sp_fib_entry *fib_entry)
3752{
7146da31
JP
3753 return mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry,
3754 MLXSW_REG_RALUE_OP_WRITE_WRITE);
61c503f9
JP
3755}
3756
3757static int mlxsw_sp_fib_entry_del(struct mlxsw_sp *mlxsw_sp,
3758 struct mlxsw_sp_fib_entry *fib_entry)
3759{
3760 return mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry,
3761 MLXSW_REG_RALUE_OP_WRITE_DELETE);
3762}
3763
61c503f9 3764static int
013b20f9
IS
3765mlxsw_sp_fib4_entry_type_set(struct mlxsw_sp *mlxsw_sp,
3766 const struct fib_entry_notifier_info *fen_info,
3767 struct mlxsw_sp_fib_entry *fib_entry)
61c503f9 3768{
4607f6d2
PM
3769 union mlxsw_sp_l3addr dip = { .addr4 = htonl(fen_info->dst) };
3770 struct net_device *dev = fen_info->fi->fib_dev;
3771 struct mlxsw_sp_ipip_entry *ipip_entry;
b45f64d1 3772 struct fib_info *fi = fen_info->fi;
61c503f9 3773
97989ee0 3774 switch (fen_info->type) {
97989ee0 3775 case RTN_LOCAL:
4607f6d2
PM
3776 ipip_entry = mlxsw_sp_ipip_entry_find_by_decap(mlxsw_sp, dev,
3777 MLXSW_SP_L3_PROTO_IPV4, dip);
3778 if (ipip_entry) {
3779 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP;
3780 return mlxsw_sp_fib_entry_decap_init(mlxsw_sp,
3781 fib_entry,
3782 ipip_entry);
3783 }
3784 /* fall through */
3785 case RTN_BROADCAST:
61c503f9
JP
3786 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
3787 return 0;
97989ee0
IS
3788 case RTN_UNREACHABLE: /* fall through */
3789 case RTN_BLACKHOLE: /* fall through */
3790 case RTN_PROHIBIT:
3791 /* Packets hitting these routes need to be trapped, but
3792 * can do so with a lower priority than packets directed
3793 * at the host, so use action type local instead of trap.
3794 */
61c503f9 3795 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL;
97989ee0
IS
3796 return 0;
3797 case RTN_UNICAST:
9b01451a 3798 if (mlxsw_sp_fi_is_gateway(mlxsw_sp, fi))
97989ee0 3799 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_REMOTE;
9b01451a
PM
3800 else
3801 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL;
97989ee0
IS
3802 return 0;
3803 default:
3804 return -EINVAL;
3805 }
a7ff87ac
JP
3806}
3807
4f1c7f1f 3808static struct mlxsw_sp_fib4_entry *
9aecce1c
IS
3809mlxsw_sp_fib4_entry_create(struct mlxsw_sp *mlxsw_sp,
3810 struct mlxsw_sp_fib_node *fib_node,
3811 const struct fib_entry_notifier_info *fen_info)
61c503f9 3812{
4f1c7f1f 3813 struct mlxsw_sp_fib4_entry *fib4_entry;
61c503f9 3814 struct mlxsw_sp_fib_entry *fib_entry;
61c503f9
JP
3815 int err;
3816
4f1c7f1f
IS
3817 fib4_entry = kzalloc(sizeof(*fib4_entry), GFP_KERNEL);
3818 if (!fib4_entry)
3819 return ERR_PTR(-ENOMEM);
3820 fib_entry = &fib4_entry->common;
61c503f9 3821
013b20f9 3822 err = mlxsw_sp_fib4_entry_type_set(mlxsw_sp, fen_info, fib_entry);
61c503f9 3823 if (err)
013b20f9 3824 goto err_fib4_entry_type_set;
61c503f9 3825
0e6ea2a4 3826 err = mlxsw_sp_nexthop4_group_get(mlxsw_sp, fib_entry, fen_info->fi);
b8399a1e 3827 if (err)
0e6ea2a4 3828 goto err_nexthop4_group_get;
b8399a1e 3829
4f1c7f1f
IS
3830 fib4_entry->prio = fen_info->fi->fib_priority;
3831 fib4_entry->tb_id = fen_info->tb_id;
3832 fib4_entry->type = fen_info->type;
3833 fib4_entry->tos = fen_info->tos;
9aecce1c
IS
3834
3835 fib_entry->fib_node = fib_node;
3836
4f1c7f1f 3837 return fib4_entry;
5b004412 3838
0e6ea2a4 3839err_nexthop4_group_get:
013b20f9 3840err_fib4_entry_type_set:
4f1c7f1f 3841 kfree(fib4_entry);
5b004412
JP
3842 return ERR_PTR(err);
3843}
3844
9aecce1c 3845static void mlxsw_sp_fib4_entry_destroy(struct mlxsw_sp *mlxsw_sp,
4f1c7f1f 3846 struct mlxsw_sp_fib4_entry *fib4_entry)
9aecce1c 3847{
0e6ea2a4 3848 mlxsw_sp_nexthop4_group_put(mlxsw_sp, &fib4_entry->common);
4f1c7f1f 3849 kfree(fib4_entry);
9aecce1c
IS
3850}
3851
4f1c7f1f 3852static struct mlxsw_sp_fib4_entry *
9aecce1c
IS
3853mlxsw_sp_fib4_entry_lookup(struct mlxsw_sp *mlxsw_sp,
3854 const struct fib_entry_notifier_info *fen_info)
5b004412 3855{
4f1c7f1f 3856 struct mlxsw_sp_fib4_entry *fib4_entry;
9aecce1c 3857 struct mlxsw_sp_fib_node *fib_node;
160e22aa
IS
3858 struct mlxsw_sp_fib *fib;
3859 struct mlxsw_sp_vr *vr;
3860
3861 vr = mlxsw_sp_vr_find(mlxsw_sp, fen_info->tb_id);
3862 if (!vr)
3863 return NULL;
3864 fib = mlxsw_sp_vr_fib(vr, MLXSW_SP_L3_PROTO_IPV4);
5b004412 3865
160e22aa
IS
3866 fib_node = mlxsw_sp_fib_node_lookup(fib, &fen_info->dst,
3867 sizeof(fen_info->dst),
3868 fen_info->dst_len);
3869 if (!fib_node)
9aecce1c
IS
3870 return NULL;
3871
4f1c7f1f
IS
3872 list_for_each_entry(fib4_entry, &fib_node->entry_list, common.list) {
3873 if (fib4_entry->tb_id == fen_info->tb_id &&
3874 fib4_entry->tos == fen_info->tos &&
3875 fib4_entry->type == fen_info->type &&
ba31d366
AS
3876 mlxsw_sp_nexthop4_group_fi(fib4_entry->common.nh_group) ==
3877 fen_info->fi) {
4f1c7f1f 3878 return fib4_entry;
9aecce1c
IS
3879 }
3880 }
3881
3882 return NULL;
3883}
3884
3885static const struct rhashtable_params mlxsw_sp_fib_ht_params = {
3886 .key_offset = offsetof(struct mlxsw_sp_fib_node, key),
3887 .head_offset = offsetof(struct mlxsw_sp_fib_node, ht_node),
3888 .key_len = sizeof(struct mlxsw_sp_fib_key),
3889 .automatic_shrinking = true,
3890};
3891
3892static int mlxsw_sp_fib_node_insert(struct mlxsw_sp_fib *fib,
3893 struct mlxsw_sp_fib_node *fib_node)
3894{
3895 return rhashtable_insert_fast(&fib->ht, &fib_node->ht_node,
3896 mlxsw_sp_fib_ht_params);
3897}
3898
3899static void mlxsw_sp_fib_node_remove(struct mlxsw_sp_fib *fib,
3900 struct mlxsw_sp_fib_node *fib_node)
3901{
3902 rhashtable_remove_fast(&fib->ht, &fib_node->ht_node,
3903 mlxsw_sp_fib_ht_params);
3904}
3905
3906static struct mlxsw_sp_fib_node *
3907mlxsw_sp_fib_node_lookup(struct mlxsw_sp_fib *fib, const void *addr,
3908 size_t addr_len, unsigned char prefix_len)
3909{
3910 struct mlxsw_sp_fib_key key;
3911
3912 memset(&key, 0, sizeof(key));
3913 memcpy(key.addr, addr, addr_len);
3914 key.prefix_len = prefix_len;
3915 return rhashtable_lookup_fast(&fib->ht, &key, mlxsw_sp_fib_ht_params);
3916}
3917
3918static struct mlxsw_sp_fib_node *
76610ebb 3919mlxsw_sp_fib_node_create(struct mlxsw_sp_fib *fib, const void *addr,
9aecce1c
IS
3920 size_t addr_len, unsigned char prefix_len)
3921{
3922 struct mlxsw_sp_fib_node *fib_node;
3923
3924 fib_node = kzalloc(sizeof(*fib_node), GFP_KERNEL);
3925 if (!fib_node)
5b004412
JP
3926 return NULL;
3927
9aecce1c 3928 INIT_LIST_HEAD(&fib_node->entry_list);
76610ebb 3929 list_add(&fib_node->list, &fib->node_list);
9aecce1c
IS
3930 memcpy(fib_node->key.addr, addr, addr_len);
3931 fib_node->key.prefix_len = prefix_len;
9aecce1c
IS
3932
3933 return fib_node;
3934}
3935
3936static void mlxsw_sp_fib_node_destroy(struct mlxsw_sp_fib_node *fib_node)
3937{
9aecce1c
IS
3938 list_del(&fib_node->list);
3939 WARN_ON(!list_empty(&fib_node->entry_list));
3940 kfree(fib_node);
3941}
3942
3943static bool
3944mlxsw_sp_fib_node_entry_is_first(const struct mlxsw_sp_fib_node *fib_node,
3945 const struct mlxsw_sp_fib_entry *fib_entry)
3946{
3947 return list_first_entry(&fib_node->entry_list,
3948 struct mlxsw_sp_fib_entry, list) == fib_entry;
3949}
3950
fc922bb0
IS
3951static int mlxsw_sp_fib_lpm_tree_link(struct mlxsw_sp *mlxsw_sp,
3952 struct mlxsw_sp_fib *fib,
3953 struct mlxsw_sp_fib_node *fib_node)
3954{
3955 struct mlxsw_sp_prefix_usage req_prefix_usage = {{ 0 } };
3956 struct mlxsw_sp_lpm_tree *lpm_tree;
3957 int err;
3958
3959 /* Since the tree is shared between all virtual routers we must
3960 * make sure it contains all the required prefix lengths. This
3961 * can be computed by either adding the new prefix length to the
3962 * existing prefix usage of a bound tree, or by aggregating the
3963 * prefix lengths across all virtual routers and adding the new
3964 * one as well.
3965 */
3966 if (fib->lpm_tree)
3967 mlxsw_sp_prefix_usage_cpy(&req_prefix_usage,
3968 &fib->lpm_tree->prefix_usage);
3969 else
3970 mlxsw_sp_vrs_prefixes(mlxsw_sp, fib->proto, &req_prefix_usage);
3971 mlxsw_sp_prefix_usage_set(&req_prefix_usage, fib_node->key.prefix_len);
3972
3973 lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage,
3974 fib->proto);
3975 if (IS_ERR(lpm_tree))
3976 return PTR_ERR(lpm_tree);
3977
3978 if (fib->lpm_tree && fib->lpm_tree->id == lpm_tree->id)
3979 return 0;
3980
3981 err = mlxsw_sp_vrs_lpm_tree_replace(mlxsw_sp, fib, lpm_tree);
3982 if (err)
3983 return err;
3984
3985 return 0;
3986}
3987
3988static void mlxsw_sp_fib_lpm_tree_unlink(struct mlxsw_sp *mlxsw_sp,
3989 struct mlxsw_sp_fib *fib)
3990{
fc922bb0
IS
3991 if (!mlxsw_sp_prefix_usage_none(&fib->prefix_usage))
3992 return;
3993 mlxsw_sp_vr_lpm_tree_unbind(mlxsw_sp, fib);
3994 mlxsw_sp_lpm_tree_put(mlxsw_sp, fib->lpm_tree);
3995 fib->lpm_tree = NULL;
3996}
3997
9aecce1c
IS
3998static void mlxsw_sp_fib_node_prefix_inc(struct mlxsw_sp_fib_node *fib_node)
3999{
4000 unsigned char prefix_len = fib_node->key.prefix_len;
76610ebb 4001 struct mlxsw_sp_fib *fib = fib_node->fib;
9aecce1c
IS
4002
4003 if (fib->prefix_ref_count[prefix_len]++ == 0)
4004 mlxsw_sp_prefix_usage_set(&fib->prefix_usage, prefix_len);
4005}
4006
4007static void mlxsw_sp_fib_node_prefix_dec(struct mlxsw_sp_fib_node *fib_node)
4008{
4009 unsigned char prefix_len = fib_node->key.prefix_len;
76610ebb 4010 struct mlxsw_sp_fib *fib = fib_node->fib;
9aecce1c
IS
4011
4012 if (--fib->prefix_ref_count[prefix_len] == 0)
4013 mlxsw_sp_prefix_usage_clear(&fib->prefix_usage, prefix_len);
5b004412
JP
4014}
4015
76610ebb
IS
4016static int mlxsw_sp_fib_node_init(struct mlxsw_sp *mlxsw_sp,
4017 struct mlxsw_sp_fib_node *fib_node,
4018 struct mlxsw_sp_fib *fib)
4019{
76610ebb
IS
4020 int err;
4021
4022 err = mlxsw_sp_fib_node_insert(fib, fib_node);
4023 if (err)
4024 return err;
4025 fib_node->fib = fib;
4026
fc922bb0
IS
4027 err = mlxsw_sp_fib_lpm_tree_link(mlxsw_sp, fib, fib_node);
4028 if (err)
4029 goto err_fib_lpm_tree_link;
76610ebb
IS
4030
4031 mlxsw_sp_fib_node_prefix_inc(fib_node);
4032
4033 return 0;
4034
fc922bb0 4035err_fib_lpm_tree_link:
76610ebb
IS
4036 fib_node->fib = NULL;
4037 mlxsw_sp_fib_node_remove(fib, fib_node);
4038 return err;
4039}
4040
4041static void mlxsw_sp_fib_node_fini(struct mlxsw_sp *mlxsw_sp,
4042 struct mlxsw_sp_fib_node *fib_node)
4043{
76610ebb
IS
4044 struct mlxsw_sp_fib *fib = fib_node->fib;
4045
4046 mlxsw_sp_fib_node_prefix_dec(fib_node);
fc922bb0 4047 mlxsw_sp_fib_lpm_tree_unlink(mlxsw_sp, fib);
76610ebb
IS
4048 fib_node->fib = NULL;
4049 mlxsw_sp_fib_node_remove(fib, fib_node);
4050}
4051
9aecce1c 4052static struct mlxsw_sp_fib_node *
731ea1ca
IS
4053mlxsw_sp_fib_node_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id, const void *addr,
4054 size_t addr_len, unsigned char prefix_len,
4055 enum mlxsw_sp_l3proto proto)
5b004412 4056{
9aecce1c 4057 struct mlxsw_sp_fib_node *fib_node;
76610ebb 4058 struct mlxsw_sp_fib *fib;
9aecce1c
IS
4059 struct mlxsw_sp_vr *vr;
4060 int err;
4061
f8fa9b4e 4062 vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id, NULL);
9aecce1c
IS
4063 if (IS_ERR(vr))
4064 return ERR_CAST(vr);
731ea1ca 4065 fib = mlxsw_sp_vr_fib(vr, proto);
9aecce1c 4066
731ea1ca 4067 fib_node = mlxsw_sp_fib_node_lookup(fib, addr, addr_len, prefix_len);
9aecce1c
IS
4068 if (fib_node)
4069 return fib_node;
5b004412 4070
731ea1ca 4071 fib_node = mlxsw_sp_fib_node_create(fib, addr, addr_len, prefix_len);
9aecce1c
IS
4072 if (!fib_node) {
4073 err = -ENOMEM;
4074 goto err_fib_node_create;
5b004412 4075 }
9aecce1c 4076
76610ebb
IS
4077 err = mlxsw_sp_fib_node_init(mlxsw_sp, fib_node, fib);
4078 if (err)
4079 goto err_fib_node_init;
4080
9aecce1c
IS
4081 return fib_node;
4082
76610ebb
IS
4083err_fib_node_init:
4084 mlxsw_sp_fib_node_destroy(fib_node);
9aecce1c 4085err_fib_node_create:
76610ebb 4086 mlxsw_sp_vr_put(vr);
9aecce1c 4087 return ERR_PTR(err);
5b004412
JP
4088}
4089
731ea1ca
IS
4090static void mlxsw_sp_fib_node_put(struct mlxsw_sp *mlxsw_sp,
4091 struct mlxsw_sp_fib_node *fib_node)
5b004412 4092{
76610ebb 4093 struct mlxsw_sp_vr *vr = fib_node->fib->vr;
5b004412 4094
9aecce1c
IS
4095 if (!list_empty(&fib_node->entry_list))
4096 return;
76610ebb 4097 mlxsw_sp_fib_node_fini(mlxsw_sp, fib_node);
9aecce1c 4098 mlxsw_sp_fib_node_destroy(fib_node);
76610ebb 4099 mlxsw_sp_vr_put(vr);
61c503f9
JP
4100}
4101
4f1c7f1f 4102static struct mlxsw_sp_fib4_entry *
9aecce1c 4103mlxsw_sp_fib4_node_entry_find(const struct mlxsw_sp_fib_node *fib_node,
4f1c7f1f 4104 const struct mlxsw_sp_fib4_entry *new4_entry)
61c503f9 4105{
4f1c7f1f 4106 struct mlxsw_sp_fib4_entry *fib4_entry;
9aecce1c 4107
4f1c7f1f
IS
4108 list_for_each_entry(fib4_entry, &fib_node->entry_list, common.list) {
4109 if (fib4_entry->tb_id > new4_entry->tb_id)
9aecce1c 4110 continue;
4f1c7f1f 4111 if (fib4_entry->tb_id != new4_entry->tb_id)
9aecce1c 4112 break;
4f1c7f1f 4113 if (fib4_entry->tos > new4_entry->tos)
9aecce1c 4114 continue;
4f1c7f1f
IS
4115 if (fib4_entry->prio >= new4_entry->prio ||
4116 fib4_entry->tos < new4_entry->tos)
4117 return fib4_entry;
9aecce1c
IS
4118 }
4119
4120 return NULL;
4121}
4122
4f1c7f1f
IS
4123static int
4124mlxsw_sp_fib4_node_list_append(struct mlxsw_sp_fib4_entry *fib4_entry,
4125 struct mlxsw_sp_fib4_entry *new4_entry)
4283bce5
IS
4126{
4127 struct mlxsw_sp_fib_node *fib_node;
4128
4f1c7f1f 4129 if (WARN_ON(!fib4_entry))
4283bce5
IS
4130 return -EINVAL;
4131
4f1c7f1f
IS
4132 fib_node = fib4_entry->common.fib_node;
4133 list_for_each_entry_from(fib4_entry, &fib_node->entry_list,
4134 common.list) {
4135 if (fib4_entry->tb_id != new4_entry->tb_id ||
4136 fib4_entry->tos != new4_entry->tos ||
4137 fib4_entry->prio != new4_entry->prio)
4283bce5
IS
4138 break;
4139 }
4140
4f1c7f1f 4141 list_add_tail(&new4_entry->common.list, &fib4_entry->common.list);
4283bce5
IS
4142 return 0;
4143}
4144
9aecce1c 4145static int
9efbee6f 4146mlxsw_sp_fib4_node_list_insert(struct mlxsw_sp_fib4_entry *new4_entry,
599cf8f9 4147 bool replace, bool append)
9aecce1c 4148{
9efbee6f 4149 struct mlxsw_sp_fib_node *fib_node = new4_entry->common.fib_node;
4f1c7f1f 4150 struct mlxsw_sp_fib4_entry *fib4_entry;
9aecce1c 4151
4f1c7f1f 4152 fib4_entry = mlxsw_sp_fib4_node_entry_find(fib_node, new4_entry);
9aecce1c 4153
4283bce5 4154 if (append)
4f1c7f1f
IS
4155 return mlxsw_sp_fib4_node_list_append(fib4_entry, new4_entry);
4156 if (replace && WARN_ON(!fib4_entry))
599cf8f9 4157 return -EINVAL;
4283bce5 4158
599cf8f9
IS
4159 /* Insert new entry before replaced one, so that we can later
4160 * remove the second.
4161 */
4f1c7f1f
IS
4162 if (fib4_entry) {
4163 list_add_tail(&new4_entry->common.list,
4164 &fib4_entry->common.list);
9aecce1c 4165 } else {
4f1c7f1f 4166 struct mlxsw_sp_fib4_entry *last;
9aecce1c 4167
4f1c7f1f
IS
4168 list_for_each_entry(last, &fib_node->entry_list, common.list) {
4169 if (new4_entry->tb_id > last->tb_id)
9aecce1c 4170 break;
4f1c7f1f 4171 fib4_entry = last;
9aecce1c
IS
4172 }
4173
4f1c7f1f
IS
4174 if (fib4_entry)
4175 list_add(&new4_entry->common.list,
4176 &fib4_entry->common.list);
9aecce1c 4177 else
4f1c7f1f
IS
4178 list_add(&new4_entry->common.list,
4179 &fib_node->entry_list);
9aecce1c
IS
4180 }
4181
4182 return 0;
4183}
4184
4185static void
4f1c7f1f 4186mlxsw_sp_fib4_node_list_remove(struct mlxsw_sp_fib4_entry *fib4_entry)
9aecce1c 4187{
4f1c7f1f 4188 list_del(&fib4_entry->common.list);
9aecce1c
IS
4189}
4190
80c238f9
IS
4191static int mlxsw_sp_fib_node_entry_add(struct mlxsw_sp *mlxsw_sp,
4192 struct mlxsw_sp_fib_entry *fib_entry)
9aecce1c 4193{
9efbee6f
IS
4194 struct mlxsw_sp_fib_node *fib_node = fib_entry->fib_node;
4195
9aecce1c
IS
4196 if (!mlxsw_sp_fib_node_entry_is_first(fib_node, fib_entry))
4197 return 0;
4198
4199 /* To prevent packet loss, overwrite the previously offloaded
4200 * entry.
4201 */
4202 if (!list_is_singular(&fib_node->entry_list)) {
4203 enum mlxsw_reg_ralue_op op = MLXSW_REG_RALUE_OP_WRITE_DELETE;
4204 struct mlxsw_sp_fib_entry *n = list_next_entry(fib_entry, list);
4205
4206 mlxsw_sp_fib_entry_offload_refresh(n, op, 0);
4207 }
4208
4209 return mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
4210}
4211
80c238f9
IS
4212static void mlxsw_sp_fib_node_entry_del(struct mlxsw_sp *mlxsw_sp,
4213 struct mlxsw_sp_fib_entry *fib_entry)
9aecce1c 4214{
9efbee6f
IS
4215 struct mlxsw_sp_fib_node *fib_node = fib_entry->fib_node;
4216
9aecce1c
IS
4217 if (!mlxsw_sp_fib_node_entry_is_first(fib_node, fib_entry))
4218 return;
4219
4220 /* Promote the next entry by overwriting the deleted entry */
4221 if (!list_is_singular(&fib_node->entry_list)) {
4222 struct mlxsw_sp_fib_entry *n = list_next_entry(fib_entry, list);
4223 enum mlxsw_reg_ralue_op op = MLXSW_REG_RALUE_OP_WRITE_DELETE;
4224
4225 mlxsw_sp_fib_entry_update(mlxsw_sp, n);
4226 mlxsw_sp_fib_entry_offload_refresh(fib_entry, op, 0);
4227 return;
4228 }
4229
4230 mlxsw_sp_fib_entry_del(mlxsw_sp, fib_entry);
4231}
4232
4233static int mlxsw_sp_fib4_node_entry_link(struct mlxsw_sp *mlxsw_sp,
4f1c7f1f 4234 struct mlxsw_sp_fib4_entry *fib4_entry,
599cf8f9 4235 bool replace, bool append)
9aecce1c 4236{
9aecce1c
IS
4237 int err;
4238
9efbee6f 4239 err = mlxsw_sp_fib4_node_list_insert(fib4_entry, replace, append);
9aecce1c
IS
4240 if (err)
4241 return err;
4242
80c238f9 4243 err = mlxsw_sp_fib_node_entry_add(mlxsw_sp, &fib4_entry->common);
9aecce1c 4244 if (err)
80c238f9 4245 goto err_fib_node_entry_add;
9aecce1c 4246
9aecce1c
IS
4247 return 0;
4248
80c238f9 4249err_fib_node_entry_add:
4f1c7f1f 4250 mlxsw_sp_fib4_node_list_remove(fib4_entry);
9aecce1c
IS
4251 return err;
4252}
4253
4254static void
4255mlxsw_sp_fib4_node_entry_unlink(struct mlxsw_sp *mlxsw_sp,
4f1c7f1f 4256 struct mlxsw_sp_fib4_entry *fib4_entry)
9aecce1c 4257{
80c238f9 4258 mlxsw_sp_fib_node_entry_del(mlxsw_sp, &fib4_entry->common);
4f1c7f1f 4259 mlxsw_sp_fib4_node_list_remove(fib4_entry);
4607f6d2
PM
4260
4261 if (fib4_entry->common.type == MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP)
4262 mlxsw_sp_fib_entry_decap_fini(mlxsw_sp, &fib4_entry->common);
9aecce1c
IS
4263}
4264
599cf8f9 4265static void mlxsw_sp_fib4_entry_replace(struct mlxsw_sp *mlxsw_sp,
4f1c7f1f 4266 struct mlxsw_sp_fib4_entry *fib4_entry,
599cf8f9
IS
4267 bool replace)
4268{
4f1c7f1f
IS
4269 struct mlxsw_sp_fib_node *fib_node = fib4_entry->common.fib_node;
4270 struct mlxsw_sp_fib4_entry *replaced;
599cf8f9
IS
4271
4272 if (!replace)
4273 return;
4274
4275 /* We inserted the new entry before replaced one */
4f1c7f1f 4276 replaced = list_next_entry(fib4_entry, common.list);
599cf8f9
IS
4277
4278 mlxsw_sp_fib4_node_entry_unlink(mlxsw_sp, replaced);
4279 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, replaced);
731ea1ca 4280 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
599cf8f9
IS
4281}
4282
9aecce1c
IS
4283static int
4284mlxsw_sp_router_fib4_add(struct mlxsw_sp *mlxsw_sp,
4283bce5 4285 const struct fib_entry_notifier_info *fen_info,
599cf8f9 4286 bool replace, bool append)
9aecce1c 4287{
4f1c7f1f 4288 struct mlxsw_sp_fib4_entry *fib4_entry;
9aecce1c 4289 struct mlxsw_sp_fib_node *fib_node;
61c503f9
JP
4290 int err;
4291
9011b677 4292 if (mlxsw_sp->router->aborted)
b45f64d1
JP
4293 return 0;
4294
731ea1ca
IS
4295 fib_node = mlxsw_sp_fib_node_get(mlxsw_sp, fen_info->tb_id,
4296 &fen_info->dst, sizeof(fen_info->dst),
4297 fen_info->dst_len,
4298 MLXSW_SP_L3_PROTO_IPV4);
9aecce1c
IS
4299 if (IS_ERR(fib_node)) {
4300 dev_warn(mlxsw_sp->bus_info->dev, "Failed to get FIB node\n");
4301 return PTR_ERR(fib_node);
b45f64d1 4302 }
61c503f9 4303
4f1c7f1f
IS
4304 fib4_entry = mlxsw_sp_fib4_entry_create(mlxsw_sp, fib_node, fen_info);
4305 if (IS_ERR(fib4_entry)) {
9aecce1c 4306 dev_warn(mlxsw_sp->bus_info->dev, "Failed to create FIB entry\n");
4f1c7f1f 4307 err = PTR_ERR(fib4_entry);
9aecce1c
IS
4308 goto err_fib4_entry_create;
4309 }
5b004412 4310
4f1c7f1f 4311 err = mlxsw_sp_fib4_node_entry_link(mlxsw_sp, fib4_entry, replace,
599cf8f9 4312 append);
b45f64d1 4313 if (err) {
9aecce1c
IS
4314 dev_warn(mlxsw_sp->bus_info->dev, "Failed to link FIB entry to node\n");
4315 goto err_fib4_node_entry_link;
b45f64d1 4316 }
9aecce1c 4317
4f1c7f1f 4318 mlxsw_sp_fib4_entry_replace(mlxsw_sp, fib4_entry, replace);
599cf8f9 4319
61c503f9
JP
4320 return 0;
4321
9aecce1c 4322err_fib4_node_entry_link:
4f1c7f1f 4323 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry);
9aecce1c 4324err_fib4_entry_create:
731ea1ca 4325 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
61c503f9
JP
4326 return err;
4327}
4328
37956d78
JP
4329static void mlxsw_sp_router_fib4_del(struct mlxsw_sp *mlxsw_sp,
4330 struct fib_entry_notifier_info *fen_info)
61c503f9 4331{
4f1c7f1f 4332 struct mlxsw_sp_fib4_entry *fib4_entry;
9aecce1c 4333 struct mlxsw_sp_fib_node *fib_node;
61c503f9 4334
9011b677 4335 if (mlxsw_sp->router->aborted)
37956d78 4336 return;
b45f64d1 4337
4f1c7f1f
IS
4338 fib4_entry = mlxsw_sp_fib4_entry_lookup(mlxsw_sp, fen_info);
4339 if (WARN_ON(!fib4_entry))
37956d78 4340 return;
4f1c7f1f 4341 fib_node = fib4_entry->common.fib_node;
5b004412 4342
4f1c7f1f
IS
4343 mlxsw_sp_fib4_node_entry_unlink(mlxsw_sp, fib4_entry);
4344 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry);
731ea1ca 4345 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
61c503f9 4346}
b45f64d1 4347
428b851f
IS
4348static bool mlxsw_sp_fib6_rt_should_ignore(const struct rt6_info *rt)
4349{
4350 /* Packets with link-local destination IP arriving to the router
4351 * are trapped to the CPU, so no need to program specific routes
4352 * for them.
4353 */
4354 if (ipv6_addr_type(&rt->rt6i_dst.addr) & IPV6_ADDR_LINKLOCAL)
4355 return true;
4356
4357 /* Multicast routes aren't supported, so ignore them. Neighbour
4358 * Discovery packets are specifically trapped.
4359 */
4360 if (ipv6_addr_type(&rt->rt6i_dst.addr) & IPV6_ADDR_MULTICAST)
4361 return true;
4362
4363 /* Cloned routes are irrelevant in the forwarding path. */
4364 if (rt->rt6i_flags & RTF_CACHE)
4365 return true;
4366
4367 return false;
4368}
4369
4370static struct mlxsw_sp_rt6 *mlxsw_sp_rt6_create(struct rt6_info *rt)
4371{
4372 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
4373
4374 mlxsw_sp_rt6 = kzalloc(sizeof(*mlxsw_sp_rt6), GFP_KERNEL);
4375 if (!mlxsw_sp_rt6)
4376 return ERR_PTR(-ENOMEM);
4377
4378 /* In case of route replace, replaced route is deleted with
4379 * no notification. Take reference to prevent accessing freed
4380 * memory.
4381 */
4382 mlxsw_sp_rt6->rt = rt;
4383 rt6_hold(rt);
4384
4385 return mlxsw_sp_rt6;
4386}
4387
4388#if IS_ENABLED(CONFIG_IPV6)
4389static void mlxsw_sp_rt6_release(struct rt6_info *rt)
4390{
4391 rt6_release(rt);
4392}
4393#else
4394static void mlxsw_sp_rt6_release(struct rt6_info *rt)
4395{
4396}
4397#endif
4398
4399static void mlxsw_sp_rt6_destroy(struct mlxsw_sp_rt6 *mlxsw_sp_rt6)
4400{
4401 mlxsw_sp_rt6_release(mlxsw_sp_rt6->rt);
4402 kfree(mlxsw_sp_rt6);
4403}
4404
4405static bool mlxsw_sp_fib6_rt_can_mp(const struct rt6_info *rt)
4406{
4407 /* RTF_CACHE routes are ignored */
4408 return (rt->rt6i_flags & (RTF_GATEWAY | RTF_ADDRCONF)) == RTF_GATEWAY;
4409}
4410
4411static struct rt6_info *
4412mlxsw_sp_fib6_entry_rt(const struct mlxsw_sp_fib6_entry *fib6_entry)
4413{
4414 return list_first_entry(&fib6_entry->rt6_list, struct mlxsw_sp_rt6,
4415 list)->rt;
4416}
4417
4418static struct mlxsw_sp_fib6_entry *
4419mlxsw_sp_fib6_node_mp_entry_find(const struct mlxsw_sp_fib_node *fib_node,
0a7fd1ac 4420 const struct rt6_info *nrt, bool replace)
428b851f
IS
4421{
4422 struct mlxsw_sp_fib6_entry *fib6_entry;
4423
0a7fd1ac 4424 if (!mlxsw_sp_fib6_rt_can_mp(nrt) || replace)
428b851f
IS
4425 return NULL;
4426
4427 list_for_each_entry(fib6_entry, &fib_node->entry_list, common.list) {
4428 struct rt6_info *rt = mlxsw_sp_fib6_entry_rt(fib6_entry);
4429
4430 /* RT6_TABLE_LOCAL and RT6_TABLE_MAIN share the same
4431 * virtual router.
4432 */
4433 if (rt->rt6i_table->tb6_id > nrt->rt6i_table->tb6_id)
4434 continue;
4435 if (rt->rt6i_table->tb6_id != nrt->rt6i_table->tb6_id)
4436 break;
4437 if (rt->rt6i_metric < nrt->rt6i_metric)
4438 continue;
4439 if (rt->rt6i_metric == nrt->rt6i_metric &&
4440 mlxsw_sp_fib6_rt_can_mp(rt))
4441 return fib6_entry;
4442 if (rt->rt6i_metric > nrt->rt6i_metric)
4443 break;
4444 }
4445
4446 return NULL;
4447}
4448
4449static struct mlxsw_sp_rt6 *
4450mlxsw_sp_fib6_entry_rt_find(const struct mlxsw_sp_fib6_entry *fib6_entry,
4451 const struct rt6_info *rt)
4452{
4453 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
4454
4455 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
4456 if (mlxsw_sp_rt6->rt == rt)
4457 return mlxsw_sp_rt6;
4458 }
4459
4460 return NULL;
4461}
4462
8f28a309
PM
4463static bool mlxsw_sp_nexthop6_ipip_type(const struct mlxsw_sp *mlxsw_sp,
4464 const struct rt6_info *rt,
4465 enum mlxsw_sp_ipip_type *ret)
4466{
4467 return rt->dst.dev &&
4468 mlxsw_sp_netdev_ipip_type(mlxsw_sp, rt->dst.dev, ret);
4469}
4470
35225e47
PM
4471static int mlxsw_sp_nexthop6_type_init(struct mlxsw_sp *mlxsw_sp,
4472 struct mlxsw_sp_nexthop_group *nh_grp,
4473 struct mlxsw_sp_nexthop *nh,
4474 const struct rt6_info *rt)
428b851f 4475{
8f28a309 4476 struct mlxsw_sp_router *router = mlxsw_sp->router;
428b851f 4477 struct net_device *dev = rt->dst.dev;
8f28a309 4478 enum mlxsw_sp_ipip_type ipipt;
428b851f
IS
4479 struct mlxsw_sp_rif *rif;
4480 int err;
4481
8f28a309
PM
4482 if (mlxsw_sp_nexthop6_ipip_type(mlxsw_sp, rt, &ipipt) &&
4483 router->ipip_ops_arr[ipipt]->can_offload(mlxsw_sp, dev,
4484 MLXSW_SP_L3_PROTO_IPV6)) {
4485 nh->type = MLXSW_SP_NEXTHOP_TYPE_IPIP;
4cccb737 4486 err = mlxsw_sp_nexthop_ipip_init(mlxsw_sp, nh, dev);
de0f43c0
PM
4487 if (err)
4488 return err;
4489 mlxsw_sp_nexthop_rif_init(nh, &nh->ipip_entry->ol_lb->common);
4490 return 0;
8f28a309
PM
4491 }
4492
35225e47 4493 nh->type = MLXSW_SP_NEXTHOP_TYPE_ETH;
428b851f
IS
4494 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
4495 if (!rif)
4496 return 0;
4497 mlxsw_sp_nexthop_rif_init(nh, rif);
4498
4499 err = mlxsw_sp_nexthop_neigh_init(mlxsw_sp, nh);
4500 if (err)
4501 goto err_nexthop_neigh_init;
4502
4503 return 0;
4504
4505err_nexthop_neigh_init:
4506 mlxsw_sp_nexthop_rif_fini(nh);
4507 return err;
4508}
4509
35225e47
PM
4510static void mlxsw_sp_nexthop6_type_fini(struct mlxsw_sp *mlxsw_sp,
4511 struct mlxsw_sp_nexthop *nh)
4512{
4513 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh);
4514}
4515
4516static int mlxsw_sp_nexthop6_init(struct mlxsw_sp *mlxsw_sp,
4517 struct mlxsw_sp_nexthop_group *nh_grp,
4518 struct mlxsw_sp_nexthop *nh,
4519 const struct rt6_info *rt)
4520{
4521 struct net_device *dev = rt->dst.dev;
4522
4523 nh->nh_grp = nh_grp;
408bd946 4524 nh->nh_weight = 1;
35225e47 4525 memcpy(&nh->gw_addr, &rt->rt6i_gateway, sizeof(nh->gw_addr));
a5390278 4526 mlxsw_sp_nexthop_counter_alloc(mlxsw_sp, nh);
35225e47 4527
dbe4598c
AS
4528 list_add_tail(&nh->router_list_node, &mlxsw_sp->router->nexthop_list);
4529
35225e47
PM
4530 if (!dev)
4531 return 0;
4532 nh->ifindex = dev->ifindex;
4533
4534 return mlxsw_sp_nexthop6_type_init(mlxsw_sp, nh_grp, nh, rt);
4535}
4536
428b851f
IS
4537static void mlxsw_sp_nexthop6_fini(struct mlxsw_sp *mlxsw_sp,
4538 struct mlxsw_sp_nexthop *nh)
4539{
35225e47 4540 mlxsw_sp_nexthop6_type_fini(mlxsw_sp, nh);
dbe4598c 4541 list_del(&nh->router_list_node);
a5390278 4542 mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh);
428b851f
IS
4543}
4544
f6050ee6
PM
4545static bool mlxsw_sp_rt6_is_gateway(const struct mlxsw_sp *mlxsw_sp,
4546 const struct rt6_info *rt)
4547{
8f28a309
PM
4548 return rt->rt6i_flags & RTF_GATEWAY ||
4549 mlxsw_sp_nexthop6_ipip_type(mlxsw_sp, rt, NULL);
f6050ee6
PM
4550}
4551
428b851f
IS
4552static struct mlxsw_sp_nexthop_group *
4553mlxsw_sp_nexthop6_group_create(struct mlxsw_sp *mlxsw_sp,
4554 struct mlxsw_sp_fib6_entry *fib6_entry)
4555{
4556 struct mlxsw_sp_nexthop_group *nh_grp;
4557 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
4558 struct mlxsw_sp_nexthop *nh;
4559 size_t alloc_size;
4560 int i = 0;
4561 int err;
4562
4563 alloc_size = sizeof(*nh_grp) +
4564 fib6_entry->nrt6 * sizeof(struct mlxsw_sp_nexthop);
4565 nh_grp = kzalloc(alloc_size, GFP_KERNEL);
4566 if (!nh_grp)
4567 return ERR_PTR(-ENOMEM);
4568 INIT_LIST_HEAD(&nh_grp->fib_list);
4569#if IS_ENABLED(CONFIG_IPV6)
4570 nh_grp->neigh_tbl = &nd_tbl;
4571#endif
4572 mlxsw_sp_rt6 = list_first_entry(&fib6_entry->rt6_list,
4573 struct mlxsw_sp_rt6, list);
f6050ee6 4574 nh_grp->gateway = mlxsw_sp_rt6_is_gateway(mlxsw_sp, mlxsw_sp_rt6->rt);
428b851f
IS
4575 nh_grp->count = fib6_entry->nrt6;
4576 for (i = 0; i < nh_grp->count; i++) {
4577 struct rt6_info *rt = mlxsw_sp_rt6->rt;
4578
4579 nh = &nh_grp->nexthops[i];
4580 err = mlxsw_sp_nexthop6_init(mlxsw_sp, nh_grp, nh, rt);
4581 if (err)
4582 goto err_nexthop6_init;
4583 mlxsw_sp_rt6 = list_next_entry(mlxsw_sp_rt6, list);
4584 }
e6f3b379
AS
4585
4586 err = mlxsw_sp_nexthop_group_insert(mlxsw_sp, nh_grp);
4587 if (err)
4588 goto err_nexthop_group_insert;
4589
428b851f
IS
4590 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
4591 return nh_grp;
4592
e6f3b379 4593err_nexthop_group_insert:
428b851f
IS
4594err_nexthop6_init:
4595 for (i--; i >= 0; i--) {
4596 nh = &nh_grp->nexthops[i];
4597 mlxsw_sp_nexthop6_fini(mlxsw_sp, nh);
4598 }
4599 kfree(nh_grp);
4600 return ERR_PTR(err);
4601}
4602
4603static void
4604mlxsw_sp_nexthop6_group_destroy(struct mlxsw_sp *mlxsw_sp,
4605 struct mlxsw_sp_nexthop_group *nh_grp)
4606{
4607 struct mlxsw_sp_nexthop *nh;
4608 int i = nh_grp->count;
4609
e6f3b379 4610 mlxsw_sp_nexthop_group_remove(mlxsw_sp, nh_grp);
428b851f
IS
4611 for (i--; i >= 0; i--) {
4612 nh = &nh_grp->nexthops[i];
4613 mlxsw_sp_nexthop6_fini(mlxsw_sp, nh);
4614 }
4615 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
4616 WARN_ON(nh_grp->adj_index_valid);
4617 kfree(nh_grp);
4618}
4619
4620static int mlxsw_sp_nexthop6_group_get(struct mlxsw_sp *mlxsw_sp,
4621 struct mlxsw_sp_fib6_entry *fib6_entry)
4622{
4623 struct mlxsw_sp_nexthop_group *nh_grp;
4624
e6f3b379
AS
4625 nh_grp = mlxsw_sp_nexthop6_group_lookup(mlxsw_sp, fib6_entry);
4626 if (!nh_grp) {
4627 nh_grp = mlxsw_sp_nexthop6_group_create(mlxsw_sp, fib6_entry);
4628 if (IS_ERR(nh_grp))
4629 return PTR_ERR(nh_grp);
4630 }
428b851f
IS
4631
4632 list_add_tail(&fib6_entry->common.nexthop_group_node,
4633 &nh_grp->fib_list);
4634 fib6_entry->common.nh_group = nh_grp;
4635
4636 return 0;
4637}
4638
4639static void mlxsw_sp_nexthop6_group_put(struct mlxsw_sp *mlxsw_sp,
4640 struct mlxsw_sp_fib_entry *fib_entry)
4641{
4642 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
4643
4644 list_del(&fib_entry->nexthop_group_node);
4645 if (!list_empty(&nh_grp->fib_list))
4646 return;
4647 mlxsw_sp_nexthop6_group_destroy(mlxsw_sp, nh_grp);
4648}
4649
4650static int
4651mlxsw_sp_nexthop6_group_update(struct mlxsw_sp *mlxsw_sp,
4652 struct mlxsw_sp_fib6_entry *fib6_entry)
4653{
4654 struct mlxsw_sp_nexthop_group *old_nh_grp = fib6_entry->common.nh_group;
4655 int err;
4656
4657 fib6_entry->common.nh_group = NULL;
4658 list_del(&fib6_entry->common.nexthop_group_node);
4659
4660 err = mlxsw_sp_nexthop6_group_get(mlxsw_sp, fib6_entry);
4661 if (err)
4662 goto err_nexthop6_group_get;
4663
4664 /* In case this entry is offloaded, then the adjacency index
4665 * currently associated with it in the device's table is that
4666 * of the old group. Start using the new one instead.
4667 */
4668 err = mlxsw_sp_fib_node_entry_add(mlxsw_sp, &fib6_entry->common);
4669 if (err)
4670 goto err_fib_node_entry_add;
4671
4672 if (list_empty(&old_nh_grp->fib_list))
4673 mlxsw_sp_nexthop6_group_destroy(mlxsw_sp, old_nh_grp);
4674
4675 return 0;
4676
4677err_fib_node_entry_add:
4678 mlxsw_sp_nexthop6_group_put(mlxsw_sp, &fib6_entry->common);
4679err_nexthop6_group_get:
4680 list_add_tail(&fib6_entry->common.nexthop_group_node,
4681 &old_nh_grp->fib_list);
4682 fib6_entry->common.nh_group = old_nh_grp;
4683 return err;
4684}
4685
4686static int
4687mlxsw_sp_fib6_entry_nexthop_add(struct mlxsw_sp *mlxsw_sp,
4688 struct mlxsw_sp_fib6_entry *fib6_entry,
4689 struct rt6_info *rt)
4690{
4691 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
4692 int err;
4693
4694 mlxsw_sp_rt6 = mlxsw_sp_rt6_create(rt);
4695 if (IS_ERR(mlxsw_sp_rt6))
4696 return PTR_ERR(mlxsw_sp_rt6);
4697
4698 list_add_tail(&mlxsw_sp_rt6->list, &fib6_entry->rt6_list);
4699 fib6_entry->nrt6++;
4700
4701 err = mlxsw_sp_nexthop6_group_update(mlxsw_sp, fib6_entry);
4702 if (err)
4703 goto err_nexthop6_group_update;
4704
4705 return 0;
4706
4707err_nexthop6_group_update:
4708 fib6_entry->nrt6--;
4709 list_del(&mlxsw_sp_rt6->list);
4710 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
4711 return err;
4712}
4713
4714static void
4715mlxsw_sp_fib6_entry_nexthop_del(struct mlxsw_sp *mlxsw_sp,
4716 struct mlxsw_sp_fib6_entry *fib6_entry,
4717 struct rt6_info *rt)
4718{
4719 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
4720
4721 mlxsw_sp_rt6 = mlxsw_sp_fib6_entry_rt_find(fib6_entry, rt);
4722 if (WARN_ON(!mlxsw_sp_rt6))
4723 return;
4724
4725 fib6_entry->nrt6--;
4726 list_del(&mlxsw_sp_rt6->list);
4727 mlxsw_sp_nexthop6_group_update(mlxsw_sp, fib6_entry);
4728 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
4729}
4730
f6050ee6
PM
4731static void mlxsw_sp_fib6_entry_type_set(struct mlxsw_sp *mlxsw_sp,
4732 struct mlxsw_sp_fib_entry *fib_entry,
428b851f
IS
4733 const struct rt6_info *rt)
4734{
4735 /* Packets hitting RTF_REJECT routes need to be discarded by the
4736 * stack. We can rely on their destination device not having a
4737 * RIF (it's the loopback device) and can thus use action type
4738 * local, which will cause them to be trapped with a lower
4739 * priority than packets that need to be locally received.
4740 */
d3b6d377 4741 if (rt->rt6i_flags & (RTF_LOCAL | RTF_ANYCAST))
428b851f
IS
4742 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
4743 else if (rt->rt6i_flags & RTF_REJECT)
4744 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL;
f6050ee6 4745 else if (mlxsw_sp_rt6_is_gateway(mlxsw_sp, rt))
428b851f
IS
4746 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_REMOTE;
4747 else
4748 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL;
4749}
4750
4751static void
4752mlxsw_sp_fib6_entry_rt_destroy_all(struct mlxsw_sp_fib6_entry *fib6_entry)
4753{
4754 struct mlxsw_sp_rt6 *mlxsw_sp_rt6, *tmp;
4755
4756 list_for_each_entry_safe(mlxsw_sp_rt6, tmp, &fib6_entry->rt6_list,
4757 list) {
4758 fib6_entry->nrt6--;
4759 list_del(&mlxsw_sp_rt6->list);
4760 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
4761 }
4762}
4763
4764static struct mlxsw_sp_fib6_entry *
4765mlxsw_sp_fib6_entry_create(struct mlxsw_sp *mlxsw_sp,
4766 struct mlxsw_sp_fib_node *fib_node,
4767 struct rt6_info *rt)
4768{
4769 struct mlxsw_sp_fib6_entry *fib6_entry;
4770 struct mlxsw_sp_fib_entry *fib_entry;
4771 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
4772 int err;
4773
4774 fib6_entry = kzalloc(sizeof(*fib6_entry), GFP_KERNEL);
4775 if (!fib6_entry)
4776 return ERR_PTR(-ENOMEM);
4777 fib_entry = &fib6_entry->common;
4778
4779 mlxsw_sp_rt6 = mlxsw_sp_rt6_create(rt);
4780 if (IS_ERR(mlxsw_sp_rt6)) {
4781 err = PTR_ERR(mlxsw_sp_rt6);
4782 goto err_rt6_create;
4783 }
4784
f6050ee6 4785 mlxsw_sp_fib6_entry_type_set(mlxsw_sp, fib_entry, mlxsw_sp_rt6->rt);
428b851f
IS
4786
4787 INIT_LIST_HEAD(&fib6_entry->rt6_list);
4788 list_add_tail(&mlxsw_sp_rt6->list, &fib6_entry->rt6_list);
4789 fib6_entry->nrt6 = 1;
4790 err = mlxsw_sp_nexthop6_group_get(mlxsw_sp, fib6_entry);
4791 if (err)
4792 goto err_nexthop6_group_get;
4793
4794 fib_entry->fib_node = fib_node;
4795
4796 return fib6_entry;
4797
4798err_nexthop6_group_get:
4799 list_del(&mlxsw_sp_rt6->list);
4800 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
4801err_rt6_create:
4802 kfree(fib6_entry);
4803 return ERR_PTR(err);
4804}
4805
4806static void mlxsw_sp_fib6_entry_destroy(struct mlxsw_sp *mlxsw_sp,
4807 struct mlxsw_sp_fib6_entry *fib6_entry)
4808{
4809 mlxsw_sp_nexthop6_group_put(mlxsw_sp, &fib6_entry->common);
4810 mlxsw_sp_fib6_entry_rt_destroy_all(fib6_entry);
4811 WARN_ON(fib6_entry->nrt6);
4812 kfree(fib6_entry);
4813}
4814
4815static struct mlxsw_sp_fib6_entry *
4816mlxsw_sp_fib6_node_entry_find(const struct mlxsw_sp_fib_node *fib_node,
0a7fd1ac 4817 const struct rt6_info *nrt, bool replace)
428b851f 4818{
0a7fd1ac 4819 struct mlxsw_sp_fib6_entry *fib6_entry, *fallback = NULL;
428b851f
IS
4820
4821 list_for_each_entry(fib6_entry, &fib_node->entry_list, common.list) {
4822 struct rt6_info *rt = mlxsw_sp_fib6_entry_rt(fib6_entry);
4823
4824 if (rt->rt6i_table->tb6_id > nrt->rt6i_table->tb6_id)
4825 continue;
4826 if (rt->rt6i_table->tb6_id != nrt->rt6i_table->tb6_id)
4827 break;
0a7fd1ac
IS
4828 if (replace && rt->rt6i_metric == nrt->rt6i_metric) {
4829 if (mlxsw_sp_fib6_rt_can_mp(rt) ==
4830 mlxsw_sp_fib6_rt_can_mp(nrt))
4831 return fib6_entry;
4832 if (mlxsw_sp_fib6_rt_can_mp(nrt))
4833 fallback = fallback ?: fib6_entry;
4834 }
428b851f 4835 if (rt->rt6i_metric > nrt->rt6i_metric)
0a7fd1ac 4836 return fallback ?: fib6_entry;
428b851f
IS
4837 }
4838
0a7fd1ac 4839 return fallback;
428b851f
IS
4840}
4841
4842static int
0a7fd1ac
IS
4843mlxsw_sp_fib6_node_list_insert(struct mlxsw_sp_fib6_entry *new6_entry,
4844 bool replace)
428b851f
IS
4845{
4846 struct mlxsw_sp_fib_node *fib_node = new6_entry->common.fib_node;
4847 struct rt6_info *nrt = mlxsw_sp_fib6_entry_rt(new6_entry);
4848 struct mlxsw_sp_fib6_entry *fib6_entry;
4849
0a7fd1ac
IS
4850 fib6_entry = mlxsw_sp_fib6_node_entry_find(fib_node, nrt, replace);
4851
4852 if (replace && WARN_ON(!fib6_entry))
4853 return -EINVAL;
428b851f
IS
4854
4855 if (fib6_entry) {
4856 list_add_tail(&new6_entry->common.list,
4857 &fib6_entry->common.list);
4858 } else {
4859 struct mlxsw_sp_fib6_entry *last;
4860
4861 list_for_each_entry(last, &fib_node->entry_list, common.list) {
4862 struct rt6_info *rt = mlxsw_sp_fib6_entry_rt(last);
4863
4864 if (nrt->rt6i_table->tb6_id > rt->rt6i_table->tb6_id)
4865 break;
4866 fib6_entry = last;
4867 }
4868
4869 if (fib6_entry)
4870 list_add(&new6_entry->common.list,
4871 &fib6_entry->common.list);
4872 else
4873 list_add(&new6_entry->common.list,
4874 &fib_node->entry_list);
4875 }
4876
4877 return 0;
4878}
4879
4880static void
4881mlxsw_sp_fib6_node_list_remove(struct mlxsw_sp_fib6_entry *fib6_entry)
4882{
4883 list_del(&fib6_entry->common.list);
4884}
4885
4886static int mlxsw_sp_fib6_node_entry_link(struct mlxsw_sp *mlxsw_sp,
0a7fd1ac
IS
4887 struct mlxsw_sp_fib6_entry *fib6_entry,
4888 bool replace)
428b851f
IS
4889{
4890 int err;
4891
0a7fd1ac 4892 err = mlxsw_sp_fib6_node_list_insert(fib6_entry, replace);
428b851f
IS
4893 if (err)
4894 return err;
4895
4896 err = mlxsw_sp_fib_node_entry_add(mlxsw_sp, &fib6_entry->common);
4897 if (err)
4898 goto err_fib_node_entry_add;
4899
4900 return 0;
4901
4902err_fib_node_entry_add:
4903 mlxsw_sp_fib6_node_list_remove(fib6_entry);
4904 return err;
4905}
4906
4907static void
4908mlxsw_sp_fib6_node_entry_unlink(struct mlxsw_sp *mlxsw_sp,
4909 struct mlxsw_sp_fib6_entry *fib6_entry)
4910{
4911 mlxsw_sp_fib_node_entry_del(mlxsw_sp, &fib6_entry->common);
4912 mlxsw_sp_fib6_node_list_remove(fib6_entry);
4913}
4914
4915static struct mlxsw_sp_fib6_entry *
4916mlxsw_sp_fib6_entry_lookup(struct mlxsw_sp *mlxsw_sp,
4917 const struct rt6_info *rt)
4918{
4919 struct mlxsw_sp_fib6_entry *fib6_entry;
4920 struct mlxsw_sp_fib_node *fib_node;
4921 struct mlxsw_sp_fib *fib;
4922 struct mlxsw_sp_vr *vr;
4923
4924 vr = mlxsw_sp_vr_find(mlxsw_sp, rt->rt6i_table->tb6_id);
4925 if (!vr)
4926 return NULL;
4927 fib = mlxsw_sp_vr_fib(vr, MLXSW_SP_L3_PROTO_IPV6);
4928
4929 fib_node = mlxsw_sp_fib_node_lookup(fib, &rt->rt6i_dst.addr,
4930 sizeof(rt->rt6i_dst.addr),
4931 rt->rt6i_dst.plen);
4932 if (!fib_node)
4933 return NULL;
4934
4935 list_for_each_entry(fib6_entry, &fib_node->entry_list, common.list) {
4936 struct rt6_info *iter_rt = mlxsw_sp_fib6_entry_rt(fib6_entry);
4937
4938 if (rt->rt6i_table->tb6_id == iter_rt->rt6i_table->tb6_id &&
4939 rt->rt6i_metric == iter_rt->rt6i_metric &&
4940 mlxsw_sp_fib6_entry_rt_find(fib6_entry, rt))
4941 return fib6_entry;
4942 }
4943
4944 return NULL;
4945}
4946
0a7fd1ac
IS
4947static void mlxsw_sp_fib6_entry_replace(struct mlxsw_sp *mlxsw_sp,
4948 struct mlxsw_sp_fib6_entry *fib6_entry,
4949 bool replace)
4950{
4951 struct mlxsw_sp_fib_node *fib_node = fib6_entry->common.fib_node;
4952 struct mlxsw_sp_fib6_entry *replaced;
4953
4954 if (!replace)
4955 return;
4956
4957 replaced = list_next_entry(fib6_entry, common.list);
4958
4959 mlxsw_sp_fib6_node_entry_unlink(mlxsw_sp, replaced);
4960 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, replaced);
4961 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
4962}
4963
428b851f 4964static int mlxsw_sp_router_fib6_add(struct mlxsw_sp *mlxsw_sp,
0a7fd1ac 4965 struct rt6_info *rt, bool replace)
428b851f
IS
4966{
4967 struct mlxsw_sp_fib6_entry *fib6_entry;
4968 struct mlxsw_sp_fib_node *fib_node;
4969 int err;
4970
4971 if (mlxsw_sp->router->aborted)
4972 return 0;
4973
f36f5ac6
IS
4974 if (rt->rt6i_src.plen)
4975 return -EINVAL;
4976
428b851f
IS
4977 if (mlxsw_sp_fib6_rt_should_ignore(rt))
4978 return 0;
4979
4980 fib_node = mlxsw_sp_fib_node_get(mlxsw_sp, rt->rt6i_table->tb6_id,
4981 &rt->rt6i_dst.addr,
4982 sizeof(rt->rt6i_dst.addr),
4983 rt->rt6i_dst.plen,
4984 MLXSW_SP_L3_PROTO_IPV6);
4985 if (IS_ERR(fib_node))
4986 return PTR_ERR(fib_node);
4987
4988 /* Before creating a new entry, try to append route to an existing
4989 * multipath entry.
4990 */
0a7fd1ac 4991 fib6_entry = mlxsw_sp_fib6_node_mp_entry_find(fib_node, rt, replace);
428b851f
IS
4992 if (fib6_entry) {
4993 err = mlxsw_sp_fib6_entry_nexthop_add(mlxsw_sp, fib6_entry, rt);
4994 if (err)
4995 goto err_fib6_entry_nexthop_add;
4996 return 0;
4997 }
4998
4999 fib6_entry = mlxsw_sp_fib6_entry_create(mlxsw_sp, fib_node, rt);
5000 if (IS_ERR(fib6_entry)) {
5001 err = PTR_ERR(fib6_entry);
5002 goto err_fib6_entry_create;
5003 }
5004
0a7fd1ac 5005 err = mlxsw_sp_fib6_node_entry_link(mlxsw_sp, fib6_entry, replace);
428b851f
IS
5006 if (err)
5007 goto err_fib6_node_entry_link;
5008
0a7fd1ac
IS
5009 mlxsw_sp_fib6_entry_replace(mlxsw_sp, fib6_entry, replace);
5010
428b851f
IS
5011 return 0;
5012
5013err_fib6_node_entry_link:
5014 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry);
5015err_fib6_entry_create:
5016err_fib6_entry_nexthop_add:
5017 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
5018 return err;
5019}
5020
5021static void mlxsw_sp_router_fib6_del(struct mlxsw_sp *mlxsw_sp,
5022 struct rt6_info *rt)
5023{
5024 struct mlxsw_sp_fib6_entry *fib6_entry;
5025 struct mlxsw_sp_fib_node *fib_node;
5026
5027 if (mlxsw_sp->router->aborted)
5028 return;
5029
5030 if (mlxsw_sp_fib6_rt_should_ignore(rt))
5031 return;
5032
5033 fib6_entry = mlxsw_sp_fib6_entry_lookup(mlxsw_sp, rt);
5034 if (WARN_ON(!fib6_entry))
5035 return;
5036
5037 /* If route is part of a multipath entry, but not the last one
5038 * removed, then only reduce its nexthop group.
5039 */
5040 if (!list_is_singular(&fib6_entry->rt6_list)) {
5041 mlxsw_sp_fib6_entry_nexthop_del(mlxsw_sp, fib6_entry, rt);
5042 return;
5043 }
5044
5045 fib_node = fib6_entry->common.fib_node;
5046
5047 mlxsw_sp_fib6_node_entry_unlink(mlxsw_sp, fib6_entry);
5048 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry);
5049 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
5050}
5051
bc65a8a4
IS
5052static int __mlxsw_sp_router_set_abort_trap(struct mlxsw_sp *mlxsw_sp,
5053 enum mlxsw_reg_ralxx_protocol proto,
5054 u8 tree_id)
b45f64d1
JP
5055{
5056 char ralta_pl[MLXSW_REG_RALTA_LEN];
5057 char ralst_pl[MLXSW_REG_RALST_LEN];
b5d90e6d 5058 int i, err;
b45f64d1 5059
bc65a8a4 5060 mlxsw_reg_ralta_pack(ralta_pl, true, proto, tree_id);
b45f64d1
JP
5061 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl);
5062 if (err)
5063 return err;
5064
bc65a8a4 5065 mlxsw_reg_ralst_pack(ralst_pl, 0xff, tree_id);
b45f64d1
JP
5066 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralst), ralst_pl);
5067 if (err)
5068 return err;
5069
b5d90e6d 5070 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
9011b677 5071 struct mlxsw_sp_vr *vr = &mlxsw_sp->router->vrs[i];
b5d90e6d
IS
5072 char raltb_pl[MLXSW_REG_RALTB_LEN];
5073 char ralue_pl[MLXSW_REG_RALUE_LEN];
b45f64d1 5074
bc65a8a4 5075 mlxsw_reg_raltb_pack(raltb_pl, vr->id, proto, tree_id);
b5d90e6d
IS
5076 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb),
5077 raltb_pl);
5078 if (err)
5079 return err;
5080
bc65a8a4
IS
5081 mlxsw_reg_ralue_pack(ralue_pl, proto,
5082 MLXSW_REG_RALUE_OP_WRITE_WRITE, vr->id, 0);
b5d90e6d
IS
5083 mlxsw_reg_ralue_act_ip2me_pack(ralue_pl);
5084 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue),
5085 ralue_pl);
5086 if (err)
5087 return err;
5088 }
5089
5090 return 0;
b45f64d1
JP
5091}
5092
d42b0965
YG
5093static int mlxsw_sp_router_fibmr_add(struct mlxsw_sp *mlxsw_sp,
5094 struct mfc_entry_notifier_info *men_info,
5095 bool replace)
5096{
5097 struct mlxsw_sp_vr *vr;
5098
5099 if (mlxsw_sp->router->aborted)
5100 return 0;
5101
f8fa9b4e 5102 vr = mlxsw_sp_vr_get(mlxsw_sp, men_info->tb_id, NULL);
d42b0965
YG
5103 if (IS_ERR(vr))
5104 return PTR_ERR(vr);
5105
5106 return mlxsw_sp_mr_route4_add(vr->mr4_table, men_info->mfc, replace);
5107}
5108
5109static void mlxsw_sp_router_fibmr_del(struct mlxsw_sp *mlxsw_sp,
5110 struct mfc_entry_notifier_info *men_info)
5111{
5112 struct mlxsw_sp_vr *vr;
5113
5114 if (mlxsw_sp->router->aborted)
5115 return;
5116
5117 vr = mlxsw_sp_vr_find(mlxsw_sp, men_info->tb_id);
5118 if (WARN_ON(!vr))
5119 return;
5120
5121 mlxsw_sp_mr_route4_del(vr->mr4_table, men_info->mfc);
5122 mlxsw_sp_vr_put(vr);
5123}
5124
5125static int
5126mlxsw_sp_router_fibmr_vif_add(struct mlxsw_sp *mlxsw_sp,
5127 struct vif_entry_notifier_info *ven_info)
5128{
5129 struct mlxsw_sp_rif *rif;
5130 struct mlxsw_sp_vr *vr;
5131
5132 if (mlxsw_sp->router->aborted)
5133 return 0;
5134
f8fa9b4e 5135 vr = mlxsw_sp_vr_get(mlxsw_sp, ven_info->tb_id, NULL);
d42b0965
YG
5136 if (IS_ERR(vr))
5137 return PTR_ERR(vr);
5138
5139 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, ven_info->dev);
5140 return mlxsw_sp_mr_vif_add(vr->mr4_table, ven_info->dev,
5141 ven_info->vif_index,
5142 ven_info->vif_flags, rif);
5143}
5144
5145static void
5146mlxsw_sp_router_fibmr_vif_del(struct mlxsw_sp *mlxsw_sp,
5147 struct vif_entry_notifier_info *ven_info)
5148{
5149 struct mlxsw_sp_vr *vr;
5150
5151 if (mlxsw_sp->router->aborted)
5152 return;
5153
5154 vr = mlxsw_sp_vr_find(mlxsw_sp, ven_info->tb_id);
5155 if (WARN_ON(!vr))
5156 return;
5157
5158 mlxsw_sp_mr_vif_del(vr->mr4_table, ven_info->vif_index);
5159 mlxsw_sp_vr_put(vr);
5160}
5161
bc65a8a4
IS
5162static int mlxsw_sp_router_set_abort_trap(struct mlxsw_sp *mlxsw_sp)
5163{
5164 enum mlxsw_reg_ralxx_protocol proto = MLXSW_REG_RALXX_PROTOCOL_IPV4;
5165 int err;
5166
5167 err = __mlxsw_sp_router_set_abort_trap(mlxsw_sp, proto,
5168 MLXSW_SP_LPM_TREE_MIN);
5169 if (err)
5170 return err;
5171
d42b0965
YG
5172 /* The multicast router code does not need an abort trap as by default,
5173 * packets that don't match any routes are trapped to the CPU.
5174 */
5175
bc65a8a4
IS
5176 proto = MLXSW_REG_RALXX_PROTOCOL_IPV6;
5177 return __mlxsw_sp_router_set_abort_trap(mlxsw_sp, proto,
5178 MLXSW_SP_LPM_TREE_MIN + 1);
5179}
5180
9aecce1c
IS
5181static void mlxsw_sp_fib4_node_flush(struct mlxsw_sp *mlxsw_sp,
5182 struct mlxsw_sp_fib_node *fib_node)
5183{
4f1c7f1f 5184 struct mlxsw_sp_fib4_entry *fib4_entry, *tmp;
9aecce1c 5185
4f1c7f1f
IS
5186 list_for_each_entry_safe(fib4_entry, tmp, &fib_node->entry_list,
5187 common.list) {
5188 bool do_break = &tmp->common.list == &fib_node->entry_list;
9aecce1c 5189
4f1c7f1f
IS
5190 mlxsw_sp_fib4_node_entry_unlink(mlxsw_sp, fib4_entry);
5191 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry);
731ea1ca 5192 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
9aecce1c
IS
5193 /* Break when entry list is empty and node was freed.
5194 * Otherwise, we'll access freed memory in the next
5195 * iteration.
5196 */
5197 if (do_break)
5198 break;
5199 }
5200}
5201
428b851f
IS
5202static void mlxsw_sp_fib6_node_flush(struct mlxsw_sp *mlxsw_sp,
5203 struct mlxsw_sp_fib_node *fib_node)
5204{
5205 struct mlxsw_sp_fib6_entry *fib6_entry, *tmp;
5206
5207 list_for_each_entry_safe(fib6_entry, tmp, &fib_node->entry_list,
5208 common.list) {
5209 bool do_break = &tmp->common.list == &fib_node->entry_list;
5210
5211 mlxsw_sp_fib6_node_entry_unlink(mlxsw_sp, fib6_entry);
5212 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry);
5213 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
5214 if (do_break)
5215 break;
5216 }
5217}
5218
9aecce1c
IS
5219static void mlxsw_sp_fib_node_flush(struct mlxsw_sp *mlxsw_sp,
5220 struct mlxsw_sp_fib_node *fib_node)
5221{
76610ebb 5222 switch (fib_node->fib->proto) {
9aecce1c
IS
5223 case MLXSW_SP_L3_PROTO_IPV4:
5224 mlxsw_sp_fib4_node_flush(mlxsw_sp, fib_node);
5225 break;
5226 case MLXSW_SP_L3_PROTO_IPV6:
428b851f 5227 mlxsw_sp_fib6_node_flush(mlxsw_sp, fib_node);
9aecce1c
IS
5228 break;
5229 }
5230}
5231
76610ebb
IS
5232static void mlxsw_sp_vr_fib_flush(struct mlxsw_sp *mlxsw_sp,
5233 struct mlxsw_sp_vr *vr,
5234 enum mlxsw_sp_l3proto proto)
b45f64d1 5235{
76610ebb 5236 struct mlxsw_sp_fib *fib = mlxsw_sp_vr_fib(vr, proto);
9aecce1c 5237 struct mlxsw_sp_fib_node *fib_node, *tmp;
76610ebb
IS
5238
5239 list_for_each_entry_safe(fib_node, tmp, &fib->node_list, list) {
5240 bool do_break = &tmp->list == &fib->node_list;
5241
5242 mlxsw_sp_fib_node_flush(mlxsw_sp, fib_node);
5243 if (do_break)
5244 break;
5245 }
5246}
5247
5248static void mlxsw_sp_router_fib_flush(struct mlxsw_sp *mlxsw_sp)
5249{
b45f64d1 5250 int i;
b45f64d1 5251
c1a38311 5252 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
9011b677 5253 struct mlxsw_sp_vr *vr = &mlxsw_sp->router->vrs[i];
ac571de9 5254
76610ebb 5255 if (!mlxsw_sp_vr_is_used(vr))
b45f64d1 5256 continue;
d42b0965
YG
5257
5258 mlxsw_sp_mr_table_flush(vr->mr4_table);
76610ebb 5259 mlxsw_sp_vr_fib_flush(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV4);
a3d9bc50
IS
5260
5261 /* If virtual router was only used for IPv4, then it's no
5262 * longer used.
5263 */
5264 if (!mlxsw_sp_vr_is_used(vr))
5265 continue;
5266 mlxsw_sp_vr_fib_flush(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV6);
b45f64d1 5267 }
ac571de9
IS
5268}
5269
bc65a8a4 5270static void mlxsw_sp_router_fib_abort(struct mlxsw_sp *mlxsw_sp)
ac571de9
IS
5271{
5272 int err;
5273
9011b677 5274 if (mlxsw_sp->router->aborted)
d331d303
IS
5275 return;
5276 dev_warn(mlxsw_sp->bus_info->dev, "FIB abort triggered. Note that FIB entries are no longer being offloaded to this device.\n");
ac571de9 5277 mlxsw_sp_router_fib_flush(mlxsw_sp);
9011b677 5278 mlxsw_sp->router->aborted = true;
b45f64d1
JP
5279 err = mlxsw_sp_router_set_abort_trap(mlxsw_sp);
5280 if (err)
5281 dev_warn(mlxsw_sp->bus_info->dev, "Failed to set abort trap.\n");
5282}
5283
3057224e 5284struct mlxsw_sp_fib_event_work {
a0e4761d 5285 struct work_struct work;
ad178c8e 5286 union {
428b851f 5287 struct fib6_entry_notifier_info fen6_info;
ad178c8e 5288 struct fib_entry_notifier_info fen_info;
5d7bfd14 5289 struct fib_rule_notifier_info fr_info;
ad178c8e 5290 struct fib_nh_notifier_info fnh_info;
d42b0965
YG
5291 struct mfc_entry_notifier_info men_info;
5292 struct vif_entry_notifier_info ven_info;
ad178c8e 5293 };
3057224e
IS
5294 struct mlxsw_sp *mlxsw_sp;
5295 unsigned long event;
5296};
5297
66a5763a 5298static void mlxsw_sp_router_fib4_event_work(struct work_struct *work)
b45f64d1 5299{
3057224e 5300 struct mlxsw_sp_fib_event_work *fib_work =
a0e4761d 5301 container_of(work, struct mlxsw_sp_fib_event_work, work);
3057224e 5302 struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp;
599cf8f9 5303 bool replace, append;
b45f64d1
JP
5304 int err;
5305
3057224e
IS
5306 /* Protect internal structures from changes */
5307 rtnl_lock();
5308 switch (fib_work->event) {
599cf8f9 5309 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
4283bce5 5310 case FIB_EVENT_ENTRY_APPEND: /* fall through */
b45f64d1 5311 case FIB_EVENT_ENTRY_ADD:
599cf8f9 5312 replace = fib_work->event == FIB_EVENT_ENTRY_REPLACE;
4283bce5
IS
5313 append = fib_work->event == FIB_EVENT_ENTRY_APPEND;
5314 err = mlxsw_sp_router_fib4_add(mlxsw_sp, &fib_work->fen_info,
599cf8f9 5315 replace, append);
b45f64d1 5316 if (err)
bc65a8a4 5317 mlxsw_sp_router_fib_abort(mlxsw_sp);
3057224e 5318 fib_info_put(fib_work->fen_info.fi);
b45f64d1
JP
5319 break;
5320 case FIB_EVENT_ENTRY_DEL:
3057224e
IS
5321 mlxsw_sp_router_fib4_del(mlxsw_sp, &fib_work->fen_info);
5322 fib_info_put(fib_work->fen_info.fi);
b45f64d1 5323 break;
1f279233
DA
5324 case FIB_EVENT_RULE_ADD:
5325 /* if we get here, a rule was added that we do not support.
5326 * just do the fib_abort
5327 */
5328 mlxsw_sp_router_fib_abort(mlxsw_sp);
b45f64d1 5329 break;
ad178c8e
IS
5330 case FIB_EVENT_NH_ADD: /* fall through */
5331 case FIB_EVENT_NH_DEL:
0e6ea2a4
IS
5332 mlxsw_sp_nexthop4_event(mlxsw_sp, fib_work->event,
5333 fib_work->fnh_info.fib_nh);
ad178c8e
IS
5334 fib_info_put(fib_work->fnh_info.fib_nh->nh_parent);
5335 break;
b45f64d1 5336 }
3057224e
IS
5337 rtnl_unlock();
5338 kfree(fib_work);
5339}
5340
66a5763a
IS
5341static void mlxsw_sp_router_fib6_event_work(struct work_struct *work)
5342{
583419fd
IS
5343 struct mlxsw_sp_fib_event_work *fib_work =
5344 container_of(work, struct mlxsw_sp_fib_event_work, work);
5345 struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp;
0a7fd1ac 5346 bool replace;
428b851f 5347 int err;
583419fd
IS
5348
5349 rtnl_lock();
5350 switch (fib_work->event) {
0a7fd1ac 5351 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
428b851f 5352 case FIB_EVENT_ENTRY_ADD:
0a7fd1ac 5353 replace = fib_work->event == FIB_EVENT_ENTRY_REPLACE;
428b851f 5354 err = mlxsw_sp_router_fib6_add(mlxsw_sp,
0a7fd1ac 5355 fib_work->fen6_info.rt, replace);
428b851f
IS
5356 if (err)
5357 mlxsw_sp_router_fib_abort(mlxsw_sp);
5358 mlxsw_sp_rt6_release(fib_work->fen6_info.rt);
5359 break;
5360 case FIB_EVENT_ENTRY_DEL:
5361 mlxsw_sp_router_fib6_del(mlxsw_sp, fib_work->fen6_info.rt);
5362 mlxsw_sp_rt6_release(fib_work->fen6_info.rt);
5363 break;
1f279233
DA
5364 case FIB_EVENT_RULE_ADD:
5365 /* if we get here, a rule was added that we do not support.
5366 * just do the fib_abort
5367 */
5368 mlxsw_sp_router_fib_abort(mlxsw_sp);
583419fd
IS
5369 break;
5370 }
5371 rtnl_unlock();
5372 kfree(fib_work);
66a5763a
IS
5373}
5374
d42b0965
YG
5375static void mlxsw_sp_router_fibmr_event_work(struct work_struct *work)
5376{
5377 struct mlxsw_sp_fib_event_work *fib_work =
5378 container_of(work, struct mlxsw_sp_fib_event_work, work);
5379 struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp;
d42b0965
YG
5380 bool replace;
5381 int err;
5382
5383 rtnl_lock();
5384 switch (fib_work->event) {
5385 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
5386 case FIB_EVENT_ENTRY_ADD:
5387 replace = fib_work->event == FIB_EVENT_ENTRY_REPLACE;
5388
5389 err = mlxsw_sp_router_fibmr_add(mlxsw_sp, &fib_work->men_info,
5390 replace);
5391 if (err)
5392 mlxsw_sp_router_fib_abort(mlxsw_sp);
5393 ipmr_cache_put(fib_work->men_info.mfc);
5394 break;
5395 case FIB_EVENT_ENTRY_DEL:
5396 mlxsw_sp_router_fibmr_del(mlxsw_sp, &fib_work->men_info);
5397 ipmr_cache_put(fib_work->men_info.mfc);
5398 break;
5399 case FIB_EVENT_VIF_ADD:
5400 err = mlxsw_sp_router_fibmr_vif_add(mlxsw_sp,
5401 &fib_work->ven_info);
5402 if (err)
5403 mlxsw_sp_router_fib_abort(mlxsw_sp);
5404 dev_put(fib_work->ven_info.dev);
5405 break;
5406 case FIB_EVENT_VIF_DEL:
5407 mlxsw_sp_router_fibmr_vif_del(mlxsw_sp,
5408 &fib_work->ven_info);
5409 dev_put(fib_work->ven_info.dev);
5410 break;
1f279233
DA
5411 case FIB_EVENT_RULE_ADD:
5412 /* if we get here, a rule was added that we do not support.
5413 * just do the fib_abort
5414 */
5415 mlxsw_sp_router_fib_abort(mlxsw_sp);
d42b0965
YG
5416 break;
5417 }
5418 rtnl_unlock();
5419 kfree(fib_work);
5420}
5421
66a5763a
IS
5422static void mlxsw_sp_router_fib4_event(struct mlxsw_sp_fib_event_work *fib_work,
5423 struct fib_notifier_info *info)
5424{
3c75f9b1 5425 struct fib_entry_notifier_info *fen_info;
3c75f9b1
DA
5426 struct fib_nh_notifier_info *fnh_info;
5427
66a5763a
IS
5428 switch (fib_work->event) {
5429 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
5430 case FIB_EVENT_ENTRY_APPEND: /* fall through */
5431 case FIB_EVENT_ENTRY_ADD: /* fall through */
5432 case FIB_EVENT_ENTRY_DEL:
3c75f9b1
DA
5433 fen_info = container_of(info, struct fib_entry_notifier_info,
5434 info);
5435 fib_work->fen_info = *fen_info;
5436 /* Take reference on fib_info to prevent it from being
66a5763a
IS
5437 * freed while work is queued. Release it afterwards.
5438 */
5439 fib_info_hold(fib_work->fen_info.fi);
5440 break;
66a5763a
IS
5441 case FIB_EVENT_NH_ADD: /* fall through */
5442 case FIB_EVENT_NH_DEL:
3c75f9b1
DA
5443 fnh_info = container_of(info, struct fib_nh_notifier_info,
5444 info);
5445 fib_work->fnh_info = *fnh_info;
66a5763a
IS
5446 fib_info_hold(fib_work->fnh_info.fib_nh->nh_parent);
5447 break;
5448 }
5449}
5450
5451static void mlxsw_sp_router_fib6_event(struct mlxsw_sp_fib_event_work *fib_work,
5452 struct fib_notifier_info *info)
5453{
3c75f9b1 5454 struct fib6_entry_notifier_info *fen6_info;
3c75f9b1 5455
583419fd 5456 switch (fib_work->event) {
0a7fd1ac 5457 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
428b851f
IS
5458 case FIB_EVENT_ENTRY_ADD: /* fall through */
5459 case FIB_EVENT_ENTRY_DEL:
3c75f9b1
DA
5460 fen6_info = container_of(info, struct fib6_entry_notifier_info,
5461 info);
5462 fib_work->fen6_info = *fen6_info;
428b851f
IS
5463 rt6_hold(fib_work->fen6_info.rt);
5464 break;
583419fd 5465 }
66a5763a
IS
5466}
5467
d42b0965
YG
5468static void
5469mlxsw_sp_router_fibmr_event(struct mlxsw_sp_fib_event_work *fib_work,
5470 struct fib_notifier_info *info)
5471{
5472 switch (fib_work->event) {
5473 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
5474 case FIB_EVENT_ENTRY_ADD: /* fall through */
5475 case FIB_EVENT_ENTRY_DEL:
5476 memcpy(&fib_work->men_info, info, sizeof(fib_work->men_info));
5477 ipmr_cache_hold(fib_work->men_info.mfc);
5478 break;
5479 case FIB_EVENT_VIF_ADD: /* fall through */
5480 case FIB_EVENT_VIF_DEL:
5481 memcpy(&fib_work->ven_info, info, sizeof(fib_work->ven_info));
5482 dev_hold(fib_work->ven_info.dev);
5483 break;
1f279233
DA
5484 }
5485}
5486
5487static int mlxsw_sp_router_fib_rule_event(unsigned long event,
5488 struct fib_notifier_info *info,
5489 struct mlxsw_sp *mlxsw_sp)
5490{
5491 struct netlink_ext_ack *extack = info->extack;
5492 struct fib_rule_notifier_info *fr_info;
5493 struct fib_rule *rule;
5494 int err = 0;
5495
5496 /* nothing to do at the moment */
5497 if (event == FIB_EVENT_RULE_DEL)
5498 return 0;
5499
5500 if (mlxsw_sp->router->aborted)
5501 return 0;
5502
5503 fr_info = container_of(info, struct fib_rule_notifier_info, info);
5504 rule = fr_info->rule;
5505
5506 switch (info->family) {
5507 case AF_INET:
5508 if (!fib4_rule_default(rule) && !rule->l3mdev)
5509 err = -1;
5510 break;
5511 case AF_INET6:
5512 if (!fib6_rule_default(rule) && !rule->l3mdev)
5513 err = -1;
5514 break;
5515 case RTNL_FAMILY_IPMR:
5516 if (!ipmr_rule_default(rule) && !rule->l3mdev)
5517 err = -1;
d42b0965
YG
5518 break;
5519 }
1f279233
DA
5520
5521 if (err < 0)
5522 NL_SET_ERR_MSG(extack, "spectrum: FIB rules not supported. Aborting offload");
5523
5524 return err;
d42b0965
YG
5525}
5526
3057224e
IS
5527/* Called with rcu_read_lock() */
5528static int mlxsw_sp_router_fib_event(struct notifier_block *nb,
5529 unsigned long event, void *ptr)
5530{
3057224e
IS
5531 struct mlxsw_sp_fib_event_work *fib_work;
5532 struct fib_notifier_info *info = ptr;
7e39d115 5533 struct mlxsw_sp_router *router;
1f279233 5534 int err;
3057224e 5535
8e29f979 5536 if (!net_eq(info->net, &init_net) ||
664375e9
YG
5537 (info->family != AF_INET && info->family != AF_INET6 &&
5538 info->family != RTNL_FAMILY_IPMR))
3057224e
IS
5539 return NOTIFY_DONE;
5540
1f279233
DA
5541 router = container_of(nb, struct mlxsw_sp_router, fib_nb);
5542
5543 switch (event) {
5544 case FIB_EVENT_RULE_ADD: /* fall through */
5545 case FIB_EVENT_RULE_DEL:
5546 err = mlxsw_sp_router_fib_rule_event(event, info,
5547 router->mlxsw_sp);
5548 if (!err)
5549 return NOTIFY_DONE;
5550 }
5551
3057224e
IS
5552 fib_work = kzalloc(sizeof(*fib_work), GFP_ATOMIC);
5553 if (WARN_ON(!fib_work))
5554 return NOTIFY_BAD;
5555
7e39d115 5556 fib_work->mlxsw_sp = router->mlxsw_sp;
3057224e
IS
5557 fib_work->event = event;
5558
66a5763a
IS
5559 switch (info->family) {
5560 case AF_INET:
5561 INIT_WORK(&fib_work->work, mlxsw_sp_router_fib4_event_work);
5562 mlxsw_sp_router_fib4_event(fib_work, info);
3057224e 5563 break;
66a5763a
IS
5564 case AF_INET6:
5565 INIT_WORK(&fib_work->work, mlxsw_sp_router_fib6_event_work);
5566 mlxsw_sp_router_fib6_event(fib_work, info);
ad178c8e 5567 break;
d42b0965
YG
5568 case RTNL_FAMILY_IPMR:
5569 INIT_WORK(&fib_work->work, mlxsw_sp_router_fibmr_event_work);
5570 mlxsw_sp_router_fibmr_event(fib_work, info);
5571 break;
3057224e
IS
5572 }
5573
a0e4761d 5574 mlxsw_core_schedule_work(&fib_work->work);
3057224e 5575
b45f64d1
JP
5576 return NOTIFY_DONE;
5577}
5578
4724ba56
IS
5579static struct mlxsw_sp_rif *
5580mlxsw_sp_rif_find_by_dev(const struct mlxsw_sp *mlxsw_sp,
5581 const struct net_device *dev)
5582{
5583 int i;
5584
5585 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++)
5f9efffb
IS
5586 if (mlxsw_sp->router->rifs[i] &&
5587 mlxsw_sp->router->rifs[i]->dev == dev)
5588 return mlxsw_sp->router->rifs[i];
4724ba56
IS
5589
5590 return NULL;
5591}
5592
5593static int mlxsw_sp_router_rif_disable(struct mlxsw_sp *mlxsw_sp, u16 rif)
5594{
5595 char ritr_pl[MLXSW_REG_RITR_LEN];
5596 int err;
5597
5598 mlxsw_reg_ritr_rif_pack(ritr_pl, rif);
5599 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
5600 if (WARN_ON_ONCE(err))
5601 return err;
5602
5603 mlxsw_reg_ritr_enable_set(ritr_pl, false);
5604 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
5605}
5606
5607static void mlxsw_sp_router_rif_gone_sync(struct mlxsw_sp *mlxsw_sp,
bf95233e 5608 struct mlxsw_sp_rif *rif)
4724ba56 5609{
bf95233e
AS
5610 mlxsw_sp_router_rif_disable(mlxsw_sp, rif->rif_index);
5611 mlxsw_sp_nexthop_rif_gone_sync(mlxsw_sp, rif);
5612 mlxsw_sp_neigh_rif_gone_sync(mlxsw_sp, rif);
4724ba56
IS
5613}
5614
5ea1237f
AS
5615static bool
5616mlxsw_sp_rif_should_config(struct mlxsw_sp_rif *rif, struct net_device *dev,
5617 unsigned long event)
4724ba56 5618{
5ea1237f
AS
5619 struct inet6_dev *inet6_dev;
5620 bool addr_list_empty = true;
5621 struct in_device *idev;
5622
4724ba56
IS
5623 switch (event) {
5624 case NETDEV_UP:
f1b1f273 5625 return rif == NULL;
4724ba56 5626 case NETDEV_DOWN:
5ea1237f
AS
5627 idev = __in_dev_get_rtnl(dev);
5628 if (idev && idev->ifa_list)
5629 addr_list_empty = false;
5630
5631 inet6_dev = __in6_dev_get(dev);
5632 if (addr_list_empty && inet6_dev &&
5633 !list_empty(&inet6_dev->addr_list))
5634 addr_list_empty = false;
5635
5636 if (rif && addr_list_empty &&
bf95233e 5637 !netif_is_l3_slave(rif->dev))
4724ba56
IS
5638 return true;
5639 /* It is possible we already removed the RIF ourselves
5640 * if it was assigned to a netdev that is now a bridge
5641 * or LAG slave.
5642 */
5643 return false;
5644 }
5645
5646 return false;
5647}
5648
e4f3c1c1
IS
5649static enum mlxsw_sp_rif_type
5650mlxsw_sp_dev_rif_type(const struct mlxsw_sp *mlxsw_sp,
5651 const struct net_device *dev)
5652{
5653 enum mlxsw_sp_fid_type type;
5654
6ddb7426
PM
5655 if (mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, NULL))
5656 return MLXSW_SP_RIF_TYPE_IPIP_LB;
5657
5658 /* Otherwise RIF type is derived from the type of the underlying FID. */
e4f3c1c1
IS
5659 if (is_vlan_dev(dev) && netif_is_bridge_master(vlan_dev_real_dev(dev)))
5660 type = MLXSW_SP_FID_TYPE_8021Q;
5661 else if (netif_is_bridge_master(dev) && br_vlan_enabled(dev))
5662 type = MLXSW_SP_FID_TYPE_8021Q;
5663 else if (netif_is_bridge_master(dev))
5664 type = MLXSW_SP_FID_TYPE_8021D;
5665 else
5666 type = MLXSW_SP_FID_TYPE_RFID;
5667
5668 return mlxsw_sp_fid_type_rif_type(mlxsw_sp, type);
5669}
5670
de5ed99e 5671static int mlxsw_sp_rif_index_alloc(struct mlxsw_sp *mlxsw_sp, u16 *p_rif_index)
4724ba56
IS
5672{
5673 int i;
5674
de5ed99e
IS
5675 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++) {
5676 if (!mlxsw_sp->router->rifs[i]) {
5677 *p_rif_index = i;
5678 return 0;
5679 }
5680 }
4724ba56 5681
de5ed99e 5682 return -ENOBUFS;
4724ba56
IS
5683}
5684
e4f3c1c1
IS
5685static struct mlxsw_sp_rif *mlxsw_sp_rif_alloc(size_t rif_size, u16 rif_index,
5686 u16 vr_id,
5687 struct net_device *l3_dev)
4724ba56 5688{
bf95233e 5689 struct mlxsw_sp_rif *rif;
4724ba56 5690
e4f3c1c1 5691 rif = kzalloc(rif_size, GFP_KERNEL);
bf95233e 5692 if (!rif)
4724ba56
IS
5693 return NULL;
5694
bf95233e
AS
5695 INIT_LIST_HEAD(&rif->nexthop_list);
5696 INIT_LIST_HEAD(&rif->neigh_list);
5697 ether_addr_copy(rif->addr, l3_dev->dev_addr);
5698 rif->mtu = l3_dev->mtu;
5699 rif->vr_id = vr_id;
5700 rif->dev = l3_dev;
5701 rif->rif_index = rif_index;
4724ba56 5702
bf95233e 5703 return rif;
4724ba56
IS
5704}
5705
5f9efffb
IS
5706struct mlxsw_sp_rif *mlxsw_sp_rif_by_index(const struct mlxsw_sp *mlxsw_sp,
5707 u16 rif_index)
5708{
5709 return mlxsw_sp->router->rifs[rif_index];
5710}
5711
fd1b9d41
AS
5712u16 mlxsw_sp_rif_index(const struct mlxsw_sp_rif *rif)
5713{
5714 return rif->rif_index;
5715}
5716
92107cfb
PM
5717u16 mlxsw_sp_ipip_lb_rif_index(const struct mlxsw_sp_rif_ipip_lb *lb_rif)
5718{
5719 return lb_rif->common.rif_index;
5720}
5721
5722u16 mlxsw_sp_ipip_lb_ul_vr_id(const struct mlxsw_sp_rif_ipip_lb *lb_rif)
5723{
5724 return lb_rif->ul_vr_id;
5725}
5726
fd1b9d41
AS
5727int mlxsw_sp_rif_dev_ifindex(const struct mlxsw_sp_rif *rif)
5728{
5729 return rif->dev->ifindex;
5730}
5731
91e4d59a
YG
5732const struct net_device *mlxsw_sp_rif_dev(const struct mlxsw_sp_rif *rif)
5733{
5734 return rif->dev;
5735}
5736
4724ba56 5737static struct mlxsw_sp_rif *
e4f3c1c1 5738mlxsw_sp_rif_create(struct mlxsw_sp *mlxsw_sp,
f8fa9b4e
DA
5739 const struct mlxsw_sp_rif_params *params,
5740 struct netlink_ext_ack *extack)
4724ba56 5741{
e4f3c1c1
IS
5742 u32 tb_id = l3mdev_fib_table(params->dev);
5743 const struct mlxsw_sp_rif_ops *ops;
010cadf9 5744 struct mlxsw_sp_fid *fid = NULL;
e4f3c1c1 5745 enum mlxsw_sp_rif_type type;
bf95233e 5746 struct mlxsw_sp_rif *rif;
a1107487
IS
5747 struct mlxsw_sp_vr *vr;
5748 u16 rif_index;
4724ba56
IS
5749 int err;
5750
e4f3c1c1
IS
5751 type = mlxsw_sp_dev_rif_type(mlxsw_sp, params->dev);
5752 ops = mlxsw_sp->router->rif_ops_arr[type];
5753
f8fa9b4e 5754 vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id ? : RT_TABLE_MAIN, extack);
c9ec53f0
IS
5755 if (IS_ERR(vr))
5756 return ERR_CAST(vr);
28a04c7b 5757 vr->rif_count++;
c9ec53f0 5758
de5ed99e 5759 err = mlxsw_sp_rif_index_alloc(mlxsw_sp, &rif_index);
f8fa9b4e
DA
5760 if (err) {
5761 NL_SET_ERR_MSG(extack, "spectrum: Exceeded number of supported router interfaces");
de5ed99e 5762 goto err_rif_index_alloc;
f8fa9b4e 5763 }
4724ba56 5764
e4f3c1c1 5765 rif = mlxsw_sp_rif_alloc(ops->rif_size, rif_index, vr->id, params->dev);
a13a594d
IS
5766 if (!rif) {
5767 err = -ENOMEM;
5768 goto err_rif_alloc;
5769 }
e4f3c1c1
IS
5770 rif->mlxsw_sp = mlxsw_sp;
5771 rif->ops = ops;
a13a594d 5772
010cadf9
PM
5773 if (ops->fid_get) {
5774 fid = ops->fid_get(rif);
5775 if (IS_ERR(fid)) {
5776 err = PTR_ERR(fid);
5777 goto err_fid_get;
5778 }
5779 rif->fid = fid;
4d93ceeb
IS
5780 }
5781
e4f3c1c1
IS
5782 if (ops->setup)
5783 ops->setup(rif, params);
5784
5785 err = ops->configure(rif);
4724ba56 5786 if (err)
e4f3c1c1 5787 goto err_configure;
4724ba56 5788
d42b0965
YG
5789 err = mlxsw_sp_mr_rif_add(vr->mr4_table, rif);
5790 if (err)
5791 goto err_mr_rif_add;
5792
e4f3c1c1 5793 mlxsw_sp_rif_counters_alloc(rif);
5f9efffb 5794 mlxsw_sp->router->rifs[rif_index] = rif;
4724ba56 5795
bf95233e 5796 return rif;
4724ba56 5797
d42b0965
YG
5798err_mr_rif_add:
5799 ops->deconfigure(rif);
e4f3c1c1 5800err_configure:
010cadf9
PM
5801 if (fid)
5802 mlxsw_sp_fid_put(fid);
a1107487 5803err_fid_get:
e4f3c1c1
IS
5804 kfree(rif);
5805err_rif_alloc:
de5ed99e 5806err_rif_index_alloc:
28a04c7b 5807 vr->rif_count--;
c9ec53f0 5808 mlxsw_sp_vr_put(vr);
4724ba56
IS
5809 return ERR_PTR(err);
5810}
5811
e4f3c1c1 5812void mlxsw_sp_rif_destroy(struct mlxsw_sp_rif *rif)
4724ba56 5813{
e4f3c1c1
IS
5814 const struct mlxsw_sp_rif_ops *ops = rif->ops;
5815 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
a1107487 5816 struct mlxsw_sp_fid *fid = rif->fid;
e4f3c1c1 5817 struct mlxsw_sp_vr *vr;
4724ba56 5818
bf95233e 5819 mlxsw_sp_router_rif_gone_sync(mlxsw_sp, rif);
e4f3c1c1 5820 vr = &mlxsw_sp->router->vrs[rif->vr_id];
e0c0afd8 5821
e4f3c1c1 5822 mlxsw_sp->router->rifs[rif->rif_index] = NULL;
e4f3c1c1 5823 mlxsw_sp_rif_counters_free(rif);
d42b0965 5824 mlxsw_sp_mr_rif_del(vr->mr4_table, rif);
e4f3c1c1 5825 ops->deconfigure(rif);
010cadf9
PM
5826 if (fid)
5827 /* Loopback RIFs are not associated with a FID. */
5828 mlxsw_sp_fid_put(fid);
e4f3c1c1 5829 kfree(rif);
28a04c7b 5830 vr->rif_count--;
c9ec53f0 5831 mlxsw_sp_vr_put(vr);
4724ba56
IS
5832}
5833
e4f3c1c1
IS
5834static void
5835mlxsw_sp_rif_subport_params_init(struct mlxsw_sp_rif_params *params,
5836 struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan)
5837{
5838 struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port;
5839
5840 params->vid = mlxsw_sp_port_vlan->vid;
5841 params->lag = mlxsw_sp_port->lagged;
5842 if (params->lag)
5843 params->lag_id = mlxsw_sp_port->lag_id;
5844 else
5845 params->system_port = mlxsw_sp_port->local_port;
5846}
5847
7cbecf24 5848static int
a1107487 5849mlxsw_sp_port_vlan_router_join(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan,
f8fa9b4e
DA
5850 struct net_device *l3_dev,
5851 struct netlink_ext_ack *extack)
4724ba56 5852{
7cbecf24 5853 struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port;
1b8f09a0 5854 struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
7cbecf24 5855 u16 vid = mlxsw_sp_port_vlan->vid;
bf95233e 5856 struct mlxsw_sp_rif *rif;
a1107487 5857 struct mlxsw_sp_fid *fid;
03ea01e9 5858 int err;
4724ba56 5859
1b8f09a0 5860 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev);
bf95233e 5861 if (!rif) {
e4f3c1c1
IS
5862 struct mlxsw_sp_rif_params params = {
5863 .dev = l3_dev,
5864 };
5865
5866 mlxsw_sp_rif_subport_params_init(&params, mlxsw_sp_port_vlan);
f8fa9b4e 5867 rif = mlxsw_sp_rif_create(mlxsw_sp, &params, extack);
bf95233e
AS
5868 if (IS_ERR(rif))
5869 return PTR_ERR(rif);
4724ba56
IS
5870 }
5871
a1107487 5872 /* FID was already created, just take a reference */
e4f3c1c1 5873 fid = rif->ops->fid_get(rif);
a1107487
IS
5874 err = mlxsw_sp_fid_port_vid_map(fid, mlxsw_sp_port, vid);
5875 if (err)
5876 goto err_fid_port_vid_map;
5877
7cbecf24 5878 err = mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, false);
03ea01e9
IS
5879 if (err)
5880 goto err_port_vid_learning_set;
5881
7cbecf24 5882 err = mlxsw_sp_port_vid_stp_set(mlxsw_sp_port, vid,
03ea01e9
IS
5883 BR_STATE_FORWARDING);
5884 if (err)
5885 goto err_port_vid_stp_set;
5886
a1107487 5887 mlxsw_sp_port_vlan->fid = fid;
4724ba56 5888
4724ba56 5889 return 0;
03ea01e9
IS
5890
5891err_port_vid_stp_set:
7cbecf24 5892 mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, true);
03ea01e9 5893err_port_vid_learning_set:
a1107487
IS
5894 mlxsw_sp_fid_port_vid_unmap(fid, mlxsw_sp_port, vid);
5895err_fid_port_vid_map:
5896 mlxsw_sp_fid_put(fid);
03ea01e9 5897 return err;
4724ba56
IS
5898}
5899
a1107487
IS
5900void
5901mlxsw_sp_port_vlan_router_leave(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan)
4724ba56 5902{
ce95e154 5903 struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port;
7cbecf24 5904 struct mlxsw_sp_fid *fid = mlxsw_sp_port_vlan->fid;
ce95e154 5905 u16 vid = mlxsw_sp_port_vlan->vid;
ce95e154 5906
a1107487
IS
5907 if (WARN_ON(mlxsw_sp_fid_type(fid) != MLXSW_SP_FID_TYPE_RFID))
5908 return;
4aafc368 5909
a1107487 5910 mlxsw_sp_port_vlan->fid = NULL;
7cbecf24
IS
5911 mlxsw_sp_port_vid_stp_set(mlxsw_sp_port, vid, BR_STATE_BLOCKING);
5912 mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, true);
a1107487
IS
5913 mlxsw_sp_fid_port_vid_unmap(fid, mlxsw_sp_port, vid);
5914 /* If router port holds the last reference on the rFID, then the
5915 * associated Sub-port RIF will be destroyed.
5916 */
5917 mlxsw_sp_fid_put(fid);
4724ba56
IS
5918}
5919
7cbecf24
IS
5920static int mlxsw_sp_inetaddr_port_vlan_event(struct net_device *l3_dev,
5921 struct net_device *port_dev,
f8fa9b4e
DA
5922 unsigned long event, u16 vid,
5923 struct netlink_ext_ack *extack)
4724ba56
IS
5924{
5925 struct mlxsw_sp_port *mlxsw_sp_port = netdev_priv(port_dev);
ce95e154 5926 struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan;
4724ba56 5927
ce95e154 5928 mlxsw_sp_port_vlan = mlxsw_sp_port_vlan_find_by_vid(mlxsw_sp_port, vid);
7cbecf24
IS
5929 if (WARN_ON(!mlxsw_sp_port_vlan))
5930 return -EINVAL;
4724ba56
IS
5931
5932 switch (event) {
5933 case NETDEV_UP:
a1107487 5934 return mlxsw_sp_port_vlan_router_join(mlxsw_sp_port_vlan,
f8fa9b4e 5935 l3_dev, extack);
4724ba56 5936 case NETDEV_DOWN:
a1107487 5937 mlxsw_sp_port_vlan_router_leave(mlxsw_sp_port_vlan);
4724ba56
IS
5938 break;
5939 }
5940
5941 return 0;
5942}
5943
5944static int mlxsw_sp_inetaddr_port_event(struct net_device *port_dev,
f8fa9b4e
DA
5945 unsigned long event,
5946 struct netlink_ext_ack *extack)
4724ba56 5947{
2b94e58d
JP
5948 if (netif_is_bridge_port(port_dev) ||
5949 netif_is_lag_port(port_dev) ||
5950 netif_is_ovs_port(port_dev))
4724ba56
IS
5951 return 0;
5952
f8fa9b4e
DA
5953 return mlxsw_sp_inetaddr_port_vlan_event(port_dev, port_dev, event, 1,
5954 extack);
4724ba56
IS
5955}
5956
5957static int __mlxsw_sp_inetaddr_lag_event(struct net_device *l3_dev,
5958 struct net_device *lag_dev,
f8fa9b4e
DA
5959 unsigned long event, u16 vid,
5960 struct netlink_ext_ack *extack)
4724ba56
IS
5961{
5962 struct net_device *port_dev;
5963 struct list_head *iter;
5964 int err;
5965
5966 netdev_for_each_lower_dev(lag_dev, port_dev, iter) {
5967 if (mlxsw_sp_port_dev_check(port_dev)) {
7cbecf24
IS
5968 err = mlxsw_sp_inetaddr_port_vlan_event(l3_dev,
5969 port_dev,
f8fa9b4e
DA
5970 event, vid,
5971 extack);
4724ba56
IS
5972 if (err)
5973 return err;
5974 }
5975 }
5976
5977 return 0;
5978}
5979
5980static int mlxsw_sp_inetaddr_lag_event(struct net_device *lag_dev,
f8fa9b4e
DA
5981 unsigned long event,
5982 struct netlink_ext_ack *extack)
4724ba56
IS
5983{
5984 if (netif_is_bridge_port(lag_dev))
5985 return 0;
5986
f8fa9b4e
DA
5987 return __mlxsw_sp_inetaddr_lag_event(lag_dev, lag_dev, event, 1,
5988 extack);
4724ba56
IS
5989}
5990
4724ba56 5991static int mlxsw_sp_inetaddr_bridge_event(struct net_device *l3_dev,
f8fa9b4e
DA
5992 unsigned long event,
5993 struct netlink_ext_ack *extack)
4724ba56
IS
5994{
5995 struct mlxsw_sp *mlxsw_sp = mlxsw_sp_lower_get(l3_dev);
e4f3c1c1
IS
5996 struct mlxsw_sp_rif_params params = {
5997 .dev = l3_dev,
5998 };
a1107487 5999 struct mlxsw_sp_rif *rif;
4724ba56
IS
6000
6001 switch (event) {
6002 case NETDEV_UP:
f8fa9b4e 6003 rif = mlxsw_sp_rif_create(mlxsw_sp, &params, extack);
e4f3c1c1
IS
6004 if (IS_ERR(rif))
6005 return PTR_ERR(rif);
6006 break;
4724ba56 6007 case NETDEV_DOWN:
a1107487 6008 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev);
e4f3c1c1 6009 mlxsw_sp_rif_destroy(rif);
4724ba56
IS
6010 break;
6011 }
6012
6013 return 0;
6014}
6015
6016static int mlxsw_sp_inetaddr_vlan_event(struct net_device *vlan_dev,
f8fa9b4e
DA
6017 unsigned long event,
6018 struct netlink_ext_ack *extack)
4724ba56
IS
6019{
6020 struct net_device *real_dev = vlan_dev_real_dev(vlan_dev);
4724ba56
IS
6021 u16 vid = vlan_dev_vlan_id(vlan_dev);
6022
6b27c8ad
IS
6023 if (netif_is_bridge_port(vlan_dev))
6024 return 0;
6025
4724ba56 6026 if (mlxsw_sp_port_dev_check(real_dev))
7cbecf24 6027 return mlxsw_sp_inetaddr_port_vlan_event(vlan_dev, real_dev,
f8fa9b4e 6028 event, vid, extack);
4724ba56
IS
6029 else if (netif_is_lag_master(real_dev))
6030 return __mlxsw_sp_inetaddr_lag_event(vlan_dev, real_dev, event,
f8fa9b4e 6031 vid, extack);
c57529e1 6032 else if (netif_is_bridge_master(real_dev) && br_vlan_enabled(real_dev))
f8fa9b4e 6033 return mlxsw_sp_inetaddr_bridge_event(vlan_dev, event, extack);
4724ba56
IS
6034
6035 return 0;
6036}
6037
b1e45526 6038static int __mlxsw_sp_inetaddr_event(struct net_device *dev,
f8fa9b4e
DA
6039 unsigned long event,
6040 struct netlink_ext_ack *extack)
b1e45526
IS
6041{
6042 if (mlxsw_sp_port_dev_check(dev))
f8fa9b4e 6043 return mlxsw_sp_inetaddr_port_event(dev, event, extack);
b1e45526 6044 else if (netif_is_lag_master(dev))
f8fa9b4e 6045 return mlxsw_sp_inetaddr_lag_event(dev, event, extack);
b1e45526 6046 else if (netif_is_bridge_master(dev))
f8fa9b4e 6047 return mlxsw_sp_inetaddr_bridge_event(dev, event, extack);
b1e45526 6048 else if (is_vlan_dev(dev))
f8fa9b4e 6049 return mlxsw_sp_inetaddr_vlan_event(dev, event, extack);
b1e45526
IS
6050 else
6051 return 0;
6052}
6053
4724ba56
IS
6054int mlxsw_sp_inetaddr_event(struct notifier_block *unused,
6055 unsigned long event, void *ptr)
6056{
6057 struct in_ifaddr *ifa = (struct in_ifaddr *) ptr;
6058 struct net_device *dev = ifa->ifa_dev->dev;
6059 struct mlxsw_sp *mlxsw_sp;
bf95233e 6060 struct mlxsw_sp_rif *rif;
4724ba56
IS
6061 int err = 0;
6062
89d5dd2e
DA
6063 /* NETDEV_UP event is handled by mlxsw_sp_inetaddr_valid_event */
6064 if (event == NETDEV_UP)
6065 goto out;
6066
6067 mlxsw_sp = mlxsw_sp_lower_get(dev);
6068 if (!mlxsw_sp)
6069 goto out;
6070
6071 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
6072 if (!mlxsw_sp_rif_should_config(rif, dev, event))
6073 goto out;
6074
f8fa9b4e 6075 err = __mlxsw_sp_inetaddr_event(dev, event, NULL);
89d5dd2e
DA
6076out:
6077 return notifier_from_errno(err);
6078}
6079
6080int mlxsw_sp_inetaddr_valid_event(struct notifier_block *unused,
6081 unsigned long event, void *ptr)
6082{
6083 struct in_validator_info *ivi = (struct in_validator_info *) ptr;
6084 struct net_device *dev = ivi->ivi_dev->dev;
6085 struct mlxsw_sp *mlxsw_sp;
6086 struct mlxsw_sp_rif *rif;
6087 int err = 0;
6088
4724ba56
IS
6089 mlxsw_sp = mlxsw_sp_lower_get(dev);
6090 if (!mlxsw_sp)
6091 goto out;
6092
bf95233e 6093 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
5ea1237f 6094 if (!mlxsw_sp_rif_should_config(rif, dev, event))
4724ba56
IS
6095 goto out;
6096
f8fa9b4e 6097 err = __mlxsw_sp_inetaddr_event(dev, event, ivi->extack);
4724ba56
IS
6098out:
6099 return notifier_from_errno(err);
6100}
6101
5ea1237f
AS
6102struct mlxsw_sp_inet6addr_event_work {
6103 struct work_struct work;
6104 struct net_device *dev;
6105 unsigned long event;
6106};
6107
6108static void mlxsw_sp_inet6addr_event_work(struct work_struct *work)
6109{
6110 struct mlxsw_sp_inet6addr_event_work *inet6addr_work =
6111 container_of(work, struct mlxsw_sp_inet6addr_event_work, work);
6112 struct net_device *dev = inet6addr_work->dev;
6113 unsigned long event = inet6addr_work->event;
6114 struct mlxsw_sp *mlxsw_sp;
6115 struct mlxsw_sp_rif *rif;
6116
6117 rtnl_lock();
6118 mlxsw_sp = mlxsw_sp_lower_get(dev);
6119 if (!mlxsw_sp)
6120 goto out;
6121
6122 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
6123 if (!mlxsw_sp_rif_should_config(rif, dev, event))
6124 goto out;
6125
f8fa9b4e 6126 __mlxsw_sp_inetaddr_event(dev, event, NULL);
5ea1237f
AS
6127out:
6128 rtnl_unlock();
6129 dev_put(dev);
6130 kfree(inet6addr_work);
6131}
6132
6133/* Called with rcu_read_lock() */
6134int mlxsw_sp_inet6addr_event(struct notifier_block *unused,
6135 unsigned long event, void *ptr)
6136{
6137 struct inet6_ifaddr *if6 = (struct inet6_ifaddr *) ptr;
6138 struct mlxsw_sp_inet6addr_event_work *inet6addr_work;
6139 struct net_device *dev = if6->idev->dev;
6140
89d5dd2e
DA
6141 /* NETDEV_UP event is handled by mlxsw_sp_inet6addr_valid_event */
6142 if (event == NETDEV_UP)
6143 return NOTIFY_DONE;
6144
5ea1237f
AS
6145 if (!mlxsw_sp_port_dev_lower_find_rcu(dev))
6146 return NOTIFY_DONE;
6147
6148 inet6addr_work = kzalloc(sizeof(*inet6addr_work), GFP_ATOMIC);
6149 if (!inet6addr_work)
6150 return NOTIFY_BAD;
6151
6152 INIT_WORK(&inet6addr_work->work, mlxsw_sp_inet6addr_event_work);
6153 inet6addr_work->dev = dev;
6154 inet6addr_work->event = event;
6155 dev_hold(dev);
6156 mlxsw_core_schedule_work(&inet6addr_work->work);
6157
6158 return NOTIFY_DONE;
6159}
6160
89d5dd2e
DA
6161int mlxsw_sp_inet6addr_valid_event(struct notifier_block *unused,
6162 unsigned long event, void *ptr)
6163{
6164 struct in6_validator_info *i6vi = (struct in6_validator_info *) ptr;
6165 struct net_device *dev = i6vi->i6vi_dev->dev;
6166 struct mlxsw_sp *mlxsw_sp;
6167 struct mlxsw_sp_rif *rif;
6168 int err = 0;
6169
6170 mlxsw_sp = mlxsw_sp_lower_get(dev);
6171 if (!mlxsw_sp)
6172 goto out;
6173
6174 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
6175 if (!mlxsw_sp_rif_should_config(rif, dev, event))
6176 goto out;
6177
f8fa9b4e 6178 err = __mlxsw_sp_inetaddr_event(dev, event, i6vi->extack);
89d5dd2e
DA
6179out:
6180 return notifier_from_errno(err);
6181}
6182
bf95233e 6183static int mlxsw_sp_rif_edit(struct mlxsw_sp *mlxsw_sp, u16 rif_index,
4724ba56
IS
6184 const char *mac, int mtu)
6185{
6186 char ritr_pl[MLXSW_REG_RITR_LEN];
6187 int err;
6188
bf95233e 6189 mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index);
4724ba56
IS
6190 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
6191 if (err)
6192 return err;
6193
6194 mlxsw_reg_ritr_mtu_set(ritr_pl, mtu);
6195 mlxsw_reg_ritr_if_mac_memcpy_to(ritr_pl, mac);
6196 mlxsw_reg_ritr_op_set(ritr_pl, MLXSW_REG_RITR_RIF_CREATE);
6197 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
6198}
6199
6200int mlxsw_sp_netdevice_router_port_event(struct net_device *dev)
6201{
6202 struct mlxsw_sp *mlxsw_sp;
bf95233e 6203 struct mlxsw_sp_rif *rif;
a1107487 6204 u16 fid_index;
4724ba56
IS
6205 int err;
6206
6207 mlxsw_sp = mlxsw_sp_lower_get(dev);
6208 if (!mlxsw_sp)
6209 return 0;
6210
bf95233e
AS
6211 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
6212 if (!rif)
4724ba56 6213 return 0;
a1107487 6214 fid_index = mlxsw_sp_fid_index(rif->fid);
4724ba56 6215
a1107487 6216 err = mlxsw_sp_rif_fdb_op(mlxsw_sp, rif->addr, fid_index, false);
4724ba56
IS
6217 if (err)
6218 return err;
6219
bf95233e
AS
6220 err = mlxsw_sp_rif_edit(mlxsw_sp, rif->rif_index, dev->dev_addr,
6221 dev->mtu);
4724ba56
IS
6222 if (err)
6223 goto err_rif_edit;
6224
a1107487 6225 err = mlxsw_sp_rif_fdb_op(mlxsw_sp, dev->dev_addr, fid_index, true);
4724ba56
IS
6226 if (err)
6227 goto err_rif_fdb_op;
6228
fd890fe9
YG
6229 if (rif->mtu != dev->mtu) {
6230 struct mlxsw_sp_vr *vr;
6231
6232 /* The RIF is relevant only to its mr_table instance, as unlike
6233 * unicast routing, in multicast routing a RIF cannot be shared
6234 * between several multicast routing tables.
6235 */
6236 vr = &mlxsw_sp->router->vrs[rif->vr_id];
6237 mlxsw_sp_mr_rif_mtu_update(vr->mr4_table, rif, dev->mtu);
6238 }
6239
bf95233e
AS
6240 ether_addr_copy(rif->addr, dev->dev_addr);
6241 rif->mtu = dev->mtu;
4724ba56 6242
bf95233e 6243 netdev_dbg(dev, "Updated RIF=%d\n", rif->rif_index);
4724ba56
IS
6244
6245 return 0;
6246
6247err_rif_fdb_op:
bf95233e 6248 mlxsw_sp_rif_edit(mlxsw_sp, rif->rif_index, rif->addr, rif->mtu);
4724ba56 6249err_rif_edit:
a1107487 6250 mlxsw_sp_rif_fdb_op(mlxsw_sp, rif->addr, fid_index, true);
4724ba56
IS
6251 return err;
6252}
6253
b1e45526 6254static int mlxsw_sp_port_vrf_join(struct mlxsw_sp *mlxsw_sp,
f8fa9b4e
DA
6255 struct net_device *l3_dev,
6256 struct netlink_ext_ack *extack)
7179eb5a 6257{
b1e45526 6258 struct mlxsw_sp_rif *rif;
7179eb5a 6259
b1e45526
IS
6260 /* If netdev is already associated with a RIF, then we need to
6261 * destroy it and create a new one with the new virtual router ID.
7179eb5a 6262 */
b1e45526
IS
6263 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev);
6264 if (rif)
f8fa9b4e 6265 __mlxsw_sp_inetaddr_event(l3_dev, NETDEV_DOWN, extack);
7179eb5a 6266
f8fa9b4e 6267 return __mlxsw_sp_inetaddr_event(l3_dev, NETDEV_UP, extack);
7179eb5a
IS
6268}
6269
b1e45526
IS
6270static void mlxsw_sp_port_vrf_leave(struct mlxsw_sp *mlxsw_sp,
6271 struct net_device *l3_dev)
7179eb5a 6272{
b1e45526 6273 struct mlxsw_sp_rif *rif;
7179eb5a 6274
b1e45526
IS
6275 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev);
6276 if (!rif)
7179eb5a 6277 return;
f8fa9b4e 6278 __mlxsw_sp_inetaddr_event(l3_dev, NETDEV_DOWN, NULL);
7179eb5a
IS
6279}
6280
b1e45526
IS
6281int mlxsw_sp_netdevice_vrf_event(struct net_device *l3_dev, unsigned long event,
6282 struct netdev_notifier_changeupper_info *info)
3d70e458 6283{
b1e45526
IS
6284 struct mlxsw_sp *mlxsw_sp = mlxsw_sp_lower_get(l3_dev);
6285 int err = 0;
3d70e458 6286
b1e45526
IS
6287 if (!mlxsw_sp)
6288 return 0;
3d70e458 6289
b1e45526
IS
6290 switch (event) {
6291 case NETDEV_PRECHANGEUPPER:
6292 return 0;
6293 case NETDEV_CHANGEUPPER:
f8fa9b4e
DA
6294 if (info->linking) {
6295 struct netlink_ext_ack *extack;
6296
6297 extack = netdev_notifier_info_to_extack(&info->info);
6298 err = mlxsw_sp_port_vrf_join(mlxsw_sp, l3_dev, extack);
6299 } else {
b1e45526 6300 mlxsw_sp_port_vrf_leave(mlxsw_sp, l3_dev);
f8fa9b4e 6301 }
b1e45526
IS
6302 break;
6303 }
3d70e458 6304
b1e45526 6305 return err;
3d70e458
IS
6306}
6307
e4f3c1c1
IS
6308static struct mlxsw_sp_rif_subport *
6309mlxsw_sp_rif_subport_rif(const struct mlxsw_sp_rif *rif)
a1107487 6310{
e4f3c1c1
IS
6311 return container_of(rif, struct mlxsw_sp_rif_subport, common);
6312}
6313
6314static void mlxsw_sp_rif_subport_setup(struct mlxsw_sp_rif *rif,
6315 const struct mlxsw_sp_rif_params *params)
6316{
6317 struct mlxsw_sp_rif_subport *rif_subport;
6318
6319 rif_subport = mlxsw_sp_rif_subport_rif(rif);
6320 rif_subport->vid = params->vid;
6321 rif_subport->lag = params->lag;
6322 if (params->lag)
6323 rif_subport->lag_id = params->lag_id;
a1107487 6324 else
e4f3c1c1
IS
6325 rif_subport->system_port = params->system_port;
6326}
6327
6328static int mlxsw_sp_rif_subport_op(struct mlxsw_sp_rif *rif, bool enable)
6329{
6330 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
6331 struct mlxsw_sp_rif_subport *rif_subport;
6332 char ritr_pl[MLXSW_REG_RITR_LEN];
6333
6334 rif_subport = mlxsw_sp_rif_subport_rif(rif);
6335 mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_SP_IF,
9571e828
PM
6336 rif->rif_index, rif->vr_id, rif->dev->mtu);
6337 mlxsw_reg_ritr_mac_pack(ritr_pl, rif->dev->dev_addr);
e4f3c1c1
IS
6338 mlxsw_reg_ritr_sp_if_pack(ritr_pl, rif_subport->lag,
6339 rif_subport->lag ? rif_subport->lag_id :
6340 rif_subport->system_port,
6341 rif_subport->vid);
6342
6343 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
6344}
6345
6346static int mlxsw_sp_rif_subport_configure(struct mlxsw_sp_rif *rif)
6347{
010cadf9
PM
6348 int err;
6349
6350 err = mlxsw_sp_rif_subport_op(rif, true);
6351 if (err)
6352 return err;
6353
6354 err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
6355 mlxsw_sp_fid_index(rif->fid), true);
6356 if (err)
6357 goto err_rif_fdb_op;
6358
6359 mlxsw_sp_fid_rif_set(rif->fid, rif);
6360 return 0;
6361
6362err_rif_fdb_op:
6363 mlxsw_sp_rif_subport_op(rif, false);
6364 return err;
a1107487
IS
6365}
6366
e4f3c1c1
IS
6367static void mlxsw_sp_rif_subport_deconfigure(struct mlxsw_sp_rif *rif)
6368{
010cadf9
PM
6369 struct mlxsw_sp_fid *fid = rif->fid;
6370
6371 mlxsw_sp_fid_rif_set(fid, NULL);
6372 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
6373 mlxsw_sp_fid_index(fid), false);
e4f3c1c1
IS
6374 mlxsw_sp_rif_subport_op(rif, false);
6375}
6376
6377static struct mlxsw_sp_fid *
6378mlxsw_sp_rif_subport_fid_get(struct mlxsw_sp_rif *rif)
6379{
6380 return mlxsw_sp_fid_rfid_get(rif->mlxsw_sp, rif->rif_index);
6381}
6382
6383static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_subport_ops = {
6384 .type = MLXSW_SP_RIF_TYPE_SUBPORT,
6385 .rif_size = sizeof(struct mlxsw_sp_rif_subport),
6386 .setup = mlxsw_sp_rif_subport_setup,
6387 .configure = mlxsw_sp_rif_subport_configure,
6388 .deconfigure = mlxsw_sp_rif_subport_deconfigure,
6389 .fid_get = mlxsw_sp_rif_subport_fid_get,
6390};
6391
6392static int mlxsw_sp_rif_vlan_fid_op(struct mlxsw_sp_rif *rif,
6393 enum mlxsw_reg_ritr_if_type type,
6394 u16 vid_fid, bool enable)
6395{
6396 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
6397 char ritr_pl[MLXSW_REG_RITR_LEN];
6398
6399 mlxsw_reg_ritr_pack(ritr_pl, enable, type, rif->rif_index, rif->vr_id,
9571e828
PM
6400 rif->dev->mtu);
6401 mlxsw_reg_ritr_mac_pack(ritr_pl, rif->dev->dev_addr);
e4f3c1c1
IS
6402 mlxsw_reg_ritr_fid_set(ritr_pl, type, vid_fid);
6403
6404 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
6405}
6406
b35750f1 6407u8 mlxsw_sp_router_port(const struct mlxsw_sp *mlxsw_sp)
e4f3c1c1
IS
6408{
6409 return mlxsw_core_max_ports(mlxsw_sp->core) + 1;
6410}
6411
6412static int mlxsw_sp_rif_vlan_configure(struct mlxsw_sp_rif *rif)
6413{
6414 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
6415 u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid);
6416 int err;
6417
6418 err = mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_VLAN_IF, vid, true);
6419 if (err)
6420 return err;
6421
0d284818
IS
6422 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
6423 mlxsw_sp_router_port(mlxsw_sp), true);
6424 if (err)
6425 goto err_fid_mc_flood_set;
6426
e4f3c1c1
IS
6427 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
6428 mlxsw_sp_router_port(mlxsw_sp), true);
6429 if (err)
6430 goto err_fid_bc_flood_set;
6431
010cadf9
PM
6432 err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
6433 mlxsw_sp_fid_index(rif->fid), true);
6434 if (err)
6435 goto err_rif_fdb_op;
6436
6437 mlxsw_sp_fid_rif_set(rif->fid, rif);
e4f3c1c1
IS
6438 return 0;
6439
010cadf9
PM
6440err_rif_fdb_op:
6441 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
6442 mlxsw_sp_router_port(mlxsw_sp), false);
e4f3c1c1 6443err_fid_bc_flood_set:
0d284818
IS
6444 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
6445 mlxsw_sp_router_port(mlxsw_sp), false);
6446err_fid_mc_flood_set:
e4f3c1c1
IS
6447 mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_VLAN_IF, vid, false);
6448 return err;
6449}
6450
6451static void mlxsw_sp_rif_vlan_deconfigure(struct mlxsw_sp_rif *rif)
6452{
e4f3c1c1 6453 u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid);
010cadf9
PM
6454 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
6455 struct mlxsw_sp_fid *fid = rif->fid;
e4f3c1c1 6456
010cadf9
PM
6457 mlxsw_sp_fid_rif_set(fid, NULL);
6458 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
6459 mlxsw_sp_fid_index(fid), false);
e4f3c1c1
IS
6460 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
6461 mlxsw_sp_router_port(mlxsw_sp), false);
0d284818
IS
6462 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
6463 mlxsw_sp_router_port(mlxsw_sp), false);
e4f3c1c1
IS
6464 mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_VLAN_IF, vid, false);
6465}
6466
6467static struct mlxsw_sp_fid *
6468mlxsw_sp_rif_vlan_fid_get(struct mlxsw_sp_rif *rif)
6469{
6470 u16 vid = is_vlan_dev(rif->dev) ? vlan_dev_vlan_id(rif->dev) : 1;
6471
6472 return mlxsw_sp_fid_8021q_get(rif->mlxsw_sp, vid);
6473}
6474
6475static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_vlan_ops = {
6476 .type = MLXSW_SP_RIF_TYPE_VLAN,
6477 .rif_size = sizeof(struct mlxsw_sp_rif),
6478 .configure = mlxsw_sp_rif_vlan_configure,
6479 .deconfigure = mlxsw_sp_rif_vlan_deconfigure,
6480 .fid_get = mlxsw_sp_rif_vlan_fid_get,
6481};
6482
6483static int mlxsw_sp_rif_fid_configure(struct mlxsw_sp_rif *rif)
6484{
6485 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
6486 u16 fid_index = mlxsw_sp_fid_index(rif->fid);
6487 int err;
6488
6489 err = mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_FID_IF, fid_index,
6490 true);
6491 if (err)
6492 return err;
6493
0d284818
IS
6494 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
6495 mlxsw_sp_router_port(mlxsw_sp), true);
6496 if (err)
6497 goto err_fid_mc_flood_set;
6498
e4f3c1c1
IS
6499 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
6500 mlxsw_sp_router_port(mlxsw_sp), true);
6501 if (err)
6502 goto err_fid_bc_flood_set;
6503
010cadf9
PM
6504 err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
6505 mlxsw_sp_fid_index(rif->fid), true);
6506 if (err)
6507 goto err_rif_fdb_op;
6508
6509 mlxsw_sp_fid_rif_set(rif->fid, rif);
e4f3c1c1
IS
6510 return 0;
6511
010cadf9
PM
6512err_rif_fdb_op:
6513 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
6514 mlxsw_sp_router_port(mlxsw_sp), false);
e4f3c1c1 6515err_fid_bc_flood_set:
0d284818
IS
6516 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
6517 mlxsw_sp_router_port(mlxsw_sp), false);
6518err_fid_mc_flood_set:
e4f3c1c1
IS
6519 mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_FID_IF, fid_index, false);
6520 return err;
6521}
6522
6523static void mlxsw_sp_rif_fid_deconfigure(struct mlxsw_sp_rif *rif)
6524{
e4f3c1c1 6525 u16 fid_index = mlxsw_sp_fid_index(rif->fid);
010cadf9
PM
6526 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
6527 struct mlxsw_sp_fid *fid = rif->fid;
e4f3c1c1 6528
010cadf9
PM
6529 mlxsw_sp_fid_rif_set(fid, NULL);
6530 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
6531 mlxsw_sp_fid_index(fid), false);
e4f3c1c1
IS
6532 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
6533 mlxsw_sp_router_port(mlxsw_sp), false);
0d284818
IS
6534 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
6535 mlxsw_sp_router_port(mlxsw_sp), false);
e4f3c1c1
IS
6536 mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_FID_IF, fid_index, false);
6537}
6538
6539static struct mlxsw_sp_fid *
6540mlxsw_sp_rif_fid_fid_get(struct mlxsw_sp_rif *rif)
6541{
6542 return mlxsw_sp_fid_8021d_get(rif->mlxsw_sp, rif->dev->ifindex);
6543}
6544
6545static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_fid_ops = {
6546 .type = MLXSW_SP_RIF_TYPE_FID,
6547 .rif_size = sizeof(struct mlxsw_sp_rif),
6548 .configure = mlxsw_sp_rif_fid_configure,
6549 .deconfigure = mlxsw_sp_rif_fid_deconfigure,
6550 .fid_get = mlxsw_sp_rif_fid_fid_get,
6551};
6552
6ddb7426
PM
6553static struct mlxsw_sp_rif_ipip_lb *
6554mlxsw_sp_rif_ipip_lb_rif(struct mlxsw_sp_rif *rif)
6555{
6556 return container_of(rif, struct mlxsw_sp_rif_ipip_lb, common);
6557}
6558
6559static void
6560mlxsw_sp_rif_ipip_lb_setup(struct mlxsw_sp_rif *rif,
6561 const struct mlxsw_sp_rif_params *params)
6562{
6563 struct mlxsw_sp_rif_params_ipip_lb *params_lb;
6564 struct mlxsw_sp_rif_ipip_lb *rif_lb;
6565
6566 params_lb = container_of(params, struct mlxsw_sp_rif_params_ipip_lb,
6567 common);
6568 rif_lb = mlxsw_sp_rif_ipip_lb_rif(rif);
6569 rif_lb->lb_config = params_lb->lb_config;
6570}
6571
6572static int
6573mlxsw_sp_rif_ipip_lb_op(struct mlxsw_sp_rif_ipip_lb *lb_rif,
6574 struct mlxsw_sp_vr *ul_vr, bool enable)
6575{
6576 struct mlxsw_sp_rif_ipip_lb_config lb_cf = lb_rif->lb_config;
6577 struct mlxsw_sp_rif *rif = &lb_rif->common;
6578 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
6579 char ritr_pl[MLXSW_REG_RITR_LEN];
6580 u32 saddr4;
6581
6582 switch (lb_cf.ul_protocol) {
6583 case MLXSW_SP_L3_PROTO_IPV4:
6584 saddr4 = be32_to_cpu(lb_cf.saddr.addr4);
6585 mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_LOOPBACK_IF,
6586 rif->rif_index, rif->vr_id, rif->dev->mtu);
6587 mlxsw_reg_ritr_loopback_ipip4_pack(ritr_pl, lb_cf.lb_ipipt,
6588 MLXSW_REG_RITR_LOOPBACK_IPIP_OPTIONS_GRE_KEY_PRESET,
6589 ul_vr->id, saddr4, lb_cf.okey);
6590 break;
6591
6592 case MLXSW_SP_L3_PROTO_IPV6:
6593 return -EAFNOSUPPORT;
6594 }
6595
6596 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
6597}
6598
6599static int
6600mlxsw_sp_rif_ipip_lb_configure(struct mlxsw_sp_rif *rif)
6601{
6602 struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif);
6603 u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(rif->dev);
6604 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
6605 struct mlxsw_sp_vr *ul_vr;
6606 int err;
6607
f8fa9b4e 6608 ul_vr = mlxsw_sp_vr_get(mlxsw_sp, ul_tb_id, NULL);
6ddb7426
PM
6609 if (IS_ERR(ul_vr))
6610 return PTR_ERR(ul_vr);
6611
6612 err = mlxsw_sp_rif_ipip_lb_op(lb_rif, ul_vr, true);
6613 if (err)
6614 goto err_loopback_op;
6615
6616 lb_rif->ul_vr_id = ul_vr->id;
6617 ++ul_vr->rif_count;
6618 return 0;
6619
6620err_loopback_op:
6621 mlxsw_sp_vr_put(ul_vr);
6622 return err;
6623}
6624
6625static void mlxsw_sp_rif_ipip_lb_deconfigure(struct mlxsw_sp_rif *rif)
6626{
6627 struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif);
6628 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
6629 struct mlxsw_sp_vr *ul_vr;
6630
6631 ul_vr = &mlxsw_sp->router->vrs[lb_rif->ul_vr_id];
6632 mlxsw_sp_rif_ipip_lb_op(lb_rif, ul_vr, false);
6633
6634 --ul_vr->rif_count;
6635 mlxsw_sp_vr_put(ul_vr);
6636}
6637
6638static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_ipip_lb_ops = {
6639 .type = MLXSW_SP_RIF_TYPE_IPIP_LB,
6640 .rif_size = sizeof(struct mlxsw_sp_rif_ipip_lb),
6641 .setup = mlxsw_sp_rif_ipip_lb_setup,
6642 .configure = mlxsw_sp_rif_ipip_lb_configure,
6643 .deconfigure = mlxsw_sp_rif_ipip_lb_deconfigure,
6644};
6645
e4f3c1c1
IS
6646static const struct mlxsw_sp_rif_ops *mlxsw_sp_rif_ops_arr[] = {
6647 [MLXSW_SP_RIF_TYPE_SUBPORT] = &mlxsw_sp_rif_subport_ops,
6648 [MLXSW_SP_RIF_TYPE_VLAN] = &mlxsw_sp_rif_vlan_ops,
6649 [MLXSW_SP_RIF_TYPE_FID] = &mlxsw_sp_rif_fid_ops,
6ddb7426 6650 [MLXSW_SP_RIF_TYPE_IPIP_LB] = &mlxsw_sp_rif_ipip_lb_ops,
e4f3c1c1
IS
6651};
6652
348b8fc3
IS
6653static int mlxsw_sp_rifs_init(struct mlxsw_sp *mlxsw_sp)
6654{
6655 u64 max_rifs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS);
6656
6657 mlxsw_sp->router->rifs = kcalloc(max_rifs,
6658 sizeof(struct mlxsw_sp_rif *),
6659 GFP_KERNEL);
6660 if (!mlxsw_sp->router->rifs)
6661 return -ENOMEM;
e4f3c1c1
IS
6662
6663 mlxsw_sp->router->rif_ops_arr = mlxsw_sp_rif_ops_arr;
6664
348b8fc3
IS
6665 return 0;
6666}
6667
6668static void mlxsw_sp_rifs_fini(struct mlxsw_sp *mlxsw_sp)
6669{
6670 int i;
6671
6672 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++)
6673 WARN_ON_ONCE(mlxsw_sp->router->rifs[i]);
6674
6675 kfree(mlxsw_sp->router->rifs);
6676}
6677
dcbda282
PM
6678static int
6679mlxsw_sp_ipip_config_tigcr(struct mlxsw_sp *mlxsw_sp)
6680{
6681 char tigcr_pl[MLXSW_REG_TIGCR_LEN];
6682
6683 mlxsw_reg_tigcr_pack(tigcr_pl, true, 0);
6684 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(tigcr), tigcr_pl);
6685}
6686
38ebc0f4
PM
6687static int mlxsw_sp_ipips_init(struct mlxsw_sp *mlxsw_sp)
6688{
6689 mlxsw_sp->router->ipip_ops_arr = mlxsw_sp_ipip_ops_arr;
1012b9ac 6690 INIT_LIST_HEAD(&mlxsw_sp->router->ipip_list);
dcbda282 6691 return mlxsw_sp_ipip_config_tigcr(mlxsw_sp);
38ebc0f4
PM
6692}
6693
6694static void mlxsw_sp_ipips_fini(struct mlxsw_sp *mlxsw_sp)
6695{
1012b9ac 6696 WARN_ON(!list_empty(&mlxsw_sp->router->ipip_list));
38ebc0f4
PM
6697}
6698
c3852ef7
IS
6699static void mlxsw_sp_router_fib_dump_flush(struct notifier_block *nb)
6700{
7e39d115 6701 struct mlxsw_sp_router *router;
c3852ef7
IS
6702
6703 /* Flush pending FIB notifications and then flush the device's
6704 * table before requesting another dump. The FIB notification
6705 * block is unregistered, so no need to take RTNL.
6706 */
6707 mlxsw_core_flush_owq();
7e39d115
IS
6708 router = container_of(nb, struct mlxsw_sp_router, fib_nb);
6709 mlxsw_sp_router_fib_flush(router->mlxsw_sp);
c3852ef7
IS
6710}
6711
af658b6a
IS
6712#ifdef CONFIG_IP_ROUTE_MULTIPATH
6713static void mlxsw_sp_mp_hash_header_set(char *recr2_pl, int header)
6714{
6715 mlxsw_reg_recr2_outer_header_enables_set(recr2_pl, header, true);
6716}
6717
6718static void mlxsw_sp_mp_hash_field_set(char *recr2_pl, int field)
6719{
6720 mlxsw_reg_recr2_outer_header_fields_enable_set(recr2_pl, field, true);
6721}
6722
6723static void mlxsw_sp_mp4_hash_init(char *recr2_pl)
6724{
6725 bool only_l3 = !init_net.ipv4.sysctl_fib_multipath_hash_policy;
6726
6727 mlxsw_sp_mp_hash_header_set(recr2_pl,
6728 MLXSW_REG_RECR2_IPV4_EN_NOT_TCP_NOT_UDP);
6729 mlxsw_sp_mp_hash_header_set(recr2_pl, MLXSW_REG_RECR2_IPV4_EN_TCP_UDP);
6730 mlxsw_reg_recr2_ipv4_sip_enable(recr2_pl);
6731 mlxsw_reg_recr2_ipv4_dip_enable(recr2_pl);
6732 if (only_l3)
6733 return;
6734 mlxsw_sp_mp_hash_header_set(recr2_pl, MLXSW_REG_RECR2_TCP_UDP_EN_IPV4);
6735 mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_IPV4_PROTOCOL);
6736 mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_TCP_UDP_SPORT);
6737 mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_TCP_UDP_DPORT);
6738}
6739
6740static void mlxsw_sp_mp6_hash_init(char *recr2_pl)
6741{
6742 mlxsw_sp_mp_hash_header_set(recr2_pl,
6743 MLXSW_REG_RECR2_IPV6_EN_NOT_TCP_NOT_UDP);
6744 mlxsw_sp_mp_hash_header_set(recr2_pl, MLXSW_REG_RECR2_IPV6_EN_TCP_UDP);
6745 mlxsw_reg_recr2_ipv6_sip_enable(recr2_pl);
6746 mlxsw_reg_recr2_ipv6_dip_enable(recr2_pl);
6747 mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_IPV6_FLOW_LABEL);
6748 mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_IPV6_NEXT_HEADER);
6749}
6750
6751static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp)
6752{
6753 char recr2_pl[MLXSW_REG_RECR2_LEN];
6754 u32 seed;
6755
6756 get_random_bytes(&seed, sizeof(seed));
6757 mlxsw_reg_recr2_pack(recr2_pl, seed);
6758 mlxsw_sp_mp4_hash_init(recr2_pl);
6759 mlxsw_sp_mp6_hash_init(recr2_pl);
6760
6761 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(recr2), recr2_pl);
6762}
6763#else
6764static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp)
6765{
6766 return 0;
6767}
6768#endif
6769
4724ba56
IS
6770static int __mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp)
6771{
6772 char rgcr_pl[MLXSW_REG_RGCR_LEN];
6773 u64 max_rifs;
6774 int err;
6775
6776 if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_RIFS))
6777 return -EIO;
4724ba56 6778 max_rifs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS);
4724ba56 6779
e29237e7 6780 mlxsw_reg_rgcr_pack(rgcr_pl, true, true);
4724ba56
IS
6781 mlxsw_reg_rgcr_max_router_interfaces_set(rgcr_pl, max_rifs);
6782 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rgcr), rgcr_pl);
6783 if (err)
348b8fc3 6784 return err;
4724ba56 6785 return 0;
4724ba56
IS
6786}
6787
6788static void __mlxsw_sp_router_fini(struct mlxsw_sp *mlxsw_sp)
6789{
6790 char rgcr_pl[MLXSW_REG_RGCR_LEN];
4724ba56 6791
e29237e7 6792 mlxsw_reg_rgcr_pack(rgcr_pl, false, false);
4724ba56 6793 mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rgcr), rgcr_pl);
4724ba56
IS
6794}
6795
b45f64d1
JP
6796int mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp)
6797{
9011b677 6798 struct mlxsw_sp_router *router;
b45f64d1
JP
6799 int err;
6800
9011b677
IS
6801 router = kzalloc(sizeof(*mlxsw_sp->router), GFP_KERNEL);
6802 if (!router)
6803 return -ENOMEM;
6804 mlxsw_sp->router = router;
6805 router->mlxsw_sp = mlxsw_sp;
6806
6807 INIT_LIST_HEAD(&mlxsw_sp->router->nexthop_neighs_list);
b45f64d1
JP
6808 err = __mlxsw_sp_router_init(mlxsw_sp);
6809 if (err)
9011b677 6810 goto err_router_init;
b45f64d1 6811
348b8fc3
IS
6812 err = mlxsw_sp_rifs_init(mlxsw_sp);
6813 if (err)
6814 goto err_rifs_init;
6815
38ebc0f4
PM
6816 err = mlxsw_sp_ipips_init(mlxsw_sp);
6817 if (err)
6818 goto err_ipips_init;
6819
9011b677 6820 err = rhashtable_init(&mlxsw_sp->router->nexthop_ht,
c53b8e1b
IS
6821 &mlxsw_sp_nexthop_ht_params);
6822 if (err)
6823 goto err_nexthop_ht_init;
6824
9011b677 6825 err = rhashtable_init(&mlxsw_sp->router->nexthop_group_ht,
e9ad5e7d
IS
6826 &mlxsw_sp_nexthop_group_ht_params);
6827 if (err)
6828 goto err_nexthop_group_ht_init;
6829
dbe4598c 6830 INIT_LIST_HEAD(&mlxsw_sp->router->nexthop_list);
8494ab06
IS
6831 err = mlxsw_sp_lpm_init(mlxsw_sp);
6832 if (err)
6833 goto err_lpm_init;
6834
d42b0965
YG
6835 err = mlxsw_sp_mr_init(mlxsw_sp, &mlxsw_sp_mr_tcam_ops);
6836 if (err)
6837 goto err_mr_init;
6838
b45f64d1
JP
6839 err = mlxsw_sp_vrs_init(mlxsw_sp);
6840 if (err)
6841 goto err_vrs_init;
6842
8c9583a8 6843 err = mlxsw_sp_neigh_init(mlxsw_sp);
b45f64d1
JP
6844 if (err)
6845 goto err_neigh_init;
6846
48fac885
IS
6847 mlxsw_sp->router->netevent_nb.notifier_call =
6848 mlxsw_sp_router_netevent_event;
6849 err = register_netevent_notifier(&mlxsw_sp->router->netevent_nb);
6850 if (err)
6851 goto err_register_netevent_notifier;
6852
af658b6a
IS
6853 err = mlxsw_sp_mp_hash_init(mlxsw_sp);
6854 if (err)
6855 goto err_mp_hash_init;
6856
7e39d115
IS
6857 mlxsw_sp->router->fib_nb.notifier_call = mlxsw_sp_router_fib_event;
6858 err = register_fib_notifier(&mlxsw_sp->router->fib_nb,
c3852ef7
IS
6859 mlxsw_sp_router_fib_dump_flush);
6860 if (err)
6861 goto err_register_fib_notifier;
6862
b45f64d1
JP
6863 return 0;
6864
c3852ef7 6865err_register_fib_notifier:
af658b6a 6866err_mp_hash_init:
48fac885
IS
6867 unregister_netevent_notifier(&mlxsw_sp->router->netevent_nb);
6868err_register_netevent_notifier:
c3852ef7 6869 mlxsw_sp_neigh_fini(mlxsw_sp);
b45f64d1
JP
6870err_neigh_init:
6871 mlxsw_sp_vrs_fini(mlxsw_sp);
6872err_vrs_init:
d42b0965
YG
6873 mlxsw_sp_mr_fini(mlxsw_sp);
6874err_mr_init:
8494ab06
IS
6875 mlxsw_sp_lpm_fini(mlxsw_sp);
6876err_lpm_init:
9011b677 6877 rhashtable_destroy(&mlxsw_sp->router->nexthop_group_ht);
e9ad5e7d 6878err_nexthop_group_ht_init:
9011b677 6879 rhashtable_destroy(&mlxsw_sp->router->nexthop_ht);
c53b8e1b 6880err_nexthop_ht_init:
38ebc0f4
PM
6881 mlxsw_sp_ipips_fini(mlxsw_sp);
6882err_ipips_init:
348b8fc3
IS
6883 mlxsw_sp_rifs_fini(mlxsw_sp);
6884err_rifs_init:
b45f64d1 6885 __mlxsw_sp_router_fini(mlxsw_sp);
9011b677
IS
6886err_router_init:
6887 kfree(mlxsw_sp->router);
b45f64d1
JP
6888 return err;
6889}
6890
6891void mlxsw_sp_router_fini(struct mlxsw_sp *mlxsw_sp)
6892{
7e39d115 6893 unregister_fib_notifier(&mlxsw_sp->router->fib_nb);
48fac885 6894 unregister_netevent_notifier(&mlxsw_sp->router->netevent_nb);
b45f64d1
JP
6895 mlxsw_sp_neigh_fini(mlxsw_sp);
6896 mlxsw_sp_vrs_fini(mlxsw_sp);
d42b0965 6897 mlxsw_sp_mr_fini(mlxsw_sp);
8494ab06 6898 mlxsw_sp_lpm_fini(mlxsw_sp);
9011b677
IS
6899 rhashtable_destroy(&mlxsw_sp->router->nexthop_group_ht);
6900 rhashtable_destroy(&mlxsw_sp->router->nexthop_ht);
38ebc0f4 6901 mlxsw_sp_ipips_fini(mlxsw_sp);
348b8fc3 6902 mlxsw_sp_rifs_fini(mlxsw_sp);
b45f64d1 6903 __mlxsw_sp_router_fini(mlxsw_sp);
9011b677 6904 kfree(mlxsw_sp->router);
b45f64d1 6905}