mlxsw: spectrum_router: Create IPv6 multipath routes in one go
[linux-2.6-block.git] / drivers / net / ethernet / mellanox / mlxsw / spectrum_router.c
CommitLineData
9948a064
JP
1// SPDX-License-Identifier: BSD-3-Clause OR GPL-2.0
2/* Copyright (c) 2016-2018 Mellanox Technologies. All rights reserved */
464dce18
IS
3
4#include <linux/kernel.h>
5#include <linux/types.h>
5e9c16cc
JP
6#include <linux/rhashtable.h>
7#include <linux/bitops.h>
8#include <linux/in6.h>
c723c735 9#include <linux/notifier.h>
df6dd79b 10#include <linux/inetdevice.h>
9db032bb 11#include <linux/netdevice.h>
03ea01e9 12#include <linux/if_bridge.h>
b5f3e0d4 13#include <linux/socket.h>
428b851f 14#include <linux/route.h>
eb789980 15#include <linux/gcd.h>
2db99378 16#include <linux/if_macvlan.h>
32fd4b49 17#include <linux/refcount.h>
fa73989f 18#include <linux/jhash.h>
c723c735 19#include <net/netevent.h>
6cf3c971
JP
20#include <net/neighbour.h>
21#include <net/arp.h>
b45f64d1 22#include <net/ip_fib.h>
583419fd 23#include <net/ip6_fib.h>
5481d73f 24#include <net/nexthop.h>
5d7bfd14 25#include <net/fib_rules.h>
6ddb7426 26#include <net/ip_tunnels.h>
57837885 27#include <net/l3mdev.h>
5ea1237f 28#include <net/addrconf.h>
d5eb89cf
AS
29#include <net/ndisc.h>
30#include <net/ipv6.h>
04b1d4e5 31#include <net/fib_notifier.h>
2db99378 32#include <net/switchdev.h>
464dce18
IS
33
34#include "spectrum.h"
35#include "core.h"
36#include "reg.h"
e0c0afd8
AS
37#include "spectrum_cnt.h"
38#include "spectrum_dpipe.h"
38ebc0f4 39#include "spectrum_ipip.h"
d42b0965
YG
40#include "spectrum_mr.h"
41#include "spectrum_mr_tcam.h"
e0c0afd8 42#include "spectrum_router.h"
803335ac 43#include "spectrum_span.h"
464dce18 44
2b52ce02 45struct mlxsw_sp_fib;
9011b677
IS
46struct mlxsw_sp_vr;
47struct mlxsw_sp_lpm_tree;
e4f3c1c1 48struct mlxsw_sp_rif_ops;
9011b677
IS
49
50struct mlxsw_sp_router {
51 struct mlxsw_sp *mlxsw_sp;
5f9efffb 52 struct mlxsw_sp_rif **rifs;
9011b677
IS
53 struct mlxsw_sp_vr *vrs;
54 struct rhashtable neigh_ht;
55 struct rhashtable nexthop_group_ht;
56 struct rhashtable nexthop_ht;
dbe4598c 57 struct list_head nexthop_list;
9011b677 58 struct {
2b52ce02
IS
59 /* One tree for each protocol: IPv4 and IPv6 */
60 struct mlxsw_sp_lpm_tree *proto_trees[2];
9011b677
IS
61 struct mlxsw_sp_lpm_tree *trees;
62 unsigned int tree_count;
63 } lpm;
64 struct {
65 struct delayed_work dw;
66 unsigned long interval; /* ms */
67 } neighs_update;
68 struct delayed_work nexthop_probe_dw;
69#define MLXSW_SP_UNRESOLVED_NH_PROBE_INTERVAL 5000 /* ms */
70 struct list_head nexthop_neighs_list;
1012b9ac 71 struct list_head ipip_list;
9011b677 72 bool aborted;
7e39d115 73 struct notifier_block fib_nb;
48fac885 74 struct notifier_block netevent_nb;
965fa8e6
IS
75 struct notifier_block inetaddr_nb;
76 struct notifier_block inet6addr_nb;
e4f3c1c1 77 const struct mlxsw_sp_rif_ops **rif_ops_arr;
38ebc0f4 78 const struct mlxsw_sp_ipip_ops **ipip_ops_arr;
9011b677
IS
79};
80
4724ba56
IS
81struct mlxsw_sp_rif {
82 struct list_head nexthop_list;
83 struct list_head neigh_list;
73b8f493 84 struct net_device *dev; /* NULL for underlay RIF */
a1107487 85 struct mlxsw_sp_fid *fid;
4724ba56
IS
86 unsigned char addr[ETH_ALEN];
87 int mtu;
bf95233e 88 u16 rif_index;
6913229e 89 u16 vr_id;
e4f3c1c1
IS
90 const struct mlxsw_sp_rif_ops *ops;
91 struct mlxsw_sp *mlxsw_sp;
92
e0c0afd8
AS
93 unsigned int counter_ingress;
94 bool counter_ingress_valid;
95 unsigned int counter_egress;
96 bool counter_egress_valid;
4724ba56
IS
97};
98
e4f3c1c1
IS
99struct mlxsw_sp_rif_params {
100 struct net_device *dev;
101 union {
102 u16 system_port;
103 u16 lag_id;
104 };
105 u16 vid;
106 bool lag;
107};
108
4d93ceeb
IS
109struct mlxsw_sp_rif_subport {
110 struct mlxsw_sp_rif common;
32fd4b49 111 refcount_t ref_count;
4d93ceeb
IS
112 union {
113 u16 system_port;
114 u16 lag_id;
115 };
116 u16 vid;
117 bool lag;
118};
119
6ddb7426
PM
120struct mlxsw_sp_rif_ipip_lb {
121 struct mlxsw_sp_rif common;
122 struct mlxsw_sp_rif_ipip_lb_config lb_config;
123 u16 ul_vr_id; /* Reserved for Spectrum-2. */
25f844dd 124 u16 ul_rif_id; /* Reserved for Spectrum. */
6ddb7426
PM
125};
126
127struct mlxsw_sp_rif_params_ipip_lb {
128 struct mlxsw_sp_rif_params common;
129 struct mlxsw_sp_rif_ipip_lb_config lb_config;
130};
131
e4f3c1c1
IS
132struct mlxsw_sp_rif_ops {
133 enum mlxsw_sp_rif_type type;
134 size_t rif_size;
135
136 void (*setup)(struct mlxsw_sp_rif *rif,
137 const struct mlxsw_sp_rif_params *params);
138 int (*configure)(struct mlxsw_sp_rif *rif);
139 void (*deconfigure)(struct mlxsw_sp_rif *rif);
5f15e257
PM
140 struct mlxsw_sp_fid * (*fid_get)(struct mlxsw_sp_rif *rif,
141 struct netlink_ext_ack *extack);
2db99378 142 void (*fdb_del)(struct mlxsw_sp_rif *rif, const char *mac);
e4f3c1c1
IS
143};
144
32fd4b49 145static void mlxsw_sp_rif_destroy(struct mlxsw_sp_rif *rif);
2b52ce02
IS
146static void mlxsw_sp_lpm_tree_hold(struct mlxsw_sp_lpm_tree *lpm_tree);
147static void mlxsw_sp_lpm_tree_put(struct mlxsw_sp *mlxsw_sp,
148 struct mlxsw_sp_lpm_tree *lpm_tree);
149static int mlxsw_sp_vr_lpm_tree_bind(struct mlxsw_sp *mlxsw_sp,
150 const struct mlxsw_sp_fib *fib,
151 u8 tree_id);
152static int mlxsw_sp_vr_lpm_tree_unbind(struct mlxsw_sp *mlxsw_sp,
153 const struct mlxsw_sp_fib *fib);
154
e0c0afd8
AS
155static unsigned int *
156mlxsw_sp_rif_p_counter_get(struct mlxsw_sp_rif *rif,
157 enum mlxsw_sp_rif_counter_dir dir)
158{
159 switch (dir) {
160 case MLXSW_SP_RIF_COUNTER_EGRESS:
161 return &rif->counter_egress;
162 case MLXSW_SP_RIF_COUNTER_INGRESS:
163 return &rif->counter_ingress;
164 }
165 return NULL;
166}
167
168static bool
169mlxsw_sp_rif_counter_valid_get(struct mlxsw_sp_rif *rif,
170 enum mlxsw_sp_rif_counter_dir dir)
171{
172 switch (dir) {
173 case MLXSW_SP_RIF_COUNTER_EGRESS:
174 return rif->counter_egress_valid;
175 case MLXSW_SP_RIF_COUNTER_INGRESS:
176 return rif->counter_ingress_valid;
177 }
178 return false;
179}
180
181static void
182mlxsw_sp_rif_counter_valid_set(struct mlxsw_sp_rif *rif,
183 enum mlxsw_sp_rif_counter_dir dir,
184 bool valid)
185{
186 switch (dir) {
187 case MLXSW_SP_RIF_COUNTER_EGRESS:
188 rif->counter_egress_valid = valid;
189 break;
190 case MLXSW_SP_RIF_COUNTER_INGRESS:
191 rif->counter_ingress_valid = valid;
192 break;
193 }
194}
195
196static int mlxsw_sp_rif_counter_edit(struct mlxsw_sp *mlxsw_sp, u16 rif_index,
197 unsigned int counter_index, bool enable,
198 enum mlxsw_sp_rif_counter_dir dir)
199{
200 char ritr_pl[MLXSW_REG_RITR_LEN];
201 bool is_egress = false;
202 int err;
203
204 if (dir == MLXSW_SP_RIF_COUNTER_EGRESS)
205 is_egress = true;
206 mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index);
207 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
208 if (err)
209 return err;
210
211 mlxsw_reg_ritr_counter_pack(ritr_pl, counter_index, enable,
212 is_egress);
213 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
214}
215
216int mlxsw_sp_rif_counter_value_get(struct mlxsw_sp *mlxsw_sp,
217 struct mlxsw_sp_rif *rif,
218 enum mlxsw_sp_rif_counter_dir dir, u64 *cnt)
219{
220 char ricnt_pl[MLXSW_REG_RICNT_LEN];
221 unsigned int *p_counter_index;
222 bool valid;
223 int err;
224
225 valid = mlxsw_sp_rif_counter_valid_get(rif, dir);
226 if (!valid)
227 return -EINVAL;
228
229 p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir);
230 if (!p_counter_index)
231 return -EINVAL;
232 mlxsw_reg_ricnt_pack(ricnt_pl, *p_counter_index,
233 MLXSW_REG_RICNT_OPCODE_NOP);
234 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ricnt), ricnt_pl);
235 if (err)
236 return err;
237 *cnt = mlxsw_reg_ricnt_good_unicast_packets_get(ricnt_pl);
238 return 0;
239}
240
241static int mlxsw_sp_rif_counter_clear(struct mlxsw_sp *mlxsw_sp,
242 unsigned int counter_index)
243{
244 char ricnt_pl[MLXSW_REG_RICNT_LEN];
245
246 mlxsw_reg_ricnt_pack(ricnt_pl, counter_index,
247 MLXSW_REG_RICNT_OPCODE_CLEAR);
248 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ricnt), ricnt_pl);
249}
250
251int mlxsw_sp_rif_counter_alloc(struct mlxsw_sp *mlxsw_sp,
252 struct mlxsw_sp_rif *rif,
253 enum mlxsw_sp_rif_counter_dir dir)
254{
255 unsigned int *p_counter_index;
256 int err;
257
258 p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir);
259 if (!p_counter_index)
260 return -EINVAL;
261 err = mlxsw_sp_counter_alloc(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF,
262 p_counter_index);
263 if (err)
264 return err;
265
266 err = mlxsw_sp_rif_counter_clear(mlxsw_sp, *p_counter_index);
267 if (err)
268 goto err_counter_clear;
269
270 err = mlxsw_sp_rif_counter_edit(mlxsw_sp, rif->rif_index,
271 *p_counter_index, true, dir);
272 if (err)
273 goto err_counter_edit;
274 mlxsw_sp_rif_counter_valid_set(rif, dir, true);
275 return 0;
276
277err_counter_edit:
278err_counter_clear:
279 mlxsw_sp_counter_free(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF,
280 *p_counter_index);
281 return err;
282}
283
284void mlxsw_sp_rif_counter_free(struct mlxsw_sp *mlxsw_sp,
285 struct mlxsw_sp_rif *rif,
286 enum mlxsw_sp_rif_counter_dir dir)
287{
288 unsigned int *p_counter_index;
289
6b1206bb
AS
290 if (!mlxsw_sp_rif_counter_valid_get(rif, dir))
291 return;
292
e0c0afd8
AS
293 p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir);
294 if (WARN_ON(!p_counter_index))
295 return;
296 mlxsw_sp_rif_counter_edit(mlxsw_sp, rif->rif_index,
297 *p_counter_index, false, dir);
298 mlxsw_sp_counter_free(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF,
299 *p_counter_index);
300 mlxsw_sp_rif_counter_valid_set(rif, dir, false);
301}
302
e4f3c1c1
IS
303static void mlxsw_sp_rif_counters_alloc(struct mlxsw_sp_rif *rif)
304{
305 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
306 struct devlink *devlink;
307
308 devlink = priv_to_devlink(mlxsw_sp->core);
309 if (!devlink_dpipe_table_counter_enabled(devlink,
310 MLXSW_SP_DPIPE_TABLE_NAME_ERIF))
311 return;
312 mlxsw_sp_rif_counter_alloc(mlxsw_sp, rif, MLXSW_SP_RIF_COUNTER_EGRESS);
313}
314
315static void mlxsw_sp_rif_counters_free(struct mlxsw_sp_rif *rif)
316{
317 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
318
319 mlxsw_sp_rif_counter_free(mlxsw_sp, rif, MLXSW_SP_RIF_COUNTER_EGRESS);
320}
321
7dcc18ad 322#define MLXSW_SP_PREFIX_COUNT (sizeof(struct in6_addr) * BITS_PER_BYTE + 1)
9011b677
IS
323
324struct mlxsw_sp_prefix_usage {
325 DECLARE_BITMAP(b, MLXSW_SP_PREFIX_COUNT);
326};
327
53342023
JP
328#define mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage) \
329 for_each_set_bit(prefix, (prefix_usage)->b, MLXSW_SP_PREFIX_COUNT)
330
331static bool
332mlxsw_sp_prefix_usage_eq(struct mlxsw_sp_prefix_usage *prefix_usage1,
333 struct mlxsw_sp_prefix_usage *prefix_usage2)
334{
335 return !memcmp(prefix_usage1, prefix_usage2, sizeof(*prefix_usage1));
336}
337
6b75c480
JP
338static void
339mlxsw_sp_prefix_usage_cpy(struct mlxsw_sp_prefix_usage *prefix_usage1,
340 struct mlxsw_sp_prefix_usage *prefix_usage2)
341{
342 memcpy(prefix_usage1, prefix_usage2, sizeof(*prefix_usage1));
343}
344
5e9c16cc
JP
345static void
346mlxsw_sp_prefix_usage_set(struct mlxsw_sp_prefix_usage *prefix_usage,
347 unsigned char prefix_len)
348{
349 set_bit(prefix_len, prefix_usage->b);
350}
351
352static void
353mlxsw_sp_prefix_usage_clear(struct mlxsw_sp_prefix_usage *prefix_usage,
354 unsigned char prefix_len)
355{
356 clear_bit(prefix_len, prefix_usage->b);
357}
358
359struct mlxsw_sp_fib_key {
360 unsigned char addr[sizeof(struct in6_addr)];
361 unsigned char prefix_len;
362};
363
61c503f9
JP
364enum mlxsw_sp_fib_entry_type {
365 MLXSW_SP_FIB_ENTRY_TYPE_REMOTE,
366 MLXSW_SP_FIB_ENTRY_TYPE_LOCAL,
367 MLXSW_SP_FIB_ENTRY_TYPE_TRAP,
2810c3b2 368 MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE,
4607f6d2
PM
369
370 /* This is a special case of local delivery, where a packet should be
371 * decapsulated on reception. Note that there is no corresponding ENCAP,
372 * because that's a type of next hop, not of FIB entry. (There can be
373 * several next hops in a REMOTE entry, and some of them may be
374 * encapsulating entries.)
375 */
376 MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP,
0c69e0fc 377 MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP,
61c503f9
JP
378};
379
a7ff87ac
JP
380struct mlxsw_sp_nexthop_group;
381
9aecce1c
IS
382struct mlxsw_sp_fib_node {
383 struct list_head entry_list;
b45f64d1 384 struct list_head list;
9aecce1c 385 struct rhash_head ht_node;
76610ebb 386 struct mlxsw_sp_fib *fib;
5e9c16cc 387 struct mlxsw_sp_fib_key key;
9aecce1c
IS
388};
389
4607f6d2
PM
390struct mlxsw_sp_fib_entry_decap {
391 struct mlxsw_sp_ipip_entry *ipip_entry;
392 u32 tunnel_index;
393};
394
9aecce1c
IS
395struct mlxsw_sp_fib_entry {
396 struct list_head list;
397 struct mlxsw_sp_fib_node *fib_node;
61c503f9 398 enum mlxsw_sp_fib_entry_type type;
a7ff87ac
JP
399 struct list_head nexthop_group_node;
400 struct mlxsw_sp_nexthop_group *nh_group;
4607f6d2 401 struct mlxsw_sp_fib_entry_decap decap; /* Valid for decap entries. */
5e9c16cc
JP
402};
403
4f1c7f1f
IS
404struct mlxsw_sp_fib4_entry {
405 struct mlxsw_sp_fib_entry common;
406 u32 tb_id;
407 u32 prio;
408 u8 tos;
409 u8 type;
410};
411
428b851f
IS
412struct mlxsw_sp_fib6_entry {
413 struct mlxsw_sp_fib_entry common;
414 struct list_head rt6_list;
415 unsigned int nrt6;
416};
417
418struct mlxsw_sp_rt6 {
419 struct list_head list;
8d1c802b 420 struct fib6_info *rt;
428b851f
IS
421};
422
9011b677
IS
423struct mlxsw_sp_lpm_tree {
424 u8 id; /* tree ID */
425 unsigned int ref_count;
426 enum mlxsw_sp_l3proto proto;
2b52ce02 427 unsigned long prefix_ref_count[MLXSW_SP_PREFIX_COUNT];
9011b677
IS
428 struct mlxsw_sp_prefix_usage prefix_usage;
429};
430
5e9c16cc
JP
431struct mlxsw_sp_fib {
432 struct rhashtable ht;
9aecce1c 433 struct list_head node_list;
76610ebb
IS
434 struct mlxsw_sp_vr *vr;
435 struct mlxsw_sp_lpm_tree *lpm_tree;
76610ebb 436 enum mlxsw_sp_l3proto proto;
5e9c16cc
JP
437};
438
9011b677
IS
439struct mlxsw_sp_vr {
440 u16 id; /* virtual router ID */
441 u32 tb_id; /* kernel fib table id */
442 unsigned int rif_count;
443 struct mlxsw_sp_fib *fib4;
a3d9bc50 444 struct mlxsw_sp_fib *fib6;
9742f866 445 struct mlxsw_sp_mr_table *mr_table[MLXSW_SP_L3_PROTO_MAX];
a5040a90
ND
446 struct mlxsw_sp_rif *ul_rif;
447 refcount_t ul_rif_refcnt;
9011b677
IS
448};
449
9aecce1c 450static const struct rhashtable_params mlxsw_sp_fib_ht_params;
5e9c16cc 451
2b52ce02
IS
452static struct mlxsw_sp_fib *mlxsw_sp_fib_create(struct mlxsw_sp *mlxsw_sp,
453 struct mlxsw_sp_vr *vr,
76610ebb 454 enum mlxsw_sp_l3proto proto)
5e9c16cc 455{
2b52ce02 456 struct mlxsw_sp_lpm_tree *lpm_tree;
5e9c16cc
JP
457 struct mlxsw_sp_fib *fib;
458 int err;
459
2b52ce02 460 lpm_tree = mlxsw_sp->router->lpm.proto_trees[proto];
5e9c16cc
JP
461 fib = kzalloc(sizeof(*fib), GFP_KERNEL);
462 if (!fib)
463 return ERR_PTR(-ENOMEM);
464 err = rhashtable_init(&fib->ht, &mlxsw_sp_fib_ht_params);
465 if (err)
466 goto err_rhashtable_init;
9aecce1c 467 INIT_LIST_HEAD(&fib->node_list);
76610ebb
IS
468 fib->proto = proto;
469 fib->vr = vr;
2b52ce02
IS
470 fib->lpm_tree = lpm_tree;
471 mlxsw_sp_lpm_tree_hold(lpm_tree);
472 err = mlxsw_sp_vr_lpm_tree_bind(mlxsw_sp, fib, lpm_tree->id);
473 if (err)
474 goto err_lpm_tree_bind;
5e9c16cc
JP
475 return fib;
476
2b52ce02
IS
477err_lpm_tree_bind:
478 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
5e9c16cc
JP
479err_rhashtable_init:
480 kfree(fib);
481 return ERR_PTR(err);
482}
483
2b52ce02
IS
484static void mlxsw_sp_fib_destroy(struct mlxsw_sp *mlxsw_sp,
485 struct mlxsw_sp_fib *fib)
5e9c16cc 486{
2b52ce02
IS
487 mlxsw_sp_vr_lpm_tree_unbind(mlxsw_sp, fib);
488 mlxsw_sp_lpm_tree_put(mlxsw_sp, fib->lpm_tree);
9aecce1c 489 WARN_ON(!list_empty(&fib->node_list));
5e9c16cc
JP
490 rhashtable_destroy(&fib->ht);
491 kfree(fib);
492}
493
53342023 494static struct mlxsw_sp_lpm_tree *
382dbb40 495mlxsw_sp_lpm_tree_find_unused(struct mlxsw_sp *mlxsw_sp)
53342023
JP
496{
497 static struct mlxsw_sp_lpm_tree *lpm_tree;
498 int i;
499
9011b677
IS
500 for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) {
501 lpm_tree = &mlxsw_sp->router->lpm.trees[i];
382dbb40
IS
502 if (lpm_tree->ref_count == 0)
503 return lpm_tree;
53342023
JP
504 }
505 return NULL;
506}
507
508static int mlxsw_sp_lpm_tree_alloc(struct mlxsw_sp *mlxsw_sp,
509 struct mlxsw_sp_lpm_tree *lpm_tree)
510{
511 char ralta_pl[MLXSW_REG_RALTA_LEN];
512
1a9234e6
IS
513 mlxsw_reg_ralta_pack(ralta_pl, true,
514 (enum mlxsw_reg_ralxx_protocol) lpm_tree->proto,
515 lpm_tree->id);
53342023
JP
516 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl);
517}
518
cc702670
IS
519static void mlxsw_sp_lpm_tree_free(struct mlxsw_sp *mlxsw_sp,
520 struct mlxsw_sp_lpm_tree *lpm_tree)
53342023
JP
521{
522 char ralta_pl[MLXSW_REG_RALTA_LEN];
523
1a9234e6
IS
524 mlxsw_reg_ralta_pack(ralta_pl, false,
525 (enum mlxsw_reg_ralxx_protocol) lpm_tree->proto,
526 lpm_tree->id);
cc702670 527 mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl);
53342023
JP
528}
529
530static int
531mlxsw_sp_lpm_tree_left_struct_set(struct mlxsw_sp *mlxsw_sp,
532 struct mlxsw_sp_prefix_usage *prefix_usage,
533 struct mlxsw_sp_lpm_tree *lpm_tree)
534{
535 char ralst_pl[MLXSW_REG_RALST_LEN];
536 u8 root_bin = 0;
537 u8 prefix;
538 u8 last_prefix = MLXSW_REG_RALST_BIN_NO_CHILD;
539
540 mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage)
541 root_bin = prefix;
542
543 mlxsw_reg_ralst_pack(ralst_pl, root_bin, lpm_tree->id);
544 mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage) {
545 if (prefix == 0)
546 continue;
547 mlxsw_reg_ralst_bin_pack(ralst_pl, prefix, last_prefix,
548 MLXSW_REG_RALST_BIN_NO_CHILD);
549 last_prefix = prefix;
550 }
551 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralst), ralst_pl);
552}
553
554static struct mlxsw_sp_lpm_tree *
555mlxsw_sp_lpm_tree_create(struct mlxsw_sp *mlxsw_sp,
556 struct mlxsw_sp_prefix_usage *prefix_usage,
382dbb40 557 enum mlxsw_sp_l3proto proto)
53342023
JP
558{
559 struct mlxsw_sp_lpm_tree *lpm_tree;
560 int err;
561
382dbb40 562 lpm_tree = mlxsw_sp_lpm_tree_find_unused(mlxsw_sp);
53342023
JP
563 if (!lpm_tree)
564 return ERR_PTR(-EBUSY);
565 lpm_tree->proto = proto;
566 err = mlxsw_sp_lpm_tree_alloc(mlxsw_sp, lpm_tree);
567 if (err)
568 return ERR_PTR(err);
569
570 err = mlxsw_sp_lpm_tree_left_struct_set(mlxsw_sp, prefix_usage,
571 lpm_tree);
572 if (err)
573 goto err_left_struct_set;
2083d367
JP
574 memcpy(&lpm_tree->prefix_usage, prefix_usage,
575 sizeof(lpm_tree->prefix_usage));
2b52ce02
IS
576 memset(&lpm_tree->prefix_ref_count, 0,
577 sizeof(lpm_tree->prefix_ref_count));
578 lpm_tree->ref_count = 1;
53342023
JP
579 return lpm_tree;
580
581err_left_struct_set:
582 mlxsw_sp_lpm_tree_free(mlxsw_sp, lpm_tree);
583 return ERR_PTR(err);
584}
585
cc702670
IS
586static void mlxsw_sp_lpm_tree_destroy(struct mlxsw_sp *mlxsw_sp,
587 struct mlxsw_sp_lpm_tree *lpm_tree)
53342023 588{
cc702670 589 mlxsw_sp_lpm_tree_free(mlxsw_sp, lpm_tree);
53342023
JP
590}
591
592static struct mlxsw_sp_lpm_tree *
593mlxsw_sp_lpm_tree_get(struct mlxsw_sp *mlxsw_sp,
594 struct mlxsw_sp_prefix_usage *prefix_usage,
382dbb40 595 enum mlxsw_sp_l3proto proto)
53342023
JP
596{
597 struct mlxsw_sp_lpm_tree *lpm_tree;
598 int i;
599
9011b677
IS
600 for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) {
601 lpm_tree = &mlxsw_sp->router->lpm.trees[i];
8b99becd
JP
602 if (lpm_tree->ref_count != 0 &&
603 lpm_tree->proto == proto &&
53342023 604 mlxsw_sp_prefix_usage_eq(&lpm_tree->prefix_usage,
2b52ce02
IS
605 prefix_usage)) {
606 mlxsw_sp_lpm_tree_hold(lpm_tree);
fc922bb0 607 return lpm_tree;
2b52ce02 608 }
53342023 609 }
fc922bb0
IS
610 return mlxsw_sp_lpm_tree_create(mlxsw_sp, prefix_usage, proto);
611}
53342023 612
fc922bb0
IS
613static void mlxsw_sp_lpm_tree_hold(struct mlxsw_sp_lpm_tree *lpm_tree)
614{
53342023 615 lpm_tree->ref_count++;
53342023
JP
616}
617
cc702670
IS
618static void mlxsw_sp_lpm_tree_put(struct mlxsw_sp *mlxsw_sp,
619 struct mlxsw_sp_lpm_tree *lpm_tree)
53342023
JP
620{
621 if (--lpm_tree->ref_count == 0)
cc702670 622 mlxsw_sp_lpm_tree_destroy(mlxsw_sp, lpm_tree);
53342023
JP
623}
624
d7a60306 625#define MLXSW_SP_LPM_TREE_MIN 1 /* tree 0 is reserved */
8494ab06
IS
626
627static int mlxsw_sp_lpm_init(struct mlxsw_sp *mlxsw_sp)
53342023 628{
2b52ce02 629 struct mlxsw_sp_prefix_usage req_prefix_usage = {{ 0 } };
53342023 630 struct mlxsw_sp_lpm_tree *lpm_tree;
8494ab06 631 u64 max_trees;
2b52ce02 632 int err, i;
53342023 633
8494ab06
IS
634 if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_LPM_TREES))
635 return -EIO;
636
637 max_trees = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_LPM_TREES);
9011b677
IS
638 mlxsw_sp->router->lpm.tree_count = max_trees - MLXSW_SP_LPM_TREE_MIN;
639 mlxsw_sp->router->lpm.trees = kcalloc(mlxsw_sp->router->lpm.tree_count,
8494ab06
IS
640 sizeof(struct mlxsw_sp_lpm_tree),
641 GFP_KERNEL);
9011b677 642 if (!mlxsw_sp->router->lpm.trees)
8494ab06
IS
643 return -ENOMEM;
644
9011b677
IS
645 for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) {
646 lpm_tree = &mlxsw_sp->router->lpm.trees[i];
53342023
JP
647 lpm_tree->id = i + MLXSW_SP_LPM_TREE_MIN;
648 }
8494ab06 649
2b52ce02
IS
650 lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage,
651 MLXSW_SP_L3_PROTO_IPV4);
652 if (IS_ERR(lpm_tree)) {
653 err = PTR_ERR(lpm_tree);
654 goto err_ipv4_tree_get;
655 }
656 mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV4] = lpm_tree;
657
658 lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage,
659 MLXSW_SP_L3_PROTO_IPV6);
660 if (IS_ERR(lpm_tree)) {
661 err = PTR_ERR(lpm_tree);
662 goto err_ipv6_tree_get;
663 }
664 mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV6] = lpm_tree;
665
8494ab06 666 return 0;
2b52ce02
IS
667
668err_ipv6_tree_get:
669 lpm_tree = mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV4];
670 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
671err_ipv4_tree_get:
672 kfree(mlxsw_sp->router->lpm.trees);
673 return err;
8494ab06
IS
674}
675
676static void mlxsw_sp_lpm_fini(struct mlxsw_sp *mlxsw_sp)
677{
2b52ce02
IS
678 struct mlxsw_sp_lpm_tree *lpm_tree;
679
680 lpm_tree = mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV6];
681 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
682
683 lpm_tree = mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV4];
684 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
685
9011b677 686 kfree(mlxsw_sp->router->lpm.trees);
53342023
JP
687}
688
76610ebb
IS
689static bool mlxsw_sp_vr_is_used(const struct mlxsw_sp_vr *vr)
690{
9742f866
YM
691 return !!vr->fib4 || !!vr->fib6 ||
692 !!vr->mr_table[MLXSW_SP_L3_PROTO_IPV4] ||
693 !!vr->mr_table[MLXSW_SP_L3_PROTO_IPV6];
76610ebb
IS
694}
695
6b75c480
JP
696static struct mlxsw_sp_vr *mlxsw_sp_vr_find_unused(struct mlxsw_sp *mlxsw_sp)
697{
698 struct mlxsw_sp_vr *vr;
699 int i;
700
c1a38311 701 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
9011b677 702 vr = &mlxsw_sp->router->vrs[i];
76610ebb 703 if (!mlxsw_sp_vr_is_used(vr))
6b75c480
JP
704 return vr;
705 }
706 return NULL;
707}
708
709static int mlxsw_sp_vr_lpm_tree_bind(struct mlxsw_sp *mlxsw_sp,
0adb214b 710 const struct mlxsw_sp_fib *fib, u8 tree_id)
6b75c480
JP
711{
712 char raltb_pl[MLXSW_REG_RALTB_LEN];
713
76610ebb
IS
714 mlxsw_reg_raltb_pack(raltb_pl, fib->vr->id,
715 (enum mlxsw_reg_ralxx_protocol) fib->proto,
0adb214b 716 tree_id);
6b75c480
JP
717 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb), raltb_pl);
718}
719
720static int mlxsw_sp_vr_lpm_tree_unbind(struct mlxsw_sp *mlxsw_sp,
76610ebb 721 const struct mlxsw_sp_fib *fib)
6b75c480
JP
722{
723 char raltb_pl[MLXSW_REG_RALTB_LEN];
724
725 /* Bind to tree 0 which is default */
76610ebb
IS
726 mlxsw_reg_raltb_pack(raltb_pl, fib->vr->id,
727 (enum mlxsw_reg_ralxx_protocol) fib->proto, 0);
6b75c480
JP
728 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb), raltb_pl);
729}
730
731static u32 mlxsw_sp_fix_tb_id(u32 tb_id)
732{
7e50d435
YG
733 /* For our purpose, squash main, default and local tables into one */
734 if (tb_id == RT_TABLE_LOCAL || tb_id == RT_TABLE_DEFAULT)
6b75c480
JP
735 tb_id = RT_TABLE_MAIN;
736 return tb_id;
737}
738
739static struct mlxsw_sp_vr *mlxsw_sp_vr_find(struct mlxsw_sp *mlxsw_sp,
76610ebb 740 u32 tb_id)
6b75c480
JP
741{
742 struct mlxsw_sp_vr *vr;
743 int i;
744
745 tb_id = mlxsw_sp_fix_tb_id(tb_id);
9497c042 746
c1a38311 747 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
9011b677 748 vr = &mlxsw_sp->router->vrs[i];
76610ebb 749 if (mlxsw_sp_vr_is_used(vr) && vr->tb_id == tb_id)
6b75c480
JP
750 return vr;
751 }
752 return NULL;
753}
754
88782f75
IS
755int mlxsw_sp_router_tb_id_vr_id(struct mlxsw_sp *mlxsw_sp, u32 tb_id,
756 u16 *vr_id)
757{
758 struct mlxsw_sp_vr *vr;
759
760 vr = mlxsw_sp_vr_find(mlxsw_sp, tb_id);
761 if (!vr)
762 return -ESRCH;
763 *vr_id = vr->id;
764
765 return 0;
766}
767
76610ebb
IS
768static struct mlxsw_sp_fib *mlxsw_sp_vr_fib(const struct mlxsw_sp_vr *vr,
769 enum mlxsw_sp_l3proto proto)
770{
771 switch (proto) {
772 case MLXSW_SP_L3_PROTO_IPV4:
773 return vr->fib4;
774 case MLXSW_SP_L3_PROTO_IPV6:
a3d9bc50 775 return vr->fib6;
76610ebb
IS
776 }
777 return NULL;
778}
779
6b75c480 780static struct mlxsw_sp_vr *mlxsw_sp_vr_create(struct mlxsw_sp *mlxsw_sp,
f8fa9b4e
DA
781 u32 tb_id,
782 struct netlink_ext_ack *extack)
6b75c480 783{
9742f866 784 struct mlxsw_sp_mr_table *mr4_table, *mr6_table;
0f2d2b27
JP
785 struct mlxsw_sp_fib *fib4;
786 struct mlxsw_sp_fib *fib6;
6b75c480 787 struct mlxsw_sp_vr *vr;
a3d9bc50 788 int err;
6b75c480
JP
789
790 vr = mlxsw_sp_vr_find_unused(mlxsw_sp);
f8fa9b4e 791 if (!vr) {
6c677750 792 NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported virtual routers");
6b75c480 793 return ERR_PTR(-EBUSY);
f8fa9b4e 794 }
0f2d2b27
JP
795 fib4 = mlxsw_sp_fib_create(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV4);
796 if (IS_ERR(fib4))
797 return ERR_CAST(fib4);
798 fib6 = mlxsw_sp_fib_create(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV6);
799 if (IS_ERR(fib6)) {
800 err = PTR_ERR(fib6);
a3d9bc50
IS
801 goto err_fib6_create;
802 }
0f2d2b27
JP
803 mr4_table = mlxsw_sp_mr_table_create(mlxsw_sp, vr->id,
804 MLXSW_SP_L3_PROTO_IPV4);
805 if (IS_ERR(mr4_table)) {
806 err = PTR_ERR(mr4_table);
9742f866 807 goto err_mr4_table_create;
d42b0965 808 }
9742f866
YM
809 mr6_table = mlxsw_sp_mr_table_create(mlxsw_sp, vr->id,
810 MLXSW_SP_L3_PROTO_IPV6);
811 if (IS_ERR(mr6_table)) {
812 err = PTR_ERR(mr6_table);
813 goto err_mr6_table_create;
814 }
815
0f2d2b27
JP
816 vr->fib4 = fib4;
817 vr->fib6 = fib6;
9742f866
YM
818 vr->mr_table[MLXSW_SP_L3_PROTO_IPV4] = mr4_table;
819 vr->mr_table[MLXSW_SP_L3_PROTO_IPV6] = mr6_table;
6b75c480 820 vr->tb_id = tb_id;
6b75c480 821 return vr;
a3d9bc50 822
9742f866
YM
823err_mr6_table_create:
824 mlxsw_sp_mr_table_destroy(mr4_table);
825err_mr4_table_create:
0f2d2b27 826 mlxsw_sp_fib_destroy(mlxsw_sp, fib6);
a3d9bc50 827err_fib6_create:
0f2d2b27 828 mlxsw_sp_fib_destroy(mlxsw_sp, fib4);
a3d9bc50 829 return ERR_PTR(err);
6b75c480
JP
830}
831
2b52ce02
IS
832static void mlxsw_sp_vr_destroy(struct mlxsw_sp *mlxsw_sp,
833 struct mlxsw_sp_vr *vr)
6b75c480 834{
9742f866
YM
835 mlxsw_sp_mr_table_destroy(vr->mr_table[MLXSW_SP_L3_PROTO_IPV6]);
836 vr->mr_table[MLXSW_SP_L3_PROTO_IPV6] = NULL;
837 mlxsw_sp_mr_table_destroy(vr->mr_table[MLXSW_SP_L3_PROTO_IPV4]);
838 vr->mr_table[MLXSW_SP_L3_PROTO_IPV4] = NULL;
2b52ce02 839 mlxsw_sp_fib_destroy(mlxsw_sp, vr->fib6);
a3d9bc50 840 vr->fib6 = NULL;
2b52ce02 841 mlxsw_sp_fib_destroy(mlxsw_sp, vr->fib4);
76610ebb 842 vr->fib4 = NULL;
6b75c480
JP
843}
844
f8fa9b4e
DA
845static struct mlxsw_sp_vr *mlxsw_sp_vr_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id,
846 struct netlink_ext_ack *extack)
6b75c480
JP
847{
848 struct mlxsw_sp_vr *vr;
6b75c480
JP
849
850 tb_id = mlxsw_sp_fix_tb_id(tb_id);
76610ebb
IS
851 vr = mlxsw_sp_vr_find(mlxsw_sp, tb_id);
852 if (!vr)
f8fa9b4e 853 vr = mlxsw_sp_vr_create(mlxsw_sp, tb_id, extack);
6b75c480
JP
854 return vr;
855}
856
2b52ce02 857static void mlxsw_sp_vr_put(struct mlxsw_sp *mlxsw_sp, struct mlxsw_sp_vr *vr)
6b75c480 858{
a3d9bc50 859 if (!vr->rif_count && list_empty(&vr->fib4->node_list) &&
d42b0965 860 list_empty(&vr->fib6->node_list) &&
9742f866
YM
861 mlxsw_sp_mr_table_empty(vr->mr_table[MLXSW_SP_L3_PROTO_IPV4]) &&
862 mlxsw_sp_mr_table_empty(vr->mr_table[MLXSW_SP_L3_PROTO_IPV6]))
2b52ce02 863 mlxsw_sp_vr_destroy(mlxsw_sp, vr);
6b75c480
JP
864}
865
fc922bb0
IS
866static bool
867mlxsw_sp_vr_lpm_tree_should_replace(struct mlxsw_sp_vr *vr,
868 enum mlxsw_sp_l3proto proto, u8 tree_id)
869{
870 struct mlxsw_sp_fib *fib = mlxsw_sp_vr_fib(vr, proto);
871
872 if (!mlxsw_sp_vr_is_used(vr))
873 return false;
2b52ce02 874 if (fib->lpm_tree->id == tree_id)
fc922bb0
IS
875 return true;
876 return false;
877}
878
879static int mlxsw_sp_vr_lpm_tree_replace(struct mlxsw_sp *mlxsw_sp,
880 struct mlxsw_sp_fib *fib,
881 struct mlxsw_sp_lpm_tree *new_tree)
882{
883 struct mlxsw_sp_lpm_tree *old_tree = fib->lpm_tree;
884 int err;
885
fc922bb0
IS
886 fib->lpm_tree = new_tree;
887 mlxsw_sp_lpm_tree_hold(new_tree);
ed604c5d
IS
888 err = mlxsw_sp_vr_lpm_tree_bind(mlxsw_sp, fib, new_tree->id);
889 if (err)
890 goto err_tree_bind;
fc922bb0
IS
891 mlxsw_sp_lpm_tree_put(mlxsw_sp, old_tree);
892 return 0;
ed604c5d
IS
893
894err_tree_bind:
895 mlxsw_sp_lpm_tree_put(mlxsw_sp, new_tree);
896 fib->lpm_tree = old_tree;
897 return err;
fc922bb0
IS
898}
899
900static int mlxsw_sp_vrs_lpm_tree_replace(struct mlxsw_sp *mlxsw_sp,
901 struct mlxsw_sp_fib *fib,
902 struct mlxsw_sp_lpm_tree *new_tree)
903{
fc922bb0 904 enum mlxsw_sp_l3proto proto = fib->proto;
2b52ce02 905 struct mlxsw_sp_lpm_tree *old_tree;
fc922bb0
IS
906 u8 old_id, new_id = new_tree->id;
907 struct mlxsw_sp_vr *vr;
908 int i, err;
909
2b52ce02 910 old_tree = mlxsw_sp->router->lpm.proto_trees[proto];
fc922bb0
IS
911 old_id = old_tree->id;
912
913 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
914 vr = &mlxsw_sp->router->vrs[i];
915 if (!mlxsw_sp_vr_lpm_tree_should_replace(vr, proto, old_id))
916 continue;
917 err = mlxsw_sp_vr_lpm_tree_replace(mlxsw_sp,
918 mlxsw_sp_vr_fib(vr, proto),
919 new_tree);
920 if (err)
921 goto err_tree_replace;
922 }
923
2b52ce02
IS
924 memcpy(new_tree->prefix_ref_count, old_tree->prefix_ref_count,
925 sizeof(new_tree->prefix_ref_count));
926 mlxsw_sp->router->lpm.proto_trees[proto] = new_tree;
927 mlxsw_sp_lpm_tree_put(mlxsw_sp, old_tree);
928
fc922bb0
IS
929 return 0;
930
931err_tree_replace:
932 for (i--; i >= 0; i--) {
933 if (!mlxsw_sp_vr_lpm_tree_should_replace(vr, proto, new_id))
934 continue;
935 mlxsw_sp_vr_lpm_tree_replace(mlxsw_sp,
936 mlxsw_sp_vr_fib(vr, proto),
937 old_tree);
938 }
939 return err;
fc922bb0
IS
940}
941
9497c042 942static int mlxsw_sp_vrs_init(struct mlxsw_sp *mlxsw_sp)
6b75c480
JP
943{
944 struct mlxsw_sp_vr *vr;
c1a38311 945 u64 max_vrs;
6b75c480
JP
946 int i;
947
c1a38311 948 if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_VRS))
9497c042
NF
949 return -EIO;
950
c1a38311 951 max_vrs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS);
9011b677
IS
952 mlxsw_sp->router->vrs = kcalloc(max_vrs, sizeof(struct mlxsw_sp_vr),
953 GFP_KERNEL);
954 if (!mlxsw_sp->router->vrs)
9497c042
NF
955 return -ENOMEM;
956
c1a38311 957 for (i = 0; i < max_vrs; i++) {
9011b677 958 vr = &mlxsw_sp->router->vrs[i];
6b75c480
JP
959 vr->id = i;
960 }
9497c042
NF
961
962 return 0;
963}
964
ac571de9
IS
965static void mlxsw_sp_router_fib_flush(struct mlxsw_sp *mlxsw_sp);
966
9497c042
NF
967static void mlxsw_sp_vrs_fini(struct mlxsw_sp *mlxsw_sp)
968{
3057224e
IS
969 /* At this stage we're guaranteed not to have new incoming
970 * FIB notifications and the work queue is free from FIBs
971 * sitting on top of mlxsw netdevs. However, we can still
972 * have other FIBs queued. Flush the queue before flushing
973 * the device's tables. No need for locks, as we're the only
974 * writer.
975 */
976 mlxsw_core_flush_owq();
ac571de9 977 mlxsw_sp_router_fib_flush(mlxsw_sp);
9011b677 978 kfree(mlxsw_sp->router->vrs);
6b75c480
JP
979}
980
6ddb7426
PM
981static struct net_device *
982__mlxsw_sp_ipip_netdev_ul_dev_get(const struct net_device *ol_dev)
983{
984 struct ip_tunnel *tun = netdev_priv(ol_dev);
985 struct net *net = dev_net(ol_dev);
986
987 return __dev_get_by_index(net, tun->parms.link);
988}
989
4cf04f3f 990u32 mlxsw_sp_ipip_dev_ul_tb_id(const struct net_device *ol_dev)
6ddb7426
PM
991{
992 struct net_device *d = __mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev);
993
994 if (d)
995 return l3mdev_fib_table(d) ? : RT_TABLE_MAIN;
996 else
997 return l3mdev_fib_table(ol_dev) ? : RT_TABLE_MAIN;
998}
999
1012b9ac
PM
1000static struct mlxsw_sp_rif *
1001mlxsw_sp_rif_create(struct mlxsw_sp *mlxsw_sp,
f8fa9b4e
DA
1002 const struct mlxsw_sp_rif_params *params,
1003 struct netlink_ext_ack *extack);
1012b9ac
PM
1004
1005static struct mlxsw_sp_rif_ipip_lb *
1006mlxsw_sp_ipip_ol_ipip_lb_create(struct mlxsw_sp *mlxsw_sp,
1007 enum mlxsw_sp_ipip_type ipipt,
7e75af63
PM
1008 struct net_device *ol_dev,
1009 struct netlink_ext_ack *extack)
1012b9ac
PM
1010{
1011 struct mlxsw_sp_rif_params_ipip_lb lb_params;
1012 const struct mlxsw_sp_ipip_ops *ipip_ops;
1013 struct mlxsw_sp_rif *rif;
1014
1015 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipipt];
1016 lb_params = (struct mlxsw_sp_rif_params_ipip_lb) {
1017 .common.dev = ol_dev,
1018 .common.lag = false,
1019 .lb_config = ipip_ops->ol_loopback_config(mlxsw_sp, ol_dev),
1020 };
1021
7e75af63 1022 rif = mlxsw_sp_rif_create(mlxsw_sp, &lb_params.common, extack);
1012b9ac
PM
1023 if (IS_ERR(rif))
1024 return ERR_CAST(rif);
1025 return container_of(rif, struct mlxsw_sp_rif_ipip_lb, common);
1026}
1027
1028static struct mlxsw_sp_ipip_entry *
1029mlxsw_sp_ipip_entry_alloc(struct mlxsw_sp *mlxsw_sp,
1030 enum mlxsw_sp_ipip_type ipipt,
1031 struct net_device *ol_dev)
1032{
e437f3b6 1033 const struct mlxsw_sp_ipip_ops *ipip_ops;
1012b9ac
PM
1034 struct mlxsw_sp_ipip_entry *ipip_entry;
1035 struct mlxsw_sp_ipip_entry *ret = NULL;
1036
e437f3b6 1037 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipipt];
1012b9ac
PM
1038 ipip_entry = kzalloc(sizeof(*ipip_entry), GFP_KERNEL);
1039 if (!ipip_entry)
1040 return ERR_PTR(-ENOMEM);
1041
1042 ipip_entry->ol_lb = mlxsw_sp_ipip_ol_ipip_lb_create(mlxsw_sp, ipipt,
7e75af63 1043 ol_dev, NULL);
1012b9ac
PM
1044 if (IS_ERR(ipip_entry->ol_lb)) {
1045 ret = ERR_CAST(ipip_entry->ol_lb);
1046 goto err_ol_ipip_lb_create;
1047 }
1048
1049 ipip_entry->ipipt = ipipt;
1050 ipip_entry->ol_dev = ol_dev;
e437f3b6
PM
1051
1052 switch (ipip_ops->ul_proto) {
1053 case MLXSW_SP_L3_PROTO_IPV4:
1054 ipip_entry->parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev);
1055 break;
1056 case MLXSW_SP_L3_PROTO_IPV6:
1057 WARN_ON(1);
1058 break;
1059 }
1012b9ac
PM
1060
1061 return ipip_entry;
1062
1063err_ol_ipip_lb_create:
1064 kfree(ipip_entry);
1065 return ret;
1066}
1067
1068static void
4cccb737 1069mlxsw_sp_ipip_entry_dealloc(struct mlxsw_sp_ipip_entry *ipip_entry)
1012b9ac 1070{
1012b9ac
PM
1071 mlxsw_sp_rif_destroy(&ipip_entry->ol_lb->common);
1072 kfree(ipip_entry);
1073}
1074
1012b9ac
PM
1075static bool
1076mlxsw_sp_ipip_entry_saddr_matches(struct mlxsw_sp *mlxsw_sp,
1077 const enum mlxsw_sp_l3proto ul_proto,
1078 union mlxsw_sp_l3addr saddr,
1079 u32 ul_tb_id,
1080 struct mlxsw_sp_ipip_entry *ipip_entry)
1081{
1082 u32 tun_ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev);
1083 enum mlxsw_sp_ipip_type ipipt = ipip_entry->ipipt;
1084 union mlxsw_sp_l3addr tun_saddr;
1085
1086 if (mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto != ul_proto)
1087 return false;
1088
1089 tun_saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ipip_entry->ol_dev);
1090 return tun_ul_tb_id == ul_tb_id &&
1091 mlxsw_sp_l3addr_eq(&tun_saddr, &saddr);
1092}
1093
4607f6d2
PM
1094static int
1095mlxsw_sp_fib_entry_decap_init(struct mlxsw_sp *mlxsw_sp,
1096 struct mlxsw_sp_fib_entry *fib_entry,
1097 struct mlxsw_sp_ipip_entry *ipip_entry)
1098{
1099 u32 tunnel_index;
1100 int err;
1101
4b6b1869
JP
1102 err = mlxsw_sp_kvdl_alloc(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
1103 1, &tunnel_index);
4607f6d2
PM
1104 if (err)
1105 return err;
1106
1107 ipip_entry->decap_fib_entry = fib_entry;
1108 fib_entry->decap.ipip_entry = ipip_entry;
1109 fib_entry->decap.tunnel_index = tunnel_index;
1110 return 0;
1111}
1112
1113static void mlxsw_sp_fib_entry_decap_fini(struct mlxsw_sp *mlxsw_sp,
1114 struct mlxsw_sp_fib_entry *fib_entry)
1115{
1116 /* Unlink this node from the IPIP entry that it's the decap entry of. */
1117 fib_entry->decap.ipip_entry->decap_fib_entry = NULL;
1118 fib_entry->decap.ipip_entry = NULL;
4b6b1869 1119 mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
0304c005 1120 1, fib_entry->decap.tunnel_index);
4607f6d2
PM
1121}
1122
1cc38fb1
PM
1123static struct mlxsw_sp_fib_node *
1124mlxsw_sp_fib_node_lookup(struct mlxsw_sp_fib *fib, const void *addr,
1125 size_t addr_len, unsigned char prefix_len);
4607f6d2
PM
1126static int mlxsw_sp_fib_entry_update(struct mlxsw_sp *mlxsw_sp,
1127 struct mlxsw_sp_fib_entry *fib_entry);
1128
1129static void
1130mlxsw_sp_ipip_entry_demote_decap(struct mlxsw_sp *mlxsw_sp,
1131 struct mlxsw_sp_ipip_entry *ipip_entry)
1132{
1133 struct mlxsw_sp_fib_entry *fib_entry = ipip_entry->decap_fib_entry;
1134
1135 mlxsw_sp_fib_entry_decap_fini(mlxsw_sp, fib_entry);
1136 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
1137
1138 mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
1139}
1140
1cc38fb1
PM
1141static void
1142mlxsw_sp_ipip_entry_promote_decap(struct mlxsw_sp *mlxsw_sp,
1143 struct mlxsw_sp_ipip_entry *ipip_entry,
1144 struct mlxsw_sp_fib_entry *decap_fib_entry)
1145{
1146 if (mlxsw_sp_fib_entry_decap_init(mlxsw_sp, decap_fib_entry,
1147 ipip_entry))
1148 return;
1149 decap_fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP;
1150
1151 if (mlxsw_sp_fib_entry_update(mlxsw_sp, decap_fib_entry))
1152 mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry);
1153}
1154
0c69e0fc
IS
1155static struct mlxsw_sp_fib_entry *
1156mlxsw_sp_router_ip2me_fib_entry_find(struct mlxsw_sp *mlxsw_sp, u32 tb_id,
1157 enum mlxsw_sp_l3proto proto,
1158 const union mlxsw_sp_l3addr *addr,
1159 enum mlxsw_sp_fib_entry_type type)
1160{
1161 struct mlxsw_sp_fib_entry *fib_entry;
1162 struct mlxsw_sp_fib_node *fib_node;
1163 unsigned char addr_prefix_len;
1164 struct mlxsw_sp_fib *fib;
1165 struct mlxsw_sp_vr *vr;
1166 const void *addrp;
1167 size_t addr_len;
1168 u32 addr4;
1169
1170 vr = mlxsw_sp_vr_find(mlxsw_sp, tb_id);
1171 if (!vr)
1172 return NULL;
1173 fib = mlxsw_sp_vr_fib(vr, proto);
1174
1175 switch (proto) {
1176 case MLXSW_SP_L3_PROTO_IPV4:
1177 addr4 = be32_to_cpu(addr->addr4);
1178 addrp = &addr4;
1179 addr_len = 4;
1180 addr_prefix_len = 32;
1181 break;
1182 case MLXSW_SP_L3_PROTO_IPV6: /* fall through */
1183 default:
1184 WARN_ON(1);
1185 return NULL;
1186 }
1187
1188 fib_node = mlxsw_sp_fib_node_lookup(fib, addrp, addr_len,
1189 addr_prefix_len);
1190 if (!fib_node || list_empty(&fib_node->entry_list))
1191 return NULL;
1192
1193 fib_entry = list_first_entry(&fib_node->entry_list,
1194 struct mlxsw_sp_fib_entry, list);
1195 if (fib_entry->type != type)
1196 return NULL;
1197
1198 return fib_entry;
1199}
1200
1cc38fb1
PM
1201/* Given an IPIP entry, find the corresponding decap route. */
1202static struct mlxsw_sp_fib_entry *
1203mlxsw_sp_ipip_entry_find_decap(struct mlxsw_sp *mlxsw_sp,
1204 struct mlxsw_sp_ipip_entry *ipip_entry)
1205{
1206 static struct mlxsw_sp_fib_node *fib_node;
1207 const struct mlxsw_sp_ipip_ops *ipip_ops;
1208 struct mlxsw_sp_fib_entry *fib_entry;
1209 unsigned char saddr_prefix_len;
1210 union mlxsw_sp_l3addr saddr;
1211 struct mlxsw_sp_fib *ul_fib;
1212 struct mlxsw_sp_vr *ul_vr;
1213 const void *saddrp;
1214 size_t saddr_len;
1215 u32 ul_tb_id;
1216 u32 saddr4;
1217
1218 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
1219
1220 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev);
1221 ul_vr = mlxsw_sp_vr_find(mlxsw_sp, ul_tb_id);
1222 if (!ul_vr)
1223 return NULL;
1224
1225 ul_fib = mlxsw_sp_vr_fib(ul_vr, ipip_ops->ul_proto);
1226 saddr = mlxsw_sp_ipip_netdev_saddr(ipip_ops->ul_proto,
1227 ipip_entry->ol_dev);
1228
1229 switch (ipip_ops->ul_proto) {
1230 case MLXSW_SP_L3_PROTO_IPV4:
1231 saddr4 = be32_to_cpu(saddr.addr4);
1232 saddrp = &saddr4;
1233 saddr_len = 4;
1234 saddr_prefix_len = 32;
1235 break;
1236 case MLXSW_SP_L3_PROTO_IPV6:
1237 WARN_ON(1);
1238 return NULL;
1239 }
1240
1241 fib_node = mlxsw_sp_fib_node_lookup(ul_fib, saddrp, saddr_len,
1242 saddr_prefix_len);
1243 if (!fib_node || list_empty(&fib_node->entry_list))
1244 return NULL;
1245
1246 fib_entry = list_first_entry(&fib_node->entry_list,
1247 struct mlxsw_sp_fib_entry, list);
1248 if (fib_entry->type != MLXSW_SP_FIB_ENTRY_TYPE_TRAP)
1249 return NULL;
1250
1251 return fib_entry;
1252}
1253
1012b9ac 1254static struct mlxsw_sp_ipip_entry *
4cccb737
PM
1255mlxsw_sp_ipip_entry_create(struct mlxsw_sp *mlxsw_sp,
1256 enum mlxsw_sp_ipip_type ipipt,
1257 struct net_device *ol_dev)
1012b9ac 1258{
1012b9ac 1259 struct mlxsw_sp_ipip_entry *ipip_entry;
1012b9ac
PM
1260
1261 ipip_entry = mlxsw_sp_ipip_entry_alloc(mlxsw_sp, ipipt, ol_dev);
1262 if (IS_ERR(ipip_entry))
1263 return ipip_entry;
1264
1265 list_add_tail(&ipip_entry->ipip_list_node,
1266 &mlxsw_sp->router->ipip_list);
1267
1012b9ac
PM
1268 return ipip_entry;
1269}
1270
1271static void
4cccb737
PM
1272mlxsw_sp_ipip_entry_destroy(struct mlxsw_sp *mlxsw_sp,
1273 struct mlxsw_sp_ipip_entry *ipip_entry)
1012b9ac 1274{
4cccb737
PM
1275 list_del(&ipip_entry->ipip_list_node);
1276 mlxsw_sp_ipip_entry_dealloc(ipip_entry);
1012b9ac
PM
1277}
1278
4607f6d2
PM
1279static bool
1280mlxsw_sp_ipip_entry_matches_decap(struct mlxsw_sp *mlxsw_sp,
1281 const struct net_device *ul_dev,
1282 enum mlxsw_sp_l3proto ul_proto,
1283 union mlxsw_sp_l3addr ul_dip,
1284 struct mlxsw_sp_ipip_entry *ipip_entry)
1285{
1286 u32 ul_tb_id = l3mdev_fib_table(ul_dev) ? : RT_TABLE_MAIN;
1287 enum mlxsw_sp_ipip_type ipipt = ipip_entry->ipipt;
4607f6d2
PM
1288
1289 if (mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto != ul_proto)
1290 return false;
1291
4607f6d2 1292 return mlxsw_sp_ipip_entry_saddr_matches(mlxsw_sp, ul_proto, ul_dip,
da93d291 1293 ul_tb_id, ipip_entry);
4607f6d2
PM
1294}
1295
1296/* Given decap parameters, find the corresponding IPIP entry. */
1297static struct mlxsw_sp_ipip_entry *
1298mlxsw_sp_ipip_entry_find_by_decap(struct mlxsw_sp *mlxsw_sp,
1299 const struct net_device *ul_dev,
1300 enum mlxsw_sp_l3proto ul_proto,
1301 union mlxsw_sp_l3addr ul_dip)
1302{
1303 struct mlxsw_sp_ipip_entry *ipip_entry;
1304
1305 list_for_each_entry(ipip_entry, &mlxsw_sp->router->ipip_list,
1306 ipip_list_node)
1307 if (mlxsw_sp_ipip_entry_matches_decap(mlxsw_sp, ul_dev,
1308 ul_proto, ul_dip,
1309 ipip_entry))
1310 return ipip_entry;
1311
1312 return NULL;
1313}
1314
6698c168
PM
1315static bool mlxsw_sp_netdev_ipip_type(const struct mlxsw_sp *mlxsw_sp,
1316 const struct net_device *dev,
1317 enum mlxsw_sp_ipip_type *p_type)
1318{
1319 struct mlxsw_sp_router *router = mlxsw_sp->router;
1320 const struct mlxsw_sp_ipip_ops *ipip_ops;
1321 enum mlxsw_sp_ipip_type ipipt;
1322
1323 for (ipipt = 0; ipipt < MLXSW_SP_IPIP_TYPE_MAX; ++ipipt) {
1324 ipip_ops = router->ipip_ops_arr[ipipt];
1325 if (dev->type == ipip_ops->dev_type) {
1326 if (p_type)
1327 *p_type = ipipt;
1328 return true;
1329 }
1330 }
1331 return false;
1332}
1333
796ec776
PM
1334bool mlxsw_sp_netdev_is_ipip_ol(const struct mlxsw_sp *mlxsw_sp,
1335 const struct net_device *dev)
0063587d
PM
1336{
1337 return mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, NULL);
1338}
1339
1340static struct mlxsw_sp_ipip_entry *
1341mlxsw_sp_ipip_entry_find_by_ol_dev(struct mlxsw_sp *mlxsw_sp,
1342 const struct net_device *ol_dev)
1343{
1344 struct mlxsw_sp_ipip_entry *ipip_entry;
1345
1346 list_for_each_entry(ipip_entry, &mlxsw_sp->router->ipip_list,
1347 ipip_list_node)
1348 if (ipip_entry->ol_dev == ol_dev)
1349 return ipip_entry;
1350
1351 return NULL;
1352}
1353
61481f2f
PM
1354static struct mlxsw_sp_ipip_entry *
1355mlxsw_sp_ipip_entry_find_by_ul_dev(const struct mlxsw_sp *mlxsw_sp,
1356 const struct net_device *ul_dev,
1357 struct mlxsw_sp_ipip_entry *start)
1358{
1359 struct mlxsw_sp_ipip_entry *ipip_entry;
1360
1361 ipip_entry = list_prepare_entry(start, &mlxsw_sp->router->ipip_list,
1362 ipip_list_node);
1363 list_for_each_entry_continue(ipip_entry, &mlxsw_sp->router->ipip_list,
1364 ipip_list_node) {
1365 struct net_device *ipip_ul_dev =
1366 __mlxsw_sp_ipip_netdev_ul_dev_get(ipip_entry->ol_dev);
1367
1368 if (ipip_ul_dev == ul_dev)
1369 return ipip_entry;
1370 }
1371
1372 return NULL;
1373}
1374
1375bool mlxsw_sp_netdev_is_ipip_ul(const struct mlxsw_sp *mlxsw_sp,
1376 const struct net_device *dev)
1377{
1378 return mlxsw_sp_ipip_entry_find_by_ul_dev(mlxsw_sp, dev, NULL);
1379}
1380
cafdb2a0
PM
1381static bool mlxsw_sp_netdevice_ipip_can_offload(struct mlxsw_sp *mlxsw_sp,
1382 const struct net_device *ol_dev,
1383 enum mlxsw_sp_ipip_type ipipt)
1384{
1385 const struct mlxsw_sp_ipip_ops *ops
1386 = mlxsw_sp->router->ipip_ops_arr[ipipt];
1387
1388 /* For deciding whether decap should be offloaded, we don't care about
1389 * overlay protocol, so ask whether either one is supported.
1390 */
1391 return ops->can_offload(mlxsw_sp, ol_dev, MLXSW_SP_L3_PROTO_IPV4) ||
1392 ops->can_offload(mlxsw_sp, ol_dev, MLXSW_SP_L3_PROTO_IPV6);
1393}
1394
796ec776
PM
1395static int mlxsw_sp_netdevice_ipip_ol_reg_event(struct mlxsw_sp *mlxsw_sp,
1396 struct net_device *ol_dev)
0063587d 1397{
0063587d 1398 struct mlxsw_sp_ipip_entry *ipip_entry;
af641713 1399 enum mlxsw_sp_l3proto ul_proto;
0063587d 1400 enum mlxsw_sp_ipip_type ipipt;
af641713
PM
1401 union mlxsw_sp_l3addr saddr;
1402 u32 ul_tb_id;
0063587d
PM
1403
1404 mlxsw_sp_netdev_ipip_type(mlxsw_sp, ol_dev, &ipipt);
cafdb2a0 1405 if (mlxsw_sp_netdevice_ipip_can_offload(mlxsw_sp, ol_dev, ipipt)) {
af641713
PM
1406 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ol_dev);
1407 ul_proto = mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto;
1408 saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ol_dev);
1409 if (!mlxsw_sp_ipip_demote_tunnel_by_saddr(mlxsw_sp, ul_proto,
1410 saddr, ul_tb_id,
1411 NULL)) {
1412 ipip_entry = mlxsw_sp_ipip_entry_create(mlxsw_sp, ipipt,
1413 ol_dev);
1414 if (IS_ERR(ipip_entry))
1415 return PTR_ERR(ipip_entry);
1416 }
0063587d
PM
1417 }
1418
1419 return 0;
1420}
1421
796ec776
PM
1422static void mlxsw_sp_netdevice_ipip_ol_unreg_event(struct mlxsw_sp *mlxsw_sp,
1423 struct net_device *ol_dev)
0063587d
PM
1424{
1425 struct mlxsw_sp_ipip_entry *ipip_entry;
1426
1427 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
1428 if (ipip_entry)
4cccb737 1429 mlxsw_sp_ipip_entry_destroy(mlxsw_sp, ipip_entry);
0063587d
PM
1430}
1431
47518ca5
PM
1432static void
1433mlxsw_sp_ipip_entry_ol_up_event(struct mlxsw_sp *mlxsw_sp,
1434 struct mlxsw_sp_ipip_entry *ipip_entry)
1435{
1436 struct mlxsw_sp_fib_entry *decap_fib_entry;
1437
1438 decap_fib_entry = mlxsw_sp_ipip_entry_find_decap(mlxsw_sp, ipip_entry);
1439 if (decap_fib_entry)
1440 mlxsw_sp_ipip_entry_promote_decap(mlxsw_sp, ipip_entry,
1441 decap_fib_entry);
1442}
1443
22b99058 1444static int
3c747500
ND
1445mlxsw_sp_rif_ipip_lb_op(struct mlxsw_sp_rif_ipip_lb *lb_rif, u16 ul_vr_id,
1446 u16 ul_rif_id, bool enable)
22b99058
PM
1447{
1448 struct mlxsw_sp_rif_ipip_lb_config lb_cf = lb_rif->lb_config;
1449 struct mlxsw_sp_rif *rif = &lb_rif->common;
1450 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
1451 char ritr_pl[MLXSW_REG_RITR_LEN];
1452 u32 saddr4;
1453
1454 switch (lb_cf.ul_protocol) {
1455 case MLXSW_SP_L3_PROTO_IPV4:
1456 saddr4 = be32_to_cpu(lb_cf.saddr.addr4);
1457 mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_LOOPBACK_IF,
1458 rif->rif_index, rif->vr_id, rif->dev->mtu);
1459 mlxsw_reg_ritr_loopback_ipip4_pack(ritr_pl, lb_cf.lb_ipipt,
1460 MLXSW_REG_RITR_LOOPBACK_IPIP_OPTIONS_GRE_KEY_PRESET,
3c747500 1461 ul_vr_id, ul_rif_id, saddr4, lb_cf.okey);
22b99058
PM
1462 break;
1463
1464 case MLXSW_SP_L3_PROTO_IPV6:
1465 return -EAFNOSUPPORT;
1466 }
1467
1468 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
1469}
1470
68c3cd92
PM
1471static int mlxsw_sp_netdevice_ipip_ol_update_mtu(struct mlxsw_sp *mlxsw_sp,
1472 struct net_device *ol_dev)
1473{
1474 struct mlxsw_sp_ipip_entry *ipip_entry;
1475 struct mlxsw_sp_rif_ipip_lb *lb_rif;
68c3cd92
PM
1476 int err = 0;
1477
1478 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
1479 if (ipip_entry) {
1480 lb_rif = ipip_entry->ol_lb;
25f844dd
ND
1481 err = mlxsw_sp_rif_ipip_lb_op(lb_rif, lb_rif->ul_vr_id,
1482 lb_rif->ul_rif_id, true);
68c3cd92
PM
1483 if (err)
1484 goto out;
1485 lb_rif->common.mtu = ol_dev->mtu;
1486 }
1487
1488out:
1489 return err;
1490}
1491
6d4de445
PM
1492static void mlxsw_sp_netdevice_ipip_ol_up_event(struct mlxsw_sp *mlxsw_sp,
1493 struct net_device *ol_dev)
0063587d 1494{
0063587d
PM
1495 struct mlxsw_sp_ipip_entry *ipip_entry;
1496
1497 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
47518ca5
PM
1498 if (ipip_entry)
1499 mlxsw_sp_ipip_entry_ol_up_event(mlxsw_sp, ipip_entry);
0063587d
PM
1500}
1501
a3fe198e
PM
1502static void
1503mlxsw_sp_ipip_entry_ol_down_event(struct mlxsw_sp *mlxsw_sp,
1504 struct mlxsw_sp_ipip_entry *ipip_entry)
1505{
1506 if (ipip_entry->decap_fib_entry)
1507 mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry);
1508}
1509
796ec776
PM
1510static void mlxsw_sp_netdevice_ipip_ol_down_event(struct mlxsw_sp *mlxsw_sp,
1511 struct net_device *ol_dev)
0063587d
PM
1512{
1513 struct mlxsw_sp_ipip_entry *ipip_entry;
1514
1515 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
a3fe198e
PM
1516 if (ipip_entry)
1517 mlxsw_sp_ipip_entry_ol_down_event(mlxsw_sp, ipip_entry);
0063587d
PM
1518}
1519
09dbf629
PM
1520static void mlxsw_sp_nexthop_rif_migrate(struct mlxsw_sp *mlxsw_sp,
1521 struct mlxsw_sp_rif *old_rif,
1522 struct mlxsw_sp_rif *new_rif);
65a6121b
PM
1523static int
1524mlxsw_sp_ipip_entry_ol_lb_update(struct mlxsw_sp *mlxsw_sp,
1525 struct mlxsw_sp_ipip_entry *ipip_entry,
0c5f1cd5 1526 bool keep_encap,
65a6121b
PM
1527 struct netlink_ext_ack *extack)
1528{
1529 struct mlxsw_sp_rif_ipip_lb *old_lb_rif = ipip_entry->ol_lb;
1530 struct mlxsw_sp_rif_ipip_lb *new_lb_rif;
1531
1532 new_lb_rif = mlxsw_sp_ipip_ol_ipip_lb_create(mlxsw_sp,
1533 ipip_entry->ipipt,
1534 ipip_entry->ol_dev,
1535 extack);
1536 if (IS_ERR(new_lb_rif))
1537 return PTR_ERR(new_lb_rif);
1538 ipip_entry->ol_lb = new_lb_rif;
0c5f1cd5 1539
09dbf629
PM
1540 if (keep_encap)
1541 mlxsw_sp_nexthop_rif_migrate(mlxsw_sp, &old_lb_rif->common,
1542 &new_lb_rif->common);
0c5f1cd5 1543
65a6121b 1544 mlxsw_sp_rif_destroy(&old_lb_rif->common);
f63ce4e5 1545
65a6121b
PM
1546 return 0;
1547}
1548
09dbf629
PM
1549static void mlxsw_sp_nexthop_rif_update(struct mlxsw_sp *mlxsw_sp,
1550 struct mlxsw_sp_rif *rif);
1551
0c5f1cd5
PM
1552/**
1553 * Update the offload related to an IPIP entry. This always updates decap, and
1554 * in addition to that it also:
1555 * @recreate_loopback: recreates the associated loopback RIF
1556 * @keep_encap: updates next hops that use the tunnel netdevice. This is only
1557 * relevant when recreate_loopback is true.
1558 * @update_nexthops: updates next hops, keeping the current loopback RIF. This
1559 * is only relevant when recreate_loopback is false.
1560 */
65a6121b
PM
1561int __mlxsw_sp_ipip_entry_update_tunnel(struct mlxsw_sp *mlxsw_sp,
1562 struct mlxsw_sp_ipip_entry *ipip_entry,
0c5f1cd5
PM
1563 bool recreate_loopback,
1564 bool keep_encap,
1565 bool update_nexthops,
65a6121b
PM
1566 struct netlink_ext_ack *extack)
1567{
1568 int err;
f63ce4e5 1569
65a6121b
PM
1570 /* RIFs can't be edited, so to update loopback, we need to destroy and
1571 * recreate it. That creates a window of opportunity where RALUE and
1572 * RATR registers end up referencing a RIF that's already gone. RATRs
1573 * are handled in mlxsw_sp_ipip_entry_ol_lb_update(), and to take care
f63ce4e5
PM
1574 * of RALUE, demote the decap route back.
1575 */
1576 if (ipip_entry->decap_fib_entry)
1577 mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry);
1578
0c5f1cd5
PM
1579 if (recreate_loopback) {
1580 err = mlxsw_sp_ipip_entry_ol_lb_update(mlxsw_sp, ipip_entry,
1581 keep_encap, extack);
1582 if (err)
1583 return err;
1584 } else if (update_nexthops) {
1585 mlxsw_sp_nexthop_rif_update(mlxsw_sp,
1586 &ipip_entry->ol_lb->common);
1587 }
65a6121b
PM
1588
1589 if (ipip_entry->ol_dev->flags & IFF_UP)
1590 mlxsw_sp_ipip_entry_ol_up_event(mlxsw_sp, ipip_entry);
f63ce4e5
PM
1591
1592 return 0;
1593}
1594
65a6121b
PM
1595static int mlxsw_sp_netdevice_ipip_ol_vrf_event(struct mlxsw_sp *mlxsw_sp,
1596 struct net_device *ol_dev,
1597 struct netlink_ext_ack *extack)
1598{
1599 struct mlxsw_sp_ipip_entry *ipip_entry =
1600 mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
cab43d9c
PM
1601 enum mlxsw_sp_l3proto ul_proto;
1602 union mlxsw_sp_l3addr saddr;
1603 u32 ul_tb_id;
65a6121b
PM
1604
1605 if (!ipip_entry)
1606 return 0;
cab43d9c
PM
1607
1608 /* For flat configuration cases, moving overlay to a different VRF might
1609 * cause local address conflict, and the conflicting tunnels need to be
1610 * demoted.
1611 */
1612 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ol_dev);
1613 ul_proto = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt]->ul_proto;
1614 saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ol_dev);
1615 if (mlxsw_sp_ipip_demote_tunnel_by_saddr(mlxsw_sp, ul_proto,
1616 saddr, ul_tb_id,
1617 ipip_entry)) {
1618 mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry);
1619 return 0;
1620 }
1621
65a6121b 1622 return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
0c5f1cd5 1623 true, false, false, extack);
65a6121b
PM
1624}
1625
61481f2f
PM
1626static int
1627mlxsw_sp_netdevice_ipip_ul_vrf_event(struct mlxsw_sp *mlxsw_sp,
1628 struct mlxsw_sp_ipip_entry *ipip_entry,
1629 struct net_device *ul_dev,
1630 struct netlink_ext_ack *extack)
1631{
1632 return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
1633 true, true, false, extack);
1634}
1635
44b0fff1
PM
1636static int
1637mlxsw_sp_netdevice_ipip_ul_up_event(struct mlxsw_sp *mlxsw_sp,
1638 struct mlxsw_sp_ipip_entry *ipip_entry,
1639 struct net_device *ul_dev)
1640{
1641 return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
1642 false, false, true, NULL);
1643}
1644
1645static int
1646mlxsw_sp_netdevice_ipip_ul_down_event(struct mlxsw_sp *mlxsw_sp,
1647 struct mlxsw_sp_ipip_entry *ipip_entry,
1648 struct net_device *ul_dev)
1649{
1650 /* A down underlay device causes encapsulated packets to not be
1651 * forwarded, but decap still works. So refresh next hops without
1652 * touching anything else.
1653 */
1654 return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
1655 false, false, true, NULL);
1656}
1657
4cf04f3f
PM
1658static int
1659mlxsw_sp_netdevice_ipip_ol_change_event(struct mlxsw_sp *mlxsw_sp,
1660 struct net_device *ol_dev,
1661 struct netlink_ext_ack *extack)
1662{
1663 const struct mlxsw_sp_ipip_ops *ipip_ops;
1664 struct mlxsw_sp_ipip_entry *ipip_entry;
1665 int err;
1666
1667 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev);
1668 if (!ipip_entry)
1669 /* A change might make a tunnel eligible for offloading, but
1670 * that is currently not implemented. What falls to slow path
1671 * stays there.
1672 */
1673 return 0;
1674
1675 /* A change might make a tunnel not eligible for offloading. */
1676 if (!mlxsw_sp_netdevice_ipip_can_offload(mlxsw_sp, ol_dev,
1677 ipip_entry->ipipt)) {
1678 mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry);
1679 return 0;
1680 }
1681
1682 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
1683 err = ipip_ops->ol_netdev_change(mlxsw_sp, ipip_entry, extack);
1684 return err;
1685}
1686
af641713
PM
1687void mlxsw_sp_ipip_entry_demote_tunnel(struct mlxsw_sp *mlxsw_sp,
1688 struct mlxsw_sp_ipip_entry *ipip_entry)
1689{
1690 struct net_device *ol_dev = ipip_entry->ol_dev;
1691
1692 if (ol_dev->flags & IFF_UP)
1693 mlxsw_sp_ipip_entry_ol_down_event(mlxsw_sp, ipip_entry);
1694 mlxsw_sp_ipip_entry_destroy(mlxsw_sp, ipip_entry);
1695}
1696
1697/* The configuration where several tunnels have the same local address in the
1698 * same underlay table needs special treatment in the HW. That is currently not
1699 * implemented in the driver. This function finds and demotes the first tunnel
1700 * with a given source address, except the one passed in in the argument
1701 * `except'.
1702 */
1703bool
1704mlxsw_sp_ipip_demote_tunnel_by_saddr(struct mlxsw_sp *mlxsw_sp,
1705 enum mlxsw_sp_l3proto ul_proto,
1706 union mlxsw_sp_l3addr saddr,
1707 u32 ul_tb_id,
1708 const struct mlxsw_sp_ipip_entry *except)
1709{
1710 struct mlxsw_sp_ipip_entry *ipip_entry, *tmp;
1711
1712 list_for_each_entry_safe(ipip_entry, tmp, &mlxsw_sp->router->ipip_list,
1713 ipip_list_node) {
1714 if (ipip_entry != except &&
1715 mlxsw_sp_ipip_entry_saddr_matches(mlxsw_sp, ul_proto, saddr,
1716 ul_tb_id, ipip_entry)) {
1717 mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry);
1718 return true;
1719 }
1720 }
1721
1722 return false;
1723}
1724
61481f2f
PM
1725static void mlxsw_sp_ipip_demote_tunnel_by_ul_netdev(struct mlxsw_sp *mlxsw_sp,
1726 struct net_device *ul_dev)
1727{
1728 struct mlxsw_sp_ipip_entry *ipip_entry, *tmp;
1729
1730 list_for_each_entry_safe(ipip_entry, tmp, &mlxsw_sp->router->ipip_list,
1731 ipip_list_node) {
1732 struct net_device *ipip_ul_dev =
1733 __mlxsw_sp_ipip_netdev_ul_dev_get(ipip_entry->ol_dev);
1734
1735 if (ipip_ul_dev == ul_dev)
1736 mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry);
1737 }
1738}
1739
7e75af63
PM
1740int mlxsw_sp_netdevice_ipip_ol_event(struct mlxsw_sp *mlxsw_sp,
1741 struct net_device *ol_dev,
1742 unsigned long event,
1743 struct netdev_notifier_info *info)
0063587d 1744{
7e75af63
PM
1745 struct netdev_notifier_changeupper_info *chup;
1746 struct netlink_ext_ack *extack;
1747
0063587d
PM
1748 switch (event) {
1749 case NETDEV_REGISTER:
796ec776 1750 return mlxsw_sp_netdevice_ipip_ol_reg_event(mlxsw_sp, ol_dev);
0063587d 1751 case NETDEV_UNREGISTER:
796ec776 1752 mlxsw_sp_netdevice_ipip_ol_unreg_event(mlxsw_sp, ol_dev);
0063587d
PM
1753 return 0;
1754 case NETDEV_UP:
6d4de445
PM
1755 mlxsw_sp_netdevice_ipip_ol_up_event(mlxsw_sp, ol_dev);
1756 return 0;
0063587d 1757 case NETDEV_DOWN:
796ec776 1758 mlxsw_sp_netdevice_ipip_ol_down_event(mlxsw_sp, ol_dev);
0063587d 1759 return 0;
f63ce4e5 1760 case NETDEV_CHANGEUPPER:
7e75af63
PM
1761 chup = container_of(info, typeof(*chup), info);
1762 extack = info->extack;
1763 if (netif_is_l3_master(chup->upper_dev))
796ec776 1764 return mlxsw_sp_netdevice_ipip_ol_vrf_event(mlxsw_sp,
7e75af63
PM
1765 ol_dev,
1766 extack);
f63ce4e5 1767 return 0;
4cf04f3f
PM
1768 case NETDEV_CHANGE:
1769 extack = info->extack;
1770 return mlxsw_sp_netdevice_ipip_ol_change_event(mlxsw_sp,
1771 ol_dev, extack);
68c3cd92
PM
1772 case NETDEV_CHANGEMTU:
1773 return mlxsw_sp_netdevice_ipip_ol_update_mtu(mlxsw_sp, ol_dev);
0063587d
PM
1774 }
1775 return 0;
1776}
1777
61481f2f
PM
1778static int
1779__mlxsw_sp_netdevice_ipip_ul_event(struct mlxsw_sp *mlxsw_sp,
1780 struct mlxsw_sp_ipip_entry *ipip_entry,
1781 struct net_device *ul_dev,
1782 unsigned long event,
1783 struct netdev_notifier_info *info)
1784{
1785 struct netdev_notifier_changeupper_info *chup;
1786 struct netlink_ext_ack *extack;
1787
1788 switch (event) {
1789 case NETDEV_CHANGEUPPER:
1790 chup = container_of(info, typeof(*chup), info);
1791 extack = info->extack;
1792 if (netif_is_l3_master(chup->upper_dev))
1793 return mlxsw_sp_netdevice_ipip_ul_vrf_event(mlxsw_sp,
1794 ipip_entry,
1795 ul_dev,
1796 extack);
1797 break;
44b0fff1
PM
1798
1799 case NETDEV_UP:
1800 return mlxsw_sp_netdevice_ipip_ul_up_event(mlxsw_sp, ipip_entry,
1801 ul_dev);
1802 case NETDEV_DOWN:
1803 return mlxsw_sp_netdevice_ipip_ul_down_event(mlxsw_sp,
1804 ipip_entry,
1805 ul_dev);
61481f2f
PM
1806 }
1807 return 0;
1808}
1809
1810int
1811mlxsw_sp_netdevice_ipip_ul_event(struct mlxsw_sp *mlxsw_sp,
1812 struct net_device *ul_dev,
1813 unsigned long event,
1814 struct netdev_notifier_info *info)
1815{
1816 struct mlxsw_sp_ipip_entry *ipip_entry = NULL;
1817 int err;
1818
1819 while ((ipip_entry = mlxsw_sp_ipip_entry_find_by_ul_dev(mlxsw_sp,
1820 ul_dev,
1821 ipip_entry))) {
1822 err = __mlxsw_sp_netdevice_ipip_ul_event(mlxsw_sp, ipip_entry,
1823 ul_dev, event, info);
1824 if (err) {
1825 mlxsw_sp_ipip_demote_tunnel_by_ul_netdev(mlxsw_sp,
1826 ul_dev);
1827 return err;
1828 }
1829 }
1830
1831 return 0;
1832}
1833
0c69e0fc
IS
1834int mlxsw_sp_router_nve_promote_decap(struct mlxsw_sp *mlxsw_sp, u32 ul_tb_id,
1835 enum mlxsw_sp_l3proto ul_proto,
1836 const union mlxsw_sp_l3addr *ul_sip,
1837 u32 tunnel_index)
1838{
1839 enum mlxsw_sp_fib_entry_type type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
1840 struct mlxsw_sp_fib_entry *fib_entry;
1841 int err;
1842
1843 /* It is valid to create a tunnel with a local IP and only later
1844 * assign this IP address to a local interface
1845 */
1846 fib_entry = mlxsw_sp_router_ip2me_fib_entry_find(mlxsw_sp, ul_tb_id,
1847 ul_proto, ul_sip,
1848 type);
1849 if (!fib_entry)
1850 return 0;
1851
1852 fib_entry->decap.tunnel_index = tunnel_index;
1853 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP;
1854
1855 err = mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
1856 if (err)
1857 goto err_fib_entry_update;
1858
1859 return 0;
1860
1861err_fib_entry_update:
1862 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
1863 mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
1864 return err;
1865}
1866
1867void mlxsw_sp_router_nve_demote_decap(struct mlxsw_sp *mlxsw_sp, u32 ul_tb_id,
1868 enum mlxsw_sp_l3proto ul_proto,
1869 const union mlxsw_sp_l3addr *ul_sip)
1870{
1871 enum mlxsw_sp_fib_entry_type type = MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP;
1872 struct mlxsw_sp_fib_entry *fib_entry;
1873
1874 fib_entry = mlxsw_sp_router_ip2me_fib_entry_find(mlxsw_sp, ul_tb_id,
1875 ul_proto, ul_sip,
1876 type);
1877 if (!fib_entry)
1878 return;
1879
1880 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
1881 mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
1882}
1883
6cf3c971 1884struct mlxsw_sp_neigh_key {
33b1341c 1885 struct neighbour *n;
6cf3c971
JP
1886};
1887
1888struct mlxsw_sp_neigh_entry {
9665b745 1889 struct list_head rif_list_node;
6cf3c971
JP
1890 struct rhash_head ht_node;
1891 struct mlxsw_sp_neigh_key key;
1892 u16 rif;
5c8802f1 1893 bool connected;
a6bf9e93 1894 unsigned char ha[ETH_ALEN];
a7ff87ac
JP
1895 struct list_head nexthop_list; /* list of nexthops using
1896 * this neigh entry
1897 */
b2157149 1898 struct list_head nexthop_neighs_list_node;
7cfcbc75
AS
1899 unsigned int counter_index;
1900 bool counter_valid;
6cf3c971
JP
1901};
1902
1903static const struct rhashtable_params mlxsw_sp_neigh_ht_params = {
1904 .key_offset = offsetof(struct mlxsw_sp_neigh_entry, key),
1905 .head_offset = offsetof(struct mlxsw_sp_neigh_entry, ht_node),
1906 .key_len = sizeof(struct mlxsw_sp_neigh_key),
1907};
1908
f17cc84d
AS
1909struct mlxsw_sp_neigh_entry *
1910mlxsw_sp_rif_neigh_next(struct mlxsw_sp_rif *rif,
1911 struct mlxsw_sp_neigh_entry *neigh_entry)
1912{
1913 if (!neigh_entry) {
1914 if (list_empty(&rif->neigh_list))
1915 return NULL;
1916 else
1917 return list_first_entry(&rif->neigh_list,
1918 typeof(*neigh_entry),
1919 rif_list_node);
1920 }
ec2437f4 1921 if (list_is_last(&neigh_entry->rif_list_node, &rif->neigh_list))
f17cc84d
AS
1922 return NULL;
1923 return list_next_entry(neigh_entry, rif_list_node);
1924}
1925
1926int mlxsw_sp_neigh_entry_type(struct mlxsw_sp_neigh_entry *neigh_entry)
1927{
1928 return neigh_entry->key.n->tbl->family;
1929}
1930
1931unsigned char *
1932mlxsw_sp_neigh_entry_ha(struct mlxsw_sp_neigh_entry *neigh_entry)
1933{
1934 return neigh_entry->ha;
1935}
1936
1937u32 mlxsw_sp_neigh4_entry_dip(struct mlxsw_sp_neigh_entry *neigh_entry)
1938{
1939 struct neighbour *n;
1940
1941 n = neigh_entry->key.n;
1942 return ntohl(*((__be32 *) n->primary_key));
1943}
1944
0250768c
AS
1945struct in6_addr *
1946mlxsw_sp_neigh6_entry_dip(struct mlxsw_sp_neigh_entry *neigh_entry)
1947{
1948 struct neighbour *n;
1949
1950 n = neigh_entry->key.n;
1951 return (struct in6_addr *) &n->primary_key;
1952}
1953
7cfcbc75
AS
1954int mlxsw_sp_neigh_counter_get(struct mlxsw_sp *mlxsw_sp,
1955 struct mlxsw_sp_neigh_entry *neigh_entry,
1956 u64 *p_counter)
1957{
1958 if (!neigh_entry->counter_valid)
1959 return -EINVAL;
1960
1961 return mlxsw_sp_flow_counter_get(mlxsw_sp, neigh_entry->counter_index,
1962 p_counter, NULL);
1963}
1964
6cf3c971 1965static struct mlxsw_sp_neigh_entry *
5c8802f1
IS
1966mlxsw_sp_neigh_entry_alloc(struct mlxsw_sp *mlxsw_sp, struct neighbour *n,
1967 u16 rif)
6cf3c971
JP
1968{
1969 struct mlxsw_sp_neigh_entry *neigh_entry;
1970
5c8802f1 1971 neigh_entry = kzalloc(sizeof(*neigh_entry), GFP_KERNEL);
6cf3c971
JP
1972 if (!neigh_entry)
1973 return NULL;
5c8802f1 1974
33b1341c 1975 neigh_entry->key.n = n;
6cf3c971 1976 neigh_entry->rif = rif;
a7ff87ac 1977 INIT_LIST_HEAD(&neigh_entry->nexthop_list);
5c8802f1 1978
6cf3c971
JP
1979 return neigh_entry;
1980}
1981
5c8802f1 1982static void mlxsw_sp_neigh_entry_free(struct mlxsw_sp_neigh_entry *neigh_entry)
6cf3c971
JP
1983{
1984 kfree(neigh_entry);
1985}
1986
5c8802f1
IS
1987static int
1988mlxsw_sp_neigh_entry_insert(struct mlxsw_sp *mlxsw_sp,
1989 struct mlxsw_sp_neigh_entry *neigh_entry)
6cf3c971 1990{
9011b677 1991 return rhashtable_insert_fast(&mlxsw_sp->router->neigh_ht,
5c8802f1
IS
1992 &neigh_entry->ht_node,
1993 mlxsw_sp_neigh_ht_params);
1994}
6cf3c971 1995
5c8802f1
IS
1996static void
1997mlxsw_sp_neigh_entry_remove(struct mlxsw_sp *mlxsw_sp,
1998 struct mlxsw_sp_neigh_entry *neigh_entry)
1999{
9011b677 2000 rhashtable_remove_fast(&mlxsw_sp->router->neigh_ht,
5c8802f1
IS
2001 &neigh_entry->ht_node,
2002 mlxsw_sp_neigh_ht_params);
6cf3c971
JP
2003}
2004
7cfcbc75 2005static bool
1ed5574c
AS
2006mlxsw_sp_neigh_counter_should_alloc(struct mlxsw_sp *mlxsw_sp,
2007 struct mlxsw_sp_neigh_entry *neigh_entry)
7cfcbc75
AS
2008{
2009 struct devlink *devlink;
1ed5574c
AS
2010 const char *table_name;
2011
2012 switch (mlxsw_sp_neigh_entry_type(neigh_entry)) {
2013 case AF_INET:
2014 table_name = MLXSW_SP_DPIPE_TABLE_NAME_HOST4;
2015 break;
2016 case AF_INET6:
2017 table_name = MLXSW_SP_DPIPE_TABLE_NAME_HOST6;
2018 break;
2019 default:
2020 WARN_ON(1);
2021 return false;
2022 }
7cfcbc75
AS
2023
2024 devlink = priv_to_devlink(mlxsw_sp->core);
1ed5574c 2025 return devlink_dpipe_table_counter_enabled(devlink, table_name);
7cfcbc75
AS
2026}
2027
2028static void
2029mlxsw_sp_neigh_counter_alloc(struct mlxsw_sp *mlxsw_sp,
2030 struct mlxsw_sp_neigh_entry *neigh_entry)
2031{
1ed5574c 2032 if (!mlxsw_sp_neigh_counter_should_alloc(mlxsw_sp, neigh_entry))
7cfcbc75
AS
2033 return;
2034
2035 if (mlxsw_sp_flow_counter_alloc(mlxsw_sp, &neigh_entry->counter_index))
2036 return;
2037
2038 neigh_entry->counter_valid = true;
2039}
2040
2041static void
2042mlxsw_sp_neigh_counter_free(struct mlxsw_sp *mlxsw_sp,
2043 struct mlxsw_sp_neigh_entry *neigh_entry)
2044{
2045 if (!neigh_entry->counter_valid)
2046 return;
2047 mlxsw_sp_flow_counter_free(mlxsw_sp,
2048 neigh_entry->counter_index);
2049 neigh_entry->counter_valid = false;
2050}
2051
5c8802f1
IS
2052static struct mlxsw_sp_neigh_entry *
2053mlxsw_sp_neigh_entry_create(struct mlxsw_sp *mlxsw_sp, struct neighbour *n)
6cf3c971 2054{
6cf3c971 2055 struct mlxsw_sp_neigh_entry *neigh_entry;
bf95233e 2056 struct mlxsw_sp_rif *rif;
6cf3c971
JP
2057 int err;
2058
bf95233e
AS
2059 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, n->dev);
2060 if (!rif)
5c8802f1 2061 return ERR_PTR(-EINVAL);
6cf3c971 2062
bf95233e 2063 neigh_entry = mlxsw_sp_neigh_entry_alloc(mlxsw_sp, n, rif->rif_index);
6cf3c971 2064 if (!neigh_entry)
5c8802f1
IS
2065 return ERR_PTR(-ENOMEM);
2066
6cf3c971
JP
2067 err = mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry);
2068 if (err)
2069 goto err_neigh_entry_insert;
5c8802f1 2070
7cfcbc75 2071 mlxsw_sp_neigh_counter_alloc(mlxsw_sp, neigh_entry);
bf95233e 2072 list_add(&neigh_entry->rif_list_node, &rif->neigh_list);
9665b745 2073
5c8802f1 2074 return neigh_entry;
6cf3c971
JP
2075
2076err_neigh_entry_insert:
5c8802f1
IS
2077 mlxsw_sp_neigh_entry_free(neigh_entry);
2078 return ERR_PTR(err);
6cf3c971
JP
2079}
2080
5c8802f1
IS
2081static void
2082mlxsw_sp_neigh_entry_destroy(struct mlxsw_sp *mlxsw_sp,
2083 struct mlxsw_sp_neigh_entry *neigh_entry)
6cf3c971 2084{
9665b745 2085 list_del(&neigh_entry->rif_list_node);
7cfcbc75 2086 mlxsw_sp_neigh_counter_free(mlxsw_sp, neigh_entry);
5c8802f1
IS
2087 mlxsw_sp_neigh_entry_remove(mlxsw_sp, neigh_entry);
2088 mlxsw_sp_neigh_entry_free(neigh_entry);
2089}
6cf3c971 2090
5c8802f1
IS
2091static struct mlxsw_sp_neigh_entry *
2092mlxsw_sp_neigh_entry_lookup(struct mlxsw_sp *mlxsw_sp, struct neighbour *n)
2093{
2094 struct mlxsw_sp_neigh_key key;
6cf3c971 2095
5c8802f1 2096 key.n = n;
9011b677 2097 return rhashtable_lookup_fast(&mlxsw_sp->router->neigh_ht,
5c8802f1 2098 &key, mlxsw_sp_neigh_ht_params);
6cf3c971
JP
2099}
2100
c723c735
YG
2101static void
2102mlxsw_sp_router_neighs_update_interval_init(struct mlxsw_sp *mlxsw_sp)
2103{
a6c9b5d1 2104 unsigned long interval;
c723c735 2105
b5f3e0d4 2106#if IS_ENABLED(CONFIG_IPV6)
a6c9b5d1
AS
2107 interval = min_t(unsigned long,
2108 NEIGH_VAR(&arp_tbl.parms, DELAY_PROBE_TIME),
2109 NEIGH_VAR(&nd_tbl.parms, DELAY_PROBE_TIME));
b5f3e0d4
IS
2110#else
2111 interval = NEIGH_VAR(&arp_tbl.parms, DELAY_PROBE_TIME);
2112#endif
9011b677 2113 mlxsw_sp->router->neighs_update.interval = jiffies_to_msecs(interval);
c723c735
YG
2114}
2115
2116static void mlxsw_sp_router_neigh_ent_ipv4_process(struct mlxsw_sp *mlxsw_sp,
2117 char *rauhtd_pl,
2118 int ent_index)
2119{
2120 struct net_device *dev;
2121 struct neighbour *n;
2122 __be32 dipn;
2123 u32 dip;
2124 u16 rif;
2125
2126 mlxsw_reg_rauhtd_ent_ipv4_unpack(rauhtd_pl, ent_index, &rif, &dip);
2127
5f9efffb 2128 if (!mlxsw_sp->router->rifs[rif]) {
c723c735
YG
2129 dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Incorrect RIF in neighbour entry\n");
2130 return;
2131 }
2132
2133 dipn = htonl(dip);
5f9efffb 2134 dev = mlxsw_sp->router->rifs[rif]->dev;
c723c735 2135 n = neigh_lookup(&arp_tbl, &dipn, dev);
1ecdaea0 2136 if (!n)
c723c735 2137 return;
c723c735
YG
2138
2139 netdev_dbg(dev, "Updating neighbour with IP=%pI4h\n", &dip);
2140 neigh_event_send(n, NULL);
2141 neigh_release(n);
2142}
2143
df9a21f1 2144#if IS_ENABLED(CONFIG_IPV6)
60f040ca
AS
2145static void mlxsw_sp_router_neigh_ent_ipv6_process(struct mlxsw_sp *mlxsw_sp,
2146 char *rauhtd_pl,
2147 int rec_index)
2148{
2149 struct net_device *dev;
2150 struct neighbour *n;
2151 struct in6_addr dip;
2152 u16 rif;
2153
2154 mlxsw_reg_rauhtd_ent_ipv6_unpack(rauhtd_pl, rec_index, &rif,
2155 (char *) &dip);
2156
2157 if (!mlxsw_sp->router->rifs[rif]) {
2158 dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Incorrect RIF in neighbour entry\n");
2159 return;
2160 }
2161
2162 dev = mlxsw_sp->router->rifs[rif]->dev;
2163 n = neigh_lookup(&nd_tbl, &dip, dev);
1ecdaea0 2164 if (!n)
60f040ca 2165 return;
60f040ca
AS
2166
2167 netdev_dbg(dev, "Updating neighbour with IP=%pI6c\n", &dip);
2168 neigh_event_send(n, NULL);
2169 neigh_release(n);
2170}
b5f3e0d4
IS
2171#else
2172static void mlxsw_sp_router_neigh_ent_ipv6_process(struct mlxsw_sp *mlxsw_sp,
2173 char *rauhtd_pl,
2174 int rec_index)
2175{
2176}
2177#endif
60f040ca 2178
c723c735
YG
2179static void mlxsw_sp_router_neigh_rec_ipv4_process(struct mlxsw_sp *mlxsw_sp,
2180 char *rauhtd_pl,
2181 int rec_index)
2182{
2183 u8 num_entries;
2184 int i;
2185
2186 num_entries = mlxsw_reg_rauhtd_ipv4_rec_num_entries_get(rauhtd_pl,
2187 rec_index);
2188 /* Hardware starts counting at 0, so add 1. */
2189 num_entries++;
2190
2191 /* Each record consists of several neighbour entries. */
2192 for (i = 0; i < num_entries; i++) {
2193 int ent_index;
2194
2195 ent_index = rec_index * MLXSW_REG_RAUHTD_IPV4_ENT_PER_REC + i;
2196 mlxsw_sp_router_neigh_ent_ipv4_process(mlxsw_sp, rauhtd_pl,
2197 ent_index);
2198 }
2199
2200}
2201
60f040ca
AS
2202static void mlxsw_sp_router_neigh_rec_ipv6_process(struct mlxsw_sp *mlxsw_sp,
2203 char *rauhtd_pl,
2204 int rec_index)
2205{
2206 /* One record contains one entry. */
2207 mlxsw_sp_router_neigh_ent_ipv6_process(mlxsw_sp, rauhtd_pl,
2208 rec_index);
2209}
2210
c723c735
YG
2211static void mlxsw_sp_router_neigh_rec_process(struct mlxsw_sp *mlxsw_sp,
2212 char *rauhtd_pl, int rec_index)
2213{
2214 switch (mlxsw_reg_rauhtd_rec_type_get(rauhtd_pl, rec_index)) {
2215 case MLXSW_REG_RAUHTD_TYPE_IPV4:
2216 mlxsw_sp_router_neigh_rec_ipv4_process(mlxsw_sp, rauhtd_pl,
2217 rec_index);
2218 break;
2219 case MLXSW_REG_RAUHTD_TYPE_IPV6:
60f040ca
AS
2220 mlxsw_sp_router_neigh_rec_ipv6_process(mlxsw_sp, rauhtd_pl,
2221 rec_index);
c723c735
YG
2222 break;
2223 }
2224}
2225
42cdb338
AS
2226static bool mlxsw_sp_router_rauhtd_is_full(char *rauhtd_pl)
2227{
2228 u8 num_rec, last_rec_index, num_entries;
2229
2230 num_rec = mlxsw_reg_rauhtd_num_rec_get(rauhtd_pl);
2231 last_rec_index = num_rec - 1;
2232
2233 if (num_rec < MLXSW_REG_RAUHTD_REC_MAX_NUM)
2234 return false;
2235 if (mlxsw_reg_rauhtd_rec_type_get(rauhtd_pl, last_rec_index) ==
2236 MLXSW_REG_RAUHTD_TYPE_IPV6)
2237 return true;
2238
2239 num_entries = mlxsw_reg_rauhtd_ipv4_rec_num_entries_get(rauhtd_pl,
2240 last_rec_index);
2241 if (++num_entries == MLXSW_REG_RAUHTD_IPV4_ENT_PER_REC)
2242 return true;
2243 return false;
2244}
2245
60f040ca
AS
2246static int
2247__mlxsw_sp_router_neighs_update_rauhtd(struct mlxsw_sp *mlxsw_sp,
2248 char *rauhtd_pl,
2249 enum mlxsw_reg_rauhtd_type type)
c723c735 2250{
60f040ca
AS
2251 int i, num_rec;
2252 int err;
c723c735
YG
2253
2254 /* Make sure the neighbour's netdev isn't removed in the
2255 * process.
2256 */
2257 rtnl_lock();
2258 do {
60f040ca 2259 mlxsw_reg_rauhtd_pack(rauhtd_pl, type);
c723c735
YG
2260 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(rauhtd),
2261 rauhtd_pl);
2262 if (err) {
7ff176f8 2263 dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Failed to dump neighbour table\n");
c723c735
YG
2264 break;
2265 }
2266 num_rec = mlxsw_reg_rauhtd_num_rec_get(rauhtd_pl);
2267 for (i = 0; i < num_rec; i++)
2268 mlxsw_sp_router_neigh_rec_process(mlxsw_sp, rauhtd_pl,
2269 i);
42cdb338 2270 } while (mlxsw_sp_router_rauhtd_is_full(rauhtd_pl));
c723c735
YG
2271 rtnl_unlock();
2272
60f040ca
AS
2273 return err;
2274}
2275
2276static int mlxsw_sp_router_neighs_update_rauhtd(struct mlxsw_sp *mlxsw_sp)
2277{
2278 enum mlxsw_reg_rauhtd_type type;
2279 char *rauhtd_pl;
2280 int err;
2281
2282 rauhtd_pl = kmalloc(MLXSW_REG_RAUHTD_LEN, GFP_KERNEL);
2283 if (!rauhtd_pl)
2284 return -ENOMEM;
2285
2286 type = MLXSW_REG_RAUHTD_TYPE_IPV4;
2287 err = __mlxsw_sp_router_neighs_update_rauhtd(mlxsw_sp, rauhtd_pl, type);
2288 if (err)
2289 goto out;
2290
2291 type = MLXSW_REG_RAUHTD_TYPE_IPV6;
2292 err = __mlxsw_sp_router_neighs_update_rauhtd(mlxsw_sp, rauhtd_pl, type);
2293out:
c723c735 2294 kfree(rauhtd_pl);
b2157149
YG
2295 return err;
2296}
2297
2298static void mlxsw_sp_router_neighs_update_nh(struct mlxsw_sp *mlxsw_sp)
2299{
2300 struct mlxsw_sp_neigh_entry *neigh_entry;
2301
2302 /* Take RTNL mutex here to prevent lists from changes */
2303 rtnl_lock();
9011b677 2304 list_for_each_entry(neigh_entry, &mlxsw_sp->router->nexthop_neighs_list,
8a0b7275 2305 nexthop_neighs_list_node)
b2157149
YG
2306 /* If this neigh have nexthops, make the kernel think this neigh
2307 * is active regardless of the traffic.
2308 */
8a0b7275 2309 neigh_event_send(neigh_entry->key.n, NULL);
b2157149
YG
2310 rtnl_unlock();
2311}
2312
2313static void
2314mlxsw_sp_router_neighs_update_work_schedule(struct mlxsw_sp *mlxsw_sp)
2315{
9011b677 2316 unsigned long interval = mlxsw_sp->router->neighs_update.interval;
b2157149 2317
9011b677 2318 mlxsw_core_schedule_dw(&mlxsw_sp->router->neighs_update.dw,
b2157149
YG
2319 msecs_to_jiffies(interval));
2320}
2321
2322static void mlxsw_sp_router_neighs_update_work(struct work_struct *work)
2323{
9011b677 2324 struct mlxsw_sp_router *router;
b2157149
YG
2325 int err;
2326
9011b677
IS
2327 router = container_of(work, struct mlxsw_sp_router,
2328 neighs_update.dw.work);
2329 err = mlxsw_sp_router_neighs_update_rauhtd(router->mlxsw_sp);
b2157149 2330 if (err)
9011b677 2331 dev_err(router->mlxsw_sp->bus_info->dev, "Could not update kernel for neigh activity");
b2157149 2332
9011b677 2333 mlxsw_sp_router_neighs_update_nh(router->mlxsw_sp);
b2157149 2334
9011b677 2335 mlxsw_sp_router_neighs_update_work_schedule(router->mlxsw_sp);
c723c735
YG
2336}
2337
0b2361d9
YG
2338static void mlxsw_sp_router_probe_unresolved_nexthops(struct work_struct *work)
2339{
2340 struct mlxsw_sp_neigh_entry *neigh_entry;
9011b677 2341 struct mlxsw_sp_router *router;
0b2361d9 2342
9011b677
IS
2343 router = container_of(work, struct mlxsw_sp_router,
2344 nexthop_probe_dw.work);
0b2361d9
YG
2345 /* Iterate over nexthop neighbours, find those who are unresolved and
2346 * send arp on them. This solves the chicken-egg problem when
2347 * the nexthop wouldn't get offloaded until the neighbor is resolved
2348 * but it wouldn't get resolved ever in case traffic is flowing in HW
2349 * using different nexthop.
2350 *
2351 * Take RTNL mutex here to prevent lists from changes.
2352 */
2353 rtnl_lock();
9011b677 2354 list_for_each_entry(neigh_entry, &router->nexthop_neighs_list,
8a0b7275 2355 nexthop_neighs_list_node)
01b1aa35 2356 if (!neigh_entry->connected)
33b1341c 2357 neigh_event_send(neigh_entry->key.n, NULL);
0b2361d9
YG
2358 rtnl_unlock();
2359
9011b677 2360 mlxsw_core_schedule_dw(&router->nexthop_probe_dw,
0b2361d9
YG
2361 MLXSW_SP_UNRESOLVED_NH_PROBE_INTERVAL);
2362}
2363
a7ff87ac
JP
2364static void
2365mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp *mlxsw_sp,
2366 struct mlxsw_sp_neigh_entry *neigh_entry,
83d57826 2367 bool removing, bool dead);
a7ff87ac 2368
5c8802f1
IS
2369static enum mlxsw_reg_rauht_op mlxsw_sp_rauht_op(bool adding)
2370{
2371 return adding ? MLXSW_REG_RAUHT_OP_WRITE_ADD :
2372 MLXSW_REG_RAUHT_OP_WRITE_DELETE;
2373}
2374
a85e84e0 2375static int
5c8802f1
IS
2376mlxsw_sp_router_neigh_entry_op4(struct mlxsw_sp *mlxsw_sp,
2377 struct mlxsw_sp_neigh_entry *neigh_entry,
2378 enum mlxsw_reg_rauht_op op)
a6bf9e93 2379{
33b1341c 2380 struct neighbour *n = neigh_entry->key.n;
5c8802f1 2381 u32 dip = ntohl(*((__be32 *) n->primary_key));
a6bf9e93 2382 char rauht_pl[MLXSW_REG_RAUHT_LEN];
5c8802f1
IS
2383
2384 mlxsw_reg_rauht_pack4(rauht_pl, op, neigh_entry->rif, neigh_entry->ha,
2385 dip);
7cfcbc75
AS
2386 if (neigh_entry->counter_valid)
2387 mlxsw_reg_rauht_pack_counter(rauht_pl,
2388 neigh_entry->counter_index);
a85e84e0 2389 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rauht), rauht_pl);
5c8802f1
IS
2390}
2391
a85e84e0 2392static int
d5eb89cf
AS
2393mlxsw_sp_router_neigh_entry_op6(struct mlxsw_sp *mlxsw_sp,
2394 struct mlxsw_sp_neigh_entry *neigh_entry,
2395 enum mlxsw_reg_rauht_op op)
2396{
2397 struct neighbour *n = neigh_entry->key.n;
2398 char rauht_pl[MLXSW_REG_RAUHT_LEN];
2399 const char *dip = n->primary_key;
2400
2401 mlxsw_reg_rauht_pack6(rauht_pl, op, neigh_entry->rif, neigh_entry->ha,
2402 dip);
7cfcbc75
AS
2403 if (neigh_entry->counter_valid)
2404 mlxsw_reg_rauht_pack_counter(rauht_pl,
2405 neigh_entry->counter_index);
a85e84e0 2406 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rauht), rauht_pl);
d5eb89cf
AS
2407}
2408
1d1056d8 2409bool mlxsw_sp_neigh_ipv6_ignore(struct mlxsw_sp_neigh_entry *neigh_entry)
d5eb89cf 2410{
1d1056d8
AS
2411 struct neighbour *n = neigh_entry->key.n;
2412
d5eb89cf
AS
2413 /* Packets with a link-local destination address are trapped
2414 * after LPM lookup and never reach the neighbour table, so
2415 * there is no need to program such neighbours to the device.
2416 */
2417 if (ipv6_addr_type((struct in6_addr *) &n->primary_key) &
2418 IPV6_ADDR_LINKLOCAL)
2419 return true;
2420 return false;
2421}
2422
5c8802f1
IS
2423static void
2424mlxsw_sp_neigh_entry_update(struct mlxsw_sp *mlxsw_sp,
2425 struct mlxsw_sp_neigh_entry *neigh_entry,
2426 bool adding)
2427{
a85e84e0
IS
2428 enum mlxsw_reg_rauht_op op = mlxsw_sp_rauht_op(adding);
2429 int err;
2430
5c8802f1
IS
2431 if (!adding && !neigh_entry->connected)
2432 return;
2433 neigh_entry->connected = adding;
b5f3e0d4 2434 if (neigh_entry->key.n->tbl->family == AF_INET) {
a85e84e0
IS
2435 err = mlxsw_sp_router_neigh_entry_op4(mlxsw_sp, neigh_entry,
2436 op);
2437 if (err)
2438 return;
b5f3e0d4 2439 } else if (neigh_entry->key.n->tbl->family == AF_INET6) {
1d1056d8 2440 if (mlxsw_sp_neigh_ipv6_ignore(neigh_entry))
d5eb89cf 2441 return;
a85e84e0
IS
2442 err = mlxsw_sp_router_neigh_entry_op6(mlxsw_sp, neigh_entry,
2443 op);
2444 if (err)
2445 return;
d5eb89cf 2446 } else {
5c8802f1 2447 WARN_ON_ONCE(1);
caf345a1 2448 return;
d5eb89cf 2449 }
caf345a1
IS
2450
2451 if (adding)
2452 neigh_entry->key.n->flags |= NTF_OFFLOADED;
2453 else
2454 neigh_entry->key.n->flags &= ~NTF_OFFLOADED;
5c8802f1
IS
2455}
2456
a481d713
AS
2457void
2458mlxsw_sp_neigh_entry_counter_update(struct mlxsw_sp *mlxsw_sp,
2459 struct mlxsw_sp_neigh_entry *neigh_entry,
2460 bool adding)
2461{
2462 if (adding)
2463 mlxsw_sp_neigh_counter_alloc(mlxsw_sp, neigh_entry);
2464 else
2465 mlxsw_sp_neigh_counter_free(mlxsw_sp, neigh_entry);
2466 mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, true);
2467}
2468
ceb8881d 2469struct mlxsw_sp_netevent_work {
5c8802f1
IS
2470 struct work_struct work;
2471 struct mlxsw_sp *mlxsw_sp;
2472 struct neighbour *n;
2473};
2474
2475static void mlxsw_sp_router_neigh_event_work(struct work_struct *work)
2476{
ceb8881d
IS
2477 struct mlxsw_sp_netevent_work *net_work =
2478 container_of(work, struct mlxsw_sp_netevent_work, work);
2479 struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp;
5c8802f1 2480 struct mlxsw_sp_neigh_entry *neigh_entry;
ceb8881d 2481 struct neighbour *n = net_work->n;
5c8802f1 2482 unsigned char ha[ETH_ALEN];
a6bf9e93 2483 bool entry_connected;
93a87e5e 2484 u8 nud_state, dead;
a6bf9e93 2485
5c8802f1
IS
2486 /* If these parameters are changed after we release the lock,
2487 * then we are guaranteed to receive another event letting us
2488 * know about it.
2489 */
a6bf9e93 2490 read_lock_bh(&n->lock);
5c8802f1 2491 memcpy(ha, n->ha, ETH_ALEN);
a6bf9e93 2492 nud_state = n->nud_state;
93a87e5e 2493 dead = n->dead;
a6bf9e93
YG
2494 read_unlock_bh(&n->lock);
2495
5c8802f1 2496 rtnl_lock();
803335ac
PM
2497 mlxsw_sp_span_respin(mlxsw_sp);
2498
93a87e5e 2499 entry_connected = nud_state & NUD_VALID && !dead;
5c8802f1
IS
2500 neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, n);
2501 if (!entry_connected && !neigh_entry)
2502 goto out;
2503 if (!neigh_entry) {
2504 neigh_entry = mlxsw_sp_neigh_entry_create(mlxsw_sp, n);
2505 if (IS_ERR(neigh_entry))
2506 goto out;
a6bf9e93
YG
2507 }
2508
5c8802f1
IS
2509 memcpy(neigh_entry->ha, ha, ETH_ALEN);
2510 mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, entry_connected);
83d57826
IS
2511 mlxsw_sp_nexthop_neigh_update(mlxsw_sp, neigh_entry, !entry_connected,
2512 dead);
5c8802f1
IS
2513
2514 if (!neigh_entry->connected && list_empty(&neigh_entry->nexthop_list))
2515 mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry);
2516
2517out:
2518 rtnl_unlock();
a6bf9e93 2519 neigh_release(n);
ceb8881d 2520 kfree(net_work);
a6bf9e93
YG
2521}
2522
28678f07
IS
2523static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp);
2524
2525static void mlxsw_sp_router_mp_hash_event_work(struct work_struct *work)
2526{
2527 struct mlxsw_sp_netevent_work *net_work =
2528 container_of(work, struct mlxsw_sp_netevent_work, work);
2529 struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp;
2530
2531 mlxsw_sp_mp_hash_init(mlxsw_sp);
2532 kfree(net_work);
2533}
2534
64953423
PM
2535static int __mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp);
2536
2537static void mlxsw_sp_router_update_priority_work(struct work_struct *work)
2538{
2539 struct mlxsw_sp_netevent_work *net_work =
2540 container_of(work, struct mlxsw_sp_netevent_work, work);
2541 struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp;
2542
2543 __mlxsw_sp_router_init(mlxsw_sp);
2544 kfree(net_work);
2545}
2546
1f65a33f
PM
2547static int mlxsw_sp_router_schedule_work(struct net *net,
2548 struct notifier_block *nb,
2549 void (*cb)(struct work_struct *))
2550{
2551 struct mlxsw_sp_netevent_work *net_work;
2552 struct mlxsw_sp_router *router;
2553
2554 if (!net_eq(net, &init_net))
2555 return NOTIFY_DONE;
2556
2557 net_work = kzalloc(sizeof(*net_work), GFP_ATOMIC);
2558 if (!net_work)
2559 return NOTIFY_BAD;
2560
2561 router = container_of(nb, struct mlxsw_sp_router, netevent_nb);
2562 INIT_WORK(&net_work->work, cb);
2563 net_work->mlxsw_sp = router->mlxsw_sp;
2564 mlxsw_core_schedule_work(&net_work->work);
2565 return NOTIFY_DONE;
2566}
2567
28678f07 2568static int mlxsw_sp_router_netevent_event(struct notifier_block *nb,
48fac885 2569 unsigned long event, void *ptr)
c723c735 2570{
ceb8881d 2571 struct mlxsw_sp_netevent_work *net_work;
c723c735
YG
2572 struct mlxsw_sp_port *mlxsw_sp_port;
2573 struct mlxsw_sp *mlxsw_sp;
2574 unsigned long interval;
2575 struct neigh_parms *p;
a6bf9e93 2576 struct neighbour *n;
c723c735
YG
2577
2578 switch (event) {
2579 case NETEVENT_DELAY_PROBE_TIME_UPDATE:
2580 p = ptr;
2581
2582 /* We don't care about changes in the default table. */
b5f3e0d4
IS
2583 if (!p->dev || (p->tbl->family != AF_INET &&
2584 p->tbl->family != AF_INET6))
c723c735
YG
2585 return NOTIFY_DONE;
2586
2587 /* We are in atomic context and can't take RTNL mutex,
2588 * so use RCU variant to walk the device chain.
2589 */
2590 mlxsw_sp_port = mlxsw_sp_port_lower_dev_hold(p->dev);
2591 if (!mlxsw_sp_port)
2592 return NOTIFY_DONE;
2593
2594 mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
2595 interval = jiffies_to_msecs(NEIGH_VAR(p, DELAY_PROBE_TIME));
9011b677 2596 mlxsw_sp->router->neighs_update.interval = interval;
c723c735
YG
2597
2598 mlxsw_sp_port_dev_put(mlxsw_sp_port);
2599 break;
a6bf9e93
YG
2600 case NETEVENT_NEIGH_UPDATE:
2601 n = ptr;
a6bf9e93 2602
b5f3e0d4 2603 if (n->tbl->family != AF_INET && n->tbl->family != AF_INET6)
a6bf9e93
YG
2604 return NOTIFY_DONE;
2605
5c8802f1 2606 mlxsw_sp_port = mlxsw_sp_port_lower_dev_hold(n->dev);
a6bf9e93
YG
2607 if (!mlxsw_sp_port)
2608 return NOTIFY_DONE;
2609
ceb8881d
IS
2610 net_work = kzalloc(sizeof(*net_work), GFP_ATOMIC);
2611 if (!net_work) {
a6bf9e93 2612 mlxsw_sp_port_dev_put(mlxsw_sp_port);
5c8802f1 2613 return NOTIFY_BAD;
a6bf9e93 2614 }
5c8802f1 2615
ceb8881d
IS
2616 INIT_WORK(&net_work->work, mlxsw_sp_router_neigh_event_work);
2617 net_work->mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
2618 net_work->n = n;
a6bf9e93
YG
2619
2620 /* Take a reference to ensure the neighbour won't be
2621 * destructed until we drop the reference in delayed
2622 * work.
2623 */
2624 neigh_clone(n);
ceb8881d 2625 mlxsw_core_schedule_work(&net_work->work);
5c8802f1 2626 mlxsw_sp_port_dev_put(mlxsw_sp_port);
a6bf9e93 2627 break;
3192dac6 2628 case NETEVENT_IPV4_MPATH_HASH_UPDATE:
5e18b9c5 2629 case NETEVENT_IPV6_MPATH_HASH_UPDATE:
1f65a33f
PM
2630 return mlxsw_sp_router_schedule_work(ptr, nb,
2631 mlxsw_sp_router_mp_hash_event_work);
28678f07 2632
64953423
PM
2633 case NETEVENT_IPV4_FWD_UPDATE_PRIORITY_UPDATE:
2634 return mlxsw_sp_router_schedule_work(ptr, nb,
2635 mlxsw_sp_router_update_priority_work);
c723c735
YG
2636 }
2637
2638 return NOTIFY_DONE;
2639}
2640
6cf3c971
JP
2641static int mlxsw_sp_neigh_init(struct mlxsw_sp *mlxsw_sp)
2642{
c723c735
YG
2643 int err;
2644
9011b677 2645 err = rhashtable_init(&mlxsw_sp->router->neigh_ht,
c723c735
YG
2646 &mlxsw_sp_neigh_ht_params);
2647 if (err)
2648 return err;
2649
2650 /* Initialize the polling interval according to the default
2651 * table.
2652 */
2653 mlxsw_sp_router_neighs_update_interval_init(mlxsw_sp);
2654
0b2361d9 2655 /* Create the delayed works for the activity_update */
9011b677 2656 INIT_DELAYED_WORK(&mlxsw_sp->router->neighs_update.dw,
c723c735 2657 mlxsw_sp_router_neighs_update_work);
9011b677 2658 INIT_DELAYED_WORK(&mlxsw_sp->router->nexthop_probe_dw,
0b2361d9 2659 mlxsw_sp_router_probe_unresolved_nexthops);
9011b677
IS
2660 mlxsw_core_schedule_dw(&mlxsw_sp->router->neighs_update.dw, 0);
2661 mlxsw_core_schedule_dw(&mlxsw_sp->router->nexthop_probe_dw, 0);
c723c735 2662 return 0;
6cf3c971
JP
2663}
2664
2665static void mlxsw_sp_neigh_fini(struct mlxsw_sp *mlxsw_sp)
2666{
9011b677
IS
2667 cancel_delayed_work_sync(&mlxsw_sp->router->neighs_update.dw);
2668 cancel_delayed_work_sync(&mlxsw_sp->router->nexthop_probe_dw);
2669 rhashtable_destroy(&mlxsw_sp->router->neigh_ht);
6cf3c971
JP
2670}
2671
9665b745 2672static void mlxsw_sp_neigh_rif_gone_sync(struct mlxsw_sp *mlxsw_sp,
bf95233e 2673 struct mlxsw_sp_rif *rif)
9665b745
IS
2674{
2675 struct mlxsw_sp_neigh_entry *neigh_entry, *tmp;
2676
bf95233e 2677 list_for_each_entry_safe(neigh_entry, tmp, &rif->neigh_list,
8ba6b30e
PM
2678 rif_list_node) {
2679 mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, false);
9665b745 2680 mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry);
8ba6b30e 2681 }
9665b745
IS
2682}
2683
35225e47
PM
2684enum mlxsw_sp_nexthop_type {
2685 MLXSW_SP_NEXTHOP_TYPE_ETH,
1012b9ac 2686 MLXSW_SP_NEXTHOP_TYPE_IPIP,
35225e47
PM
2687};
2688
c53b8e1b
IS
2689struct mlxsw_sp_nexthop_key {
2690 struct fib_nh *fib_nh;
2691};
2692
a7ff87ac
JP
2693struct mlxsw_sp_nexthop {
2694 struct list_head neigh_list_node; /* member of neigh entry list */
9665b745 2695 struct list_head rif_list_node;
dbe4598c 2696 struct list_head router_list_node;
a7ff87ac
JP
2697 struct mlxsw_sp_nexthop_group *nh_grp; /* pointer back to the group
2698 * this belongs to
2699 */
c53b8e1b
IS
2700 struct rhash_head ht_node;
2701 struct mlxsw_sp_nexthop_key key;
58adf2c4 2702 unsigned char gw_addr[sizeof(struct in6_addr)];
e6f3b379 2703 int ifindex;
408bd946 2704 int nh_weight;
eb789980
IS
2705 int norm_nh_weight;
2706 int num_adj_entries;
bf95233e 2707 struct mlxsw_sp_rif *rif;
a7ff87ac
JP
2708 u8 should_offload:1, /* set indicates this neigh is connected and
2709 * should be put to KVD linear area of this group.
2710 */
2711 offloaded:1, /* set in case the neigh is actually put into
2712 * KVD linear area of this group.
2713 */
2714 update:1; /* set indicates that MAC of this neigh should be
2715 * updated in HW
2716 */
35225e47
PM
2717 enum mlxsw_sp_nexthop_type type;
2718 union {
2719 struct mlxsw_sp_neigh_entry *neigh_entry;
1012b9ac 2720 struct mlxsw_sp_ipip_entry *ipip_entry;
35225e47 2721 };
a5390278
AS
2722 unsigned int counter_index;
2723 bool counter_valid;
a7ff87ac
JP
2724};
2725
2726struct mlxsw_sp_nexthop_group {
ba31d366 2727 void *priv;
e9ad5e7d 2728 struct rhash_head ht_node;
a7ff87ac 2729 struct list_head fib_list; /* list of fib entries that use this group */
58adf2c4 2730 struct neigh_table *neigh_tbl;
b3e8d1eb
IS
2731 u8 adj_index_valid:1,
2732 gateway:1; /* routes using the group use a gateway */
a7ff87ac
JP
2733 u32 adj_index;
2734 u16 ecmp_size;
2735 u16 count;
eb789980 2736 int sum_norm_weight;
a7ff87ac 2737 struct mlxsw_sp_nexthop nexthops[0];
bf95233e 2738#define nh_rif nexthops[0].rif
a7ff87ac
JP
2739};
2740
427e652a
AS
2741void mlxsw_sp_nexthop_counter_alloc(struct mlxsw_sp *mlxsw_sp,
2742 struct mlxsw_sp_nexthop *nh)
a5390278
AS
2743{
2744 struct devlink *devlink;
2745
2746 devlink = priv_to_devlink(mlxsw_sp->core);
2747 if (!devlink_dpipe_table_counter_enabled(devlink,
2748 MLXSW_SP_DPIPE_TABLE_NAME_ADJ))
2749 return;
2750
2751 if (mlxsw_sp_flow_counter_alloc(mlxsw_sp, &nh->counter_index))
2752 return;
2753
2754 nh->counter_valid = true;
2755}
2756
427e652a
AS
2757void mlxsw_sp_nexthop_counter_free(struct mlxsw_sp *mlxsw_sp,
2758 struct mlxsw_sp_nexthop *nh)
a5390278
AS
2759{
2760 if (!nh->counter_valid)
2761 return;
2762 mlxsw_sp_flow_counter_free(mlxsw_sp, nh->counter_index);
2763 nh->counter_valid = false;
2764}
2765
2766int mlxsw_sp_nexthop_counter_get(struct mlxsw_sp *mlxsw_sp,
2767 struct mlxsw_sp_nexthop *nh, u64 *p_counter)
2768{
2769 if (!nh->counter_valid)
2770 return -EINVAL;
2771
2772 return mlxsw_sp_flow_counter_get(mlxsw_sp, nh->counter_index,
2773 p_counter, NULL);
2774}
2775
c556cd28
AS
2776struct mlxsw_sp_nexthop *mlxsw_sp_nexthop_next(struct mlxsw_sp_router *router,
2777 struct mlxsw_sp_nexthop *nh)
2778{
2779 if (!nh) {
2780 if (list_empty(&router->nexthop_list))
2781 return NULL;
2782 else
2783 return list_first_entry(&router->nexthop_list,
2784 typeof(*nh), router_list_node);
2785 }
2786 if (list_is_last(&nh->router_list_node, &router->nexthop_list))
2787 return NULL;
2788 return list_next_entry(nh, router_list_node);
2789}
2790
2791bool mlxsw_sp_nexthop_offload(struct mlxsw_sp_nexthop *nh)
2792{
2793 return nh->offloaded;
2794}
2795
2796unsigned char *mlxsw_sp_nexthop_ha(struct mlxsw_sp_nexthop *nh)
2797{
2798 if (!nh->offloaded)
2799 return NULL;
2800 return nh->neigh_entry->ha;
2801}
2802
2803int mlxsw_sp_nexthop_indexes(struct mlxsw_sp_nexthop *nh, u32 *p_adj_index,
e69cd9d7 2804 u32 *p_adj_size, u32 *p_adj_hash_index)
c556cd28
AS
2805{
2806 struct mlxsw_sp_nexthop_group *nh_grp = nh->nh_grp;
2807 u32 adj_hash_index = 0;
2808 int i;
2809
2810 if (!nh->offloaded || !nh_grp->adj_index_valid)
2811 return -EINVAL;
2812
2813 *p_adj_index = nh_grp->adj_index;
e69cd9d7 2814 *p_adj_size = nh_grp->ecmp_size;
c556cd28
AS
2815
2816 for (i = 0; i < nh_grp->count; i++) {
2817 struct mlxsw_sp_nexthop *nh_iter = &nh_grp->nexthops[i];
2818
2819 if (nh_iter == nh)
2820 break;
2821 if (nh_iter->offloaded)
eb789980 2822 adj_hash_index += nh_iter->num_adj_entries;
c556cd28
AS
2823 }
2824
2825 *p_adj_hash_index = adj_hash_index;
2826 return 0;
2827}
2828
2829struct mlxsw_sp_rif *mlxsw_sp_nexthop_rif(struct mlxsw_sp_nexthop *nh)
2830{
2831 return nh->rif;
2832}
2833
2834bool mlxsw_sp_nexthop_group_has_ipip(struct mlxsw_sp_nexthop *nh)
2835{
2836 struct mlxsw_sp_nexthop_group *nh_grp = nh->nh_grp;
2837 int i;
2838
2839 for (i = 0; i < nh_grp->count; i++) {
2840 struct mlxsw_sp_nexthop *nh_iter = &nh_grp->nexthops[i];
2841
2842 if (nh_iter->type == MLXSW_SP_NEXTHOP_TYPE_IPIP)
2843 return true;
2844 }
2845 return false;
2846}
2847
ba31d366
AS
2848static struct fib_info *
2849mlxsw_sp_nexthop4_group_fi(const struct mlxsw_sp_nexthop_group *nh_grp)
2850{
2851 return nh_grp->priv;
2852}
2853
2854struct mlxsw_sp_nexthop_group_cmp_arg {
e6f3b379
AS
2855 enum mlxsw_sp_l3proto proto;
2856 union {
2857 struct fib_info *fi;
2858 struct mlxsw_sp_fib6_entry *fib6_entry;
2859 };
ba31d366
AS
2860};
2861
e6f3b379
AS
2862static bool
2863mlxsw_sp_nexthop6_group_has_nexthop(const struct mlxsw_sp_nexthop_group *nh_grp,
3743d88a
IS
2864 const struct in6_addr *gw, int ifindex,
2865 int weight)
e6f3b379
AS
2866{
2867 int i;
2868
2869 for (i = 0; i < nh_grp->count; i++) {
2870 const struct mlxsw_sp_nexthop *nh;
2871
2872 nh = &nh_grp->nexthops[i];
3743d88a 2873 if (nh->ifindex == ifindex && nh->nh_weight == weight &&
e6f3b379
AS
2874 ipv6_addr_equal(gw, (struct in6_addr *) nh->gw_addr))
2875 return true;
2876 }
2877
2878 return false;
2879}
2880
2881static bool
2882mlxsw_sp_nexthop6_group_cmp(const struct mlxsw_sp_nexthop_group *nh_grp,
2883 const struct mlxsw_sp_fib6_entry *fib6_entry)
2884{
2885 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
2886
2887 if (nh_grp->count != fib6_entry->nrt6)
2888 return false;
2889
2890 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
1cf844c7 2891 struct fib6_nh *fib6_nh = mlxsw_sp_rt6->rt->fib6_nh;
e6f3b379 2892 struct in6_addr *gw;
3743d88a 2893 int ifindex, weight;
e6f3b379 2894
ad1601ae
DA
2895 ifindex = fib6_nh->fib_nh_dev->ifindex;
2896 weight = fib6_nh->fib_nh_weight;
2897 gw = &fib6_nh->fib_nh_gw6;
3743d88a
IS
2898 if (!mlxsw_sp_nexthop6_group_has_nexthop(nh_grp, gw, ifindex,
2899 weight))
e6f3b379
AS
2900 return false;
2901 }
2902
2903 return true;
2904}
2905
ba31d366
AS
2906static int
2907mlxsw_sp_nexthop_group_cmp(struct rhashtable_compare_arg *arg, const void *ptr)
2908{
2909 const struct mlxsw_sp_nexthop_group_cmp_arg *cmp_arg = arg->key;
2910 const struct mlxsw_sp_nexthop_group *nh_grp = ptr;
2911
e6f3b379
AS
2912 switch (cmp_arg->proto) {
2913 case MLXSW_SP_L3_PROTO_IPV4:
2914 return cmp_arg->fi != mlxsw_sp_nexthop4_group_fi(nh_grp);
2915 case MLXSW_SP_L3_PROTO_IPV6:
2916 return !mlxsw_sp_nexthop6_group_cmp(nh_grp,
2917 cmp_arg->fib6_entry);
2918 default:
2919 WARN_ON(1);
2920 return 1;
2921 }
2922}
2923
2924static int
2925mlxsw_sp_nexthop_group_type(const struct mlxsw_sp_nexthop_group *nh_grp)
2926{
2927 return nh_grp->neigh_tbl->family;
ba31d366
AS
2928}
2929
2930static u32 mlxsw_sp_nexthop_group_hash_obj(const void *data, u32 len, u32 seed)
2931{
2932 const struct mlxsw_sp_nexthop_group *nh_grp = data;
e6f3b379
AS
2933 const struct mlxsw_sp_nexthop *nh;
2934 struct fib_info *fi;
2935 unsigned int val;
2936 int i;
ba31d366 2937
e6f3b379
AS
2938 switch (mlxsw_sp_nexthop_group_type(nh_grp)) {
2939 case AF_INET:
2940 fi = mlxsw_sp_nexthop4_group_fi(nh_grp);
2941 return jhash(&fi, sizeof(fi), seed);
2942 case AF_INET6:
2943 val = nh_grp->count;
2944 for (i = 0; i < nh_grp->count; i++) {
2945 nh = &nh_grp->nexthops[i];
2946 val ^= nh->ifindex;
2947 }
2948 return jhash(&val, sizeof(val), seed);
2949 default:
2950 WARN_ON(1);
2951 return 0;
2952 }
2953}
2954
2955static u32
2956mlxsw_sp_nexthop6_group_hash(struct mlxsw_sp_fib6_entry *fib6_entry, u32 seed)
2957{
2958 unsigned int val = fib6_entry->nrt6;
2959 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
2960 struct net_device *dev;
2961
2962 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
1cf844c7 2963 dev = mlxsw_sp_rt6->rt->fib6_nh->fib_nh_dev;
e6f3b379
AS
2964 val ^= dev->ifindex;
2965 }
2966
2967 return jhash(&val, sizeof(val), seed);
ba31d366
AS
2968}
2969
2970static u32
2971mlxsw_sp_nexthop_group_hash(const void *data, u32 len, u32 seed)
2972{
2973 const struct mlxsw_sp_nexthop_group_cmp_arg *cmp_arg = data;
2974
e6f3b379
AS
2975 switch (cmp_arg->proto) {
2976 case MLXSW_SP_L3_PROTO_IPV4:
2977 return jhash(&cmp_arg->fi, sizeof(cmp_arg->fi), seed);
2978 case MLXSW_SP_L3_PROTO_IPV6:
2979 return mlxsw_sp_nexthop6_group_hash(cmp_arg->fib6_entry, seed);
2980 default:
2981 WARN_ON(1);
2982 return 0;
2983 }
ba31d366
AS
2984}
2985
e9ad5e7d 2986static const struct rhashtable_params mlxsw_sp_nexthop_group_ht_params = {
e9ad5e7d 2987 .head_offset = offsetof(struct mlxsw_sp_nexthop_group, ht_node),
ba31d366
AS
2988 .hashfn = mlxsw_sp_nexthop_group_hash,
2989 .obj_hashfn = mlxsw_sp_nexthop_group_hash_obj,
2990 .obj_cmpfn = mlxsw_sp_nexthop_group_cmp,
e9ad5e7d
IS
2991};
2992
2993static int mlxsw_sp_nexthop_group_insert(struct mlxsw_sp *mlxsw_sp,
2994 struct mlxsw_sp_nexthop_group *nh_grp)
2995{
e6f3b379
AS
2996 if (mlxsw_sp_nexthop_group_type(nh_grp) == AF_INET6 &&
2997 !nh_grp->gateway)
2998 return 0;
2999
9011b677 3000 return rhashtable_insert_fast(&mlxsw_sp->router->nexthop_group_ht,
e9ad5e7d
IS
3001 &nh_grp->ht_node,
3002 mlxsw_sp_nexthop_group_ht_params);
3003}
3004
3005static void mlxsw_sp_nexthop_group_remove(struct mlxsw_sp *mlxsw_sp,
3006 struct mlxsw_sp_nexthop_group *nh_grp)
3007{
e6f3b379
AS
3008 if (mlxsw_sp_nexthop_group_type(nh_grp) == AF_INET6 &&
3009 !nh_grp->gateway)
3010 return;
3011
9011b677 3012 rhashtable_remove_fast(&mlxsw_sp->router->nexthop_group_ht,
e9ad5e7d
IS
3013 &nh_grp->ht_node,
3014 mlxsw_sp_nexthop_group_ht_params);
3015}
3016
3017static struct mlxsw_sp_nexthop_group *
ba31d366
AS
3018mlxsw_sp_nexthop4_group_lookup(struct mlxsw_sp *mlxsw_sp,
3019 struct fib_info *fi)
e9ad5e7d 3020{
ba31d366
AS
3021 struct mlxsw_sp_nexthop_group_cmp_arg cmp_arg;
3022
e6f3b379 3023 cmp_arg.proto = MLXSW_SP_L3_PROTO_IPV4;
ba31d366
AS
3024 cmp_arg.fi = fi;
3025 return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_group_ht,
3026 &cmp_arg,
e9ad5e7d
IS
3027 mlxsw_sp_nexthop_group_ht_params);
3028}
3029
e6f3b379
AS
3030static struct mlxsw_sp_nexthop_group *
3031mlxsw_sp_nexthop6_group_lookup(struct mlxsw_sp *mlxsw_sp,
3032 struct mlxsw_sp_fib6_entry *fib6_entry)
3033{
3034 struct mlxsw_sp_nexthop_group_cmp_arg cmp_arg;
3035
3036 cmp_arg.proto = MLXSW_SP_L3_PROTO_IPV6;
3037 cmp_arg.fib6_entry = fib6_entry;
3038 return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_group_ht,
3039 &cmp_arg,
3040 mlxsw_sp_nexthop_group_ht_params);
3041}
3042
c53b8e1b
IS
3043static const struct rhashtable_params mlxsw_sp_nexthop_ht_params = {
3044 .key_offset = offsetof(struct mlxsw_sp_nexthop, key),
3045 .head_offset = offsetof(struct mlxsw_sp_nexthop, ht_node),
3046 .key_len = sizeof(struct mlxsw_sp_nexthop_key),
3047};
3048
3049static int mlxsw_sp_nexthop_insert(struct mlxsw_sp *mlxsw_sp,
3050 struct mlxsw_sp_nexthop *nh)
3051{
9011b677 3052 return rhashtable_insert_fast(&mlxsw_sp->router->nexthop_ht,
c53b8e1b
IS
3053 &nh->ht_node, mlxsw_sp_nexthop_ht_params);
3054}
3055
3056static void mlxsw_sp_nexthop_remove(struct mlxsw_sp *mlxsw_sp,
3057 struct mlxsw_sp_nexthop *nh)
3058{
9011b677 3059 rhashtable_remove_fast(&mlxsw_sp->router->nexthop_ht, &nh->ht_node,
c53b8e1b
IS
3060 mlxsw_sp_nexthop_ht_params);
3061}
3062
ad178c8e
IS
3063static struct mlxsw_sp_nexthop *
3064mlxsw_sp_nexthop_lookup(struct mlxsw_sp *mlxsw_sp,
3065 struct mlxsw_sp_nexthop_key key)
3066{
9011b677 3067 return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_ht, &key,
ad178c8e
IS
3068 mlxsw_sp_nexthop_ht_params);
3069}
3070
a7ff87ac 3071static int mlxsw_sp_adj_index_mass_update_vr(struct mlxsw_sp *mlxsw_sp,
76610ebb 3072 const struct mlxsw_sp_fib *fib,
a7ff87ac
JP
3073 u32 adj_index, u16 ecmp_size,
3074 u32 new_adj_index,
3075 u16 new_ecmp_size)
3076{
3077 char raleu_pl[MLXSW_REG_RALEU_LEN];
3078
1a9234e6 3079 mlxsw_reg_raleu_pack(raleu_pl,
76610ebb
IS
3080 (enum mlxsw_reg_ralxx_protocol) fib->proto,
3081 fib->vr->id, adj_index, ecmp_size, new_adj_index,
1a9234e6 3082 new_ecmp_size);
a7ff87ac
JP
3083 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raleu), raleu_pl);
3084}
3085
3086static int mlxsw_sp_adj_index_mass_update(struct mlxsw_sp *mlxsw_sp,
3087 struct mlxsw_sp_nexthop_group *nh_grp,
3088 u32 old_adj_index, u16 old_ecmp_size)
3089{
3090 struct mlxsw_sp_fib_entry *fib_entry;
76610ebb 3091 struct mlxsw_sp_fib *fib = NULL;
a7ff87ac
JP
3092 int err;
3093
3094 list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) {
76610ebb 3095 if (fib == fib_entry->fib_node->fib)
a7ff87ac 3096 continue;
76610ebb
IS
3097 fib = fib_entry->fib_node->fib;
3098 err = mlxsw_sp_adj_index_mass_update_vr(mlxsw_sp, fib,
a7ff87ac
JP
3099 old_adj_index,
3100 old_ecmp_size,
3101 nh_grp->adj_index,
3102 nh_grp->ecmp_size);
3103 if (err)
3104 return err;
3105 }
3106 return 0;
3107}
3108
eb789980
IS
3109static int __mlxsw_sp_nexthop_update(struct mlxsw_sp *mlxsw_sp, u32 adj_index,
3110 struct mlxsw_sp_nexthop *nh)
a7ff87ac
JP
3111{
3112 struct mlxsw_sp_neigh_entry *neigh_entry = nh->neigh_entry;
3113 char ratr_pl[MLXSW_REG_RATR_LEN];
3114
3115 mlxsw_reg_ratr_pack(ratr_pl, MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY,
89e41982
PM
3116 true, MLXSW_REG_RATR_TYPE_ETHERNET,
3117 adj_index, neigh_entry->rif);
a7ff87ac 3118 mlxsw_reg_ratr_eth_entry_pack(ratr_pl, neigh_entry->ha);
a5390278
AS
3119 if (nh->counter_valid)
3120 mlxsw_reg_ratr_counter_pack(ratr_pl, nh->counter_index, true);
3121 else
3122 mlxsw_reg_ratr_counter_pack(ratr_pl, 0, false);
3123
a7ff87ac
JP
3124 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl);
3125}
3126
eb789980
IS
3127int mlxsw_sp_nexthop_update(struct mlxsw_sp *mlxsw_sp, u32 adj_index,
3128 struct mlxsw_sp_nexthop *nh)
3129{
3130 int i;
3131
3132 for (i = 0; i < nh->num_adj_entries; i++) {
3133 int err;
3134
3135 err = __mlxsw_sp_nexthop_update(mlxsw_sp, adj_index + i, nh);
3136 if (err)
3137 return err;
3138 }
3139
3140 return 0;
3141}
3142
3143static int __mlxsw_sp_nexthop_ipip_update(struct mlxsw_sp *mlxsw_sp,
3144 u32 adj_index,
3145 struct mlxsw_sp_nexthop *nh)
1012b9ac
PM
3146{
3147 const struct mlxsw_sp_ipip_ops *ipip_ops;
3148
3149 ipip_ops = mlxsw_sp->router->ipip_ops_arr[nh->ipip_entry->ipipt];
3150 return ipip_ops->nexthop_update(mlxsw_sp, adj_index, nh->ipip_entry);
3151}
3152
eb789980
IS
3153static int mlxsw_sp_nexthop_ipip_update(struct mlxsw_sp *mlxsw_sp,
3154 u32 adj_index,
3155 struct mlxsw_sp_nexthop *nh)
3156{
3157 int i;
3158
3159 for (i = 0; i < nh->num_adj_entries; i++) {
3160 int err;
3161
3162 err = __mlxsw_sp_nexthop_ipip_update(mlxsw_sp, adj_index + i,
3163 nh);
3164 if (err)
3165 return err;
3166 }
3167
3168 return 0;
3169}
3170
a7ff87ac 3171static int
35225e47
PM
3172mlxsw_sp_nexthop_group_update(struct mlxsw_sp *mlxsw_sp,
3173 struct mlxsw_sp_nexthop_group *nh_grp,
3174 bool reallocate)
a7ff87ac
JP
3175{
3176 u32 adj_index = nh_grp->adj_index; /* base */
3177 struct mlxsw_sp_nexthop *nh;
3178 int i;
3179 int err;
3180
3181 for (i = 0; i < nh_grp->count; i++) {
3182 nh = &nh_grp->nexthops[i];
3183
3184 if (!nh->should_offload) {
3185 nh->offloaded = 0;
3186 continue;
3187 }
3188
a59b7e02 3189 if (nh->update || reallocate) {
35225e47
PM
3190 switch (nh->type) {
3191 case MLXSW_SP_NEXTHOP_TYPE_ETH:
a5390278 3192 err = mlxsw_sp_nexthop_update
35225e47
PM
3193 (mlxsw_sp, adj_index, nh);
3194 break;
1012b9ac
PM
3195 case MLXSW_SP_NEXTHOP_TYPE_IPIP:
3196 err = mlxsw_sp_nexthop_ipip_update
3197 (mlxsw_sp, adj_index, nh);
3198 break;
35225e47 3199 }
a7ff87ac
JP
3200 if (err)
3201 return err;
3202 nh->update = 0;
3203 nh->offloaded = 1;
3204 }
eb789980 3205 adj_index += nh->num_adj_entries;
a7ff87ac
JP
3206 }
3207 return 0;
3208}
3209
1819ae3d
IS
3210static bool
3211mlxsw_sp_fib_node_entry_is_first(const struct mlxsw_sp_fib_node *fib_node,
3212 const struct mlxsw_sp_fib_entry *fib_entry);
3213
a7ff87ac
JP
3214static int
3215mlxsw_sp_nexthop_fib_entries_update(struct mlxsw_sp *mlxsw_sp,
3216 struct mlxsw_sp_nexthop_group *nh_grp)
3217{
3218 struct mlxsw_sp_fib_entry *fib_entry;
3219 int err;
3220
3221 list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) {
1819ae3d
IS
3222 if (!mlxsw_sp_fib_node_entry_is_first(fib_entry->fib_node,
3223 fib_entry))
3224 continue;
a7ff87ac
JP
3225 err = mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
3226 if (err)
3227 return err;
3228 }
3229 return 0;
3230}
3231
77d964e6
IS
3232static void
3233mlxsw_sp_fib_entry_offload_refresh(struct mlxsw_sp_fib_entry *fib_entry,
3234 enum mlxsw_reg_ralue_op op, int err);
3235
3236static void
3237mlxsw_sp_nexthop_fib_entries_refresh(struct mlxsw_sp_nexthop_group *nh_grp)
3238{
3239 enum mlxsw_reg_ralue_op op = MLXSW_REG_RALUE_OP_WRITE_WRITE;
3240 struct mlxsw_sp_fib_entry *fib_entry;
3241
3242 list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) {
3243 if (!mlxsw_sp_fib_node_entry_is_first(fib_entry->fib_node,
3244 fib_entry))
3245 continue;
3246 mlxsw_sp_fib_entry_offload_refresh(fib_entry, op, 0);
3247 }
3248}
3249
425a08c6
IS
3250static void mlxsw_sp_adj_grp_size_round_up(u16 *p_adj_grp_size)
3251{
3252 /* Valid sizes for an adjacency group are:
3253 * 1-64, 512, 1024, 2048 and 4096.
3254 */
3255 if (*p_adj_grp_size <= 64)
3256 return;
3257 else if (*p_adj_grp_size <= 512)
3258 *p_adj_grp_size = 512;
3259 else if (*p_adj_grp_size <= 1024)
3260 *p_adj_grp_size = 1024;
3261 else if (*p_adj_grp_size <= 2048)
3262 *p_adj_grp_size = 2048;
3263 else
3264 *p_adj_grp_size = 4096;
3265}
3266
3267static void mlxsw_sp_adj_grp_size_round_down(u16 *p_adj_grp_size,
3268 unsigned int alloc_size)
3269{
3270 if (alloc_size >= 4096)
3271 *p_adj_grp_size = 4096;
3272 else if (alloc_size >= 2048)
3273 *p_adj_grp_size = 2048;
3274 else if (alloc_size >= 1024)
3275 *p_adj_grp_size = 1024;
3276 else if (alloc_size >= 512)
3277 *p_adj_grp_size = 512;
3278}
3279
3280static int mlxsw_sp_fix_adj_grp_size(struct mlxsw_sp *mlxsw_sp,
3281 u16 *p_adj_grp_size)
3282{
3283 unsigned int alloc_size;
3284 int err;
3285
3286 /* Round up the requested group size to the next size supported
3287 * by the device and make sure the request can be satisfied.
3288 */
3289 mlxsw_sp_adj_grp_size_round_up(p_adj_grp_size);
4b6b1869
JP
3290 err = mlxsw_sp_kvdl_alloc_count_query(mlxsw_sp,
3291 MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
3292 *p_adj_grp_size, &alloc_size);
425a08c6
IS
3293 if (err)
3294 return err;
3295 /* It is possible the allocation results in more allocated
3296 * entries than requested. Try to use as much of them as
3297 * possible.
3298 */
3299 mlxsw_sp_adj_grp_size_round_down(p_adj_grp_size, alloc_size);
3300
3301 return 0;
3302}
3303
eb789980
IS
3304static void
3305mlxsw_sp_nexthop_group_normalize(struct mlxsw_sp_nexthop_group *nh_grp)
3306{
3307 int i, g = 0, sum_norm_weight = 0;
3308 struct mlxsw_sp_nexthop *nh;
3309
3310 for (i = 0; i < nh_grp->count; i++) {
3311 nh = &nh_grp->nexthops[i];
3312
3313 if (!nh->should_offload)
3314 continue;
3315 if (g > 0)
3316 g = gcd(nh->nh_weight, g);
3317 else
3318 g = nh->nh_weight;
3319 }
3320
3321 for (i = 0; i < nh_grp->count; i++) {
3322 nh = &nh_grp->nexthops[i];
3323
3324 if (!nh->should_offload)
3325 continue;
3326 nh->norm_nh_weight = nh->nh_weight / g;
3327 sum_norm_weight += nh->norm_nh_weight;
3328 }
3329
3330 nh_grp->sum_norm_weight = sum_norm_weight;
3331}
3332
3333static void
3334mlxsw_sp_nexthop_group_rebalance(struct mlxsw_sp_nexthop_group *nh_grp)
3335{
3336 int total = nh_grp->sum_norm_weight;
3337 u16 ecmp_size = nh_grp->ecmp_size;
3338 int i, weight = 0, lower_bound = 0;
3339
3340 for (i = 0; i < nh_grp->count; i++) {
3341 struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
3342 int upper_bound;
3343
3344 if (!nh->should_offload)
3345 continue;
3346 weight += nh->norm_nh_weight;
3347 upper_bound = DIV_ROUND_CLOSEST(ecmp_size * weight, total);
3348 nh->num_adj_entries = upper_bound - lower_bound;
3349 lower_bound = upper_bound;
3350 }
3351}
3352
a7ff87ac
JP
3353static void
3354mlxsw_sp_nexthop_group_refresh(struct mlxsw_sp *mlxsw_sp,
3355 struct mlxsw_sp_nexthop_group *nh_grp)
3356{
eb789980 3357 u16 ecmp_size, old_ecmp_size;
a7ff87ac
JP
3358 struct mlxsw_sp_nexthop *nh;
3359 bool offload_change = false;
3360 u32 adj_index;
a7ff87ac
JP
3361 bool old_adj_index_valid;
3362 u32 old_adj_index;
a7ff87ac
JP
3363 int i;
3364 int err;
3365
b3e8d1eb
IS
3366 if (!nh_grp->gateway) {
3367 mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp);
3368 return;
3369 }
3370
a7ff87ac
JP
3371 for (i = 0; i < nh_grp->count; i++) {
3372 nh = &nh_grp->nexthops[i];
3373
56b8a9ed 3374 if (nh->should_offload != nh->offloaded) {
a7ff87ac
JP
3375 offload_change = true;
3376 if (nh->should_offload)
3377 nh->update = 1;
3378 }
a7ff87ac
JP
3379 }
3380 if (!offload_change) {
3381 /* Nothing was added or removed, so no need to reallocate. Just
3382 * update MAC on existing adjacency indexes.
3383 */
35225e47 3384 err = mlxsw_sp_nexthop_group_update(mlxsw_sp, nh_grp, false);
a7ff87ac
JP
3385 if (err) {
3386 dev_warn(mlxsw_sp->bus_info->dev, "Failed to update neigh MAC in adjacency table.\n");
3387 goto set_trap;
3388 }
3389 return;
3390 }
eb789980
IS
3391 mlxsw_sp_nexthop_group_normalize(nh_grp);
3392 if (!nh_grp->sum_norm_weight)
a7ff87ac
JP
3393 /* No neigh of this group is connected so we just set
3394 * the trap and let everthing flow through kernel.
3395 */
3396 goto set_trap;
3397
eb789980 3398 ecmp_size = nh_grp->sum_norm_weight;
425a08c6
IS
3399 err = mlxsw_sp_fix_adj_grp_size(mlxsw_sp, &ecmp_size);
3400 if (err)
3401 /* No valid allocation size available. */
3402 goto set_trap;
3403
4b6b1869
JP
3404 err = mlxsw_sp_kvdl_alloc(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
3405 ecmp_size, &adj_index);
13124443 3406 if (err) {
a7ff87ac
JP
3407 /* We ran out of KVD linear space, just set the
3408 * trap and let everything flow through kernel.
3409 */
3410 dev_warn(mlxsw_sp->bus_info->dev, "Failed to allocate KVD linear area for nexthop group.\n");
3411 goto set_trap;
3412 }
a7ff87ac
JP
3413 old_adj_index_valid = nh_grp->adj_index_valid;
3414 old_adj_index = nh_grp->adj_index;
3415 old_ecmp_size = nh_grp->ecmp_size;
3416 nh_grp->adj_index_valid = 1;
3417 nh_grp->adj_index = adj_index;
3418 nh_grp->ecmp_size = ecmp_size;
eb789980 3419 mlxsw_sp_nexthop_group_rebalance(nh_grp);
35225e47 3420 err = mlxsw_sp_nexthop_group_update(mlxsw_sp, nh_grp, true);
a7ff87ac
JP
3421 if (err) {
3422 dev_warn(mlxsw_sp->bus_info->dev, "Failed to update neigh MAC in adjacency table.\n");
3423 goto set_trap;
3424 }
3425
3426 if (!old_adj_index_valid) {
3427 /* The trap was set for fib entries, so we have to call
3428 * fib entry update to unset it and use adjacency index.
3429 */
3430 err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp);
3431 if (err) {
3432 dev_warn(mlxsw_sp->bus_info->dev, "Failed to add adjacency index to fib entries.\n");
3433 goto set_trap;
3434 }
3435 return;
3436 }
3437
3438 err = mlxsw_sp_adj_index_mass_update(mlxsw_sp, nh_grp,
3439 old_adj_index, old_ecmp_size);
4b6b1869 3440 mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
0304c005 3441 old_ecmp_size, old_adj_index);
a7ff87ac
JP
3442 if (err) {
3443 dev_warn(mlxsw_sp->bus_info->dev, "Failed to mass-update adjacency index for nexthop group.\n");
3444 goto set_trap;
3445 }
77d964e6
IS
3446
3447 /* Offload state within the group changed, so update the flags. */
3448 mlxsw_sp_nexthop_fib_entries_refresh(nh_grp);
3449
a7ff87ac
JP
3450 return;
3451
3452set_trap:
3453 old_adj_index_valid = nh_grp->adj_index_valid;
3454 nh_grp->adj_index_valid = 0;
3455 for (i = 0; i < nh_grp->count; i++) {
3456 nh = &nh_grp->nexthops[i];
3457 nh->offloaded = 0;
3458 }
3459 err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp);
3460 if (err)
3461 dev_warn(mlxsw_sp->bus_info->dev, "Failed to set traps for fib entries.\n");
3462 if (old_adj_index_valid)
4b6b1869 3463 mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ,
0304c005 3464 nh_grp->ecmp_size, nh_grp->adj_index);
a7ff87ac
JP
3465}
3466
3467static void __mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp_nexthop *nh,
3468 bool removing)
3469{
213666a3 3470 if (!removing)
a7ff87ac 3471 nh->should_offload = 1;
8764a826 3472 else
a7ff87ac
JP
3473 nh->should_offload = 0;
3474 nh->update = 1;
3475}
3476
83d57826
IS
3477static int
3478mlxsw_sp_nexthop_dead_neigh_replace(struct mlxsw_sp *mlxsw_sp,
3479 struct mlxsw_sp_neigh_entry *neigh_entry)
3480{
3481 struct neighbour *n, *old_n = neigh_entry->key.n;
3482 struct mlxsw_sp_nexthop *nh;
3483 bool entry_connected;
3484 u8 nud_state, dead;
3485 int err;
3486
3487 nh = list_first_entry(&neigh_entry->nexthop_list,
3488 struct mlxsw_sp_nexthop, neigh_list_node);
3489
3490 n = neigh_lookup(nh->nh_grp->neigh_tbl, &nh->gw_addr, nh->rif->dev);
3491 if (!n) {
3492 n = neigh_create(nh->nh_grp->neigh_tbl, &nh->gw_addr,
3493 nh->rif->dev);
3494 if (IS_ERR(n))
3495 return PTR_ERR(n);
3496 neigh_event_send(n, NULL);
3497 }
3498
3499 mlxsw_sp_neigh_entry_remove(mlxsw_sp, neigh_entry);
3500 neigh_entry->key.n = n;
3501 err = mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry);
3502 if (err)
3503 goto err_neigh_entry_insert;
3504
3505 read_lock_bh(&n->lock);
3506 nud_state = n->nud_state;
3507 dead = n->dead;
3508 read_unlock_bh(&n->lock);
3509 entry_connected = nud_state & NUD_VALID && !dead;
3510
3511 list_for_each_entry(nh, &neigh_entry->nexthop_list,
3512 neigh_list_node) {
3513 neigh_release(old_n);
3514 neigh_clone(n);
3515 __mlxsw_sp_nexthop_neigh_update(nh, !entry_connected);
3516 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
3517 }
3518
3519 neigh_release(n);
3520
3521 return 0;
3522
3523err_neigh_entry_insert:
3524 neigh_entry->key.n = old_n;
3525 mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry);
3526 neigh_release(n);
3527 return err;
3528}
3529
a7ff87ac
JP
3530static void
3531mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp *mlxsw_sp,
3532 struct mlxsw_sp_neigh_entry *neigh_entry,
83d57826 3533 bool removing, bool dead)
a7ff87ac
JP
3534{
3535 struct mlxsw_sp_nexthop *nh;
3536
83d57826
IS
3537 if (list_empty(&neigh_entry->nexthop_list))
3538 return;
3539
3540 if (dead) {
3541 int err;
3542
3543 err = mlxsw_sp_nexthop_dead_neigh_replace(mlxsw_sp,
3544 neigh_entry);
3545 if (err)
3546 dev_err(mlxsw_sp->bus_info->dev, "Failed to replace dead neigh\n");
3547 return;
3548 }
3549
a7ff87ac
JP
3550 list_for_each_entry(nh, &neigh_entry->nexthop_list,
3551 neigh_list_node) {
3552 __mlxsw_sp_nexthop_neigh_update(nh, removing);
3553 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
3554 }
a7ff87ac
JP
3555}
3556
9665b745 3557static void mlxsw_sp_nexthop_rif_init(struct mlxsw_sp_nexthop *nh,
bf95233e 3558 struct mlxsw_sp_rif *rif)
9665b745 3559{
bf95233e 3560 if (nh->rif)
9665b745
IS
3561 return;
3562
bf95233e
AS
3563 nh->rif = rif;
3564 list_add(&nh->rif_list_node, &rif->nexthop_list);
9665b745
IS
3565}
3566
3567static void mlxsw_sp_nexthop_rif_fini(struct mlxsw_sp_nexthop *nh)
3568{
bf95233e 3569 if (!nh->rif)
9665b745
IS
3570 return;
3571
3572 list_del(&nh->rif_list_node);
bf95233e 3573 nh->rif = NULL;
9665b745
IS
3574}
3575
a8c97014
IS
3576static int mlxsw_sp_nexthop_neigh_init(struct mlxsw_sp *mlxsw_sp,
3577 struct mlxsw_sp_nexthop *nh)
a7ff87ac
JP
3578{
3579 struct mlxsw_sp_neigh_entry *neigh_entry;
a7ff87ac 3580 struct neighbour *n;
93a87e5e 3581 u8 nud_state, dead;
c53b8e1b
IS
3582 int err;
3583
ad178c8e 3584 if (!nh->nh_grp->gateway || nh->neigh_entry)
b8399a1e
IS
3585 return 0;
3586
33b1341c 3587 /* Take a reference of neigh here ensuring that neigh would
8de3c178 3588 * not be destructed before the nexthop entry is finished.
33b1341c 3589 * The reference is taken either in neigh_lookup() or
fd76d910 3590 * in neigh_create() in case n is not found.
33b1341c 3591 */
58adf2c4 3592 n = neigh_lookup(nh->nh_grp->neigh_tbl, &nh->gw_addr, nh->rif->dev);
33b1341c 3593 if (!n) {
58adf2c4
IS
3594 n = neigh_create(nh->nh_grp->neigh_tbl, &nh->gw_addr,
3595 nh->rif->dev);
a8c97014
IS
3596 if (IS_ERR(n))
3597 return PTR_ERR(n);
a7ff87ac 3598 neigh_event_send(n, NULL);
33b1341c
JP
3599 }
3600 neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, n);
3601 if (!neigh_entry) {
5c8802f1
IS
3602 neigh_entry = mlxsw_sp_neigh_entry_create(mlxsw_sp, n);
3603 if (IS_ERR(neigh_entry)) {
c53b8e1b
IS
3604 err = -EINVAL;
3605 goto err_neigh_entry_create;
5c8802f1 3606 }
a7ff87ac 3607 }
b2157149
YG
3608
3609 /* If that is the first nexthop connected to that neigh, add to
3610 * nexthop_neighs_list
3611 */
3612 if (list_empty(&neigh_entry->nexthop_list))
3613 list_add_tail(&neigh_entry->nexthop_neighs_list_node,
9011b677 3614 &mlxsw_sp->router->nexthop_neighs_list);
b2157149 3615
a7ff87ac
JP
3616 nh->neigh_entry = neigh_entry;
3617 list_add_tail(&nh->neigh_list_node, &neigh_entry->nexthop_list);
3618 read_lock_bh(&n->lock);
3619 nud_state = n->nud_state;
93a87e5e 3620 dead = n->dead;
a7ff87ac 3621 read_unlock_bh(&n->lock);
93a87e5e 3622 __mlxsw_sp_nexthop_neigh_update(nh, !(nud_state & NUD_VALID && !dead));
a7ff87ac
JP
3623
3624 return 0;
c53b8e1b
IS
3625
3626err_neigh_entry_create:
3627 neigh_release(n);
c53b8e1b 3628 return err;
a7ff87ac
JP
3629}
3630
a8c97014
IS
3631static void mlxsw_sp_nexthop_neigh_fini(struct mlxsw_sp *mlxsw_sp,
3632 struct mlxsw_sp_nexthop *nh)
a7ff87ac
JP
3633{
3634 struct mlxsw_sp_neigh_entry *neigh_entry = nh->neigh_entry;
a8c97014 3635 struct neighbour *n;
a7ff87ac 3636
b8399a1e 3637 if (!neigh_entry)
a8c97014
IS
3638 return;
3639 n = neigh_entry->key.n;
b8399a1e 3640
58312125 3641 __mlxsw_sp_nexthop_neigh_update(nh, true);
a7ff87ac 3642 list_del(&nh->neigh_list_node);
e58be79e 3643 nh->neigh_entry = NULL;
b2157149
YG
3644
3645 /* If that is the last nexthop connected to that neigh, remove from
3646 * nexthop_neighs_list
3647 */
e58be79e
IS
3648 if (list_empty(&neigh_entry->nexthop_list))
3649 list_del(&neigh_entry->nexthop_neighs_list_node);
b2157149 3650
5c8802f1
IS
3651 if (!neigh_entry->connected && list_empty(&neigh_entry->nexthop_list))
3652 mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry);
3653
3654 neigh_release(n);
a8c97014 3655}
c53b8e1b 3656
44b0fff1
PM
3657static bool mlxsw_sp_ipip_netdev_ul_up(struct net_device *ol_dev)
3658{
3659 struct net_device *ul_dev = __mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev);
3660
3661 return ul_dev ? (ul_dev->flags & IFF_UP) : true;
3662}
3663
d97cda5f
PM
3664static void mlxsw_sp_nexthop_ipip_init(struct mlxsw_sp *mlxsw_sp,
3665 struct mlxsw_sp_nexthop *nh,
3666 struct mlxsw_sp_ipip_entry *ipip_entry)
1012b9ac 3667{
44b0fff1
PM
3668 bool removing;
3669
1012b9ac 3670 if (!nh->nh_grp->gateway || nh->ipip_entry)
d97cda5f 3671 return;
1012b9ac 3672
d97cda5f
PM
3673 nh->ipip_entry = ipip_entry;
3674 removing = !mlxsw_sp_ipip_netdev_ul_up(ipip_entry->ol_dev);
44b0fff1 3675 __mlxsw_sp_nexthop_neigh_update(nh, removing);
d97cda5f 3676 mlxsw_sp_nexthop_rif_init(nh, &ipip_entry->ol_lb->common);
1012b9ac
PM
3677}
3678
3679static void mlxsw_sp_nexthop_ipip_fini(struct mlxsw_sp *mlxsw_sp,
3680 struct mlxsw_sp_nexthop *nh)
3681{
3682 struct mlxsw_sp_ipip_entry *ipip_entry = nh->ipip_entry;
3683
3684 if (!ipip_entry)
3685 return;
3686
3687 __mlxsw_sp_nexthop_neigh_update(nh, true);
1012b9ac
PM
3688 nh->ipip_entry = NULL;
3689}
3690
3691static bool mlxsw_sp_nexthop4_ipip_type(const struct mlxsw_sp *mlxsw_sp,
3692 const struct fib_nh *fib_nh,
3693 enum mlxsw_sp_ipip_type *p_ipipt)
3694{
b75ed8b1 3695 struct net_device *dev = fib_nh->fib_nh_dev;
1012b9ac
PM
3696
3697 return dev &&
3698 fib_nh->nh_parent->fib_type == RTN_UNICAST &&
3699 mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, p_ipipt);
3700}
3701
35225e47
PM
3702static void mlxsw_sp_nexthop_type_fini(struct mlxsw_sp *mlxsw_sp,
3703 struct mlxsw_sp_nexthop *nh)
3704{
3705 switch (nh->type) {
3706 case MLXSW_SP_NEXTHOP_TYPE_ETH:
3707 mlxsw_sp_nexthop_neigh_fini(mlxsw_sp, nh);
3708 mlxsw_sp_nexthop_rif_fini(nh);
3709 break;
1012b9ac 3710 case MLXSW_SP_NEXTHOP_TYPE_IPIP:
de0f43c0 3711 mlxsw_sp_nexthop_rif_fini(nh);
1012b9ac
PM
3712 mlxsw_sp_nexthop_ipip_fini(mlxsw_sp, nh);
3713 break;
35225e47
PM
3714 }
3715}
3716
3717static int mlxsw_sp_nexthop4_type_init(struct mlxsw_sp *mlxsw_sp,
3718 struct mlxsw_sp_nexthop *nh,
3719 struct fib_nh *fib_nh)
3720{
d97cda5f 3721 const struct mlxsw_sp_ipip_ops *ipip_ops;
b75ed8b1 3722 struct net_device *dev = fib_nh->fib_nh_dev;
d97cda5f 3723 struct mlxsw_sp_ipip_entry *ipip_entry;
35225e47
PM
3724 struct mlxsw_sp_rif *rif;
3725 int err;
3726
d97cda5f
PM
3727 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, dev);
3728 if (ipip_entry) {
3729 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
3730 if (ipip_ops->can_offload(mlxsw_sp, dev,
3731 MLXSW_SP_L3_PROTO_IPV4)) {
3732 nh->type = MLXSW_SP_NEXTHOP_TYPE_IPIP;
3733 mlxsw_sp_nexthop_ipip_init(mlxsw_sp, nh, ipip_entry);
3734 return 0;
3735 }
1012b9ac
PM
3736 }
3737
35225e47
PM
3738 nh->type = MLXSW_SP_NEXTHOP_TYPE_ETH;
3739 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
3740 if (!rif)
3741 return 0;
3742
3743 mlxsw_sp_nexthop_rif_init(nh, rif);
3744 err = mlxsw_sp_nexthop_neigh_init(mlxsw_sp, nh);
3745 if (err)
3746 goto err_neigh_init;
3747
3748 return 0;
3749
3750err_neigh_init:
3751 mlxsw_sp_nexthop_rif_fini(nh);
3752 return err;
3753}
3754
3755static void mlxsw_sp_nexthop4_type_fini(struct mlxsw_sp *mlxsw_sp,
3756 struct mlxsw_sp_nexthop *nh)
3757{
3758 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh);
3759}
3760
0e6ea2a4
IS
3761static int mlxsw_sp_nexthop4_init(struct mlxsw_sp *mlxsw_sp,
3762 struct mlxsw_sp_nexthop_group *nh_grp,
3763 struct mlxsw_sp_nexthop *nh,
3764 struct fib_nh *fib_nh)
a8c97014 3765{
b75ed8b1 3766 struct net_device *dev = fib_nh->fib_nh_dev;
df6dd79b 3767 struct in_device *in_dev;
a8c97014
IS
3768 int err;
3769
3770 nh->nh_grp = nh_grp;
3771 nh->key.fib_nh = fib_nh;
408bd946 3772#ifdef CONFIG_IP_ROUTE_MULTIPATH
b75ed8b1 3773 nh->nh_weight = fib_nh->fib_nh_weight;
408bd946
IS
3774#else
3775 nh->nh_weight = 1;
3776#endif
b75ed8b1 3777 memcpy(&nh->gw_addr, &fib_nh->fib_nh_gw4, sizeof(fib_nh->fib_nh_gw4));
a8c97014
IS
3778 err = mlxsw_sp_nexthop_insert(mlxsw_sp, nh);
3779 if (err)
3780 return err;
3781
a5390278 3782 mlxsw_sp_nexthop_counter_alloc(mlxsw_sp, nh);
dbe4598c
AS
3783 list_add_tail(&nh->router_list_node, &mlxsw_sp->router->nexthop_list);
3784
97989ee0
IS
3785 if (!dev)
3786 return 0;
3787
df6dd79b
IS
3788 in_dev = __in_dev_get_rtnl(dev);
3789 if (in_dev && IN_DEV_IGNORE_ROUTES_WITH_LINKDOWN(in_dev) &&
b75ed8b1 3790 fib_nh->fib_nh_flags & RTNH_F_LINKDOWN)
df6dd79b
IS
3791 return 0;
3792
35225e47 3793 err = mlxsw_sp_nexthop4_type_init(mlxsw_sp, nh, fib_nh);
a8c97014
IS
3794 if (err)
3795 goto err_nexthop_neigh_init;
3796
3797 return 0;
3798
3799err_nexthop_neigh_init:
3800 mlxsw_sp_nexthop_remove(mlxsw_sp, nh);
3801 return err;
3802}
3803
0e6ea2a4
IS
3804static void mlxsw_sp_nexthop4_fini(struct mlxsw_sp *mlxsw_sp,
3805 struct mlxsw_sp_nexthop *nh)
a8c97014 3806{
35225e47 3807 mlxsw_sp_nexthop4_type_fini(mlxsw_sp, nh);
dbe4598c 3808 list_del(&nh->router_list_node);
a5390278 3809 mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh);
c53b8e1b 3810 mlxsw_sp_nexthop_remove(mlxsw_sp, nh);
a7ff87ac
JP
3811}
3812
0e6ea2a4
IS
3813static void mlxsw_sp_nexthop4_event(struct mlxsw_sp *mlxsw_sp,
3814 unsigned long event, struct fib_nh *fib_nh)
ad178c8e
IS
3815{
3816 struct mlxsw_sp_nexthop_key key;
3817 struct mlxsw_sp_nexthop *nh;
ad178c8e 3818
9011b677 3819 if (mlxsw_sp->router->aborted)
ad178c8e
IS
3820 return;
3821
3822 key.fib_nh = fib_nh;
3823 nh = mlxsw_sp_nexthop_lookup(mlxsw_sp, key);
3824 if (WARN_ON_ONCE(!nh))
3825 return;
3826
ad178c8e
IS
3827 switch (event) {
3828 case FIB_EVENT_NH_ADD:
35225e47 3829 mlxsw_sp_nexthop4_type_init(mlxsw_sp, nh, fib_nh);
ad178c8e
IS
3830 break;
3831 case FIB_EVENT_NH_DEL:
35225e47 3832 mlxsw_sp_nexthop4_type_fini(mlxsw_sp, nh);
ad178c8e
IS
3833 break;
3834 }
3835
3836 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
3837}
3838
0c5f1cd5
PM
3839static void mlxsw_sp_nexthop_rif_update(struct mlxsw_sp *mlxsw_sp,
3840 struct mlxsw_sp_rif *rif)
3841{
3842 struct mlxsw_sp_nexthop *nh;
44b0fff1 3843 bool removing;
0c5f1cd5
PM
3844
3845 list_for_each_entry(nh, &rif->nexthop_list, rif_list_node) {
44b0fff1
PM
3846 switch (nh->type) {
3847 case MLXSW_SP_NEXTHOP_TYPE_ETH:
3848 removing = false;
3849 break;
3850 case MLXSW_SP_NEXTHOP_TYPE_IPIP:
3851 removing = !mlxsw_sp_ipip_netdev_ul_up(rif->dev);
3852 break;
3853 default:
3854 WARN_ON(1);
3855 continue;
3856 }
3857
3858 __mlxsw_sp_nexthop_neigh_update(nh, removing);
0c5f1cd5
PM
3859 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
3860 }
3861}
3862
09dbf629
PM
3863static void mlxsw_sp_nexthop_rif_migrate(struct mlxsw_sp *mlxsw_sp,
3864 struct mlxsw_sp_rif *old_rif,
3865 struct mlxsw_sp_rif *new_rif)
3866{
3867 struct mlxsw_sp_nexthop *nh;
3868
3869 list_splice_init(&old_rif->nexthop_list, &new_rif->nexthop_list);
3870 list_for_each_entry(nh, &new_rif->nexthop_list, rif_list_node)
3871 nh->rif = new_rif;
3872 mlxsw_sp_nexthop_rif_update(mlxsw_sp, new_rif);
3873}
3874
9665b745 3875static void mlxsw_sp_nexthop_rif_gone_sync(struct mlxsw_sp *mlxsw_sp,
bf95233e 3876 struct mlxsw_sp_rif *rif)
9665b745
IS
3877{
3878 struct mlxsw_sp_nexthop *nh, *tmp;
3879
bf95233e 3880 list_for_each_entry_safe(nh, tmp, &rif->nexthop_list, rif_list_node) {
35225e47 3881 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh);
9665b745
IS
3882 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp);
3883 }
3884}
3885
9b01451a 3886static bool mlxsw_sp_fi_is_gateway(const struct mlxsw_sp *mlxsw_sp,
5481d73f 3887 struct fib_info *fi)
9b01451a 3888{
5481d73f
DA
3889 const struct fib_nh *nh = fib_info_nh(fi, 0);
3890
3891 return nh->fib_nh_scope == RT_SCOPE_LINK ||
3892 mlxsw_sp_nexthop4_ipip_type(mlxsw_sp, nh, NULL);
9b01451a
PM
3893}
3894
a7ff87ac 3895static struct mlxsw_sp_nexthop_group *
0e6ea2a4 3896mlxsw_sp_nexthop4_group_create(struct mlxsw_sp *mlxsw_sp, struct fib_info *fi)
a7ff87ac 3897{
5481d73f 3898 unsigned int nhs = fib_info_num_path(fi);
a7ff87ac
JP
3899 struct mlxsw_sp_nexthop_group *nh_grp;
3900 struct mlxsw_sp_nexthop *nh;
3901 struct fib_nh *fib_nh;
a7ff87ac
JP
3902 int i;
3903 int err;
3904
5481d73f 3905 nh_grp = kzalloc(struct_size(nh_grp, nexthops, nhs), GFP_KERNEL);
a7ff87ac
JP
3906 if (!nh_grp)
3907 return ERR_PTR(-ENOMEM);
ba31d366 3908 nh_grp->priv = fi;
a7ff87ac 3909 INIT_LIST_HEAD(&nh_grp->fib_list);
58adf2c4
IS
3910 nh_grp->neigh_tbl = &arp_tbl;
3911
9b01451a 3912 nh_grp->gateway = mlxsw_sp_fi_is_gateway(mlxsw_sp, fi);
5481d73f 3913 nh_grp->count = nhs;
7387dbbc 3914 fib_info_hold(fi);
a7ff87ac
JP
3915 for (i = 0; i < nh_grp->count; i++) {
3916 nh = &nh_grp->nexthops[i];
5481d73f 3917 fib_nh = fib_info_nh(fi, i);
0e6ea2a4 3918 err = mlxsw_sp_nexthop4_init(mlxsw_sp, nh_grp, nh, fib_nh);
a7ff87ac 3919 if (err)
0e6ea2a4 3920 goto err_nexthop4_init;
a7ff87ac 3921 }
e9ad5e7d
IS
3922 err = mlxsw_sp_nexthop_group_insert(mlxsw_sp, nh_grp);
3923 if (err)
3924 goto err_nexthop_group_insert;
a7ff87ac
JP
3925 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
3926 return nh_grp;
3927
e9ad5e7d 3928err_nexthop_group_insert:
0e6ea2a4 3929err_nexthop4_init:
df6dd79b
IS
3930 for (i--; i >= 0; i--) {
3931 nh = &nh_grp->nexthops[i];
0e6ea2a4 3932 mlxsw_sp_nexthop4_fini(mlxsw_sp, nh);
df6dd79b 3933 }
ba31d366 3934 fib_info_put(fi);
a7ff87ac
JP
3935 kfree(nh_grp);
3936 return ERR_PTR(err);
3937}
3938
3939static void
0e6ea2a4
IS
3940mlxsw_sp_nexthop4_group_destroy(struct mlxsw_sp *mlxsw_sp,
3941 struct mlxsw_sp_nexthop_group *nh_grp)
a7ff87ac
JP
3942{
3943 struct mlxsw_sp_nexthop *nh;
3944 int i;
3945
e9ad5e7d 3946 mlxsw_sp_nexthop_group_remove(mlxsw_sp, nh_grp);
a7ff87ac
JP
3947 for (i = 0; i < nh_grp->count; i++) {
3948 nh = &nh_grp->nexthops[i];
0e6ea2a4 3949 mlxsw_sp_nexthop4_fini(mlxsw_sp, nh);
a7ff87ac 3950 }
58312125
IS
3951 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
3952 WARN_ON_ONCE(nh_grp->adj_index_valid);
ba31d366 3953 fib_info_put(mlxsw_sp_nexthop4_group_fi(nh_grp));
a7ff87ac
JP
3954 kfree(nh_grp);
3955}
3956
0e6ea2a4
IS
3957static int mlxsw_sp_nexthop4_group_get(struct mlxsw_sp *mlxsw_sp,
3958 struct mlxsw_sp_fib_entry *fib_entry,
3959 struct fib_info *fi)
a7ff87ac
JP
3960{
3961 struct mlxsw_sp_nexthop_group *nh_grp;
3962
ba31d366 3963 nh_grp = mlxsw_sp_nexthop4_group_lookup(mlxsw_sp, fi);
a7ff87ac 3964 if (!nh_grp) {
0e6ea2a4 3965 nh_grp = mlxsw_sp_nexthop4_group_create(mlxsw_sp, fi);
a7ff87ac
JP
3966 if (IS_ERR(nh_grp))
3967 return PTR_ERR(nh_grp);
3968 }
3969 list_add_tail(&fib_entry->nexthop_group_node, &nh_grp->fib_list);
3970 fib_entry->nh_group = nh_grp;
3971 return 0;
3972}
3973
0e6ea2a4
IS
3974static void mlxsw_sp_nexthop4_group_put(struct mlxsw_sp *mlxsw_sp,
3975 struct mlxsw_sp_fib_entry *fib_entry)
a7ff87ac
JP
3976{
3977 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
3978
3979 list_del(&fib_entry->nexthop_group_node);
3980 if (!list_empty(&nh_grp->fib_list))
3981 return;
0e6ea2a4 3982 mlxsw_sp_nexthop4_group_destroy(mlxsw_sp, nh_grp);
a7ff87ac
JP
3983}
3984
4f1c7f1f
IS
3985static bool
3986mlxsw_sp_fib4_entry_should_offload(const struct mlxsw_sp_fib_entry *fib_entry)
3987{
3988 struct mlxsw_sp_fib4_entry *fib4_entry;
3989
3990 fib4_entry = container_of(fib_entry, struct mlxsw_sp_fib4_entry,
3991 common);
3992 return !fib4_entry->tos;
3993}
3994
013b20f9
IS
3995static bool
3996mlxsw_sp_fib_entry_should_offload(const struct mlxsw_sp_fib_entry *fib_entry)
3997{
3998 struct mlxsw_sp_nexthop_group *nh_group = fib_entry->nh_group;
3999
4f1c7f1f
IS
4000 switch (fib_entry->fib_node->fib->proto) {
4001 case MLXSW_SP_L3_PROTO_IPV4:
4002 if (!mlxsw_sp_fib4_entry_should_offload(fib_entry))
4003 return false;
4004 break;
4005 case MLXSW_SP_L3_PROTO_IPV6:
4006 break;
4007 }
9aecce1c 4008
013b20f9
IS
4009 switch (fib_entry->type) {
4010 case MLXSW_SP_FIB_ENTRY_TYPE_REMOTE:
4011 return !!nh_group->adj_index_valid;
4012 case MLXSW_SP_FIB_ENTRY_TYPE_LOCAL:
70ad3506 4013 return !!nh_group->nh_rif;
2810c3b2 4014 case MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE:
4607f6d2 4015 case MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP:
0c69e0fc 4016 case MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP:
4607f6d2 4017 return true;
013b20f9
IS
4018 default:
4019 return false;
4020 }
4021}
4022
428b851f
IS
4023static struct mlxsw_sp_nexthop *
4024mlxsw_sp_rt6_nexthop(struct mlxsw_sp_nexthop_group *nh_grp,
4025 const struct mlxsw_sp_rt6 *mlxsw_sp_rt6)
4026{
4027 int i;
4028
4029 for (i = 0; i < nh_grp->count; i++) {
4030 struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
8d1c802b 4031 struct fib6_info *rt = mlxsw_sp_rt6->rt;
428b851f 4032
1cf844c7 4033 if (nh->rif && nh->rif->dev == rt->fib6_nh->fib_nh_dev &&
428b851f 4034 ipv6_addr_equal((const struct in6_addr *) &nh->gw_addr,
1cf844c7 4035 &rt->fib6_nh->fib_nh_gw6))
428b851f
IS
4036 return nh;
4037 continue;
4038 }
4039
4040 return NULL;
4041}
4042
3984d1a8
IS
4043static void
4044mlxsw_sp_fib4_entry_offload_set(struct mlxsw_sp_fib_entry *fib_entry)
4045{
4046 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
4047 int i;
4048
4607f6d2 4049 if (fib_entry->type == MLXSW_SP_FIB_ENTRY_TYPE_LOCAL ||
2810c3b2 4050 fib_entry->type == MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE ||
0c69e0fc
IS
4051 fib_entry->type == MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP ||
4052 fib_entry->type == MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP) {
b75ed8b1 4053 nh_grp->nexthops->key.fib_nh->fib_nh_flags |= RTNH_F_OFFLOAD;
3984d1a8
IS
4054 return;
4055 }
4056
4057 for (i = 0; i < nh_grp->count; i++) {
4058 struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
4059
4060 if (nh->offloaded)
b75ed8b1 4061 nh->key.fib_nh->fib_nh_flags |= RTNH_F_OFFLOAD;
3984d1a8 4062 else
b75ed8b1 4063 nh->key.fib_nh->fib_nh_flags &= ~RTNH_F_OFFLOAD;
3984d1a8
IS
4064 }
4065}
4066
4067static void
4068mlxsw_sp_fib4_entry_offload_unset(struct mlxsw_sp_fib_entry *fib_entry)
4069{
4070 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
4071 int i;
4072
d1c95af3
IS
4073 if (!list_is_singular(&nh_grp->fib_list))
4074 return;
4075
3984d1a8
IS
4076 for (i = 0; i < nh_grp->count; i++) {
4077 struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i];
4078
b75ed8b1 4079 nh->key.fib_nh->fib_nh_flags &= ~RTNH_F_OFFLOAD;
3984d1a8
IS
4080 }
4081}
4082
428b851f
IS
4083static void
4084mlxsw_sp_fib6_entry_offload_set(struct mlxsw_sp_fib_entry *fib_entry)
4085{
4086 struct mlxsw_sp_fib6_entry *fib6_entry;
4087 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
4088
4089 fib6_entry = container_of(fib_entry, struct mlxsw_sp_fib6_entry,
4090 common);
4091
2810c3b2
IS
4092 if (fib_entry->type == MLXSW_SP_FIB_ENTRY_TYPE_LOCAL ||
4093 fib_entry->type == MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE) {
428b851f 4094 list_first_entry(&fib6_entry->rt6_list, struct mlxsw_sp_rt6,
1cf844c7 4095 list)->rt->fib6_nh->fib_nh_flags |= RTNH_F_OFFLOAD;
428b851f
IS
4096 return;
4097 }
4098
4099 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
4100 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
1cf844c7 4101 struct fib6_nh *fib6_nh = mlxsw_sp_rt6->rt->fib6_nh;
428b851f
IS
4102 struct mlxsw_sp_nexthop *nh;
4103
4104 nh = mlxsw_sp_rt6_nexthop(nh_grp, mlxsw_sp_rt6);
4105 if (nh && nh->offloaded)
ad1601ae 4106 fib6_nh->fib_nh_flags |= RTNH_F_OFFLOAD;
428b851f 4107 else
ad1601ae 4108 fib6_nh->fib_nh_flags &= ~RTNH_F_OFFLOAD;
428b851f
IS
4109 }
4110}
4111
4112static void
4113mlxsw_sp_fib6_entry_offload_unset(struct mlxsw_sp_fib_entry *fib_entry)
4114{
4115 struct mlxsw_sp_fib6_entry *fib6_entry;
4116 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
4117
4118 fib6_entry = container_of(fib_entry, struct mlxsw_sp_fib6_entry,
4119 common);
4120 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
8d1c802b 4121 struct fib6_info *rt = mlxsw_sp_rt6->rt;
428b851f 4122
1cf844c7 4123 rt->fib6_nh->fib_nh_flags &= ~RTNH_F_OFFLOAD;
428b851f
IS
4124 }
4125}
4126
013b20f9
IS
4127static void mlxsw_sp_fib_entry_offload_set(struct mlxsw_sp_fib_entry *fib_entry)
4128{
76610ebb 4129 switch (fib_entry->fib_node->fib->proto) {
013b20f9 4130 case MLXSW_SP_L3_PROTO_IPV4:
3984d1a8 4131 mlxsw_sp_fib4_entry_offload_set(fib_entry);
013b20f9
IS
4132 break;
4133 case MLXSW_SP_L3_PROTO_IPV6:
428b851f
IS
4134 mlxsw_sp_fib6_entry_offload_set(fib_entry);
4135 break;
013b20f9
IS
4136 }
4137}
4138
4139static void
4140mlxsw_sp_fib_entry_offload_unset(struct mlxsw_sp_fib_entry *fib_entry)
4141{
76610ebb 4142 switch (fib_entry->fib_node->fib->proto) {
013b20f9 4143 case MLXSW_SP_L3_PROTO_IPV4:
3984d1a8 4144 mlxsw_sp_fib4_entry_offload_unset(fib_entry);
013b20f9
IS
4145 break;
4146 case MLXSW_SP_L3_PROTO_IPV6:
428b851f
IS
4147 mlxsw_sp_fib6_entry_offload_unset(fib_entry);
4148 break;
013b20f9 4149 }
013b20f9
IS
4150}
4151
4152static void
4153mlxsw_sp_fib_entry_offload_refresh(struct mlxsw_sp_fib_entry *fib_entry,
4154 enum mlxsw_reg_ralue_op op, int err)
4155{
4156 switch (op) {
4157 case MLXSW_REG_RALUE_OP_WRITE_DELETE:
013b20f9
IS
4158 return mlxsw_sp_fib_entry_offload_unset(fib_entry);
4159 case MLXSW_REG_RALUE_OP_WRITE_WRITE:
4160 if (err)
4161 return;
1353ee70 4162 if (mlxsw_sp_fib_entry_should_offload(fib_entry))
013b20f9 4163 mlxsw_sp_fib_entry_offload_set(fib_entry);
85f44a15 4164 else
013b20f9
IS
4165 mlxsw_sp_fib_entry_offload_unset(fib_entry);
4166 return;
4167 default:
4168 return;
4169 }
4170}
4171
9dbf4d76
IS
4172static void
4173mlxsw_sp_fib_entry_ralue_pack(char *ralue_pl,
4174 const struct mlxsw_sp_fib_entry *fib_entry,
4175 enum mlxsw_reg_ralue_op op)
a7ff87ac 4176{
76610ebb 4177 struct mlxsw_sp_fib *fib = fib_entry->fib_node->fib;
9dbf4d76
IS
4178 enum mlxsw_reg_ralxx_protocol proto;
4179 u32 *p_dip;
4180
4181 proto = (enum mlxsw_reg_ralxx_protocol) fib->proto;
4182
4183 switch (fib->proto) {
4184 case MLXSW_SP_L3_PROTO_IPV4:
4185 p_dip = (u32 *) fib_entry->fib_node->key.addr;
4186 mlxsw_reg_ralue_pack4(ralue_pl, proto, op, fib->vr->id,
4187 fib_entry->fib_node->key.prefix_len,
4188 *p_dip);
4189 break;
4190 case MLXSW_SP_L3_PROTO_IPV6:
4191 mlxsw_reg_ralue_pack6(ralue_pl, proto, op, fib->vr->id,
4192 fib_entry->fib_node->key.prefix_len,
4193 fib_entry->fib_node->key.addr);
4194 break;
4195 }
4196}
4197
4198static int mlxsw_sp_fib_entry_op_remote(struct mlxsw_sp *mlxsw_sp,
4199 struct mlxsw_sp_fib_entry *fib_entry,
4200 enum mlxsw_reg_ralue_op op)
4201{
4202 char ralue_pl[MLXSW_REG_RALUE_LEN];
a7ff87ac
JP
4203 enum mlxsw_reg_ralue_trap_action trap_action;
4204 u16 trap_id = 0;
4205 u32 adjacency_index = 0;
4206 u16 ecmp_size = 0;
4207
4208 /* In case the nexthop group adjacency index is valid, use it
4209 * with provided ECMP size. Otherwise, setup trap and pass
4210 * traffic to kernel.
4211 */
4b411477 4212 if (mlxsw_sp_fib_entry_should_offload(fib_entry)) {
a7ff87ac
JP
4213 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP;
4214 adjacency_index = fib_entry->nh_group->adj_index;
4215 ecmp_size = fib_entry->nh_group->ecmp_size;
4216 } else {
4217 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP;
4218 trap_id = MLXSW_TRAP_ID_RTR_INGRESS0;
4219 }
4220
9dbf4d76 4221 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
a7ff87ac
JP
4222 mlxsw_reg_ralue_act_remote_pack(ralue_pl, trap_action, trap_id,
4223 adjacency_index, ecmp_size);
4224 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
4225}
4226
9dbf4d76
IS
4227static int mlxsw_sp_fib_entry_op_local(struct mlxsw_sp *mlxsw_sp,
4228 struct mlxsw_sp_fib_entry *fib_entry,
4229 enum mlxsw_reg_ralue_op op)
61c503f9 4230{
bf95233e 4231 struct mlxsw_sp_rif *rif = fib_entry->nh_group->nh_rif;
70ad3506 4232 enum mlxsw_reg_ralue_trap_action trap_action;
61c503f9 4233 char ralue_pl[MLXSW_REG_RALUE_LEN];
70ad3506 4234 u16 trap_id = 0;
bf95233e 4235 u16 rif_index = 0;
70ad3506
IS
4236
4237 if (mlxsw_sp_fib_entry_should_offload(fib_entry)) {
4238 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP;
bf95233e 4239 rif_index = rif->rif_index;
70ad3506
IS
4240 } else {
4241 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP;
4242 trap_id = MLXSW_TRAP_ID_RTR_INGRESS0;
4243 }
61c503f9 4244
9dbf4d76 4245 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
bf95233e
AS
4246 mlxsw_reg_ralue_act_local_pack(ralue_pl, trap_action, trap_id,
4247 rif_index);
61c503f9
JP
4248 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
4249}
4250
9dbf4d76
IS
4251static int mlxsw_sp_fib_entry_op_trap(struct mlxsw_sp *mlxsw_sp,
4252 struct mlxsw_sp_fib_entry *fib_entry,
4253 enum mlxsw_reg_ralue_op op)
61c503f9
JP
4254{
4255 char ralue_pl[MLXSW_REG_RALUE_LEN];
61c503f9 4256
9dbf4d76 4257 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
61c503f9
JP
4258 mlxsw_reg_ralue_act_ip2me_pack(ralue_pl);
4259 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
4260}
4261
2810c3b2
IS
4262static int mlxsw_sp_fib_entry_op_blackhole(struct mlxsw_sp *mlxsw_sp,
4263 struct mlxsw_sp_fib_entry *fib_entry,
4264 enum mlxsw_reg_ralue_op op)
4265{
4266 enum mlxsw_reg_ralue_trap_action trap_action;
4267 char ralue_pl[MLXSW_REG_RALUE_LEN];
4268
4269 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_DISCARD_ERROR;
4270 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
4271 mlxsw_reg_ralue_act_local_pack(ralue_pl, trap_action, 0, 0);
4272 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
4273}
4274
4607f6d2
PM
4275static int
4276mlxsw_sp_fib_entry_op_ipip_decap(struct mlxsw_sp *mlxsw_sp,
4277 struct mlxsw_sp_fib_entry *fib_entry,
4278 enum mlxsw_reg_ralue_op op)
4279{
4280 struct mlxsw_sp_ipip_entry *ipip_entry = fib_entry->decap.ipip_entry;
4281 const struct mlxsw_sp_ipip_ops *ipip_ops;
4282
4283 if (WARN_ON(!ipip_entry))
4284 return -EINVAL;
4285
4286 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
4287 return ipip_ops->fib_entry_op(mlxsw_sp, ipip_entry, op,
4288 fib_entry->decap.tunnel_index);
4289}
4290
0c69e0fc
IS
4291static int mlxsw_sp_fib_entry_op_nve_decap(struct mlxsw_sp *mlxsw_sp,
4292 struct mlxsw_sp_fib_entry *fib_entry,
4293 enum mlxsw_reg_ralue_op op)
4294{
4295 char ralue_pl[MLXSW_REG_RALUE_LEN];
4296
4297 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op);
4298 mlxsw_reg_ralue_act_ip2me_tun_pack(ralue_pl,
4299 fib_entry->decap.tunnel_index);
4300 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
4301}
4302
9dbf4d76
IS
4303static int __mlxsw_sp_fib_entry_op(struct mlxsw_sp *mlxsw_sp,
4304 struct mlxsw_sp_fib_entry *fib_entry,
4305 enum mlxsw_reg_ralue_op op)
61c503f9
JP
4306{
4307 switch (fib_entry->type) {
4308 case MLXSW_SP_FIB_ENTRY_TYPE_REMOTE:
9dbf4d76 4309 return mlxsw_sp_fib_entry_op_remote(mlxsw_sp, fib_entry, op);
61c503f9 4310 case MLXSW_SP_FIB_ENTRY_TYPE_LOCAL:
9dbf4d76 4311 return mlxsw_sp_fib_entry_op_local(mlxsw_sp, fib_entry, op);
61c503f9 4312 case MLXSW_SP_FIB_ENTRY_TYPE_TRAP:
9dbf4d76 4313 return mlxsw_sp_fib_entry_op_trap(mlxsw_sp, fib_entry, op);
2810c3b2
IS
4314 case MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE:
4315 return mlxsw_sp_fib_entry_op_blackhole(mlxsw_sp, fib_entry, op);
4607f6d2
PM
4316 case MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP:
4317 return mlxsw_sp_fib_entry_op_ipip_decap(mlxsw_sp,
4318 fib_entry, op);
0c69e0fc
IS
4319 case MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP:
4320 return mlxsw_sp_fib_entry_op_nve_decap(mlxsw_sp, fib_entry, op);
61c503f9
JP
4321 }
4322 return -EINVAL;
4323}
4324
4325static int mlxsw_sp_fib_entry_op(struct mlxsw_sp *mlxsw_sp,
4326 struct mlxsw_sp_fib_entry *fib_entry,
4327 enum mlxsw_reg_ralue_op op)
4328{
9dbf4d76 4329 int err = __mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry, op);
013b20f9 4330
013b20f9 4331 mlxsw_sp_fib_entry_offload_refresh(fib_entry, op, err);
9dbf4d76 4332
013b20f9 4333 return err;
61c503f9
JP
4334}
4335
4336static int mlxsw_sp_fib_entry_update(struct mlxsw_sp *mlxsw_sp,
4337 struct mlxsw_sp_fib_entry *fib_entry)
4338{
7146da31
JP
4339 return mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry,
4340 MLXSW_REG_RALUE_OP_WRITE_WRITE);
61c503f9
JP
4341}
4342
4343static int mlxsw_sp_fib_entry_del(struct mlxsw_sp *mlxsw_sp,
4344 struct mlxsw_sp_fib_entry *fib_entry)
4345{
4346 return mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry,
4347 MLXSW_REG_RALUE_OP_WRITE_DELETE);
4348}
4349
61c503f9 4350static int
013b20f9
IS
4351mlxsw_sp_fib4_entry_type_set(struct mlxsw_sp *mlxsw_sp,
4352 const struct fib_entry_notifier_info *fen_info,
4353 struct mlxsw_sp_fib_entry *fib_entry)
61c503f9 4354{
5481d73f 4355 struct net_device *dev = fib_info_nh(fen_info->fi, 0)->fib_nh_dev;
4607f6d2 4356 union mlxsw_sp_l3addr dip = { .addr4 = htonl(fen_info->dst) };
4cf178d7 4357 u32 tb_id = mlxsw_sp_fix_tb_id(fen_info->tb_id);
4607f6d2 4358 struct mlxsw_sp_ipip_entry *ipip_entry;
b45f64d1 4359 struct fib_info *fi = fen_info->fi;
61c503f9 4360
97989ee0 4361 switch (fen_info->type) {
97989ee0 4362 case RTN_LOCAL:
4607f6d2
PM
4363 ipip_entry = mlxsw_sp_ipip_entry_find_by_decap(mlxsw_sp, dev,
4364 MLXSW_SP_L3_PROTO_IPV4, dip);
57c77ce4 4365 if (ipip_entry && ipip_entry->ol_dev->flags & IFF_UP) {
4607f6d2
PM
4366 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP;
4367 return mlxsw_sp_fib_entry_decap_init(mlxsw_sp,
4368 fib_entry,
4369 ipip_entry);
4370 }
4cf178d7
IS
4371 if (mlxsw_sp_nve_ipv4_route_is_decap(mlxsw_sp, tb_id,
4372 dip.addr4)) {
4373 u32 t_index;
4374
4375 t_index = mlxsw_sp_nve_decap_tunnel_index_get(mlxsw_sp);
4376 fib_entry->decap.tunnel_index = t_index;
4377 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP;
4378 return 0;
4379 }
4607f6d2
PM
4380 /* fall through */
4381 case RTN_BROADCAST:
61c503f9
JP
4382 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
4383 return 0;
2810c3b2
IS
4384 case RTN_BLACKHOLE:
4385 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE;
4386 return 0;
97989ee0 4387 case RTN_UNREACHABLE: /* fall through */
97989ee0
IS
4388 case RTN_PROHIBIT:
4389 /* Packets hitting these routes need to be trapped, but
4390 * can do so with a lower priority than packets directed
4391 * at the host, so use action type local instead of trap.
4392 */
61c503f9 4393 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL;
97989ee0
IS
4394 return 0;
4395 case RTN_UNICAST:
9b01451a 4396 if (mlxsw_sp_fi_is_gateway(mlxsw_sp, fi))
97989ee0 4397 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_REMOTE;
9b01451a
PM
4398 else
4399 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL;
97989ee0
IS
4400 return 0;
4401 default:
4402 return -EINVAL;
4403 }
a7ff87ac
JP
4404}
4405
4f1c7f1f 4406static struct mlxsw_sp_fib4_entry *
9aecce1c
IS
4407mlxsw_sp_fib4_entry_create(struct mlxsw_sp *mlxsw_sp,
4408 struct mlxsw_sp_fib_node *fib_node,
4409 const struct fib_entry_notifier_info *fen_info)
61c503f9 4410{
4f1c7f1f 4411 struct mlxsw_sp_fib4_entry *fib4_entry;
61c503f9 4412 struct mlxsw_sp_fib_entry *fib_entry;
61c503f9
JP
4413 int err;
4414
4f1c7f1f
IS
4415 fib4_entry = kzalloc(sizeof(*fib4_entry), GFP_KERNEL);
4416 if (!fib4_entry)
4417 return ERR_PTR(-ENOMEM);
4418 fib_entry = &fib4_entry->common;
61c503f9 4419
013b20f9 4420 err = mlxsw_sp_fib4_entry_type_set(mlxsw_sp, fen_info, fib_entry);
61c503f9 4421 if (err)
013b20f9 4422 goto err_fib4_entry_type_set;
61c503f9 4423
0e6ea2a4 4424 err = mlxsw_sp_nexthop4_group_get(mlxsw_sp, fib_entry, fen_info->fi);
b8399a1e 4425 if (err)
0e6ea2a4 4426 goto err_nexthop4_group_get;
b8399a1e 4427
4f1c7f1f
IS
4428 fib4_entry->prio = fen_info->fi->fib_priority;
4429 fib4_entry->tb_id = fen_info->tb_id;
4430 fib4_entry->type = fen_info->type;
4431 fib4_entry->tos = fen_info->tos;
9aecce1c
IS
4432
4433 fib_entry->fib_node = fib_node;
4434
4f1c7f1f 4435 return fib4_entry;
5b004412 4436
0e6ea2a4 4437err_nexthop4_group_get:
013b20f9 4438err_fib4_entry_type_set:
4f1c7f1f 4439 kfree(fib4_entry);
5b004412
JP
4440 return ERR_PTR(err);
4441}
4442
9aecce1c 4443static void mlxsw_sp_fib4_entry_destroy(struct mlxsw_sp *mlxsw_sp,
4f1c7f1f 4444 struct mlxsw_sp_fib4_entry *fib4_entry)
9aecce1c 4445{
0e6ea2a4 4446 mlxsw_sp_nexthop4_group_put(mlxsw_sp, &fib4_entry->common);
4f1c7f1f 4447 kfree(fib4_entry);
9aecce1c
IS
4448}
4449
4f1c7f1f 4450static struct mlxsw_sp_fib4_entry *
9aecce1c
IS
4451mlxsw_sp_fib4_entry_lookup(struct mlxsw_sp *mlxsw_sp,
4452 const struct fib_entry_notifier_info *fen_info)
5b004412 4453{
4f1c7f1f 4454 struct mlxsw_sp_fib4_entry *fib4_entry;
9aecce1c 4455 struct mlxsw_sp_fib_node *fib_node;
160e22aa
IS
4456 struct mlxsw_sp_fib *fib;
4457 struct mlxsw_sp_vr *vr;
4458
4459 vr = mlxsw_sp_vr_find(mlxsw_sp, fen_info->tb_id);
4460 if (!vr)
4461 return NULL;
4462 fib = mlxsw_sp_vr_fib(vr, MLXSW_SP_L3_PROTO_IPV4);
5b004412 4463
160e22aa
IS
4464 fib_node = mlxsw_sp_fib_node_lookup(fib, &fen_info->dst,
4465 sizeof(fen_info->dst),
4466 fen_info->dst_len);
4467 if (!fib_node)
9aecce1c
IS
4468 return NULL;
4469
4f1c7f1f
IS
4470 list_for_each_entry(fib4_entry, &fib_node->entry_list, common.list) {
4471 if (fib4_entry->tb_id == fen_info->tb_id &&
4472 fib4_entry->tos == fen_info->tos &&
4473 fib4_entry->type == fen_info->type &&
ba31d366
AS
4474 mlxsw_sp_nexthop4_group_fi(fib4_entry->common.nh_group) ==
4475 fen_info->fi) {
4f1c7f1f 4476 return fib4_entry;
9aecce1c
IS
4477 }
4478 }
4479
4480 return NULL;
4481}
4482
4483static const struct rhashtable_params mlxsw_sp_fib_ht_params = {
4484 .key_offset = offsetof(struct mlxsw_sp_fib_node, key),
4485 .head_offset = offsetof(struct mlxsw_sp_fib_node, ht_node),
4486 .key_len = sizeof(struct mlxsw_sp_fib_key),
4487 .automatic_shrinking = true,
4488};
4489
4490static int mlxsw_sp_fib_node_insert(struct mlxsw_sp_fib *fib,
4491 struct mlxsw_sp_fib_node *fib_node)
4492{
4493 return rhashtable_insert_fast(&fib->ht, &fib_node->ht_node,
4494 mlxsw_sp_fib_ht_params);
4495}
4496
4497static void mlxsw_sp_fib_node_remove(struct mlxsw_sp_fib *fib,
4498 struct mlxsw_sp_fib_node *fib_node)
4499{
4500 rhashtable_remove_fast(&fib->ht, &fib_node->ht_node,
4501 mlxsw_sp_fib_ht_params);
4502}
4503
4504static struct mlxsw_sp_fib_node *
4505mlxsw_sp_fib_node_lookup(struct mlxsw_sp_fib *fib, const void *addr,
4506 size_t addr_len, unsigned char prefix_len)
4507{
4508 struct mlxsw_sp_fib_key key;
4509
4510 memset(&key, 0, sizeof(key));
4511 memcpy(key.addr, addr, addr_len);
4512 key.prefix_len = prefix_len;
4513 return rhashtable_lookup_fast(&fib->ht, &key, mlxsw_sp_fib_ht_params);
4514}
4515
4516static struct mlxsw_sp_fib_node *
76610ebb 4517mlxsw_sp_fib_node_create(struct mlxsw_sp_fib *fib, const void *addr,
9aecce1c
IS
4518 size_t addr_len, unsigned char prefix_len)
4519{
4520 struct mlxsw_sp_fib_node *fib_node;
4521
4522 fib_node = kzalloc(sizeof(*fib_node), GFP_KERNEL);
4523 if (!fib_node)
5b004412
JP
4524 return NULL;
4525
9aecce1c 4526 INIT_LIST_HEAD(&fib_node->entry_list);
76610ebb 4527 list_add(&fib_node->list, &fib->node_list);
9aecce1c
IS
4528 memcpy(fib_node->key.addr, addr, addr_len);
4529 fib_node->key.prefix_len = prefix_len;
9aecce1c
IS
4530
4531 return fib_node;
4532}
4533
4534static void mlxsw_sp_fib_node_destroy(struct mlxsw_sp_fib_node *fib_node)
4535{
9aecce1c
IS
4536 list_del(&fib_node->list);
4537 WARN_ON(!list_empty(&fib_node->entry_list));
4538 kfree(fib_node);
4539}
4540
4541static bool
4542mlxsw_sp_fib_node_entry_is_first(const struct mlxsw_sp_fib_node *fib_node,
4543 const struct mlxsw_sp_fib_entry *fib_entry)
4544{
4545 return list_first_entry(&fib_node->entry_list,
4546 struct mlxsw_sp_fib_entry, list) == fib_entry;
4547}
4548
fc922bb0 4549static int mlxsw_sp_fib_lpm_tree_link(struct mlxsw_sp *mlxsw_sp,
fc922bb0
IS
4550 struct mlxsw_sp_fib_node *fib_node)
4551{
2b52ce02 4552 struct mlxsw_sp_prefix_usage req_prefix_usage;
3aad95df 4553 struct mlxsw_sp_fib *fib = fib_node->fib;
fc922bb0
IS
4554 struct mlxsw_sp_lpm_tree *lpm_tree;
4555 int err;
4556
2b52ce02
IS
4557 lpm_tree = mlxsw_sp->router->lpm.proto_trees[fib->proto];
4558 if (lpm_tree->prefix_ref_count[fib_node->key.prefix_len] != 0)
4559 goto out;
fc922bb0 4560
2b52ce02
IS
4561 mlxsw_sp_prefix_usage_cpy(&req_prefix_usage, &lpm_tree->prefix_usage);
4562 mlxsw_sp_prefix_usage_set(&req_prefix_usage, fib_node->key.prefix_len);
fc922bb0
IS
4563 lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage,
4564 fib->proto);
4565 if (IS_ERR(lpm_tree))
4566 return PTR_ERR(lpm_tree);
4567
fc922bb0
IS
4568 err = mlxsw_sp_vrs_lpm_tree_replace(mlxsw_sp, fib, lpm_tree);
4569 if (err)
2b52ce02 4570 goto err_lpm_tree_replace;
fc922bb0 4571
2b52ce02
IS
4572out:
4573 lpm_tree->prefix_ref_count[fib_node->key.prefix_len]++;
fc922bb0 4574 return 0;
2b52ce02
IS
4575
4576err_lpm_tree_replace:
4577 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
4578 return err;
fc922bb0
IS
4579}
4580
4581static void mlxsw_sp_fib_lpm_tree_unlink(struct mlxsw_sp *mlxsw_sp,
3aad95df 4582 struct mlxsw_sp_fib_node *fib_node)
fc922bb0 4583{
2b52ce02
IS
4584 struct mlxsw_sp_lpm_tree *lpm_tree = fib_node->fib->lpm_tree;
4585 struct mlxsw_sp_prefix_usage req_prefix_usage;
3aad95df 4586 struct mlxsw_sp_fib *fib = fib_node->fib;
2b52ce02 4587 int err;
3aad95df 4588
2b52ce02 4589 if (--lpm_tree->prefix_ref_count[fib_node->key.prefix_len] != 0)
fc922bb0 4590 return;
2b52ce02
IS
4591 /* Try to construct a new LPM tree from the current prefix usage
4592 * minus the unused one. If we fail, continue using the old one.
4fd00312 4593 */
2b52ce02
IS
4594 mlxsw_sp_prefix_usage_cpy(&req_prefix_usage, &lpm_tree->prefix_usage);
4595 mlxsw_sp_prefix_usage_clear(&req_prefix_usage,
4596 fib_node->key.prefix_len);
4597 lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage,
4598 fib->proto);
4599 if (IS_ERR(lpm_tree))
4600 return;
9aecce1c 4601
2b52ce02
IS
4602 err = mlxsw_sp_vrs_lpm_tree_replace(mlxsw_sp, fib, lpm_tree);
4603 if (err)
4604 goto err_lpm_tree_replace;
9aecce1c 4605
2b52ce02 4606 return;
9aecce1c 4607
2b52ce02
IS
4608err_lpm_tree_replace:
4609 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree);
5b004412
JP
4610}
4611
76610ebb
IS
4612static int mlxsw_sp_fib_node_init(struct mlxsw_sp *mlxsw_sp,
4613 struct mlxsw_sp_fib_node *fib_node,
4614 struct mlxsw_sp_fib *fib)
4615{
76610ebb
IS
4616 int err;
4617
4618 err = mlxsw_sp_fib_node_insert(fib, fib_node);
4619 if (err)
4620 return err;
4621 fib_node->fib = fib;
4622
3aad95df 4623 err = mlxsw_sp_fib_lpm_tree_link(mlxsw_sp, fib_node);
fc922bb0
IS
4624 if (err)
4625 goto err_fib_lpm_tree_link;
76610ebb 4626
76610ebb
IS
4627 return 0;
4628
fc922bb0 4629err_fib_lpm_tree_link:
76610ebb
IS
4630 fib_node->fib = NULL;
4631 mlxsw_sp_fib_node_remove(fib, fib_node);
4632 return err;
4633}
4634
4635static void mlxsw_sp_fib_node_fini(struct mlxsw_sp *mlxsw_sp,
4636 struct mlxsw_sp_fib_node *fib_node)
4637{
76610ebb
IS
4638 struct mlxsw_sp_fib *fib = fib_node->fib;
4639
3aad95df 4640 mlxsw_sp_fib_lpm_tree_unlink(mlxsw_sp, fib_node);
76610ebb
IS
4641 fib_node->fib = NULL;
4642 mlxsw_sp_fib_node_remove(fib, fib_node);
4643}
4644
9aecce1c 4645static struct mlxsw_sp_fib_node *
731ea1ca
IS
4646mlxsw_sp_fib_node_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id, const void *addr,
4647 size_t addr_len, unsigned char prefix_len,
4648 enum mlxsw_sp_l3proto proto)
5b004412 4649{
9aecce1c 4650 struct mlxsw_sp_fib_node *fib_node;
76610ebb 4651 struct mlxsw_sp_fib *fib;
9aecce1c
IS
4652 struct mlxsw_sp_vr *vr;
4653 int err;
4654
f8fa9b4e 4655 vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id, NULL);
9aecce1c
IS
4656 if (IS_ERR(vr))
4657 return ERR_CAST(vr);
731ea1ca 4658 fib = mlxsw_sp_vr_fib(vr, proto);
9aecce1c 4659
731ea1ca 4660 fib_node = mlxsw_sp_fib_node_lookup(fib, addr, addr_len, prefix_len);
9aecce1c
IS
4661 if (fib_node)
4662 return fib_node;
5b004412 4663
731ea1ca 4664 fib_node = mlxsw_sp_fib_node_create(fib, addr, addr_len, prefix_len);
9aecce1c
IS
4665 if (!fib_node) {
4666 err = -ENOMEM;
4667 goto err_fib_node_create;
5b004412 4668 }
9aecce1c 4669
76610ebb
IS
4670 err = mlxsw_sp_fib_node_init(mlxsw_sp, fib_node, fib);
4671 if (err)
4672 goto err_fib_node_init;
4673
9aecce1c
IS
4674 return fib_node;
4675
76610ebb
IS
4676err_fib_node_init:
4677 mlxsw_sp_fib_node_destroy(fib_node);
9aecce1c 4678err_fib_node_create:
2b52ce02 4679 mlxsw_sp_vr_put(mlxsw_sp, vr);
9aecce1c 4680 return ERR_PTR(err);
5b004412
JP
4681}
4682
731ea1ca
IS
4683static void mlxsw_sp_fib_node_put(struct mlxsw_sp *mlxsw_sp,
4684 struct mlxsw_sp_fib_node *fib_node)
5b004412 4685{
76610ebb 4686 struct mlxsw_sp_vr *vr = fib_node->fib->vr;
5b004412 4687
9aecce1c
IS
4688 if (!list_empty(&fib_node->entry_list))
4689 return;
76610ebb 4690 mlxsw_sp_fib_node_fini(mlxsw_sp, fib_node);
9aecce1c 4691 mlxsw_sp_fib_node_destroy(fib_node);
2b52ce02 4692 mlxsw_sp_vr_put(mlxsw_sp, vr);
61c503f9
JP
4693}
4694
4f1c7f1f 4695static struct mlxsw_sp_fib4_entry *
9aecce1c 4696mlxsw_sp_fib4_node_entry_find(const struct mlxsw_sp_fib_node *fib_node,
4f1c7f1f 4697 const struct mlxsw_sp_fib4_entry *new4_entry)
61c503f9 4698{
4f1c7f1f 4699 struct mlxsw_sp_fib4_entry *fib4_entry;
9aecce1c 4700
4f1c7f1f
IS
4701 list_for_each_entry(fib4_entry, &fib_node->entry_list, common.list) {
4702 if (fib4_entry->tb_id > new4_entry->tb_id)
9aecce1c 4703 continue;
4f1c7f1f 4704 if (fib4_entry->tb_id != new4_entry->tb_id)
9aecce1c 4705 break;
4f1c7f1f 4706 if (fib4_entry->tos > new4_entry->tos)
9aecce1c 4707 continue;
4f1c7f1f
IS
4708 if (fib4_entry->prio >= new4_entry->prio ||
4709 fib4_entry->tos < new4_entry->tos)
4710 return fib4_entry;
9aecce1c
IS
4711 }
4712
4713 return NULL;
4714}
4715
4f1c7f1f
IS
4716static int
4717mlxsw_sp_fib4_node_list_append(struct mlxsw_sp_fib4_entry *fib4_entry,
4718 struct mlxsw_sp_fib4_entry *new4_entry)
4283bce5
IS
4719{
4720 struct mlxsw_sp_fib_node *fib_node;
4721
4f1c7f1f 4722 if (WARN_ON(!fib4_entry))
4283bce5
IS
4723 return -EINVAL;
4724
4f1c7f1f
IS
4725 fib_node = fib4_entry->common.fib_node;
4726 list_for_each_entry_from(fib4_entry, &fib_node->entry_list,
4727 common.list) {
4728 if (fib4_entry->tb_id != new4_entry->tb_id ||
4729 fib4_entry->tos != new4_entry->tos ||
4730 fib4_entry->prio != new4_entry->prio)
4283bce5
IS
4731 break;
4732 }
4733
4f1c7f1f 4734 list_add_tail(&new4_entry->common.list, &fib4_entry->common.list);
4283bce5
IS
4735 return 0;
4736}
4737
9aecce1c 4738static int
9efbee6f 4739mlxsw_sp_fib4_node_list_insert(struct mlxsw_sp_fib4_entry *new4_entry,
599cf8f9 4740 bool replace, bool append)
9aecce1c 4741{
9efbee6f 4742 struct mlxsw_sp_fib_node *fib_node = new4_entry->common.fib_node;
4f1c7f1f 4743 struct mlxsw_sp_fib4_entry *fib4_entry;
9aecce1c 4744
4f1c7f1f 4745 fib4_entry = mlxsw_sp_fib4_node_entry_find(fib_node, new4_entry);
9aecce1c 4746
4283bce5 4747 if (append)
4f1c7f1f
IS
4748 return mlxsw_sp_fib4_node_list_append(fib4_entry, new4_entry);
4749 if (replace && WARN_ON(!fib4_entry))
599cf8f9 4750 return -EINVAL;
4283bce5 4751
599cf8f9
IS
4752 /* Insert new entry before replaced one, so that we can later
4753 * remove the second.
4754 */
4f1c7f1f
IS
4755 if (fib4_entry) {
4756 list_add_tail(&new4_entry->common.list,
4757 &fib4_entry->common.list);
9aecce1c 4758 } else {
4f1c7f1f 4759 struct mlxsw_sp_fib4_entry *last;
9aecce1c 4760
4f1c7f1f
IS
4761 list_for_each_entry(last, &fib_node->entry_list, common.list) {
4762 if (new4_entry->tb_id > last->tb_id)
9aecce1c 4763 break;
4f1c7f1f 4764 fib4_entry = last;
9aecce1c
IS
4765 }
4766
4f1c7f1f
IS
4767 if (fib4_entry)
4768 list_add(&new4_entry->common.list,
4769 &fib4_entry->common.list);
9aecce1c 4770 else
4f1c7f1f
IS
4771 list_add(&new4_entry->common.list,
4772 &fib_node->entry_list);
9aecce1c
IS
4773 }
4774
4775 return 0;
4776}
4777
4778static void
4f1c7f1f 4779mlxsw_sp_fib4_node_list_remove(struct mlxsw_sp_fib4_entry *fib4_entry)
9aecce1c 4780{
4f1c7f1f 4781 list_del(&fib4_entry->common.list);
9aecce1c
IS
4782}
4783
80c238f9
IS
4784static int mlxsw_sp_fib_node_entry_add(struct mlxsw_sp *mlxsw_sp,
4785 struct mlxsw_sp_fib_entry *fib_entry)
9aecce1c 4786{
9efbee6f
IS
4787 struct mlxsw_sp_fib_node *fib_node = fib_entry->fib_node;
4788
9aecce1c
IS
4789 if (!mlxsw_sp_fib_node_entry_is_first(fib_node, fib_entry))
4790 return 0;
4791
4792 /* To prevent packet loss, overwrite the previously offloaded
4793 * entry.
4794 */
4795 if (!list_is_singular(&fib_node->entry_list)) {
4796 enum mlxsw_reg_ralue_op op = MLXSW_REG_RALUE_OP_WRITE_DELETE;
4797 struct mlxsw_sp_fib_entry *n = list_next_entry(fib_entry, list);
4798
4799 mlxsw_sp_fib_entry_offload_refresh(n, op, 0);
4800 }
4801
4802 return mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry);
4803}
4804
80c238f9
IS
4805static void mlxsw_sp_fib_node_entry_del(struct mlxsw_sp *mlxsw_sp,
4806 struct mlxsw_sp_fib_entry *fib_entry)
9aecce1c 4807{
9efbee6f
IS
4808 struct mlxsw_sp_fib_node *fib_node = fib_entry->fib_node;
4809
9aecce1c
IS
4810 if (!mlxsw_sp_fib_node_entry_is_first(fib_node, fib_entry))
4811 return;
4812
4813 /* Promote the next entry by overwriting the deleted entry */
4814 if (!list_is_singular(&fib_node->entry_list)) {
4815 struct mlxsw_sp_fib_entry *n = list_next_entry(fib_entry, list);
4816 enum mlxsw_reg_ralue_op op = MLXSW_REG_RALUE_OP_WRITE_DELETE;
4817
4818 mlxsw_sp_fib_entry_update(mlxsw_sp, n);
4819 mlxsw_sp_fib_entry_offload_refresh(fib_entry, op, 0);
4820 return;
4821 }
4822
4823 mlxsw_sp_fib_entry_del(mlxsw_sp, fib_entry);
4824}
4825
4826static int mlxsw_sp_fib4_node_entry_link(struct mlxsw_sp *mlxsw_sp,
4f1c7f1f 4827 struct mlxsw_sp_fib4_entry *fib4_entry,
599cf8f9 4828 bool replace, bool append)
9aecce1c 4829{
9aecce1c
IS
4830 int err;
4831
9efbee6f 4832 err = mlxsw_sp_fib4_node_list_insert(fib4_entry, replace, append);
9aecce1c
IS
4833 if (err)
4834 return err;
4835
80c238f9 4836 err = mlxsw_sp_fib_node_entry_add(mlxsw_sp, &fib4_entry->common);
9aecce1c 4837 if (err)
80c238f9 4838 goto err_fib_node_entry_add;
9aecce1c 4839
9aecce1c
IS
4840 return 0;
4841
80c238f9 4842err_fib_node_entry_add:
4f1c7f1f 4843 mlxsw_sp_fib4_node_list_remove(fib4_entry);
9aecce1c
IS
4844 return err;
4845}
4846
4847static void
4848mlxsw_sp_fib4_node_entry_unlink(struct mlxsw_sp *mlxsw_sp,
4f1c7f1f 4849 struct mlxsw_sp_fib4_entry *fib4_entry)
9aecce1c 4850{
80c238f9 4851 mlxsw_sp_fib_node_entry_del(mlxsw_sp, &fib4_entry->common);
4f1c7f1f 4852 mlxsw_sp_fib4_node_list_remove(fib4_entry);
4607f6d2
PM
4853
4854 if (fib4_entry->common.type == MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP)
4855 mlxsw_sp_fib_entry_decap_fini(mlxsw_sp, &fib4_entry->common);
9aecce1c
IS
4856}
4857
599cf8f9 4858static void mlxsw_sp_fib4_entry_replace(struct mlxsw_sp *mlxsw_sp,
4f1c7f1f 4859 struct mlxsw_sp_fib4_entry *fib4_entry,
599cf8f9
IS
4860 bool replace)
4861{
4f1c7f1f
IS
4862 struct mlxsw_sp_fib_node *fib_node = fib4_entry->common.fib_node;
4863 struct mlxsw_sp_fib4_entry *replaced;
599cf8f9
IS
4864
4865 if (!replace)
4866 return;
4867
4868 /* We inserted the new entry before replaced one */
4f1c7f1f 4869 replaced = list_next_entry(fib4_entry, common.list);
599cf8f9
IS
4870
4871 mlxsw_sp_fib4_node_entry_unlink(mlxsw_sp, replaced);
4872 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, replaced);
731ea1ca 4873 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
599cf8f9
IS
4874}
4875
9aecce1c
IS
4876static int
4877mlxsw_sp_router_fib4_add(struct mlxsw_sp *mlxsw_sp,
4283bce5 4878 const struct fib_entry_notifier_info *fen_info,
599cf8f9 4879 bool replace, bool append)
9aecce1c 4880{
4f1c7f1f 4881 struct mlxsw_sp_fib4_entry *fib4_entry;
9aecce1c 4882 struct mlxsw_sp_fib_node *fib_node;
61c503f9
JP
4883 int err;
4884
9011b677 4885 if (mlxsw_sp->router->aborted)
b45f64d1
JP
4886 return 0;
4887
731ea1ca
IS
4888 fib_node = mlxsw_sp_fib_node_get(mlxsw_sp, fen_info->tb_id,
4889 &fen_info->dst, sizeof(fen_info->dst),
4890 fen_info->dst_len,
4891 MLXSW_SP_L3_PROTO_IPV4);
9aecce1c
IS
4892 if (IS_ERR(fib_node)) {
4893 dev_warn(mlxsw_sp->bus_info->dev, "Failed to get FIB node\n");
4894 return PTR_ERR(fib_node);
b45f64d1 4895 }
61c503f9 4896
4f1c7f1f
IS
4897 fib4_entry = mlxsw_sp_fib4_entry_create(mlxsw_sp, fib_node, fen_info);
4898 if (IS_ERR(fib4_entry)) {
9aecce1c 4899 dev_warn(mlxsw_sp->bus_info->dev, "Failed to create FIB entry\n");
4f1c7f1f 4900 err = PTR_ERR(fib4_entry);
9aecce1c
IS
4901 goto err_fib4_entry_create;
4902 }
5b004412 4903
4f1c7f1f 4904 err = mlxsw_sp_fib4_node_entry_link(mlxsw_sp, fib4_entry, replace,
599cf8f9 4905 append);
b45f64d1 4906 if (err) {
9aecce1c
IS
4907 dev_warn(mlxsw_sp->bus_info->dev, "Failed to link FIB entry to node\n");
4908 goto err_fib4_node_entry_link;
b45f64d1 4909 }
9aecce1c 4910
4f1c7f1f 4911 mlxsw_sp_fib4_entry_replace(mlxsw_sp, fib4_entry, replace);
599cf8f9 4912
61c503f9
JP
4913 return 0;
4914
9aecce1c 4915err_fib4_node_entry_link:
4f1c7f1f 4916 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry);
9aecce1c 4917err_fib4_entry_create:
731ea1ca 4918 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
61c503f9
JP
4919 return err;
4920}
4921
37956d78
JP
4922static void mlxsw_sp_router_fib4_del(struct mlxsw_sp *mlxsw_sp,
4923 struct fib_entry_notifier_info *fen_info)
61c503f9 4924{
4f1c7f1f 4925 struct mlxsw_sp_fib4_entry *fib4_entry;
9aecce1c 4926 struct mlxsw_sp_fib_node *fib_node;
61c503f9 4927
9011b677 4928 if (mlxsw_sp->router->aborted)
37956d78 4929 return;
b45f64d1 4930
4f1c7f1f
IS
4931 fib4_entry = mlxsw_sp_fib4_entry_lookup(mlxsw_sp, fen_info);
4932 if (WARN_ON(!fib4_entry))
37956d78 4933 return;
4f1c7f1f 4934 fib_node = fib4_entry->common.fib_node;
5b004412 4935
4f1c7f1f
IS
4936 mlxsw_sp_fib4_node_entry_unlink(mlxsw_sp, fib4_entry);
4937 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry);
731ea1ca 4938 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
61c503f9 4939}
b45f64d1 4940
8d1c802b 4941static bool mlxsw_sp_fib6_rt_should_ignore(const struct fib6_info *rt)
428b851f
IS
4942{
4943 /* Packets with link-local destination IP arriving to the router
4944 * are trapped to the CPU, so no need to program specific routes
4945 * for them.
4946 */
93c2fb25 4947 if (ipv6_addr_type(&rt->fib6_dst.addr) & IPV6_ADDR_LINKLOCAL)
428b851f
IS
4948 return true;
4949
4950 /* Multicast routes aren't supported, so ignore them. Neighbour
4951 * Discovery packets are specifically trapped.
4952 */
93c2fb25 4953 if (ipv6_addr_type(&rt->fib6_dst.addr) & IPV6_ADDR_MULTICAST)
428b851f
IS
4954 return true;
4955
4956 /* Cloned routes are irrelevant in the forwarding path. */
93c2fb25 4957 if (rt->fib6_flags & RTF_CACHE)
428b851f
IS
4958 return true;
4959
4960 return false;
4961}
4962
8d1c802b 4963static struct mlxsw_sp_rt6 *mlxsw_sp_rt6_create(struct fib6_info *rt)
428b851f
IS
4964{
4965 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
4966
4967 mlxsw_sp_rt6 = kzalloc(sizeof(*mlxsw_sp_rt6), GFP_KERNEL);
4968 if (!mlxsw_sp_rt6)
4969 return ERR_PTR(-ENOMEM);
4970
4971 /* In case of route replace, replaced route is deleted with
4972 * no notification. Take reference to prevent accessing freed
4973 * memory.
4974 */
4975 mlxsw_sp_rt6->rt = rt;
8d1c802b 4976 fib6_info_hold(rt);
428b851f
IS
4977
4978 return mlxsw_sp_rt6;
4979}
4980
4981#if IS_ENABLED(CONFIG_IPV6)
8d1c802b 4982static void mlxsw_sp_rt6_release(struct fib6_info *rt)
428b851f 4983{
8d1c802b 4984 fib6_info_release(rt);
428b851f
IS
4985}
4986#else
8d1c802b 4987static void mlxsw_sp_rt6_release(struct fib6_info *rt)
428b851f
IS
4988{
4989}
4990#endif
4991
4992static void mlxsw_sp_rt6_destroy(struct mlxsw_sp_rt6 *mlxsw_sp_rt6)
4993{
4994 mlxsw_sp_rt6_release(mlxsw_sp_rt6->rt);
4995 kfree(mlxsw_sp_rt6);
4996}
4997
33bd5ac5
DA
4998static bool mlxsw_sp_fib6_rt_can_mp(const struct fib6_info *rt)
4999{
5000 /* RTF_CACHE routes are ignored */
1cf844c7
DA
5001 return !(rt->fib6_flags & RTF_ADDRCONF) &&
5002 rt->fib6_nh->fib_nh_gw_family;
33bd5ac5
DA
5003}
5004
8d1c802b 5005static struct fib6_info *
428b851f
IS
5006mlxsw_sp_fib6_entry_rt(const struct mlxsw_sp_fib6_entry *fib6_entry)
5007{
5008 return list_first_entry(&fib6_entry->rt6_list, struct mlxsw_sp_rt6,
5009 list)->rt;
5010}
5011
5012static struct mlxsw_sp_fib6_entry *
5013mlxsw_sp_fib6_node_mp_entry_find(const struct mlxsw_sp_fib_node *fib_node,
33bd5ac5 5014 const struct fib6_info *nrt, bool replace)
428b851f
IS
5015{
5016 struct mlxsw_sp_fib6_entry *fib6_entry;
5017
33bd5ac5 5018 if (!mlxsw_sp_fib6_rt_can_mp(nrt) || replace)
428b851f
IS
5019 return NULL;
5020
5021 list_for_each_entry(fib6_entry, &fib_node->entry_list, common.list) {
8d1c802b 5022 struct fib6_info *rt = mlxsw_sp_fib6_entry_rt(fib6_entry);
428b851f
IS
5023
5024 /* RT6_TABLE_LOCAL and RT6_TABLE_MAIN share the same
5025 * virtual router.
5026 */
93c2fb25 5027 if (rt->fib6_table->tb6_id > nrt->fib6_table->tb6_id)
428b851f 5028 continue;
93c2fb25 5029 if (rt->fib6_table->tb6_id != nrt->fib6_table->tb6_id)
428b851f 5030 break;
93c2fb25 5031 if (rt->fib6_metric < nrt->fib6_metric)
428b851f 5032 continue;
33bd5ac5
DA
5033 if (rt->fib6_metric == nrt->fib6_metric &&
5034 mlxsw_sp_fib6_rt_can_mp(rt))
428b851f 5035 return fib6_entry;
93c2fb25 5036 if (rt->fib6_metric > nrt->fib6_metric)
428b851f
IS
5037 break;
5038 }
5039
5040 return NULL;
5041}
5042
5043static struct mlxsw_sp_rt6 *
5044mlxsw_sp_fib6_entry_rt_find(const struct mlxsw_sp_fib6_entry *fib6_entry,
8d1c802b 5045 const struct fib6_info *rt)
428b851f
IS
5046{
5047 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
5048
5049 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) {
5050 if (mlxsw_sp_rt6->rt == rt)
5051 return mlxsw_sp_rt6;
5052 }
5053
5054 return NULL;
5055}
5056
8f28a309 5057static bool mlxsw_sp_nexthop6_ipip_type(const struct mlxsw_sp *mlxsw_sp,
8d1c802b 5058 const struct fib6_info *rt,
8f28a309
PM
5059 enum mlxsw_sp_ipip_type *ret)
5060{
1cf844c7
DA
5061 return rt->fib6_nh->fib_nh_dev &&
5062 mlxsw_sp_netdev_ipip_type(mlxsw_sp, rt->fib6_nh->fib_nh_dev, ret);
8f28a309
PM
5063}
5064
35225e47
PM
5065static int mlxsw_sp_nexthop6_type_init(struct mlxsw_sp *mlxsw_sp,
5066 struct mlxsw_sp_nexthop_group *nh_grp,
5067 struct mlxsw_sp_nexthop *nh,
8d1c802b 5068 const struct fib6_info *rt)
428b851f 5069{
d97cda5f
PM
5070 const struct mlxsw_sp_ipip_ops *ipip_ops;
5071 struct mlxsw_sp_ipip_entry *ipip_entry;
1cf844c7 5072 struct net_device *dev = rt->fib6_nh->fib_nh_dev;
428b851f
IS
5073 struct mlxsw_sp_rif *rif;
5074 int err;
5075
d97cda5f
PM
5076 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, dev);
5077 if (ipip_entry) {
5078 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt];
5079 if (ipip_ops->can_offload(mlxsw_sp, dev,
5080 MLXSW_SP_L3_PROTO_IPV6)) {
5081 nh->type = MLXSW_SP_NEXTHOP_TYPE_IPIP;
5082 mlxsw_sp_nexthop_ipip_init(mlxsw_sp, nh, ipip_entry);
5083 return 0;
5084 }
8f28a309
PM
5085 }
5086
35225e47 5087 nh->type = MLXSW_SP_NEXTHOP_TYPE_ETH;
428b851f
IS
5088 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
5089 if (!rif)
5090 return 0;
5091 mlxsw_sp_nexthop_rif_init(nh, rif);
5092
5093 err = mlxsw_sp_nexthop_neigh_init(mlxsw_sp, nh);
5094 if (err)
5095 goto err_nexthop_neigh_init;
5096
5097 return 0;
5098
5099err_nexthop_neigh_init:
5100 mlxsw_sp_nexthop_rif_fini(nh);
5101 return err;
5102}
5103
35225e47
PM
5104static void mlxsw_sp_nexthop6_type_fini(struct mlxsw_sp *mlxsw_sp,
5105 struct mlxsw_sp_nexthop *nh)
5106{
5107 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh);
5108}
5109
5110static int mlxsw_sp_nexthop6_init(struct mlxsw_sp *mlxsw_sp,
5111 struct mlxsw_sp_nexthop_group *nh_grp,
5112 struct mlxsw_sp_nexthop *nh,
8d1c802b 5113 const struct fib6_info *rt)
35225e47 5114{
1cf844c7 5115 struct net_device *dev = rt->fib6_nh->fib_nh_dev;
35225e47
PM
5116
5117 nh->nh_grp = nh_grp;
1cf844c7
DA
5118 nh->nh_weight = rt->fib6_nh->fib_nh_weight;
5119 memcpy(&nh->gw_addr, &rt->fib6_nh->fib_nh_gw6, sizeof(nh->gw_addr));
a5390278 5120 mlxsw_sp_nexthop_counter_alloc(mlxsw_sp, nh);
35225e47 5121
dbe4598c
AS
5122 list_add_tail(&nh->router_list_node, &mlxsw_sp->router->nexthop_list);
5123
35225e47
PM
5124 if (!dev)
5125 return 0;
5126 nh->ifindex = dev->ifindex;
5127
5128 return mlxsw_sp_nexthop6_type_init(mlxsw_sp, nh_grp, nh, rt);
5129}
5130
428b851f
IS
5131static void mlxsw_sp_nexthop6_fini(struct mlxsw_sp *mlxsw_sp,
5132 struct mlxsw_sp_nexthop *nh)
5133{
35225e47 5134 mlxsw_sp_nexthop6_type_fini(mlxsw_sp, nh);
dbe4598c 5135 list_del(&nh->router_list_node);
a5390278 5136 mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh);
428b851f
IS
5137}
5138
f6050ee6 5139static bool mlxsw_sp_rt6_is_gateway(const struct mlxsw_sp *mlxsw_sp,
8d1c802b 5140 const struct fib6_info *rt)
f6050ee6 5141{
1cf844c7 5142 return rt->fib6_nh->fib_nh_gw_family ||
8f28a309 5143 mlxsw_sp_nexthop6_ipip_type(mlxsw_sp, rt, NULL);
f6050ee6
PM
5144}
5145
428b851f
IS
5146static struct mlxsw_sp_nexthop_group *
5147mlxsw_sp_nexthop6_group_create(struct mlxsw_sp *mlxsw_sp,
5148 struct mlxsw_sp_fib6_entry *fib6_entry)
5149{
5150 struct mlxsw_sp_nexthop_group *nh_grp;
5151 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
5152 struct mlxsw_sp_nexthop *nh;
428b851f
IS
5153 int i = 0;
5154 int err;
5155
9e475293
GS
5156 nh_grp = kzalloc(struct_size(nh_grp, nexthops, fib6_entry->nrt6),
5157 GFP_KERNEL);
428b851f
IS
5158 if (!nh_grp)
5159 return ERR_PTR(-ENOMEM);
5160 INIT_LIST_HEAD(&nh_grp->fib_list);
5161#if IS_ENABLED(CONFIG_IPV6)
5162 nh_grp->neigh_tbl = &nd_tbl;
5163#endif
5164 mlxsw_sp_rt6 = list_first_entry(&fib6_entry->rt6_list,
5165 struct mlxsw_sp_rt6, list);
f6050ee6 5166 nh_grp->gateway = mlxsw_sp_rt6_is_gateway(mlxsw_sp, mlxsw_sp_rt6->rt);
428b851f
IS
5167 nh_grp->count = fib6_entry->nrt6;
5168 for (i = 0; i < nh_grp->count; i++) {
8d1c802b 5169 struct fib6_info *rt = mlxsw_sp_rt6->rt;
428b851f
IS
5170
5171 nh = &nh_grp->nexthops[i];
5172 err = mlxsw_sp_nexthop6_init(mlxsw_sp, nh_grp, nh, rt);
5173 if (err)
5174 goto err_nexthop6_init;
5175 mlxsw_sp_rt6 = list_next_entry(mlxsw_sp_rt6, list);
5176 }
e6f3b379
AS
5177
5178 err = mlxsw_sp_nexthop_group_insert(mlxsw_sp, nh_grp);
5179 if (err)
5180 goto err_nexthop_group_insert;
5181
428b851f
IS
5182 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
5183 return nh_grp;
5184
e6f3b379 5185err_nexthop_group_insert:
428b851f
IS
5186err_nexthop6_init:
5187 for (i--; i >= 0; i--) {
5188 nh = &nh_grp->nexthops[i];
5189 mlxsw_sp_nexthop6_fini(mlxsw_sp, nh);
5190 }
5191 kfree(nh_grp);
5192 return ERR_PTR(err);
5193}
5194
5195static void
5196mlxsw_sp_nexthop6_group_destroy(struct mlxsw_sp *mlxsw_sp,
5197 struct mlxsw_sp_nexthop_group *nh_grp)
5198{
5199 struct mlxsw_sp_nexthop *nh;
5200 int i = nh_grp->count;
5201
e6f3b379 5202 mlxsw_sp_nexthop_group_remove(mlxsw_sp, nh_grp);
428b851f
IS
5203 for (i--; i >= 0; i--) {
5204 nh = &nh_grp->nexthops[i];
5205 mlxsw_sp_nexthop6_fini(mlxsw_sp, nh);
5206 }
5207 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp);
5208 WARN_ON(nh_grp->adj_index_valid);
5209 kfree(nh_grp);
5210}
5211
5212static int mlxsw_sp_nexthop6_group_get(struct mlxsw_sp *mlxsw_sp,
5213 struct mlxsw_sp_fib6_entry *fib6_entry)
5214{
5215 struct mlxsw_sp_nexthop_group *nh_grp;
5216
e6f3b379
AS
5217 nh_grp = mlxsw_sp_nexthop6_group_lookup(mlxsw_sp, fib6_entry);
5218 if (!nh_grp) {
5219 nh_grp = mlxsw_sp_nexthop6_group_create(mlxsw_sp, fib6_entry);
5220 if (IS_ERR(nh_grp))
5221 return PTR_ERR(nh_grp);
5222 }
428b851f
IS
5223
5224 list_add_tail(&fib6_entry->common.nexthop_group_node,
5225 &nh_grp->fib_list);
5226 fib6_entry->common.nh_group = nh_grp;
5227
5228 return 0;
5229}
5230
5231static void mlxsw_sp_nexthop6_group_put(struct mlxsw_sp *mlxsw_sp,
5232 struct mlxsw_sp_fib_entry *fib_entry)
5233{
5234 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group;
5235
5236 list_del(&fib_entry->nexthop_group_node);
5237 if (!list_empty(&nh_grp->fib_list))
5238 return;
5239 mlxsw_sp_nexthop6_group_destroy(mlxsw_sp, nh_grp);
5240}
5241
5242static int
5243mlxsw_sp_nexthop6_group_update(struct mlxsw_sp *mlxsw_sp,
5244 struct mlxsw_sp_fib6_entry *fib6_entry)
5245{
5246 struct mlxsw_sp_nexthop_group *old_nh_grp = fib6_entry->common.nh_group;
5247 int err;
5248
5249 fib6_entry->common.nh_group = NULL;
5250 list_del(&fib6_entry->common.nexthop_group_node);
5251
5252 err = mlxsw_sp_nexthop6_group_get(mlxsw_sp, fib6_entry);
5253 if (err)
5254 goto err_nexthop6_group_get;
5255
5256 /* In case this entry is offloaded, then the adjacency index
5257 * currently associated with it in the device's table is that
5258 * of the old group. Start using the new one instead.
5259 */
5260 err = mlxsw_sp_fib_node_entry_add(mlxsw_sp, &fib6_entry->common);
5261 if (err)
5262 goto err_fib_node_entry_add;
5263
5264 if (list_empty(&old_nh_grp->fib_list))
5265 mlxsw_sp_nexthop6_group_destroy(mlxsw_sp, old_nh_grp);
5266
5267 return 0;
5268
5269err_fib_node_entry_add:
5270 mlxsw_sp_nexthop6_group_put(mlxsw_sp, &fib6_entry->common);
5271err_nexthop6_group_get:
5272 list_add_tail(&fib6_entry->common.nexthop_group_node,
5273 &old_nh_grp->fib_list);
5274 fib6_entry->common.nh_group = old_nh_grp;
5275 return err;
5276}
5277
5278static int
5279mlxsw_sp_fib6_entry_nexthop_add(struct mlxsw_sp *mlxsw_sp,
5280 struct mlxsw_sp_fib6_entry *fib6_entry,
d21afd30 5281 struct fib6_info **rt_arr, unsigned int nrt6)
428b851f
IS
5282{
5283 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
d21afd30 5284 int err, i;
428b851f 5285
d21afd30
IS
5286 for (i = 0; i < nrt6; i++) {
5287 mlxsw_sp_rt6 = mlxsw_sp_rt6_create(rt_arr[i]);
5288 if (IS_ERR(mlxsw_sp_rt6)) {
5289 err = PTR_ERR(mlxsw_sp_rt6);
5290 goto err_rt6_create;
5291 }
428b851f 5292
d21afd30
IS
5293 list_add_tail(&mlxsw_sp_rt6->list, &fib6_entry->rt6_list);
5294 fib6_entry->nrt6++;
5295 }
428b851f
IS
5296
5297 err = mlxsw_sp_nexthop6_group_update(mlxsw_sp, fib6_entry);
5298 if (err)
5299 goto err_nexthop6_group_update;
5300
5301 return 0;
5302
5303err_nexthop6_group_update:
d21afd30
IS
5304 i = nrt6;
5305err_rt6_create:
5306 for (i--; i >= 0; i--) {
5307 fib6_entry->nrt6--;
5308 mlxsw_sp_rt6 = list_last_entry(&fib6_entry->rt6_list,
5309 struct mlxsw_sp_rt6, list);
5310 list_del(&mlxsw_sp_rt6->list);
5311 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
5312 }
428b851f
IS
5313 return err;
5314}
5315
5316static void
5317mlxsw_sp_fib6_entry_nexthop_del(struct mlxsw_sp *mlxsw_sp,
5318 struct mlxsw_sp_fib6_entry *fib6_entry,
d21afd30 5319 struct fib6_info **rt_arr, unsigned int nrt6)
428b851f
IS
5320{
5321 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
d21afd30 5322 int i;
428b851f 5323
d21afd30
IS
5324 for (i = 0; i < nrt6; i++) {
5325 mlxsw_sp_rt6 = mlxsw_sp_fib6_entry_rt_find(fib6_entry,
5326 rt_arr[i]);
5327 if (WARN_ON_ONCE(!mlxsw_sp_rt6))
5328 continue;
5329
5330 fib6_entry->nrt6--;
5331 list_del(&mlxsw_sp_rt6->list);
5332 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
5333 }
428b851f 5334
428b851f 5335 mlxsw_sp_nexthop6_group_update(mlxsw_sp, fib6_entry);
428b851f
IS
5336}
5337
f6050ee6
PM
5338static void mlxsw_sp_fib6_entry_type_set(struct mlxsw_sp *mlxsw_sp,
5339 struct mlxsw_sp_fib_entry *fib_entry,
8d1c802b 5340 const struct fib6_info *rt)
428b851f
IS
5341{
5342 /* Packets hitting RTF_REJECT routes need to be discarded by the
5343 * stack. We can rely on their destination device not having a
5344 * RIF (it's the loopback device) and can thus use action type
5345 * local, which will cause them to be trapped with a lower
5346 * priority than packets that need to be locally received.
5347 */
93c2fb25 5348 if (rt->fib6_flags & (RTF_LOCAL | RTF_ANYCAST))
428b851f 5349 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP;
2810c3b2
IS
5350 else if (rt->fib6_type == RTN_BLACKHOLE)
5351 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE;
93c2fb25 5352 else if (rt->fib6_flags & RTF_REJECT)
428b851f 5353 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL;
f6050ee6 5354 else if (mlxsw_sp_rt6_is_gateway(mlxsw_sp, rt))
428b851f
IS
5355 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_REMOTE;
5356 else
5357 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL;
5358}
5359
5360static void
5361mlxsw_sp_fib6_entry_rt_destroy_all(struct mlxsw_sp_fib6_entry *fib6_entry)
5362{
5363 struct mlxsw_sp_rt6 *mlxsw_sp_rt6, *tmp;
5364
5365 list_for_each_entry_safe(mlxsw_sp_rt6, tmp, &fib6_entry->rt6_list,
5366 list) {
5367 fib6_entry->nrt6--;
5368 list_del(&mlxsw_sp_rt6->list);
5369 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
5370 }
5371}
5372
5373static struct mlxsw_sp_fib6_entry *
5374mlxsw_sp_fib6_entry_create(struct mlxsw_sp *mlxsw_sp,
5375 struct mlxsw_sp_fib_node *fib_node,
2d9dd7ec 5376 struct fib6_info **rt_arr, unsigned int nrt6)
428b851f
IS
5377{
5378 struct mlxsw_sp_fib6_entry *fib6_entry;
5379 struct mlxsw_sp_fib_entry *fib_entry;
5380 struct mlxsw_sp_rt6 *mlxsw_sp_rt6;
2d9dd7ec 5381 int err, i;
428b851f
IS
5382
5383 fib6_entry = kzalloc(sizeof(*fib6_entry), GFP_KERNEL);
5384 if (!fib6_entry)
5385 return ERR_PTR(-ENOMEM);
5386 fib_entry = &fib6_entry->common;
5387
2d9dd7ec
IS
5388 INIT_LIST_HEAD(&fib6_entry->rt6_list);
5389
5390 for (i = 0; i < nrt6; i++) {
5391 mlxsw_sp_rt6 = mlxsw_sp_rt6_create(rt_arr[i]);
5392 if (IS_ERR(mlxsw_sp_rt6)) {
5393 err = PTR_ERR(mlxsw_sp_rt6);
5394 goto err_rt6_create;
5395 }
5396 list_add_tail(&mlxsw_sp_rt6->list, &fib6_entry->rt6_list);
5397 fib6_entry->nrt6++;
428b851f
IS
5398 }
5399
2d9dd7ec 5400 mlxsw_sp_fib6_entry_type_set(mlxsw_sp, fib_entry, rt_arr[0]);
428b851f 5401
428b851f
IS
5402 err = mlxsw_sp_nexthop6_group_get(mlxsw_sp, fib6_entry);
5403 if (err)
5404 goto err_nexthop6_group_get;
5405
5406 fib_entry->fib_node = fib_node;
5407
5408 return fib6_entry;
5409
5410err_nexthop6_group_get:
2d9dd7ec 5411 i = nrt6;
428b851f 5412err_rt6_create:
2d9dd7ec
IS
5413 for (i--; i >= 0; i--) {
5414 fib6_entry->nrt6--;
5415 mlxsw_sp_rt6 = list_last_entry(&fib6_entry->rt6_list,
5416 struct mlxsw_sp_rt6, list);
5417 list_del(&mlxsw_sp_rt6->list);
5418 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6);
5419 }
428b851f
IS
5420 kfree(fib6_entry);
5421 return ERR_PTR(err);
5422}
5423
5424static void mlxsw_sp_fib6_entry_destroy(struct mlxsw_sp *mlxsw_sp,
5425 struct mlxsw_sp_fib6_entry *fib6_entry)
5426{
5427 mlxsw_sp_nexthop6_group_put(mlxsw_sp, &fib6_entry->common);
5428 mlxsw_sp_fib6_entry_rt_destroy_all(fib6_entry);
5429 WARN_ON(fib6_entry->nrt6);
5430 kfree(fib6_entry);
5431}
5432
5433static struct mlxsw_sp_fib6_entry *
5434mlxsw_sp_fib6_node_entry_find(const struct mlxsw_sp_fib_node *fib_node,
8d1c802b 5435 const struct fib6_info *nrt, bool replace)
428b851f 5436{
33bd5ac5 5437 struct mlxsw_sp_fib6_entry *fib6_entry, *fallback = NULL;
428b851f
IS
5438
5439 list_for_each_entry(fib6_entry, &fib_node->entry_list, common.list) {
8d1c802b 5440 struct fib6_info *rt = mlxsw_sp_fib6_entry_rt(fib6_entry);
428b851f 5441
93c2fb25 5442 if (rt->fib6_table->tb6_id > nrt->fib6_table->tb6_id)
428b851f 5443 continue;
93c2fb25 5444 if (rt->fib6_table->tb6_id != nrt->fib6_table->tb6_id)
428b851f 5445 break;
33bd5ac5
DA
5446 if (replace && rt->fib6_metric == nrt->fib6_metric) {
5447 if (mlxsw_sp_fib6_rt_can_mp(rt) ==
5448 mlxsw_sp_fib6_rt_can_mp(nrt))
5449 return fib6_entry;
5450 if (mlxsw_sp_fib6_rt_can_mp(nrt))
5451 fallback = fallback ?: fib6_entry;
5452 }
93c2fb25 5453 if (rt->fib6_metric > nrt->fib6_metric)
33bd5ac5 5454 return fallback ?: fib6_entry;
428b851f
IS
5455 }
5456
33bd5ac5 5457 return fallback;
428b851f
IS
5458}
5459
5460static int
0a7fd1ac 5461mlxsw_sp_fib6_node_list_insert(struct mlxsw_sp_fib6_entry *new6_entry,
94d628d1 5462 bool *p_replace)
428b851f
IS
5463{
5464 struct mlxsw_sp_fib_node *fib_node = new6_entry->common.fib_node;
8d1c802b 5465 struct fib6_info *nrt = mlxsw_sp_fib6_entry_rt(new6_entry);
428b851f
IS
5466 struct mlxsw_sp_fib6_entry *fib6_entry;
5467
94d628d1 5468 fib6_entry = mlxsw_sp_fib6_node_entry_find(fib_node, nrt, *p_replace);
0a7fd1ac 5469
94d628d1
IS
5470 if (*p_replace && !fib6_entry)
5471 *p_replace = false;
428b851f
IS
5472
5473 if (fib6_entry) {
5474 list_add_tail(&new6_entry->common.list,
5475 &fib6_entry->common.list);
5476 } else {
5477 struct mlxsw_sp_fib6_entry *last;
5478
5479 list_for_each_entry(last, &fib_node->entry_list, common.list) {
8d1c802b 5480 struct fib6_info *rt = mlxsw_sp_fib6_entry_rt(last);
428b851f 5481
93c2fb25 5482 if (nrt->fib6_table->tb6_id > rt->fib6_table->tb6_id)
428b851f
IS
5483 break;
5484 fib6_entry = last;
5485 }
5486
5487 if (fib6_entry)
5488 list_add(&new6_entry->common.list,
5489 &fib6_entry->common.list);
5490 else
5491 list_add(&new6_entry->common.list,
5492 &fib_node->entry_list);
5493 }
5494
5495 return 0;
5496}
5497
5498static void
5499mlxsw_sp_fib6_node_list_remove(struct mlxsw_sp_fib6_entry *fib6_entry)
5500{
5501 list_del(&fib6_entry->common.list);
5502}
5503
5504static int mlxsw_sp_fib6_node_entry_link(struct mlxsw_sp *mlxsw_sp,
0a7fd1ac 5505 struct mlxsw_sp_fib6_entry *fib6_entry,
94d628d1 5506 bool *p_replace)
428b851f
IS
5507{
5508 int err;
5509
94d628d1 5510 err = mlxsw_sp_fib6_node_list_insert(fib6_entry, p_replace);
428b851f
IS
5511 if (err)
5512 return err;
5513
5514 err = mlxsw_sp_fib_node_entry_add(mlxsw_sp, &fib6_entry->common);
5515 if (err)
5516 goto err_fib_node_entry_add;
5517
5518 return 0;
5519
5520err_fib_node_entry_add:
5521 mlxsw_sp_fib6_node_list_remove(fib6_entry);
5522 return err;
5523}
5524
5525static void
5526mlxsw_sp_fib6_node_entry_unlink(struct mlxsw_sp *mlxsw_sp,
5527 struct mlxsw_sp_fib6_entry *fib6_entry)
5528{
5529 mlxsw_sp_fib_node_entry_del(mlxsw_sp, &fib6_entry->common);
5530 mlxsw_sp_fib6_node_list_remove(fib6_entry);
5531}
5532
5533static struct mlxsw_sp_fib6_entry *
5534mlxsw_sp_fib6_entry_lookup(struct mlxsw_sp *mlxsw_sp,
8d1c802b 5535 const struct fib6_info *rt)
428b851f
IS
5536{
5537 struct mlxsw_sp_fib6_entry *fib6_entry;
5538 struct mlxsw_sp_fib_node *fib_node;
5539 struct mlxsw_sp_fib *fib;
5540 struct mlxsw_sp_vr *vr;
5541
93c2fb25 5542 vr = mlxsw_sp_vr_find(mlxsw_sp, rt->fib6_table->tb6_id);
428b851f
IS
5543 if (!vr)
5544 return NULL;
5545 fib = mlxsw_sp_vr_fib(vr, MLXSW_SP_L3_PROTO_IPV6);
5546
93c2fb25
DA
5547 fib_node = mlxsw_sp_fib_node_lookup(fib, &rt->fib6_dst.addr,
5548 sizeof(rt->fib6_dst.addr),
5549 rt->fib6_dst.plen);
428b851f
IS
5550 if (!fib_node)
5551 return NULL;
5552
5553 list_for_each_entry(fib6_entry, &fib_node->entry_list, common.list) {
8d1c802b 5554 struct fib6_info *iter_rt = mlxsw_sp_fib6_entry_rt(fib6_entry);
428b851f 5555
93c2fb25
DA
5556 if (rt->fib6_table->tb6_id == iter_rt->fib6_table->tb6_id &&
5557 rt->fib6_metric == iter_rt->fib6_metric &&
428b851f
IS
5558 mlxsw_sp_fib6_entry_rt_find(fib6_entry, rt))
5559 return fib6_entry;
5560 }
5561
5562 return NULL;
5563}
5564
0a7fd1ac
IS
5565static void mlxsw_sp_fib6_entry_replace(struct mlxsw_sp *mlxsw_sp,
5566 struct mlxsw_sp_fib6_entry *fib6_entry,
5567 bool replace)
5568{
5569 struct mlxsw_sp_fib_node *fib_node = fib6_entry->common.fib_node;
5570 struct mlxsw_sp_fib6_entry *replaced;
5571
5572 if (!replace)
5573 return;
5574
5575 replaced = list_next_entry(fib6_entry, common.list);
5576
5577 mlxsw_sp_fib6_node_entry_unlink(mlxsw_sp, replaced);
5578 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, replaced);
5579 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
5580}
5581
428b851f 5582static int mlxsw_sp_router_fib6_add(struct mlxsw_sp *mlxsw_sp,
921bc539
IS
5583 struct fib6_info **rt_arr,
5584 unsigned int nrt6, bool replace)
428b851f
IS
5585{
5586 struct mlxsw_sp_fib6_entry *fib6_entry;
5587 struct mlxsw_sp_fib_node *fib_node;
921bc539 5588 struct fib6_info *rt = rt_arr[0];
428b851f
IS
5589 int err;
5590
5591 if (mlxsw_sp->router->aborted)
5592 return 0;
5593
93c2fb25 5594 if (rt->fib6_src.plen)
f36f5ac6
IS
5595 return -EINVAL;
5596
428b851f
IS
5597 if (mlxsw_sp_fib6_rt_should_ignore(rt))
5598 return 0;
5599
93c2fb25
DA
5600 fib_node = mlxsw_sp_fib_node_get(mlxsw_sp, rt->fib6_table->tb6_id,
5601 &rt->fib6_dst.addr,
5602 sizeof(rt->fib6_dst.addr),
5603 rt->fib6_dst.plen,
428b851f
IS
5604 MLXSW_SP_L3_PROTO_IPV6);
5605 if (IS_ERR(fib_node))
5606 return PTR_ERR(fib_node);
5607
5608 /* Before creating a new entry, try to append route to an existing
5609 * multipath entry.
5610 */
33bd5ac5 5611 fib6_entry = mlxsw_sp_fib6_node_mp_entry_find(fib_node, rt, replace);
428b851f 5612 if (fib6_entry) {
d21afd30
IS
5613 err = mlxsw_sp_fib6_entry_nexthop_add(mlxsw_sp, fib6_entry,
5614 rt_arr, nrt6);
428b851f
IS
5615 if (err)
5616 goto err_fib6_entry_nexthop_add;
5617 return 0;
5618 }
5619
2d9dd7ec
IS
5620 fib6_entry = mlxsw_sp_fib6_entry_create(mlxsw_sp, fib_node, rt_arr,
5621 nrt6);
428b851f
IS
5622 if (IS_ERR(fib6_entry)) {
5623 err = PTR_ERR(fib6_entry);
5624 goto err_fib6_entry_create;
5625 }
5626
94d628d1 5627 err = mlxsw_sp_fib6_node_entry_link(mlxsw_sp, fib6_entry, &replace);
428b851f
IS
5628 if (err)
5629 goto err_fib6_node_entry_link;
5630
0a7fd1ac
IS
5631 mlxsw_sp_fib6_entry_replace(mlxsw_sp, fib6_entry, replace);
5632
428b851f
IS
5633 return 0;
5634
5635err_fib6_node_entry_link:
5636 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry);
5637err_fib6_entry_create:
5638err_fib6_entry_nexthop_add:
5639 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
5640 return err;
5641}
5642
5643static void mlxsw_sp_router_fib6_del(struct mlxsw_sp *mlxsw_sp,
921bc539
IS
5644 struct fib6_info **rt_arr,
5645 unsigned int nrt6)
428b851f
IS
5646{
5647 struct mlxsw_sp_fib6_entry *fib6_entry;
5648 struct mlxsw_sp_fib_node *fib_node;
921bc539 5649 struct fib6_info *rt = rt_arr[0];
428b851f
IS
5650
5651 if (mlxsw_sp->router->aborted)
5652 return;
5653
5654 if (mlxsw_sp_fib6_rt_should_ignore(rt))
5655 return;
5656
5657 fib6_entry = mlxsw_sp_fib6_entry_lookup(mlxsw_sp, rt);
5658 if (WARN_ON(!fib6_entry))
5659 return;
5660
d21afd30
IS
5661 /* If not all the nexthops are deleted, then only reduce the nexthop
5662 * group.
428b851f 5663 */
d21afd30
IS
5664 if (nrt6 != fib6_entry->nrt6) {
5665 mlxsw_sp_fib6_entry_nexthop_del(mlxsw_sp, fib6_entry, rt_arr,
5666 nrt6);
428b851f
IS
5667 return;
5668 }
5669
5670 fib_node = fib6_entry->common.fib_node;
5671
5672 mlxsw_sp_fib6_node_entry_unlink(mlxsw_sp, fib6_entry);
5673 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry);
5674 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
5675}
5676
bc65a8a4
IS
5677static int __mlxsw_sp_router_set_abort_trap(struct mlxsw_sp *mlxsw_sp,
5678 enum mlxsw_reg_ralxx_protocol proto,
5679 u8 tree_id)
b45f64d1
JP
5680{
5681 char ralta_pl[MLXSW_REG_RALTA_LEN];
5682 char ralst_pl[MLXSW_REG_RALST_LEN];
b5d90e6d 5683 int i, err;
b45f64d1 5684
bc65a8a4 5685 mlxsw_reg_ralta_pack(ralta_pl, true, proto, tree_id);
b45f64d1
JP
5686 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl);
5687 if (err)
5688 return err;
5689
bc65a8a4 5690 mlxsw_reg_ralst_pack(ralst_pl, 0xff, tree_id);
b45f64d1
JP
5691 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralst), ralst_pl);
5692 if (err)
5693 return err;
5694
b5d90e6d 5695 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
9011b677 5696 struct mlxsw_sp_vr *vr = &mlxsw_sp->router->vrs[i];
b5d90e6d
IS
5697 char raltb_pl[MLXSW_REG_RALTB_LEN];
5698 char ralue_pl[MLXSW_REG_RALUE_LEN];
b45f64d1 5699
bc65a8a4 5700 mlxsw_reg_raltb_pack(raltb_pl, vr->id, proto, tree_id);
b5d90e6d
IS
5701 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb),
5702 raltb_pl);
5703 if (err)
5704 return err;
5705
bc65a8a4
IS
5706 mlxsw_reg_ralue_pack(ralue_pl, proto,
5707 MLXSW_REG_RALUE_OP_WRITE_WRITE, vr->id, 0);
b5d90e6d
IS
5708 mlxsw_reg_ralue_act_ip2me_pack(ralue_pl);
5709 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue),
5710 ralue_pl);
5711 if (err)
5712 return err;
5713 }
5714
5715 return 0;
b45f64d1
JP
5716}
5717
eb35da0c
YM
5718static struct mlxsw_sp_mr_table *
5719mlxsw_sp_router_fibmr_family_to_table(struct mlxsw_sp_vr *vr, int family)
5720{
64ed1b9e 5721 if (family == RTNL_FAMILY_IPMR)
eb35da0c 5722 return vr->mr_table[MLXSW_SP_L3_PROTO_IPV4];
64ed1b9e
YM
5723 else
5724 return vr->mr_table[MLXSW_SP_L3_PROTO_IPV6];
eb35da0c
YM
5725}
5726
d42b0965
YG
5727static int mlxsw_sp_router_fibmr_add(struct mlxsw_sp *mlxsw_sp,
5728 struct mfc_entry_notifier_info *men_info,
5729 bool replace)
5730{
eb35da0c 5731 struct mlxsw_sp_mr_table *mrt;
d42b0965
YG
5732 struct mlxsw_sp_vr *vr;
5733
5734 if (mlxsw_sp->router->aborted)
5735 return 0;
5736
f8fa9b4e 5737 vr = mlxsw_sp_vr_get(mlxsw_sp, men_info->tb_id, NULL);
d42b0965
YG
5738 if (IS_ERR(vr))
5739 return PTR_ERR(vr);
5740
eb35da0c
YM
5741 mrt = mlxsw_sp_router_fibmr_family_to_table(vr, men_info->info.family);
5742 return mlxsw_sp_mr_route_add(mrt, men_info->mfc, replace);
d42b0965
YG
5743}
5744
5745static void mlxsw_sp_router_fibmr_del(struct mlxsw_sp *mlxsw_sp,
5746 struct mfc_entry_notifier_info *men_info)
5747{
eb35da0c 5748 struct mlxsw_sp_mr_table *mrt;
d42b0965
YG
5749 struct mlxsw_sp_vr *vr;
5750
5751 if (mlxsw_sp->router->aborted)
5752 return;
5753
5754 vr = mlxsw_sp_vr_find(mlxsw_sp, men_info->tb_id);
5755 if (WARN_ON(!vr))
5756 return;
5757
eb35da0c
YM
5758 mrt = mlxsw_sp_router_fibmr_family_to_table(vr, men_info->info.family);
5759 mlxsw_sp_mr_route_del(mrt, men_info->mfc);
2b52ce02 5760 mlxsw_sp_vr_put(mlxsw_sp, vr);
d42b0965
YG
5761}
5762
5763static int
5764mlxsw_sp_router_fibmr_vif_add(struct mlxsw_sp *mlxsw_sp,
5765 struct vif_entry_notifier_info *ven_info)
5766{
eb35da0c 5767 struct mlxsw_sp_mr_table *mrt;
d42b0965
YG
5768 struct mlxsw_sp_rif *rif;
5769 struct mlxsw_sp_vr *vr;
5770
5771 if (mlxsw_sp->router->aborted)
5772 return 0;
5773
f8fa9b4e 5774 vr = mlxsw_sp_vr_get(mlxsw_sp, ven_info->tb_id, NULL);
d42b0965
YG
5775 if (IS_ERR(vr))
5776 return PTR_ERR(vr);
5777
eb35da0c 5778 mrt = mlxsw_sp_router_fibmr_family_to_table(vr, ven_info->info.family);
d42b0965 5779 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, ven_info->dev);
eb35da0c 5780 return mlxsw_sp_mr_vif_add(mrt, ven_info->dev,
d42b0965
YG
5781 ven_info->vif_index,
5782 ven_info->vif_flags, rif);
5783}
5784
5785static void
5786mlxsw_sp_router_fibmr_vif_del(struct mlxsw_sp *mlxsw_sp,
5787 struct vif_entry_notifier_info *ven_info)
5788{
eb35da0c 5789 struct mlxsw_sp_mr_table *mrt;
d42b0965
YG
5790 struct mlxsw_sp_vr *vr;
5791
5792 if (mlxsw_sp->router->aborted)
5793 return;
5794
5795 vr = mlxsw_sp_vr_find(mlxsw_sp, ven_info->tb_id);
5796 if (WARN_ON(!vr))
5797 return;
5798
eb35da0c
YM
5799 mrt = mlxsw_sp_router_fibmr_family_to_table(vr, ven_info->info.family);
5800 mlxsw_sp_mr_vif_del(mrt, ven_info->vif_index);
2b52ce02 5801 mlxsw_sp_vr_put(mlxsw_sp, vr);
d42b0965
YG
5802}
5803
bc65a8a4
IS
5804static int mlxsw_sp_router_set_abort_trap(struct mlxsw_sp *mlxsw_sp)
5805{
5806 enum mlxsw_reg_ralxx_protocol proto = MLXSW_REG_RALXX_PROTOCOL_IPV4;
5807 int err;
5808
5809 err = __mlxsw_sp_router_set_abort_trap(mlxsw_sp, proto,
5810 MLXSW_SP_LPM_TREE_MIN);
5811 if (err)
5812 return err;
5813
d42b0965
YG
5814 /* The multicast router code does not need an abort trap as by default,
5815 * packets that don't match any routes are trapped to the CPU.
5816 */
5817
bc65a8a4
IS
5818 proto = MLXSW_REG_RALXX_PROTOCOL_IPV6;
5819 return __mlxsw_sp_router_set_abort_trap(mlxsw_sp, proto,
5820 MLXSW_SP_LPM_TREE_MIN + 1);
5821}
5822
9aecce1c
IS
5823static void mlxsw_sp_fib4_node_flush(struct mlxsw_sp *mlxsw_sp,
5824 struct mlxsw_sp_fib_node *fib_node)
5825{
4f1c7f1f 5826 struct mlxsw_sp_fib4_entry *fib4_entry, *tmp;
9aecce1c 5827
4f1c7f1f
IS
5828 list_for_each_entry_safe(fib4_entry, tmp, &fib_node->entry_list,
5829 common.list) {
5830 bool do_break = &tmp->common.list == &fib_node->entry_list;
9aecce1c 5831
4f1c7f1f
IS
5832 mlxsw_sp_fib4_node_entry_unlink(mlxsw_sp, fib4_entry);
5833 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry);
731ea1ca 5834 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
9aecce1c
IS
5835 /* Break when entry list is empty and node was freed.
5836 * Otherwise, we'll access freed memory in the next
5837 * iteration.
5838 */
5839 if (do_break)
5840 break;
5841 }
5842}
5843
428b851f
IS
5844static void mlxsw_sp_fib6_node_flush(struct mlxsw_sp *mlxsw_sp,
5845 struct mlxsw_sp_fib_node *fib_node)
5846{
5847 struct mlxsw_sp_fib6_entry *fib6_entry, *tmp;
5848
5849 list_for_each_entry_safe(fib6_entry, tmp, &fib_node->entry_list,
5850 common.list) {
5851 bool do_break = &tmp->common.list == &fib_node->entry_list;
5852
5853 mlxsw_sp_fib6_node_entry_unlink(mlxsw_sp, fib6_entry);
5854 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry);
5855 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node);
5856 if (do_break)
5857 break;
5858 }
5859}
5860
9aecce1c
IS
5861static void mlxsw_sp_fib_node_flush(struct mlxsw_sp *mlxsw_sp,
5862 struct mlxsw_sp_fib_node *fib_node)
5863{
76610ebb 5864 switch (fib_node->fib->proto) {
9aecce1c
IS
5865 case MLXSW_SP_L3_PROTO_IPV4:
5866 mlxsw_sp_fib4_node_flush(mlxsw_sp, fib_node);
5867 break;
5868 case MLXSW_SP_L3_PROTO_IPV6:
428b851f 5869 mlxsw_sp_fib6_node_flush(mlxsw_sp, fib_node);
9aecce1c
IS
5870 break;
5871 }
5872}
5873
76610ebb
IS
5874static void mlxsw_sp_vr_fib_flush(struct mlxsw_sp *mlxsw_sp,
5875 struct mlxsw_sp_vr *vr,
5876 enum mlxsw_sp_l3proto proto)
b45f64d1 5877{
76610ebb 5878 struct mlxsw_sp_fib *fib = mlxsw_sp_vr_fib(vr, proto);
9aecce1c 5879 struct mlxsw_sp_fib_node *fib_node, *tmp;
76610ebb
IS
5880
5881 list_for_each_entry_safe(fib_node, tmp, &fib->node_list, list) {
5882 bool do_break = &tmp->list == &fib->node_list;
5883
5884 mlxsw_sp_fib_node_flush(mlxsw_sp, fib_node);
5885 if (do_break)
5886 break;
5887 }
5888}
5889
5890static void mlxsw_sp_router_fib_flush(struct mlxsw_sp *mlxsw_sp)
5891{
9742f866 5892 int i, j;
b45f64d1 5893
c1a38311 5894 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) {
9011b677 5895 struct mlxsw_sp_vr *vr = &mlxsw_sp->router->vrs[i];
ac571de9 5896
76610ebb 5897 if (!mlxsw_sp_vr_is_used(vr))
b45f64d1 5898 continue;
d42b0965 5899
9742f866
YM
5900 for (j = 0; j < MLXSW_SP_L3_PROTO_MAX; j++)
5901 mlxsw_sp_mr_table_flush(vr->mr_table[j]);
76610ebb 5902 mlxsw_sp_vr_fib_flush(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV4);
a3d9bc50
IS
5903
5904 /* If virtual router was only used for IPv4, then it's no
5905 * longer used.
5906 */
5907 if (!mlxsw_sp_vr_is_used(vr))
5908 continue;
5909 mlxsw_sp_vr_fib_flush(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV6);
b45f64d1 5910 }
ac571de9
IS
5911}
5912
bc65a8a4 5913static void mlxsw_sp_router_fib_abort(struct mlxsw_sp *mlxsw_sp)
ac571de9
IS
5914{
5915 int err;
5916
9011b677 5917 if (mlxsw_sp->router->aborted)
d331d303
IS
5918 return;
5919 dev_warn(mlxsw_sp->bus_info->dev, "FIB abort triggered. Note that FIB entries are no longer being offloaded to this device.\n");
ac571de9 5920 mlxsw_sp_router_fib_flush(mlxsw_sp);
9011b677 5921 mlxsw_sp->router->aborted = true;
b45f64d1
JP
5922 err = mlxsw_sp_router_set_abort_trap(mlxsw_sp);
5923 if (err)
5924 dev_warn(mlxsw_sp->bus_info->dev, "Failed to set abort trap.\n");
5925}
5926
928c0b53
IS
5927struct mlxsw_sp_fib6_event_work {
5928 struct fib6_info **rt_arr;
5929 unsigned int nrt6;
5930};
5931
3057224e 5932struct mlxsw_sp_fib_event_work {
a0e4761d 5933 struct work_struct work;
ad178c8e 5934 union {
928c0b53 5935 struct mlxsw_sp_fib6_event_work fib6_work;
ad178c8e 5936 struct fib_entry_notifier_info fen_info;
5d7bfd14 5937 struct fib_rule_notifier_info fr_info;
ad178c8e 5938 struct fib_nh_notifier_info fnh_info;
d42b0965
YG
5939 struct mfc_entry_notifier_info men_info;
5940 struct vif_entry_notifier_info ven_info;
ad178c8e 5941 };
3057224e
IS
5942 struct mlxsw_sp *mlxsw_sp;
5943 unsigned long event;
5944};
5945
928c0b53
IS
5946static int
5947mlxsw_sp_router_fib6_work_init(struct mlxsw_sp_fib6_event_work *fib6_work,
5948 struct fib6_entry_notifier_info *fen6_info)
5949{
5950 struct fib6_info *rt = fen6_info->rt;
5951 struct fib6_info **rt_arr;
5952 struct fib6_info *iter;
5953 unsigned int nrt6;
5954 int i = 0;
5955
5956 nrt6 = fen6_info->nsiblings + 1;
5957
5958 rt_arr = kcalloc(nrt6, sizeof(struct fib6_info *), GFP_ATOMIC);
5959 if (!rt_arr)
5960 return -ENOMEM;
5961
5962 fib6_work->rt_arr = rt_arr;
5963 fib6_work->nrt6 = nrt6;
5964
5965 rt_arr[0] = rt;
5966 fib6_info_hold(rt);
5967
5968 if (!fen6_info->nsiblings)
5969 return 0;
5970
5971 list_for_each_entry(iter, &rt->fib6_siblings, fib6_siblings) {
5972 if (i == fen6_info->nsiblings)
5973 break;
5974
5975 rt_arr[i + 1] = iter;
5976 fib6_info_hold(iter);
5977 i++;
5978 }
5979 WARN_ON_ONCE(i != fen6_info->nsiblings);
5980
5981 return 0;
5982}
5983
5984static void
5985mlxsw_sp_router_fib6_work_fini(struct mlxsw_sp_fib6_event_work *fib6_work)
5986{
5987 int i;
5988
5989 for (i = 0; i < fib6_work->nrt6; i++)
5990 mlxsw_sp_rt6_release(fib6_work->rt_arr[i]);
5991 kfree(fib6_work->rt_arr);
5992}
5993
66a5763a 5994static void mlxsw_sp_router_fib4_event_work(struct work_struct *work)
b45f64d1 5995{
3057224e 5996 struct mlxsw_sp_fib_event_work *fib_work =
a0e4761d 5997 container_of(work, struct mlxsw_sp_fib_event_work, work);
3057224e 5998 struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp;
599cf8f9 5999 bool replace, append;
b45f64d1
JP
6000 int err;
6001
3057224e
IS
6002 /* Protect internal structures from changes */
6003 rtnl_lock();
803335ac
PM
6004 mlxsw_sp_span_respin(mlxsw_sp);
6005
3057224e 6006 switch (fib_work->event) {
599cf8f9 6007 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
4283bce5 6008 case FIB_EVENT_ENTRY_APPEND: /* fall through */
b45f64d1 6009 case FIB_EVENT_ENTRY_ADD:
599cf8f9 6010 replace = fib_work->event == FIB_EVENT_ENTRY_REPLACE;
4283bce5
IS
6011 append = fib_work->event == FIB_EVENT_ENTRY_APPEND;
6012 err = mlxsw_sp_router_fib4_add(mlxsw_sp, &fib_work->fen_info,
599cf8f9 6013 replace, append);
b45f64d1 6014 if (err)
bc65a8a4 6015 mlxsw_sp_router_fib_abort(mlxsw_sp);
3057224e 6016 fib_info_put(fib_work->fen_info.fi);
b45f64d1
JP
6017 break;
6018 case FIB_EVENT_ENTRY_DEL:
3057224e
IS
6019 mlxsw_sp_router_fib4_del(mlxsw_sp, &fib_work->fen_info);
6020 fib_info_put(fib_work->fen_info.fi);
b45f64d1 6021 break;
1f279233
DA
6022 case FIB_EVENT_RULE_ADD:
6023 /* if we get here, a rule was added that we do not support.
6024 * just do the fib_abort
6025 */
6026 mlxsw_sp_router_fib_abort(mlxsw_sp);
b45f64d1 6027 break;
ad178c8e
IS
6028 case FIB_EVENT_NH_ADD: /* fall through */
6029 case FIB_EVENT_NH_DEL:
0e6ea2a4
IS
6030 mlxsw_sp_nexthop4_event(mlxsw_sp, fib_work->event,
6031 fib_work->fnh_info.fib_nh);
ad178c8e
IS
6032 fib_info_put(fib_work->fnh_info.fib_nh->nh_parent);
6033 break;
b45f64d1 6034 }
3057224e
IS
6035 rtnl_unlock();
6036 kfree(fib_work);
6037}
6038
66a5763a
IS
6039static void mlxsw_sp_router_fib6_event_work(struct work_struct *work)
6040{
583419fd
IS
6041 struct mlxsw_sp_fib_event_work *fib_work =
6042 container_of(work, struct mlxsw_sp_fib_event_work, work);
6043 struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp;
33bd5ac5 6044 bool replace;
428b851f 6045 int err;
583419fd
IS
6046
6047 rtnl_lock();
803335ac
PM
6048 mlxsw_sp_span_respin(mlxsw_sp);
6049
583419fd 6050 switch (fib_work->event) {
0a7fd1ac 6051 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
428b851f 6052 case FIB_EVENT_ENTRY_ADD:
0a7fd1ac 6053 replace = fib_work->event == FIB_EVENT_ENTRY_REPLACE;
428b851f 6054 err = mlxsw_sp_router_fib6_add(mlxsw_sp,
921bc539
IS
6055 fib_work->fib6_work.rt_arr,
6056 fib_work->fib6_work.nrt6,
928c0b53 6057 replace);
428b851f
IS
6058 if (err)
6059 mlxsw_sp_router_fib_abort(mlxsw_sp);
928c0b53 6060 mlxsw_sp_router_fib6_work_fini(&fib_work->fib6_work);
428b851f
IS
6061 break;
6062 case FIB_EVENT_ENTRY_DEL:
928c0b53 6063 mlxsw_sp_router_fib6_del(mlxsw_sp,
921bc539
IS
6064 fib_work->fib6_work.rt_arr,
6065 fib_work->fib6_work.nrt6);
928c0b53 6066 mlxsw_sp_router_fib6_work_fini(&fib_work->fib6_work);
428b851f 6067 break;
1f279233
DA
6068 case FIB_EVENT_RULE_ADD:
6069 /* if we get here, a rule was added that we do not support.
6070 * just do the fib_abort
6071 */
6072 mlxsw_sp_router_fib_abort(mlxsw_sp);
583419fd
IS
6073 break;
6074 }
6075 rtnl_unlock();
6076 kfree(fib_work);
66a5763a
IS
6077}
6078
d42b0965
YG
6079static void mlxsw_sp_router_fibmr_event_work(struct work_struct *work)
6080{
6081 struct mlxsw_sp_fib_event_work *fib_work =
6082 container_of(work, struct mlxsw_sp_fib_event_work, work);
6083 struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp;
d42b0965
YG
6084 bool replace;
6085 int err;
6086
6087 rtnl_lock();
6088 switch (fib_work->event) {
6089 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
6090 case FIB_EVENT_ENTRY_ADD:
6091 replace = fib_work->event == FIB_EVENT_ENTRY_REPLACE;
6092
6093 err = mlxsw_sp_router_fibmr_add(mlxsw_sp, &fib_work->men_info,
6094 replace);
6095 if (err)
6096 mlxsw_sp_router_fib_abort(mlxsw_sp);
8c13af2a 6097 mr_cache_put(fib_work->men_info.mfc);
d42b0965
YG
6098 break;
6099 case FIB_EVENT_ENTRY_DEL:
6100 mlxsw_sp_router_fibmr_del(mlxsw_sp, &fib_work->men_info);
8c13af2a 6101 mr_cache_put(fib_work->men_info.mfc);
d42b0965
YG
6102 break;
6103 case FIB_EVENT_VIF_ADD:
6104 err = mlxsw_sp_router_fibmr_vif_add(mlxsw_sp,
6105 &fib_work->ven_info);
6106 if (err)
6107 mlxsw_sp_router_fib_abort(mlxsw_sp);
6108 dev_put(fib_work->ven_info.dev);
6109 break;
6110 case FIB_EVENT_VIF_DEL:
6111 mlxsw_sp_router_fibmr_vif_del(mlxsw_sp,
6112 &fib_work->ven_info);
6113 dev_put(fib_work->ven_info.dev);
6114 break;
1f279233
DA
6115 case FIB_EVENT_RULE_ADD:
6116 /* if we get here, a rule was added that we do not support.
6117 * just do the fib_abort
6118 */
6119 mlxsw_sp_router_fib_abort(mlxsw_sp);
d42b0965
YG
6120 break;
6121 }
6122 rtnl_unlock();
6123 kfree(fib_work);
6124}
6125
66a5763a
IS
6126static void mlxsw_sp_router_fib4_event(struct mlxsw_sp_fib_event_work *fib_work,
6127 struct fib_notifier_info *info)
6128{
3c75f9b1 6129 struct fib_entry_notifier_info *fen_info;
3c75f9b1
DA
6130 struct fib_nh_notifier_info *fnh_info;
6131
66a5763a
IS
6132 switch (fib_work->event) {
6133 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
6134 case FIB_EVENT_ENTRY_APPEND: /* fall through */
6135 case FIB_EVENT_ENTRY_ADD: /* fall through */
6136 case FIB_EVENT_ENTRY_DEL:
3c75f9b1
DA
6137 fen_info = container_of(info, struct fib_entry_notifier_info,
6138 info);
6139 fib_work->fen_info = *fen_info;
6140 /* Take reference on fib_info to prevent it from being
66a5763a
IS
6141 * freed while work is queued. Release it afterwards.
6142 */
6143 fib_info_hold(fib_work->fen_info.fi);
6144 break;
66a5763a
IS
6145 case FIB_EVENT_NH_ADD: /* fall through */
6146 case FIB_EVENT_NH_DEL:
3c75f9b1
DA
6147 fnh_info = container_of(info, struct fib_nh_notifier_info,
6148 info);
6149 fib_work->fnh_info = *fnh_info;
66a5763a
IS
6150 fib_info_hold(fib_work->fnh_info.fib_nh->nh_parent);
6151 break;
6152 }
6153}
6154
ccd56a5f
IS
6155static int mlxsw_sp_router_fib6_event(struct mlxsw_sp_fib_event_work *fib_work,
6156 struct fib_notifier_info *info)
66a5763a 6157{
3c75f9b1 6158 struct fib6_entry_notifier_info *fen6_info;
928c0b53 6159 int err;
3c75f9b1 6160
583419fd 6161 switch (fib_work->event) {
0a7fd1ac 6162 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
428b851f
IS
6163 case FIB_EVENT_ENTRY_ADD: /* fall through */
6164 case FIB_EVENT_ENTRY_DEL:
3c75f9b1
DA
6165 fen6_info = container_of(info, struct fib6_entry_notifier_info,
6166 info);
928c0b53
IS
6167 err = mlxsw_sp_router_fib6_work_init(&fib_work->fib6_work,
6168 fen6_info);
6169 if (err)
6170 return err;
428b851f 6171 break;
583419fd 6172 }
ccd56a5f
IS
6173
6174 return 0;
66a5763a
IS
6175}
6176
d42b0965
YG
6177static void
6178mlxsw_sp_router_fibmr_event(struct mlxsw_sp_fib_event_work *fib_work,
6179 struct fib_notifier_info *info)
6180{
6181 switch (fib_work->event) {
6182 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
6183 case FIB_EVENT_ENTRY_ADD: /* fall through */
6184 case FIB_EVENT_ENTRY_DEL:
6185 memcpy(&fib_work->men_info, info, sizeof(fib_work->men_info));
8c13af2a 6186 mr_cache_hold(fib_work->men_info.mfc);
d42b0965
YG
6187 break;
6188 case FIB_EVENT_VIF_ADD: /* fall through */
6189 case FIB_EVENT_VIF_DEL:
6190 memcpy(&fib_work->ven_info, info, sizeof(fib_work->ven_info));
6191 dev_hold(fib_work->ven_info.dev);
6192 break;
1f279233
DA
6193 }
6194}
6195
6196static int mlxsw_sp_router_fib_rule_event(unsigned long event,
6197 struct fib_notifier_info *info,
6198 struct mlxsw_sp *mlxsw_sp)
6199{
6200 struct netlink_ext_ack *extack = info->extack;
6201 struct fib_rule_notifier_info *fr_info;
6202 struct fib_rule *rule;
6203 int err = 0;
6204
6205 /* nothing to do at the moment */
6206 if (event == FIB_EVENT_RULE_DEL)
6207 return 0;
6208
6209 if (mlxsw_sp->router->aborted)
6210 return 0;
6211
6212 fr_info = container_of(info, struct fib_rule_notifier_info, info);
6213 rule = fr_info->rule;
6214
05414dd1
IS
6215 /* Rule only affects locally generated traffic */
6216 if (rule->iifindex == info->net->loopback_dev->ifindex)
6217 return 0;
6218
1f279233
DA
6219 switch (info->family) {
6220 case AF_INET:
6221 if (!fib4_rule_default(rule) && !rule->l3mdev)
6290182b 6222 err = -EOPNOTSUPP;
1f279233
DA
6223 break;
6224 case AF_INET6:
6225 if (!fib6_rule_default(rule) && !rule->l3mdev)
6290182b 6226 err = -EOPNOTSUPP;
1f279233
DA
6227 break;
6228 case RTNL_FAMILY_IPMR:
6229 if (!ipmr_rule_default(rule) && !rule->l3mdev)
6290182b 6230 err = -EOPNOTSUPP;
d42b0965 6231 break;
64ed1b9e
YM
6232 case RTNL_FAMILY_IP6MR:
6233 if (!ip6mr_rule_default(rule) && !rule->l3mdev)
6290182b 6234 err = -EOPNOTSUPP;
64ed1b9e 6235 break;
d42b0965 6236 }
1f279233
DA
6237
6238 if (err < 0)
6290182b 6239 NL_SET_ERR_MSG_MOD(extack, "FIB rules not supported");
1f279233
DA
6240
6241 return err;
d42b0965
YG
6242}
6243
3057224e
IS
6244/* Called with rcu_read_lock() */
6245static int mlxsw_sp_router_fib_event(struct notifier_block *nb,
6246 unsigned long event, void *ptr)
6247{
3057224e
IS
6248 struct mlxsw_sp_fib_event_work *fib_work;
6249 struct fib_notifier_info *info = ptr;
7e39d115 6250 struct mlxsw_sp_router *router;
1f279233 6251 int err;
3057224e 6252
8e29f979 6253 if (!net_eq(info->net, &init_net) ||
664375e9 6254 (info->family != AF_INET && info->family != AF_INET6 &&
64ed1b9e
YM
6255 info->family != RTNL_FAMILY_IPMR &&
6256 info->family != RTNL_FAMILY_IP6MR))
3057224e
IS
6257 return NOTIFY_DONE;
6258
1f279233
DA
6259 router = container_of(nb, struct mlxsw_sp_router, fib_nb);
6260
6261 switch (event) {
6262 case FIB_EVENT_RULE_ADD: /* fall through */
6263 case FIB_EVENT_RULE_DEL:
6264 err = mlxsw_sp_router_fib_rule_event(event, info,
6265 router->mlxsw_sp);
6290182b
IS
6266 if (!err || info->extack)
6267 return notifier_from_errno(err);
50d10711
IS
6268 break;
6269 case FIB_EVENT_ENTRY_ADD:
7973d9e7
DA
6270 case FIB_EVENT_ENTRY_REPLACE: /* fall through */
6271 case FIB_EVENT_ENTRY_APPEND: /* fall through */
50d10711
IS
6272 if (router->aborted) {
6273 NL_SET_ERR_MSG_MOD(info->extack, "FIB offload was aborted. Not configuring route");
6274 return notifier_from_errno(-EINVAL);
6275 }
19a9d136
DA
6276 if (info->family == AF_INET) {
6277 struct fib_entry_notifier_info *fen_info = ptr;
6278
6279 if (fen_info->fi->fib_nh_is_v6) {
6280 NL_SET_ERR_MSG_MOD(info->extack, "IPv6 gateway with IPv4 route is not supported");
6281 return notifier_from_errno(-EINVAL);
6282 }
54250805
DA
6283 if (fen_info->fi->nh) {
6284 NL_SET_ERR_MSG_MOD(info->extack, "IPv4 route with nexthop objects is not supported");
6285 return notifier_from_errno(-EINVAL);
6286 }
6287 } else if (info->family == AF_INET6) {
6288 struct fib6_entry_notifier_info *fen6_info;
6289
6290 fen6_info = container_of(info,
6291 struct fib6_entry_notifier_info,
6292 info);
6293 if (fen6_info->rt->nh) {
6294 NL_SET_ERR_MSG_MOD(info->extack, "IPv6 route with nexthop objects is not supported");
6295 return notifier_from_errno(-EINVAL);
6296 }
f6c3bb75
IS
6297 if (fen6_info->multipath_rt)
6298 return NOTIFY_DONE;
19a9d136 6299 }
50d10711 6300 break;
1f279233
DA
6301 }
6302
3057224e
IS
6303 fib_work = kzalloc(sizeof(*fib_work), GFP_ATOMIC);
6304 if (WARN_ON(!fib_work))
6305 return NOTIFY_BAD;
6306
7e39d115 6307 fib_work->mlxsw_sp = router->mlxsw_sp;
3057224e
IS
6308 fib_work->event = event;
6309
66a5763a
IS
6310 switch (info->family) {
6311 case AF_INET:
6312 INIT_WORK(&fib_work->work, mlxsw_sp_router_fib4_event_work);
6313 mlxsw_sp_router_fib4_event(fib_work, info);
3057224e 6314 break;
66a5763a
IS
6315 case AF_INET6:
6316 INIT_WORK(&fib_work->work, mlxsw_sp_router_fib6_event_work);
ccd56a5f
IS
6317 err = mlxsw_sp_router_fib6_event(fib_work, info);
6318 if (err)
6319 goto err_fib_event;
ad178c8e 6320 break;
64ed1b9e 6321 case RTNL_FAMILY_IP6MR:
d42b0965
YG
6322 case RTNL_FAMILY_IPMR:
6323 INIT_WORK(&fib_work->work, mlxsw_sp_router_fibmr_event_work);
6324 mlxsw_sp_router_fibmr_event(fib_work, info);
6325 break;
3057224e
IS
6326 }
6327
a0e4761d 6328 mlxsw_core_schedule_work(&fib_work->work);
3057224e 6329
b45f64d1 6330 return NOTIFY_DONE;
ccd56a5f
IS
6331
6332err_fib_event:
6333 kfree(fib_work);
6334 return NOTIFY_BAD;
b45f64d1
JP
6335}
6336
0c41292b 6337struct mlxsw_sp_rif *
4724ba56
IS
6338mlxsw_sp_rif_find_by_dev(const struct mlxsw_sp *mlxsw_sp,
6339 const struct net_device *dev)
6340{
6341 int i;
6342
6343 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++)
5f9efffb
IS
6344 if (mlxsw_sp->router->rifs[i] &&
6345 mlxsw_sp->router->rifs[i]->dev == dev)
6346 return mlxsw_sp->router->rifs[i];
4724ba56
IS
6347
6348 return NULL;
6349}
6350
6351static int mlxsw_sp_router_rif_disable(struct mlxsw_sp *mlxsw_sp, u16 rif)
6352{
6353 char ritr_pl[MLXSW_REG_RITR_LEN];
6354 int err;
6355
6356 mlxsw_reg_ritr_rif_pack(ritr_pl, rif);
6357 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
24f91ce0 6358 if (err)
4724ba56
IS
6359 return err;
6360
6361 mlxsw_reg_ritr_enable_set(ritr_pl, false);
6362 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
6363}
6364
6365static void mlxsw_sp_router_rif_gone_sync(struct mlxsw_sp *mlxsw_sp,
bf95233e 6366 struct mlxsw_sp_rif *rif)
4724ba56 6367{
bf95233e
AS
6368 mlxsw_sp_router_rif_disable(mlxsw_sp, rif->rif_index);
6369 mlxsw_sp_nexthop_rif_gone_sync(mlxsw_sp, rif);
6370 mlxsw_sp_neigh_rif_gone_sync(mlxsw_sp, rif);
4724ba56
IS
6371}
6372
5ea1237f
AS
6373static bool
6374mlxsw_sp_rif_should_config(struct mlxsw_sp_rif *rif, struct net_device *dev,
6375 unsigned long event)
4724ba56 6376{
5ea1237f
AS
6377 struct inet6_dev *inet6_dev;
6378 bool addr_list_empty = true;
6379 struct in_device *idev;
6380
4724ba56
IS
6381 switch (event) {
6382 case NETDEV_UP:
f1b1f273 6383 return rif == NULL;
4724ba56 6384 case NETDEV_DOWN:
5ea1237f
AS
6385 idev = __in_dev_get_rtnl(dev);
6386 if (idev && idev->ifa_list)
6387 addr_list_empty = false;
6388
6389 inet6_dev = __in6_dev_get(dev);
6390 if (addr_list_empty && inet6_dev &&
6391 !list_empty(&inet6_dev->addr_list))
6392 addr_list_empty = false;
6393
2db99378
IS
6394 /* macvlans do not have a RIF, but rather piggy back on the
6395 * RIF of their lower device.
6396 */
6397 if (netif_is_macvlan(dev) && addr_list_empty)
6398 return true;
6399
5ea1237f 6400 if (rif && addr_list_empty &&
bf95233e 6401 !netif_is_l3_slave(rif->dev))
4724ba56
IS
6402 return true;
6403 /* It is possible we already removed the RIF ourselves
6404 * if it was assigned to a netdev that is now a bridge
6405 * or LAG slave.
6406 */
6407 return false;
6408 }
6409
6410 return false;
6411}
6412
e4f3c1c1
IS
6413static enum mlxsw_sp_rif_type
6414mlxsw_sp_dev_rif_type(const struct mlxsw_sp *mlxsw_sp,
6415 const struct net_device *dev)
6416{
6417 enum mlxsw_sp_fid_type type;
6418
6ddb7426
PM
6419 if (mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, NULL))
6420 return MLXSW_SP_RIF_TYPE_IPIP_LB;
6421
6422 /* Otherwise RIF type is derived from the type of the underlying FID. */
e4f3c1c1
IS
6423 if (is_vlan_dev(dev) && netif_is_bridge_master(vlan_dev_real_dev(dev)))
6424 type = MLXSW_SP_FID_TYPE_8021Q;
6425 else if (netif_is_bridge_master(dev) && br_vlan_enabled(dev))
6426 type = MLXSW_SP_FID_TYPE_8021Q;
6427 else if (netif_is_bridge_master(dev))
6428 type = MLXSW_SP_FID_TYPE_8021D;
6429 else
6430 type = MLXSW_SP_FID_TYPE_RFID;
6431
6432 return mlxsw_sp_fid_type_rif_type(mlxsw_sp, type);
6433}
6434
de5ed99e 6435static int mlxsw_sp_rif_index_alloc(struct mlxsw_sp *mlxsw_sp, u16 *p_rif_index)
4724ba56
IS
6436{
6437 int i;
6438
de5ed99e
IS
6439 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++) {
6440 if (!mlxsw_sp->router->rifs[i]) {
6441 *p_rif_index = i;
6442 return 0;
6443 }
6444 }
4724ba56 6445
de5ed99e 6446 return -ENOBUFS;
4724ba56
IS
6447}
6448
e4f3c1c1
IS
6449static struct mlxsw_sp_rif *mlxsw_sp_rif_alloc(size_t rif_size, u16 rif_index,
6450 u16 vr_id,
6451 struct net_device *l3_dev)
4724ba56 6452{
bf95233e 6453 struct mlxsw_sp_rif *rif;
4724ba56 6454
e4f3c1c1 6455 rif = kzalloc(rif_size, GFP_KERNEL);
bf95233e 6456 if (!rif)
4724ba56
IS
6457 return NULL;
6458
bf95233e
AS
6459 INIT_LIST_HEAD(&rif->nexthop_list);
6460 INIT_LIST_HEAD(&rif->neigh_list);
73b8f493
ND
6461 if (l3_dev) {
6462 ether_addr_copy(rif->addr, l3_dev->dev_addr);
6463 rif->mtu = l3_dev->mtu;
6464 rif->dev = l3_dev;
6465 }
bf95233e 6466 rif->vr_id = vr_id;
bf95233e 6467 rif->rif_index = rif_index;
4724ba56 6468
bf95233e 6469 return rif;
4724ba56
IS
6470}
6471
5f9efffb
IS
6472struct mlxsw_sp_rif *mlxsw_sp_rif_by_index(const struct mlxsw_sp *mlxsw_sp,
6473 u16 rif_index)
6474{
6475 return mlxsw_sp->router->rifs[rif_index];
6476}
6477
fd1b9d41
AS
6478u16 mlxsw_sp_rif_index(const struct mlxsw_sp_rif *rif)
6479{
6480 return rif->rif_index;
6481}
6482
92107cfb
PM
6483u16 mlxsw_sp_ipip_lb_rif_index(const struct mlxsw_sp_rif_ipip_lb *lb_rif)
6484{
6485 return lb_rif->common.rif_index;
6486}
6487
6488u16 mlxsw_sp_ipip_lb_ul_vr_id(const struct mlxsw_sp_rif_ipip_lb *lb_rif)
6489{
33c04afe
ND
6490 u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(lb_rif->common.dev);
6491 struct mlxsw_sp_vr *ul_vr;
6492
6493 ul_vr = mlxsw_sp_vr_get(lb_rif->common.mlxsw_sp, ul_tb_id, NULL);
6494 if (WARN_ON(IS_ERR(ul_vr)))
6495 return 0;
6496
6497 return ul_vr->id;
92107cfb
PM
6498}
6499
311596f5
ND
6500u16 mlxsw_sp_ipip_lb_ul_rif_id(const struct mlxsw_sp_rif_ipip_lb *lb_rif)
6501{
6502 return lb_rif->ul_rif_id;
6503}
6504
fd1b9d41
AS
6505int mlxsw_sp_rif_dev_ifindex(const struct mlxsw_sp_rif *rif)
6506{
6507 return rif->dev->ifindex;
6508}
6509
91e4d59a
YG
6510const struct net_device *mlxsw_sp_rif_dev(const struct mlxsw_sp_rif *rif)
6511{
6512 return rif->dev;
6513}
6514
a28b1ebe
PM
6515struct mlxsw_sp_fid *mlxsw_sp_rif_fid(const struct mlxsw_sp_rif *rif)
6516{
6517 return rif->fid;
6518}
6519
4724ba56 6520static struct mlxsw_sp_rif *
e4f3c1c1 6521mlxsw_sp_rif_create(struct mlxsw_sp *mlxsw_sp,
f8fa9b4e
DA
6522 const struct mlxsw_sp_rif_params *params,
6523 struct netlink_ext_ack *extack)
4724ba56 6524{
e4f3c1c1
IS
6525 u32 tb_id = l3mdev_fib_table(params->dev);
6526 const struct mlxsw_sp_rif_ops *ops;
010cadf9 6527 struct mlxsw_sp_fid *fid = NULL;
e4f3c1c1 6528 enum mlxsw_sp_rif_type type;
bf95233e 6529 struct mlxsw_sp_rif *rif;
a1107487
IS
6530 struct mlxsw_sp_vr *vr;
6531 u16 rif_index;
9742f866 6532 int i, err;
4724ba56 6533
e4f3c1c1 6534 type = mlxsw_sp_dev_rif_type(mlxsw_sp, params->dev);
1f5b2303 6535 ops = mlxsw_sp->rif_ops_arr[type];
e4f3c1c1 6536
f8fa9b4e 6537 vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id ? : RT_TABLE_MAIN, extack);
c9ec53f0
IS
6538 if (IS_ERR(vr))
6539 return ERR_CAST(vr);
28a04c7b 6540 vr->rif_count++;
c9ec53f0 6541
de5ed99e 6542 err = mlxsw_sp_rif_index_alloc(mlxsw_sp, &rif_index);
f8fa9b4e 6543 if (err) {
6c677750 6544 NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported router interfaces");
de5ed99e 6545 goto err_rif_index_alloc;
f8fa9b4e 6546 }
4724ba56 6547
e4f3c1c1 6548 rif = mlxsw_sp_rif_alloc(ops->rif_size, rif_index, vr->id, params->dev);
a13a594d
IS
6549 if (!rif) {
6550 err = -ENOMEM;
6551 goto err_rif_alloc;
6552 }
b61cd7c6 6553 dev_hold(rif->dev);
a04563e4 6554 mlxsw_sp->router->rifs[rif_index] = rif;
e4f3c1c1
IS
6555 rif->mlxsw_sp = mlxsw_sp;
6556 rif->ops = ops;
a13a594d 6557
010cadf9 6558 if (ops->fid_get) {
5f15e257 6559 fid = ops->fid_get(rif, extack);
010cadf9
PM
6560 if (IS_ERR(fid)) {
6561 err = PTR_ERR(fid);
6562 goto err_fid_get;
6563 }
6564 rif->fid = fid;
4d93ceeb
IS
6565 }
6566
e4f3c1c1
IS
6567 if (ops->setup)
6568 ops->setup(rif, params);
6569
6570 err = ops->configure(rif);
4724ba56 6571 if (err)
e4f3c1c1 6572 goto err_configure;
4724ba56 6573
9742f866
YM
6574 for (i = 0; i < MLXSW_SP_L3_PROTO_MAX; i++) {
6575 err = mlxsw_sp_mr_rif_add(vr->mr_table[i], rif);
6576 if (err)
6577 goto err_mr_rif_add;
6578 }
d42b0965 6579
e4f3c1c1 6580 mlxsw_sp_rif_counters_alloc(rif);
4724ba56 6581
bf95233e 6582 return rif;
4724ba56 6583
d42b0965 6584err_mr_rif_add:
9742f866
YM
6585 for (i--; i >= 0; i--)
6586 mlxsw_sp_mr_rif_del(vr->mr_table[i], rif);
d42b0965 6587 ops->deconfigure(rif);
e4f3c1c1 6588err_configure:
010cadf9
PM
6589 if (fid)
6590 mlxsw_sp_fid_put(fid);
a1107487 6591err_fid_get:
a04563e4 6592 mlxsw_sp->router->rifs[rif_index] = NULL;
b61cd7c6 6593 dev_put(rif->dev);
e4f3c1c1
IS
6594 kfree(rif);
6595err_rif_alloc:
de5ed99e 6596err_rif_index_alloc:
28a04c7b 6597 vr->rif_count--;
2b52ce02 6598 mlxsw_sp_vr_put(mlxsw_sp, vr);
4724ba56
IS
6599 return ERR_PTR(err);
6600}
6601
32fd4b49 6602static void mlxsw_sp_rif_destroy(struct mlxsw_sp_rif *rif)
4724ba56 6603{
e4f3c1c1
IS
6604 const struct mlxsw_sp_rif_ops *ops = rif->ops;
6605 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
a1107487 6606 struct mlxsw_sp_fid *fid = rif->fid;
e4f3c1c1 6607 struct mlxsw_sp_vr *vr;
9742f866 6608 int i;
4724ba56 6609
bf95233e 6610 mlxsw_sp_router_rif_gone_sync(mlxsw_sp, rif);
e4f3c1c1 6611 vr = &mlxsw_sp->router->vrs[rif->vr_id];
e0c0afd8 6612
e4f3c1c1 6613 mlxsw_sp_rif_counters_free(rif);
9742f866
YM
6614 for (i = 0; i < MLXSW_SP_L3_PROTO_MAX; i++)
6615 mlxsw_sp_mr_rif_del(vr->mr_table[i], rif);
e4f3c1c1 6616 ops->deconfigure(rif);
010cadf9
PM
6617 if (fid)
6618 /* Loopback RIFs are not associated with a FID. */
6619 mlxsw_sp_fid_put(fid);
a04563e4 6620 mlxsw_sp->router->rifs[rif->rif_index] = NULL;
b61cd7c6 6621 dev_put(rif->dev);
e4f3c1c1 6622 kfree(rif);
28a04c7b 6623 vr->rif_count--;
2b52ce02 6624 mlxsw_sp_vr_put(mlxsw_sp, vr);
4724ba56
IS
6625}
6626
602b74ed
IS
6627void mlxsw_sp_rif_destroy_by_dev(struct mlxsw_sp *mlxsw_sp,
6628 struct net_device *dev)
6629{
6630 struct mlxsw_sp_rif *rif;
6631
6632 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
6633 if (!rif)
6634 return;
6635 mlxsw_sp_rif_destroy(rif);
6636}
6637
e4f3c1c1
IS
6638static void
6639mlxsw_sp_rif_subport_params_init(struct mlxsw_sp_rif_params *params,
6640 struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan)
6641{
6642 struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port;
6643
6644 params->vid = mlxsw_sp_port_vlan->vid;
6645 params->lag = mlxsw_sp_port->lagged;
6646 if (params->lag)
6647 params->lag_id = mlxsw_sp_port->lag_id;
6648 else
6649 params->system_port = mlxsw_sp_port->local_port;
6650}
6651
32fd4b49
IS
6652static struct mlxsw_sp_rif_subport *
6653mlxsw_sp_rif_subport_rif(const struct mlxsw_sp_rif *rif)
6654{
6655 return container_of(rif, struct mlxsw_sp_rif_subport, common);
6656}
6657
6658static struct mlxsw_sp_rif *
6659mlxsw_sp_rif_subport_get(struct mlxsw_sp *mlxsw_sp,
6660 const struct mlxsw_sp_rif_params *params,
6661 struct netlink_ext_ack *extack)
6662{
6663 struct mlxsw_sp_rif_subport *rif_subport;
6664 struct mlxsw_sp_rif *rif;
6665
6666 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, params->dev);
6667 if (!rif)
6668 return mlxsw_sp_rif_create(mlxsw_sp, params, extack);
6669
6670 rif_subport = mlxsw_sp_rif_subport_rif(rif);
6671 refcount_inc(&rif_subport->ref_count);
6672 return rif;
6673}
6674
6675static void mlxsw_sp_rif_subport_put(struct mlxsw_sp_rif *rif)
6676{
6677 struct mlxsw_sp_rif_subport *rif_subport;
6678
6679 rif_subport = mlxsw_sp_rif_subport_rif(rif);
6680 if (!refcount_dec_and_test(&rif_subport->ref_count))
6681 return;
6682
6683 mlxsw_sp_rif_destroy(rif);
6684}
6685
7cbecf24 6686static int
a1107487 6687mlxsw_sp_port_vlan_router_join(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan,
f8fa9b4e
DA
6688 struct net_device *l3_dev,
6689 struct netlink_ext_ack *extack)
4724ba56 6690{
7cbecf24 6691 struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port;
1b8f09a0 6692 struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
32fd4b49
IS
6693 struct mlxsw_sp_rif_params params = {
6694 .dev = l3_dev,
6695 };
7cbecf24 6696 u16 vid = mlxsw_sp_port_vlan->vid;
bf95233e 6697 struct mlxsw_sp_rif *rif;
a1107487 6698 struct mlxsw_sp_fid *fid;
03ea01e9 6699 int err;
4724ba56 6700
32fd4b49
IS
6701 mlxsw_sp_rif_subport_params_init(&params, mlxsw_sp_port_vlan);
6702 rif = mlxsw_sp_rif_subport_get(mlxsw_sp, &params, extack);
6703 if (IS_ERR(rif))
6704 return PTR_ERR(rif);
4724ba56 6705
a1107487 6706 /* FID was already created, just take a reference */
5f15e257 6707 fid = rif->ops->fid_get(rif, extack);
a1107487
IS
6708 err = mlxsw_sp_fid_port_vid_map(fid, mlxsw_sp_port, vid);
6709 if (err)
6710 goto err_fid_port_vid_map;
6711
7cbecf24 6712 err = mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, false);
03ea01e9
IS
6713 if (err)
6714 goto err_port_vid_learning_set;
6715
7cbecf24 6716 err = mlxsw_sp_port_vid_stp_set(mlxsw_sp_port, vid,
03ea01e9
IS
6717 BR_STATE_FORWARDING);
6718 if (err)
6719 goto err_port_vid_stp_set;
6720
a1107487 6721 mlxsw_sp_port_vlan->fid = fid;
4724ba56 6722
4724ba56 6723 return 0;
03ea01e9
IS
6724
6725err_port_vid_stp_set:
7cbecf24 6726 mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, true);
03ea01e9 6727err_port_vid_learning_set:
a1107487
IS
6728 mlxsw_sp_fid_port_vid_unmap(fid, mlxsw_sp_port, vid);
6729err_fid_port_vid_map:
6730 mlxsw_sp_fid_put(fid);
32fd4b49 6731 mlxsw_sp_rif_subport_put(rif);
03ea01e9 6732 return err;
4724ba56
IS
6733}
6734
a1107487
IS
6735void
6736mlxsw_sp_port_vlan_router_leave(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan)
4724ba56 6737{
ce95e154 6738 struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port;
7cbecf24 6739 struct mlxsw_sp_fid *fid = mlxsw_sp_port_vlan->fid;
32fd4b49 6740 struct mlxsw_sp_rif *rif = mlxsw_sp_fid_rif(fid);
ce95e154 6741 u16 vid = mlxsw_sp_port_vlan->vid;
ce95e154 6742
a1107487
IS
6743 if (WARN_ON(mlxsw_sp_fid_type(fid) != MLXSW_SP_FID_TYPE_RFID))
6744 return;
4aafc368 6745
a1107487 6746 mlxsw_sp_port_vlan->fid = NULL;
7cbecf24
IS
6747 mlxsw_sp_port_vid_stp_set(mlxsw_sp_port, vid, BR_STATE_BLOCKING);
6748 mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, true);
a1107487 6749 mlxsw_sp_fid_port_vid_unmap(fid, mlxsw_sp_port, vid);
a1107487 6750 mlxsw_sp_fid_put(fid);
32fd4b49 6751 mlxsw_sp_rif_subport_put(rif);
4724ba56
IS
6752}
6753
7cbecf24
IS
6754static int mlxsw_sp_inetaddr_port_vlan_event(struct net_device *l3_dev,
6755 struct net_device *port_dev,
f8fa9b4e
DA
6756 unsigned long event, u16 vid,
6757 struct netlink_ext_ack *extack)
4724ba56
IS
6758{
6759 struct mlxsw_sp_port *mlxsw_sp_port = netdev_priv(port_dev);
ce95e154 6760 struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan;
4724ba56 6761
ce95e154 6762 mlxsw_sp_port_vlan = mlxsw_sp_port_vlan_find_by_vid(mlxsw_sp_port, vid);
7cbecf24
IS
6763 if (WARN_ON(!mlxsw_sp_port_vlan))
6764 return -EINVAL;
4724ba56
IS
6765
6766 switch (event) {
6767 case NETDEV_UP:
a1107487 6768 return mlxsw_sp_port_vlan_router_join(mlxsw_sp_port_vlan,
f8fa9b4e 6769 l3_dev, extack);
4724ba56 6770 case NETDEV_DOWN:
a1107487 6771 mlxsw_sp_port_vlan_router_leave(mlxsw_sp_port_vlan);
4724ba56
IS
6772 break;
6773 }
6774
6775 return 0;
6776}
6777
6778static int mlxsw_sp_inetaddr_port_event(struct net_device *port_dev,
f8fa9b4e
DA
6779 unsigned long event,
6780 struct netlink_ext_ack *extack)
4724ba56 6781{
2b94e58d
JP
6782 if (netif_is_bridge_port(port_dev) ||
6783 netif_is_lag_port(port_dev) ||
6784 netif_is_ovs_port(port_dev))
4724ba56
IS
6785 return 0;
6786
a2d2a205
IS
6787 return mlxsw_sp_inetaddr_port_vlan_event(port_dev, port_dev, event,
6788 MLXSW_SP_DEFAULT_VID, extack);
4724ba56
IS
6789}
6790
6791static int __mlxsw_sp_inetaddr_lag_event(struct net_device *l3_dev,
6792 struct net_device *lag_dev,
f8fa9b4e
DA
6793 unsigned long event, u16 vid,
6794 struct netlink_ext_ack *extack)
4724ba56
IS
6795{
6796 struct net_device *port_dev;
6797 struct list_head *iter;
6798 int err;
6799
6800 netdev_for_each_lower_dev(lag_dev, port_dev, iter) {
6801 if (mlxsw_sp_port_dev_check(port_dev)) {
7cbecf24
IS
6802 err = mlxsw_sp_inetaddr_port_vlan_event(l3_dev,
6803 port_dev,
f8fa9b4e
DA
6804 event, vid,
6805 extack);
4724ba56
IS
6806 if (err)
6807 return err;
6808 }
6809 }
6810
6811 return 0;
6812}
6813
6814static int mlxsw_sp_inetaddr_lag_event(struct net_device *lag_dev,
f8fa9b4e
DA
6815 unsigned long event,
6816 struct netlink_ext_ack *extack)
4724ba56
IS
6817{
6818 if (netif_is_bridge_port(lag_dev))
6819 return 0;
6820
a2d2a205
IS
6821 return __mlxsw_sp_inetaddr_lag_event(lag_dev, lag_dev, event,
6822 MLXSW_SP_DEFAULT_VID, extack);
4724ba56
IS
6823}
6824
21ffedb6
IS
6825static int mlxsw_sp_inetaddr_bridge_event(struct mlxsw_sp *mlxsw_sp,
6826 struct net_device *l3_dev,
f8fa9b4e
DA
6827 unsigned long event,
6828 struct netlink_ext_ack *extack)
4724ba56 6829{
e4f3c1c1
IS
6830 struct mlxsw_sp_rif_params params = {
6831 .dev = l3_dev,
6832 };
a1107487 6833 struct mlxsw_sp_rif *rif;
4724ba56
IS
6834
6835 switch (event) {
6836 case NETDEV_UP:
f8fa9b4e 6837 rif = mlxsw_sp_rif_create(mlxsw_sp, &params, extack);
e4f3c1c1
IS
6838 if (IS_ERR(rif))
6839 return PTR_ERR(rif);
6840 break;
4724ba56 6841 case NETDEV_DOWN:
a1107487 6842 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev);
e4f3c1c1 6843 mlxsw_sp_rif_destroy(rif);
4724ba56
IS
6844 break;
6845 }
6846
6847 return 0;
6848}
6849
21ffedb6
IS
6850static int mlxsw_sp_inetaddr_vlan_event(struct mlxsw_sp *mlxsw_sp,
6851 struct net_device *vlan_dev,
f8fa9b4e
DA
6852 unsigned long event,
6853 struct netlink_ext_ack *extack)
4724ba56
IS
6854{
6855 struct net_device *real_dev = vlan_dev_real_dev(vlan_dev);
4724ba56
IS
6856 u16 vid = vlan_dev_vlan_id(vlan_dev);
6857
6b27c8ad
IS
6858 if (netif_is_bridge_port(vlan_dev))
6859 return 0;
6860
4724ba56 6861 if (mlxsw_sp_port_dev_check(real_dev))
7cbecf24 6862 return mlxsw_sp_inetaddr_port_vlan_event(vlan_dev, real_dev,
f8fa9b4e 6863 event, vid, extack);
4724ba56
IS
6864 else if (netif_is_lag_master(real_dev))
6865 return __mlxsw_sp_inetaddr_lag_event(vlan_dev, real_dev, event,
f8fa9b4e 6866 vid, extack);
c57529e1 6867 else if (netif_is_bridge_master(real_dev) && br_vlan_enabled(real_dev))
21ffedb6
IS
6868 return mlxsw_sp_inetaddr_bridge_event(mlxsw_sp, vlan_dev, event,
6869 extack);
4724ba56
IS
6870
6871 return 0;
6872}
6873
c3a49540
IS
6874static bool mlxsw_sp_rif_macvlan_is_vrrp4(const u8 *mac)
6875{
6876 u8 vrrp4[ETH_ALEN] = { 0x00, 0x00, 0x5e, 0x00, 0x01, 0x00 };
6877 u8 mask[ETH_ALEN] = { 0xff, 0xff, 0xff, 0xff, 0xff, 0x00 };
6878
6879 return ether_addr_equal_masked(mac, vrrp4, mask);
6880}
6881
6882static bool mlxsw_sp_rif_macvlan_is_vrrp6(const u8 *mac)
6883{
6884 u8 vrrp6[ETH_ALEN] = { 0x00, 0x00, 0x5e, 0x00, 0x02, 0x00 };
6885 u8 mask[ETH_ALEN] = { 0xff, 0xff, 0xff, 0xff, 0xff, 0x00 };
6886
6887 return ether_addr_equal_masked(mac, vrrp6, mask);
6888}
6889
6890static int mlxsw_sp_rif_vrrp_op(struct mlxsw_sp *mlxsw_sp, u16 rif_index,
6891 const u8 *mac, bool adding)
6892{
6893 char ritr_pl[MLXSW_REG_RITR_LEN];
6894 u8 vrrp_id = adding ? mac[5] : 0;
6895 int err;
6896
6897 if (!mlxsw_sp_rif_macvlan_is_vrrp4(mac) &&
6898 !mlxsw_sp_rif_macvlan_is_vrrp6(mac))
6899 return 0;
6900
6901 mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index);
6902 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
6903 if (err)
6904 return err;
6905
6906 if (mlxsw_sp_rif_macvlan_is_vrrp4(mac))
6907 mlxsw_reg_ritr_if_vrrp_id_ipv4_set(ritr_pl, vrrp_id);
6908 else
6909 mlxsw_reg_ritr_if_vrrp_id_ipv6_set(ritr_pl, vrrp_id);
6910
6911 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
6912}
6913
2db99378
IS
6914static int mlxsw_sp_rif_macvlan_add(struct mlxsw_sp *mlxsw_sp,
6915 const struct net_device *macvlan_dev,
6916 struct netlink_ext_ack *extack)
6917{
6918 struct macvlan_dev *vlan = netdev_priv(macvlan_dev);
6919 struct mlxsw_sp_rif *rif;
6920 int err;
6921
6922 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, vlan->lowerdev);
6923 if (!rif) {
6924 NL_SET_ERR_MSG_MOD(extack, "macvlan is only supported on top of router interfaces");
6925 return -EOPNOTSUPP;
6926 }
6927
6928 err = mlxsw_sp_rif_fdb_op(mlxsw_sp, macvlan_dev->dev_addr,
6929 mlxsw_sp_fid_index(rif->fid), true);
6930 if (err)
6931 return err;
6932
c3a49540
IS
6933 err = mlxsw_sp_rif_vrrp_op(mlxsw_sp, rif->rif_index,
6934 macvlan_dev->dev_addr, true);
6935 if (err)
6936 goto err_rif_vrrp_add;
6937
2db99378
IS
6938 /* Make sure the bridge driver does not have this MAC pointing at
6939 * some other port.
6940 */
6941 if (rif->ops->fdb_del)
6942 rif->ops->fdb_del(rif, macvlan_dev->dev_addr);
6943
6944 return 0;
c3a49540
IS
6945
6946err_rif_vrrp_add:
6947 mlxsw_sp_rif_fdb_op(mlxsw_sp, macvlan_dev->dev_addr,
6948 mlxsw_sp_fid_index(rif->fid), false);
6949 return err;
2db99378
IS
6950}
6951
6952void mlxsw_sp_rif_macvlan_del(struct mlxsw_sp *mlxsw_sp,
6953 const struct net_device *macvlan_dev)
6954{
6955 struct macvlan_dev *vlan = netdev_priv(macvlan_dev);
6956 struct mlxsw_sp_rif *rif;
6957
6958 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, vlan->lowerdev);
6959 /* If we do not have a RIF, then we already took care of
6960 * removing the macvlan's MAC during RIF deletion.
6961 */
6962 if (!rif)
6963 return;
c3a49540
IS
6964 mlxsw_sp_rif_vrrp_op(mlxsw_sp, rif->rif_index, macvlan_dev->dev_addr,
6965 false);
2db99378
IS
6966 mlxsw_sp_rif_fdb_op(mlxsw_sp, macvlan_dev->dev_addr,
6967 mlxsw_sp_fid_index(rif->fid), false);
6968}
6969
21ffedb6
IS
6970static int mlxsw_sp_inetaddr_macvlan_event(struct mlxsw_sp *mlxsw_sp,
6971 struct net_device *macvlan_dev,
2db99378
IS
6972 unsigned long event,
6973 struct netlink_ext_ack *extack)
6974{
2db99378
IS
6975 switch (event) {
6976 case NETDEV_UP:
6977 return mlxsw_sp_rif_macvlan_add(mlxsw_sp, macvlan_dev, extack);
6978 case NETDEV_DOWN:
6979 mlxsw_sp_rif_macvlan_del(mlxsw_sp, macvlan_dev);
6980 break;
6981 }
6982
6983 return 0;
6984}
6985
74bc9939
PM
6986static int mlxsw_sp_router_port_check_rif_addr(struct mlxsw_sp *mlxsw_sp,
6987 struct net_device *dev,
6988 const unsigned char *dev_addr,
6989 struct netlink_ext_ack *extack)
6990{
6991 struct mlxsw_sp_rif *rif;
6992 int i;
6993
6994 /* A RIF is not created for macvlan netdevs. Their MAC is used to
6995 * populate the FDB
6996 */
972fae68 6997 if (netif_is_macvlan(dev) || netif_is_l3_master(dev))
74bc9939
PM
6998 return 0;
6999
7000 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++) {
7001 rif = mlxsw_sp->router->rifs[i];
73b8f493 7002 if (rif && rif->dev && rif->dev != dev &&
74bc9939
PM
7003 !ether_addr_equal_masked(rif->dev->dev_addr, dev_addr,
7004 mlxsw_sp->mac_mask)) {
7005 NL_SET_ERR_MSG_MOD(extack, "All router interface MAC addresses must have the same prefix");
7006 return -EINVAL;
7007 }
7008 }
7009
7010 return 0;
7011}
7012
21ffedb6
IS
7013static int __mlxsw_sp_inetaddr_event(struct mlxsw_sp *mlxsw_sp,
7014 struct net_device *dev,
f8fa9b4e
DA
7015 unsigned long event,
7016 struct netlink_ext_ack *extack)
b1e45526
IS
7017{
7018 if (mlxsw_sp_port_dev_check(dev))
f8fa9b4e 7019 return mlxsw_sp_inetaddr_port_event(dev, event, extack);
b1e45526 7020 else if (netif_is_lag_master(dev))
f8fa9b4e 7021 return mlxsw_sp_inetaddr_lag_event(dev, event, extack);
b1e45526 7022 else if (netif_is_bridge_master(dev))
21ffedb6
IS
7023 return mlxsw_sp_inetaddr_bridge_event(mlxsw_sp, dev, event,
7024 extack);
b1e45526 7025 else if (is_vlan_dev(dev))
21ffedb6
IS
7026 return mlxsw_sp_inetaddr_vlan_event(mlxsw_sp, dev, event,
7027 extack);
2db99378 7028 else if (netif_is_macvlan(dev))
21ffedb6
IS
7029 return mlxsw_sp_inetaddr_macvlan_event(mlxsw_sp, dev, event,
7030 extack);
b1e45526
IS
7031 else
7032 return 0;
7033}
7034
965fa8e6
IS
7035static int mlxsw_sp_inetaddr_event(struct notifier_block *nb,
7036 unsigned long event, void *ptr)
4724ba56
IS
7037{
7038 struct in_ifaddr *ifa = (struct in_ifaddr *) ptr;
7039 struct net_device *dev = ifa->ifa_dev->dev;
965fa8e6 7040 struct mlxsw_sp_router *router;
bf95233e 7041 struct mlxsw_sp_rif *rif;
4724ba56
IS
7042 int err = 0;
7043
89d5dd2e
DA
7044 /* NETDEV_UP event is handled by mlxsw_sp_inetaddr_valid_event */
7045 if (event == NETDEV_UP)
7046 goto out;
7047
965fa8e6
IS
7048 router = container_of(nb, struct mlxsw_sp_router, inetaddr_nb);
7049 rif = mlxsw_sp_rif_find_by_dev(router->mlxsw_sp, dev);
89d5dd2e
DA
7050 if (!mlxsw_sp_rif_should_config(rif, dev, event))
7051 goto out;
7052
965fa8e6 7053 err = __mlxsw_sp_inetaddr_event(router->mlxsw_sp, dev, event, NULL);
89d5dd2e
DA
7054out:
7055 return notifier_from_errno(err);
7056}
7057
7058int mlxsw_sp_inetaddr_valid_event(struct notifier_block *unused,
7059 unsigned long event, void *ptr)
7060{
7061 struct in_validator_info *ivi = (struct in_validator_info *) ptr;
7062 struct net_device *dev = ivi->ivi_dev->dev;
7063 struct mlxsw_sp *mlxsw_sp;
7064 struct mlxsw_sp_rif *rif;
7065 int err = 0;
7066
4724ba56
IS
7067 mlxsw_sp = mlxsw_sp_lower_get(dev);
7068 if (!mlxsw_sp)
7069 goto out;
7070
bf95233e 7071 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
5ea1237f 7072 if (!mlxsw_sp_rif_should_config(rif, dev, event))
4724ba56
IS
7073 goto out;
7074
74bc9939
PM
7075 err = mlxsw_sp_router_port_check_rif_addr(mlxsw_sp, dev, dev->dev_addr,
7076 ivi->extack);
7077 if (err)
7078 goto out;
7079
21ffedb6 7080 err = __mlxsw_sp_inetaddr_event(mlxsw_sp, dev, event, ivi->extack);
4724ba56
IS
7081out:
7082 return notifier_from_errno(err);
7083}
7084
5ea1237f
AS
7085struct mlxsw_sp_inet6addr_event_work {
7086 struct work_struct work;
965fa8e6 7087 struct mlxsw_sp *mlxsw_sp;
5ea1237f
AS
7088 struct net_device *dev;
7089 unsigned long event;
7090};
7091
7092static void mlxsw_sp_inet6addr_event_work(struct work_struct *work)
7093{
7094 struct mlxsw_sp_inet6addr_event_work *inet6addr_work =
7095 container_of(work, struct mlxsw_sp_inet6addr_event_work, work);
965fa8e6 7096 struct mlxsw_sp *mlxsw_sp = inet6addr_work->mlxsw_sp;
5ea1237f
AS
7097 struct net_device *dev = inet6addr_work->dev;
7098 unsigned long event = inet6addr_work->event;
5ea1237f
AS
7099 struct mlxsw_sp_rif *rif;
7100
7101 rtnl_lock();
5ea1237f
AS
7102
7103 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
7104 if (!mlxsw_sp_rif_should_config(rif, dev, event))
7105 goto out;
7106
21ffedb6 7107 __mlxsw_sp_inetaddr_event(mlxsw_sp, dev, event, NULL);
5ea1237f
AS
7108out:
7109 rtnl_unlock();
7110 dev_put(dev);
7111 kfree(inet6addr_work);
7112}
7113
7114/* Called with rcu_read_lock() */
965fa8e6
IS
7115static int mlxsw_sp_inet6addr_event(struct notifier_block *nb,
7116 unsigned long event, void *ptr)
5ea1237f
AS
7117{
7118 struct inet6_ifaddr *if6 = (struct inet6_ifaddr *) ptr;
7119 struct mlxsw_sp_inet6addr_event_work *inet6addr_work;
7120 struct net_device *dev = if6->idev->dev;
965fa8e6 7121 struct mlxsw_sp_router *router;
5ea1237f 7122
89d5dd2e
DA
7123 /* NETDEV_UP event is handled by mlxsw_sp_inet6addr_valid_event */
7124 if (event == NETDEV_UP)
7125 return NOTIFY_DONE;
7126
5ea1237f
AS
7127 inet6addr_work = kzalloc(sizeof(*inet6addr_work), GFP_ATOMIC);
7128 if (!inet6addr_work)
7129 return NOTIFY_BAD;
7130
965fa8e6 7131 router = container_of(nb, struct mlxsw_sp_router, inet6addr_nb);
5ea1237f 7132 INIT_WORK(&inet6addr_work->work, mlxsw_sp_inet6addr_event_work);
965fa8e6 7133 inet6addr_work->mlxsw_sp = router->mlxsw_sp;
5ea1237f
AS
7134 inet6addr_work->dev = dev;
7135 inet6addr_work->event = event;
7136 dev_hold(dev);
7137 mlxsw_core_schedule_work(&inet6addr_work->work);
7138
7139 return NOTIFY_DONE;
7140}
7141
89d5dd2e
DA
7142int mlxsw_sp_inet6addr_valid_event(struct notifier_block *unused,
7143 unsigned long event, void *ptr)
7144{
7145 struct in6_validator_info *i6vi = (struct in6_validator_info *) ptr;
7146 struct net_device *dev = i6vi->i6vi_dev->dev;
7147 struct mlxsw_sp *mlxsw_sp;
7148 struct mlxsw_sp_rif *rif;
7149 int err = 0;
7150
7151 mlxsw_sp = mlxsw_sp_lower_get(dev);
7152 if (!mlxsw_sp)
7153 goto out;
7154
7155 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
7156 if (!mlxsw_sp_rif_should_config(rif, dev, event))
7157 goto out;
7158
74bc9939
PM
7159 err = mlxsw_sp_router_port_check_rif_addr(mlxsw_sp, dev, dev->dev_addr,
7160 i6vi->extack);
7161 if (err)
7162 goto out;
7163
21ffedb6 7164 err = __mlxsw_sp_inetaddr_event(mlxsw_sp, dev, event, i6vi->extack);
89d5dd2e
DA
7165out:
7166 return notifier_from_errno(err);
7167}
7168
bf95233e 7169static int mlxsw_sp_rif_edit(struct mlxsw_sp *mlxsw_sp, u16 rif_index,
4724ba56
IS
7170 const char *mac, int mtu)
7171{
7172 char ritr_pl[MLXSW_REG_RITR_LEN];
7173 int err;
7174
bf95233e 7175 mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index);
4724ba56
IS
7176 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
7177 if (err)
7178 return err;
7179
7180 mlxsw_reg_ritr_mtu_set(ritr_pl, mtu);
7181 mlxsw_reg_ritr_if_mac_memcpy_to(ritr_pl, mac);
7182 mlxsw_reg_ritr_op_set(ritr_pl, MLXSW_REG_RITR_RIF_CREATE);
7183 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
7184}
7185
9735f2d2
PM
7186static int
7187mlxsw_sp_router_port_change_event(struct mlxsw_sp *mlxsw_sp,
7188 struct mlxsw_sp_rif *rif)
4724ba56 7189{
9735f2d2 7190 struct net_device *dev = rif->dev;
a1107487 7191 u16 fid_index;
4724ba56
IS
7192 int err;
7193
a1107487 7194 fid_index = mlxsw_sp_fid_index(rif->fid);
4724ba56 7195
a1107487 7196 err = mlxsw_sp_rif_fdb_op(mlxsw_sp, rif->addr, fid_index, false);
4724ba56
IS
7197 if (err)
7198 return err;
7199
bf95233e
AS
7200 err = mlxsw_sp_rif_edit(mlxsw_sp, rif->rif_index, dev->dev_addr,
7201 dev->mtu);
4724ba56
IS
7202 if (err)
7203 goto err_rif_edit;
7204
a1107487 7205 err = mlxsw_sp_rif_fdb_op(mlxsw_sp, dev->dev_addr, fid_index, true);
4724ba56
IS
7206 if (err)
7207 goto err_rif_fdb_op;
7208
fd890fe9
YG
7209 if (rif->mtu != dev->mtu) {
7210 struct mlxsw_sp_vr *vr;
9742f866 7211 int i;
fd890fe9
YG
7212
7213 /* The RIF is relevant only to its mr_table instance, as unlike
7214 * unicast routing, in multicast routing a RIF cannot be shared
7215 * between several multicast routing tables.
7216 */
7217 vr = &mlxsw_sp->router->vrs[rif->vr_id];
9742f866
YM
7218 for (i = 0; i < MLXSW_SP_L3_PROTO_MAX; i++)
7219 mlxsw_sp_mr_rif_mtu_update(vr->mr_table[i],
7220 rif, dev->mtu);
fd890fe9
YG
7221 }
7222
bf95233e
AS
7223 ether_addr_copy(rif->addr, dev->dev_addr);
7224 rif->mtu = dev->mtu;
4724ba56 7225
bf95233e 7226 netdev_dbg(dev, "Updated RIF=%d\n", rif->rif_index);
4724ba56
IS
7227
7228 return 0;
7229
7230err_rif_fdb_op:
bf95233e 7231 mlxsw_sp_rif_edit(mlxsw_sp, rif->rif_index, rif->addr, rif->mtu);
4724ba56 7232err_rif_edit:
a1107487 7233 mlxsw_sp_rif_fdb_op(mlxsw_sp, rif->addr, fid_index, true);
4724ba56
IS
7234 return err;
7235}
7236
74bc9939
PM
7237static int mlxsw_sp_router_port_pre_changeaddr_event(struct mlxsw_sp_rif *rif,
7238 struct netdev_notifier_pre_changeaddr_info *info)
7239{
7240 struct netlink_ext_ack *extack;
7241
7242 extack = netdev_notifier_info_to_extack(&info->info);
7243 return mlxsw_sp_router_port_check_rif_addr(rif->mlxsw_sp, rif->dev,
7244 info->dev_addr, extack);
7245}
7246
9735f2d2
PM
7247int mlxsw_sp_netdevice_router_port_event(struct net_device *dev,
7248 unsigned long event, void *ptr)
7249{
7250 struct mlxsw_sp *mlxsw_sp;
7251 struct mlxsw_sp_rif *rif;
7252
7253 mlxsw_sp = mlxsw_sp_lower_get(dev);
7254 if (!mlxsw_sp)
7255 return 0;
7256
7257 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev);
7258 if (!rif)
7259 return 0;
7260
7261 switch (event) {
7262 case NETDEV_CHANGEMTU: /* fall through */
7263 case NETDEV_CHANGEADDR:
7264 return mlxsw_sp_router_port_change_event(mlxsw_sp, rif);
74bc9939
PM
7265 case NETDEV_PRE_CHANGEADDR:
7266 return mlxsw_sp_router_port_pre_changeaddr_event(rif, ptr);
9735f2d2
PM
7267 }
7268
7269 return 0;
7270}
7271
b1e45526 7272static int mlxsw_sp_port_vrf_join(struct mlxsw_sp *mlxsw_sp,
f8fa9b4e
DA
7273 struct net_device *l3_dev,
7274 struct netlink_ext_ack *extack)
7179eb5a 7275{
b1e45526 7276 struct mlxsw_sp_rif *rif;
7179eb5a 7277
b1e45526
IS
7278 /* If netdev is already associated with a RIF, then we need to
7279 * destroy it and create a new one with the new virtual router ID.
7179eb5a 7280 */
b1e45526
IS
7281 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev);
7282 if (rif)
21ffedb6
IS
7283 __mlxsw_sp_inetaddr_event(mlxsw_sp, l3_dev, NETDEV_DOWN,
7284 extack);
7179eb5a 7285
21ffedb6 7286 return __mlxsw_sp_inetaddr_event(mlxsw_sp, l3_dev, NETDEV_UP, extack);
7179eb5a
IS
7287}
7288
b1e45526
IS
7289static void mlxsw_sp_port_vrf_leave(struct mlxsw_sp *mlxsw_sp,
7290 struct net_device *l3_dev)
7179eb5a 7291{
b1e45526 7292 struct mlxsw_sp_rif *rif;
7179eb5a 7293
b1e45526
IS
7294 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev);
7295 if (!rif)
7179eb5a 7296 return;
21ffedb6 7297 __mlxsw_sp_inetaddr_event(mlxsw_sp, l3_dev, NETDEV_DOWN, NULL);
7179eb5a
IS
7298}
7299
b1e45526
IS
7300int mlxsw_sp_netdevice_vrf_event(struct net_device *l3_dev, unsigned long event,
7301 struct netdev_notifier_changeupper_info *info)
3d70e458 7302{
b1e45526
IS
7303 struct mlxsw_sp *mlxsw_sp = mlxsw_sp_lower_get(l3_dev);
7304 int err = 0;
3d70e458 7305
c5516185
IS
7306 /* We do not create a RIF for a macvlan, but only use it to
7307 * direct more MAC addresses to the router.
7308 */
7309 if (!mlxsw_sp || netif_is_macvlan(l3_dev))
b1e45526 7310 return 0;
3d70e458 7311
b1e45526
IS
7312 switch (event) {
7313 case NETDEV_PRECHANGEUPPER:
7314 return 0;
7315 case NETDEV_CHANGEUPPER:
f8fa9b4e
DA
7316 if (info->linking) {
7317 struct netlink_ext_ack *extack;
7318
7319 extack = netdev_notifier_info_to_extack(&info->info);
7320 err = mlxsw_sp_port_vrf_join(mlxsw_sp, l3_dev, extack);
7321 } else {
b1e45526 7322 mlxsw_sp_port_vrf_leave(mlxsw_sp, l3_dev);
f8fa9b4e 7323 }
b1e45526
IS
7324 break;
7325 }
3d70e458 7326
b1e45526 7327 return err;
3d70e458
IS
7328}
7329
2db99378
IS
7330static int __mlxsw_sp_rif_macvlan_flush(struct net_device *dev, void *data)
7331{
7332 struct mlxsw_sp_rif *rif = data;
7333
7334 if (!netif_is_macvlan(dev))
7335 return 0;
7336
7337 return mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, dev->dev_addr,
7338 mlxsw_sp_fid_index(rif->fid), false);
7339}
7340
7341static int mlxsw_sp_rif_macvlan_flush(struct mlxsw_sp_rif *rif)
7342{
7343 if (!netif_is_macvlan_port(rif->dev))
7344 return 0;
7345
7346 netdev_warn(rif->dev, "Router interface is deleted. Upper macvlans will not work\n");
7347 return netdev_walk_all_upper_dev_rcu(rif->dev,
7348 __mlxsw_sp_rif_macvlan_flush, rif);
7349}
7350
e4f3c1c1
IS
7351static void mlxsw_sp_rif_subport_setup(struct mlxsw_sp_rif *rif,
7352 const struct mlxsw_sp_rif_params *params)
7353{
7354 struct mlxsw_sp_rif_subport *rif_subport;
7355
7356 rif_subport = mlxsw_sp_rif_subport_rif(rif);
32fd4b49 7357 refcount_set(&rif_subport->ref_count, 1);
e4f3c1c1
IS
7358 rif_subport->vid = params->vid;
7359 rif_subport->lag = params->lag;
7360 if (params->lag)
7361 rif_subport->lag_id = params->lag_id;
a1107487 7362 else
e4f3c1c1
IS
7363 rif_subport->system_port = params->system_port;
7364}
7365
7366static int mlxsw_sp_rif_subport_op(struct mlxsw_sp_rif *rif, bool enable)
7367{
7368 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
7369 struct mlxsw_sp_rif_subport *rif_subport;
7370 char ritr_pl[MLXSW_REG_RITR_LEN];
7371
7372 rif_subport = mlxsw_sp_rif_subport_rif(rif);
7373 mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_SP_IF,
9571e828
PM
7374 rif->rif_index, rif->vr_id, rif->dev->mtu);
7375 mlxsw_reg_ritr_mac_pack(ritr_pl, rif->dev->dev_addr);
e4f3c1c1
IS
7376 mlxsw_reg_ritr_sp_if_pack(ritr_pl, rif_subport->lag,
7377 rif_subport->lag ? rif_subport->lag_id :
7378 rif_subport->system_port,
7379 rif_subport->vid);
7380
7381 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
7382}
7383
7384static int mlxsw_sp_rif_subport_configure(struct mlxsw_sp_rif *rif)
7385{
010cadf9
PM
7386 int err;
7387
7388 err = mlxsw_sp_rif_subport_op(rif, true);
7389 if (err)
7390 return err;
7391
7392 err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
7393 mlxsw_sp_fid_index(rif->fid), true);
7394 if (err)
7395 goto err_rif_fdb_op;
7396
7397 mlxsw_sp_fid_rif_set(rif->fid, rif);
7398 return 0;
7399
7400err_rif_fdb_op:
7401 mlxsw_sp_rif_subport_op(rif, false);
7402 return err;
a1107487
IS
7403}
7404
e4f3c1c1
IS
7405static void mlxsw_sp_rif_subport_deconfigure(struct mlxsw_sp_rif *rif)
7406{
010cadf9
PM
7407 struct mlxsw_sp_fid *fid = rif->fid;
7408
7409 mlxsw_sp_fid_rif_set(fid, NULL);
7410 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
7411 mlxsw_sp_fid_index(fid), false);
2db99378 7412 mlxsw_sp_rif_macvlan_flush(rif);
e4f3c1c1
IS
7413 mlxsw_sp_rif_subport_op(rif, false);
7414}
7415
7416static struct mlxsw_sp_fid *
5f15e257
PM
7417mlxsw_sp_rif_subport_fid_get(struct mlxsw_sp_rif *rif,
7418 struct netlink_ext_ack *extack)
e4f3c1c1
IS
7419{
7420 return mlxsw_sp_fid_rfid_get(rif->mlxsw_sp, rif->rif_index);
7421}
7422
7423static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_subport_ops = {
7424 .type = MLXSW_SP_RIF_TYPE_SUBPORT,
7425 .rif_size = sizeof(struct mlxsw_sp_rif_subport),
7426 .setup = mlxsw_sp_rif_subport_setup,
7427 .configure = mlxsw_sp_rif_subport_configure,
7428 .deconfigure = mlxsw_sp_rif_subport_deconfigure,
7429 .fid_get = mlxsw_sp_rif_subport_fid_get,
7430};
7431
7432static int mlxsw_sp_rif_vlan_fid_op(struct mlxsw_sp_rif *rif,
7433 enum mlxsw_reg_ritr_if_type type,
7434 u16 vid_fid, bool enable)
7435{
7436 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
7437 char ritr_pl[MLXSW_REG_RITR_LEN];
7438
7439 mlxsw_reg_ritr_pack(ritr_pl, enable, type, rif->rif_index, rif->vr_id,
9571e828
PM
7440 rif->dev->mtu);
7441 mlxsw_reg_ritr_mac_pack(ritr_pl, rif->dev->dev_addr);
e4f3c1c1
IS
7442 mlxsw_reg_ritr_fid_set(ritr_pl, type, vid_fid);
7443
7444 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
7445}
7446
b35750f1 7447u8 mlxsw_sp_router_port(const struct mlxsw_sp *mlxsw_sp)
e4f3c1c1
IS
7448{
7449 return mlxsw_core_max_ports(mlxsw_sp->core) + 1;
7450}
7451
7452static int mlxsw_sp_rif_vlan_configure(struct mlxsw_sp_rif *rif)
7453{
7454 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
7455 u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid);
7456 int err;
7457
7458 err = mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_VLAN_IF, vid, true);
7459 if (err)
7460 return err;
7461
0d284818
IS
7462 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
7463 mlxsw_sp_router_port(mlxsw_sp), true);
7464 if (err)
7465 goto err_fid_mc_flood_set;
7466
e4f3c1c1
IS
7467 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
7468 mlxsw_sp_router_port(mlxsw_sp), true);
7469 if (err)
7470 goto err_fid_bc_flood_set;
7471
010cadf9
PM
7472 err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
7473 mlxsw_sp_fid_index(rif->fid), true);
7474 if (err)
7475 goto err_rif_fdb_op;
7476
7477 mlxsw_sp_fid_rif_set(rif->fid, rif);
e4f3c1c1
IS
7478 return 0;
7479
010cadf9
PM
7480err_rif_fdb_op:
7481 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
7482 mlxsw_sp_router_port(mlxsw_sp), false);
e4f3c1c1 7483err_fid_bc_flood_set:
0d284818
IS
7484 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
7485 mlxsw_sp_router_port(mlxsw_sp), false);
7486err_fid_mc_flood_set:
e4f3c1c1
IS
7487 mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_VLAN_IF, vid, false);
7488 return err;
7489}
7490
7491static void mlxsw_sp_rif_vlan_deconfigure(struct mlxsw_sp_rif *rif)
7492{
e4f3c1c1 7493 u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid);
010cadf9
PM
7494 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
7495 struct mlxsw_sp_fid *fid = rif->fid;
e4f3c1c1 7496
010cadf9
PM
7497 mlxsw_sp_fid_rif_set(fid, NULL);
7498 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
7499 mlxsw_sp_fid_index(fid), false);
2db99378 7500 mlxsw_sp_rif_macvlan_flush(rif);
e4f3c1c1
IS
7501 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
7502 mlxsw_sp_router_port(mlxsw_sp), false);
0d284818
IS
7503 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
7504 mlxsw_sp_router_port(mlxsw_sp), false);
e4f3c1c1
IS
7505 mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_VLAN_IF, vid, false);
7506}
7507
7508static struct mlxsw_sp_fid *
5f15e257
PM
7509mlxsw_sp_rif_vlan_fid_get(struct mlxsw_sp_rif *rif,
7510 struct netlink_ext_ack *extack)
e4f3c1c1 7511{
f40be47a 7512 struct net_device *br_dev = rif->dev;
e6f1960a
PM
7513 u16 vid;
7514 int err;
7515
7516 if (is_vlan_dev(rif->dev)) {
7517 vid = vlan_dev_vlan_id(rif->dev);
f40be47a
IS
7518 br_dev = vlan_dev_real_dev(rif->dev);
7519 if (WARN_ON(!netif_is_bridge_master(br_dev)))
7520 return ERR_PTR(-EINVAL);
e6f1960a
PM
7521 } else {
7522 err = br_vlan_get_pvid(rif->dev, &vid);
be9c64b1 7523 if (err < 0 || !vid) {
e6f1960a 7524 NL_SET_ERR_MSG_MOD(extack, "Couldn't determine bridge PVID");
be9c64b1 7525 return ERR_PTR(-EINVAL);
e6f1960a
PM
7526 }
7527 }
e4f3c1c1 7528
f40be47a 7529 return mlxsw_sp_bridge_fid_get(rif->mlxsw_sp, br_dev, vid, extack);
e4f3c1c1
IS
7530}
7531
2db99378
IS
7532static void mlxsw_sp_rif_vlan_fdb_del(struct mlxsw_sp_rif *rif, const char *mac)
7533{
7534 u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid);
7535 struct switchdev_notifier_fdb_info info;
7536 struct net_device *br_dev;
7537 struct net_device *dev;
7538
7539 br_dev = is_vlan_dev(rif->dev) ? vlan_dev_real_dev(rif->dev) : rif->dev;
7540 dev = br_fdb_find_port(br_dev, mac, vid);
7541 if (!dev)
7542 return;
7543
7544 info.addr = mac;
7545 info.vid = vid;
6685987c
PM
7546 call_switchdev_notifiers(SWITCHDEV_FDB_DEL_TO_BRIDGE, dev, &info.info,
7547 NULL);
2db99378
IS
7548}
7549
e4f3c1c1
IS
7550static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_vlan_ops = {
7551 .type = MLXSW_SP_RIF_TYPE_VLAN,
7552 .rif_size = sizeof(struct mlxsw_sp_rif),
7553 .configure = mlxsw_sp_rif_vlan_configure,
7554 .deconfigure = mlxsw_sp_rif_vlan_deconfigure,
7555 .fid_get = mlxsw_sp_rif_vlan_fid_get,
2db99378 7556 .fdb_del = mlxsw_sp_rif_vlan_fdb_del,
e4f3c1c1
IS
7557};
7558
7559static int mlxsw_sp_rif_fid_configure(struct mlxsw_sp_rif *rif)
7560{
7561 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
7562 u16 fid_index = mlxsw_sp_fid_index(rif->fid);
7563 int err;
7564
7565 err = mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_FID_IF, fid_index,
7566 true);
7567 if (err)
7568 return err;
7569
0d284818
IS
7570 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
7571 mlxsw_sp_router_port(mlxsw_sp), true);
7572 if (err)
7573 goto err_fid_mc_flood_set;
7574
e4f3c1c1
IS
7575 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
7576 mlxsw_sp_router_port(mlxsw_sp), true);
7577 if (err)
7578 goto err_fid_bc_flood_set;
7579
010cadf9
PM
7580 err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
7581 mlxsw_sp_fid_index(rif->fid), true);
7582 if (err)
7583 goto err_rif_fdb_op;
7584
7585 mlxsw_sp_fid_rif_set(rif->fid, rif);
e4f3c1c1
IS
7586 return 0;
7587
010cadf9
PM
7588err_rif_fdb_op:
7589 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
7590 mlxsw_sp_router_port(mlxsw_sp), false);
e4f3c1c1 7591err_fid_bc_flood_set:
0d284818
IS
7592 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
7593 mlxsw_sp_router_port(mlxsw_sp), false);
7594err_fid_mc_flood_set:
e4f3c1c1
IS
7595 mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_FID_IF, fid_index, false);
7596 return err;
7597}
7598
7599static void mlxsw_sp_rif_fid_deconfigure(struct mlxsw_sp_rif *rif)
7600{
e4f3c1c1 7601 u16 fid_index = mlxsw_sp_fid_index(rif->fid);
010cadf9
PM
7602 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
7603 struct mlxsw_sp_fid *fid = rif->fid;
e4f3c1c1 7604
010cadf9
PM
7605 mlxsw_sp_fid_rif_set(fid, NULL);
7606 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr,
7607 mlxsw_sp_fid_index(fid), false);
2db99378 7608 mlxsw_sp_rif_macvlan_flush(rif);
e4f3c1c1
IS
7609 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC,
7610 mlxsw_sp_router_port(mlxsw_sp), false);
0d284818
IS
7611 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC,
7612 mlxsw_sp_router_port(mlxsw_sp), false);
e4f3c1c1
IS
7613 mlxsw_sp_rif_vlan_fid_op(rif, MLXSW_REG_RITR_FID_IF, fid_index, false);
7614}
7615
7616static struct mlxsw_sp_fid *
5f15e257
PM
7617mlxsw_sp_rif_fid_fid_get(struct mlxsw_sp_rif *rif,
7618 struct netlink_ext_ack *extack)
e4f3c1c1 7619{
f40be47a 7620 return mlxsw_sp_bridge_fid_get(rif->mlxsw_sp, rif->dev, 0, extack);
e4f3c1c1
IS
7621}
7622
2db99378
IS
7623static void mlxsw_sp_rif_fid_fdb_del(struct mlxsw_sp_rif *rif, const char *mac)
7624{
7625 struct switchdev_notifier_fdb_info info;
7626 struct net_device *dev;
7627
7628 dev = br_fdb_find_port(rif->dev, mac, 0);
7629 if (!dev)
7630 return;
7631
7632 info.addr = mac;
7633 info.vid = 0;
6685987c
PM
7634 call_switchdev_notifiers(SWITCHDEV_FDB_DEL_TO_BRIDGE, dev, &info.info,
7635 NULL);
2db99378
IS
7636}
7637
e4f3c1c1
IS
7638static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_fid_ops = {
7639 .type = MLXSW_SP_RIF_TYPE_FID,
7640 .rif_size = sizeof(struct mlxsw_sp_rif),
7641 .configure = mlxsw_sp_rif_fid_configure,
7642 .deconfigure = mlxsw_sp_rif_fid_deconfigure,
7643 .fid_get = mlxsw_sp_rif_fid_fid_get,
2db99378 7644 .fdb_del = mlxsw_sp_rif_fid_fdb_del,
e4f3c1c1
IS
7645};
7646
ba6da02a
IS
7647static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_vlan_emu_ops = {
7648 .type = MLXSW_SP_RIF_TYPE_VLAN,
7649 .rif_size = sizeof(struct mlxsw_sp_rif),
7650 .configure = mlxsw_sp_rif_fid_configure,
7651 .deconfigure = mlxsw_sp_rif_fid_deconfigure,
7652 .fid_get = mlxsw_sp_rif_vlan_fid_get,
7653 .fdb_del = mlxsw_sp_rif_vlan_fdb_del,
7654};
7655
6ddb7426
PM
7656static struct mlxsw_sp_rif_ipip_lb *
7657mlxsw_sp_rif_ipip_lb_rif(struct mlxsw_sp_rif *rif)
7658{
7659 return container_of(rif, struct mlxsw_sp_rif_ipip_lb, common);
7660}
7661
7662static void
7663mlxsw_sp_rif_ipip_lb_setup(struct mlxsw_sp_rif *rif,
7664 const struct mlxsw_sp_rif_params *params)
7665{
7666 struct mlxsw_sp_rif_params_ipip_lb *params_lb;
7667 struct mlxsw_sp_rif_ipip_lb *rif_lb;
7668
7669 params_lb = container_of(params, struct mlxsw_sp_rif_params_ipip_lb,
7670 common);
7671 rif_lb = mlxsw_sp_rif_ipip_lb_rif(rif);
7672 rif_lb->lb_config = params_lb->lb_config;
7673}
7674
6ddb7426 7675static int
99974468 7676mlxsw_sp1_rif_ipip_lb_configure(struct mlxsw_sp_rif *rif)
6ddb7426
PM
7677{
7678 struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif);
7679 u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(rif->dev);
7680 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
7681 struct mlxsw_sp_vr *ul_vr;
7682 int err;
7683
f8fa9b4e 7684 ul_vr = mlxsw_sp_vr_get(mlxsw_sp, ul_tb_id, NULL);
6ddb7426
PM
7685 if (IS_ERR(ul_vr))
7686 return PTR_ERR(ul_vr);
7687
3c747500 7688 err = mlxsw_sp_rif_ipip_lb_op(lb_rif, ul_vr->id, 0, true);
6ddb7426
PM
7689 if (err)
7690 goto err_loopback_op;
7691
7692 lb_rif->ul_vr_id = ul_vr->id;
25f844dd 7693 lb_rif->ul_rif_id = 0;
6ddb7426
PM
7694 ++ul_vr->rif_count;
7695 return 0;
7696
7697err_loopback_op:
2b52ce02 7698 mlxsw_sp_vr_put(mlxsw_sp, ul_vr);
6ddb7426
PM
7699 return err;
7700}
7701
99974468 7702static void mlxsw_sp1_rif_ipip_lb_deconfigure(struct mlxsw_sp_rif *rif)
6ddb7426
PM
7703{
7704 struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif);
7705 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
7706 struct mlxsw_sp_vr *ul_vr;
7707
7708 ul_vr = &mlxsw_sp->router->vrs[lb_rif->ul_vr_id];
3c747500 7709 mlxsw_sp_rif_ipip_lb_op(lb_rif, ul_vr->id, 0, false);
6ddb7426
PM
7710
7711 --ul_vr->rif_count;
2b52ce02 7712 mlxsw_sp_vr_put(mlxsw_sp, ul_vr);
6ddb7426
PM
7713}
7714
99974468 7715static const struct mlxsw_sp_rif_ops mlxsw_sp1_rif_ipip_lb_ops = {
6ddb7426
PM
7716 .type = MLXSW_SP_RIF_TYPE_IPIP_LB,
7717 .rif_size = sizeof(struct mlxsw_sp_rif_ipip_lb),
7718 .setup = mlxsw_sp_rif_ipip_lb_setup,
99974468
ND
7719 .configure = mlxsw_sp1_rif_ipip_lb_configure,
7720 .deconfigure = mlxsw_sp1_rif_ipip_lb_deconfigure,
6ddb7426
PM
7721};
7722
99974468 7723const struct mlxsw_sp_rif_ops *mlxsw_sp1_rif_ops_arr[] = {
e4f3c1c1 7724 [MLXSW_SP_RIF_TYPE_SUBPORT] = &mlxsw_sp_rif_subport_ops,
c2e7490c 7725 [MLXSW_SP_RIF_TYPE_VLAN] = &mlxsw_sp_rif_vlan_emu_ops,
e4f3c1c1 7726 [MLXSW_SP_RIF_TYPE_FID] = &mlxsw_sp_rif_fid_ops,
99974468
ND
7727 [MLXSW_SP_RIF_TYPE_IPIP_LB] = &mlxsw_sp1_rif_ipip_lb_ops,
7728};
7729
a5040a90
ND
7730static int
7731mlxsw_sp_rif_ipip_lb_ul_rif_op(struct mlxsw_sp_rif *ul_rif, bool enable)
7732{
7733 struct mlxsw_sp *mlxsw_sp = ul_rif->mlxsw_sp;
7734 char ritr_pl[MLXSW_REG_RITR_LEN];
7735
7736 mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_LOOPBACK_IF,
7737 ul_rif->rif_index, ul_rif->vr_id, IP_MAX_MTU);
7738 mlxsw_reg_ritr_loopback_protocol_set(ritr_pl,
7739 MLXSW_REG_RITR_LOOPBACK_GENERIC);
7740
7741 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl);
7742}
7743
7744static struct mlxsw_sp_rif *
7745mlxsw_sp_ul_rif_create(struct mlxsw_sp *mlxsw_sp, struct mlxsw_sp_vr *vr,
7746 struct netlink_ext_ack *extack)
7747{
7748 struct mlxsw_sp_rif *ul_rif;
7749 u16 rif_index;
7750 int err;
7751
7752 err = mlxsw_sp_rif_index_alloc(mlxsw_sp, &rif_index);
7753 if (err) {
7754 NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported router interfaces");
7755 return ERR_PTR(err);
7756 }
7757
7758 ul_rif = mlxsw_sp_rif_alloc(sizeof(*ul_rif), rif_index, vr->id, NULL);
7759 if (!ul_rif)
7760 return ERR_PTR(-ENOMEM);
7761
7762 mlxsw_sp->router->rifs[rif_index] = ul_rif;
7763 ul_rif->mlxsw_sp = mlxsw_sp;
7764 err = mlxsw_sp_rif_ipip_lb_ul_rif_op(ul_rif, true);
7765 if (err)
7766 goto ul_rif_op_err;
7767
7768 return ul_rif;
7769
7770ul_rif_op_err:
7771 mlxsw_sp->router->rifs[rif_index] = NULL;
7772 kfree(ul_rif);
7773 return ERR_PTR(err);
7774}
7775
7776static void mlxsw_sp_ul_rif_destroy(struct mlxsw_sp_rif *ul_rif)
7777{
7778 struct mlxsw_sp *mlxsw_sp = ul_rif->mlxsw_sp;
7779
7780 mlxsw_sp_rif_ipip_lb_ul_rif_op(ul_rif, false);
7781 mlxsw_sp->router->rifs[ul_rif->rif_index] = NULL;
7782 kfree(ul_rif);
7783}
7784
7785static struct mlxsw_sp_rif *
7786mlxsw_sp_ul_rif_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id,
7787 struct netlink_ext_ack *extack)
7788{
7789 struct mlxsw_sp_vr *vr;
7790 int err;
7791
7792 vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id, extack);
7793 if (IS_ERR(vr))
7794 return ERR_CAST(vr);
7795
7796 if (refcount_inc_not_zero(&vr->ul_rif_refcnt))
7797 return vr->ul_rif;
7798
7799 vr->ul_rif = mlxsw_sp_ul_rif_create(mlxsw_sp, vr, extack);
7800 if (IS_ERR(vr->ul_rif)) {
7801 err = PTR_ERR(vr->ul_rif);
7802 goto err_ul_rif_create;
7803 }
7804
7805 vr->rif_count++;
7806 refcount_set(&vr->ul_rif_refcnt, 1);
7807
7808 return vr->ul_rif;
7809
7810err_ul_rif_create:
7811 mlxsw_sp_vr_put(mlxsw_sp, vr);
7812 return ERR_PTR(err);
7813}
7814
7815static void mlxsw_sp_ul_rif_put(struct mlxsw_sp_rif *ul_rif)
7816{
7817 struct mlxsw_sp *mlxsw_sp = ul_rif->mlxsw_sp;
7818 struct mlxsw_sp_vr *vr;
7819
7820 vr = &mlxsw_sp->router->vrs[ul_rif->vr_id];
7821
7822 if (!refcount_dec_and_test(&vr->ul_rif_refcnt))
7823 return;
7824
7825 vr->rif_count--;
7826 mlxsw_sp_ul_rif_destroy(ul_rif);
7827 mlxsw_sp_vr_put(mlxsw_sp, vr);
7828}
7829
eff42aa9
IS
7830int mlxsw_sp_router_ul_rif_get(struct mlxsw_sp *mlxsw_sp, u32 ul_tb_id,
7831 u16 *ul_rif_index)
7832{
7833 struct mlxsw_sp_rif *ul_rif;
7834
7835 ASSERT_RTNL();
7836
7837 ul_rif = mlxsw_sp_ul_rif_get(mlxsw_sp, ul_tb_id, NULL);
7838 if (IS_ERR(ul_rif))
7839 return PTR_ERR(ul_rif);
7840 *ul_rif_index = ul_rif->rif_index;
7841
7842 return 0;
7843}
7844
7845void mlxsw_sp_router_ul_rif_put(struct mlxsw_sp *mlxsw_sp, u16 ul_rif_index)
7846{
7847 struct mlxsw_sp_rif *ul_rif;
7848
7849 ASSERT_RTNL();
7850
7851 ul_rif = mlxsw_sp->router->rifs[ul_rif_index];
7852 if (WARN_ON(!ul_rif))
7853 return;
7854
7855 mlxsw_sp_ul_rif_put(ul_rif);
7856}
7857
99974468
ND
7858static int
7859mlxsw_sp2_rif_ipip_lb_configure(struct mlxsw_sp_rif *rif)
7860{
a5040a90
ND
7861 struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif);
7862 u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(rif->dev);
7863 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
7864 struct mlxsw_sp_rif *ul_rif;
7865 int err;
7866
7867 ul_rif = mlxsw_sp_ul_rif_get(mlxsw_sp, ul_tb_id, NULL);
7868 if (IS_ERR(ul_rif))
7869 return PTR_ERR(ul_rif);
7870
7871 err = mlxsw_sp_rif_ipip_lb_op(lb_rif, 0, ul_rif->rif_index, true);
7872 if (err)
7873 goto err_loopback_op;
7874
7875 lb_rif->ul_vr_id = 0;
7876 lb_rif->ul_rif_id = ul_rif->rif_index;
7877
99974468 7878 return 0;
a5040a90
ND
7879
7880err_loopback_op:
7881 mlxsw_sp_ul_rif_put(ul_rif);
7882 return err;
99974468
ND
7883}
7884
7885static void mlxsw_sp2_rif_ipip_lb_deconfigure(struct mlxsw_sp_rif *rif)
7886{
a5040a90
ND
7887 struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif);
7888 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp;
7889 struct mlxsw_sp_rif *ul_rif;
7890
7891 ul_rif = mlxsw_sp_rif_by_index(mlxsw_sp, lb_rif->ul_rif_id);
7892 mlxsw_sp_rif_ipip_lb_op(lb_rif, 0, lb_rif->ul_rif_id, false);
7893 mlxsw_sp_ul_rif_put(ul_rif);
99974468
ND
7894}
7895
7896static const struct mlxsw_sp_rif_ops mlxsw_sp2_rif_ipip_lb_ops = {
7897 .type = MLXSW_SP_RIF_TYPE_IPIP_LB,
7898 .rif_size = sizeof(struct mlxsw_sp_rif_ipip_lb),
7899 .setup = mlxsw_sp_rif_ipip_lb_setup,
7900 .configure = mlxsw_sp2_rif_ipip_lb_configure,
7901 .deconfigure = mlxsw_sp2_rif_ipip_lb_deconfigure,
7902};
7903
7904const struct mlxsw_sp_rif_ops *mlxsw_sp2_rif_ops_arr[] = {
7905 [MLXSW_SP_RIF_TYPE_SUBPORT] = &mlxsw_sp_rif_subport_ops,
7906 [MLXSW_SP_RIF_TYPE_VLAN] = &mlxsw_sp_rif_vlan_emu_ops,
7907 [MLXSW_SP_RIF_TYPE_FID] = &mlxsw_sp_rif_fid_ops,
7908 [MLXSW_SP_RIF_TYPE_IPIP_LB] = &mlxsw_sp2_rif_ipip_lb_ops,
e4f3c1c1
IS
7909};
7910
348b8fc3
IS
7911static int mlxsw_sp_rifs_init(struct mlxsw_sp *mlxsw_sp)
7912{
7913 u64 max_rifs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS);
7914
7915 mlxsw_sp->router->rifs = kcalloc(max_rifs,
7916 sizeof(struct mlxsw_sp_rif *),
7917 GFP_KERNEL);
7918 if (!mlxsw_sp->router->rifs)
7919 return -ENOMEM;
e4f3c1c1 7920
348b8fc3
IS
7921 return 0;
7922}
7923
7924static void mlxsw_sp_rifs_fini(struct mlxsw_sp *mlxsw_sp)
7925{
7926 int i;
7927
7928 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++)
7929 WARN_ON_ONCE(mlxsw_sp->router->rifs[i]);
7930
7931 kfree(mlxsw_sp->router->rifs);
7932}
7933
dcbda282
PM
7934static int
7935mlxsw_sp_ipip_config_tigcr(struct mlxsw_sp *mlxsw_sp)
7936{
7937 char tigcr_pl[MLXSW_REG_TIGCR_LEN];
7938
7939 mlxsw_reg_tigcr_pack(tigcr_pl, true, 0);
7940 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(tigcr), tigcr_pl);
7941}
7942
38ebc0f4
PM
7943static int mlxsw_sp_ipips_init(struct mlxsw_sp *mlxsw_sp)
7944{
7945 mlxsw_sp->router->ipip_ops_arr = mlxsw_sp_ipip_ops_arr;
1012b9ac 7946 INIT_LIST_HEAD(&mlxsw_sp->router->ipip_list);
dcbda282 7947 return mlxsw_sp_ipip_config_tigcr(mlxsw_sp);
38ebc0f4
PM
7948}
7949
7950static void mlxsw_sp_ipips_fini(struct mlxsw_sp *mlxsw_sp)
7951{
1012b9ac 7952 WARN_ON(!list_empty(&mlxsw_sp->router->ipip_list));
38ebc0f4
PM
7953}
7954
c3852ef7
IS
7955static void mlxsw_sp_router_fib_dump_flush(struct notifier_block *nb)
7956{
7e39d115 7957 struct mlxsw_sp_router *router;
c3852ef7
IS
7958
7959 /* Flush pending FIB notifications and then flush the device's
7960 * table before requesting another dump. The FIB notification
7961 * block is unregistered, so no need to take RTNL.
7962 */
7963 mlxsw_core_flush_owq();
7e39d115
IS
7964 router = container_of(nb, struct mlxsw_sp_router, fib_nb);
7965 mlxsw_sp_router_fib_flush(router->mlxsw_sp);
c3852ef7
IS
7966}
7967
af658b6a
IS
7968#ifdef CONFIG_IP_ROUTE_MULTIPATH
7969static void mlxsw_sp_mp_hash_header_set(char *recr2_pl, int header)
7970{
7971 mlxsw_reg_recr2_outer_header_enables_set(recr2_pl, header, true);
7972}
7973
7974static void mlxsw_sp_mp_hash_field_set(char *recr2_pl, int field)
7975{
7976 mlxsw_reg_recr2_outer_header_fields_enable_set(recr2_pl, field, true);
7977}
7978
7979static void mlxsw_sp_mp4_hash_init(char *recr2_pl)
7980{
7981 bool only_l3 = !init_net.ipv4.sysctl_fib_multipath_hash_policy;
7982
7983 mlxsw_sp_mp_hash_header_set(recr2_pl,
7984 MLXSW_REG_RECR2_IPV4_EN_NOT_TCP_NOT_UDP);
7985 mlxsw_sp_mp_hash_header_set(recr2_pl, MLXSW_REG_RECR2_IPV4_EN_TCP_UDP);
7986 mlxsw_reg_recr2_ipv4_sip_enable(recr2_pl);
7987 mlxsw_reg_recr2_ipv4_dip_enable(recr2_pl);
7988 if (only_l3)
7989 return;
7990 mlxsw_sp_mp_hash_header_set(recr2_pl, MLXSW_REG_RECR2_TCP_UDP_EN_IPV4);
7991 mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_IPV4_PROTOCOL);
7992 mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_TCP_UDP_SPORT);
7993 mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_TCP_UDP_DPORT);
7994}
7995
7996static void mlxsw_sp_mp6_hash_init(char *recr2_pl)
7997{
918ee507 7998 bool only_l3 = !ip6_multipath_hash_policy(&init_net);
5e18b9c5 7999
af658b6a
IS
8000 mlxsw_sp_mp_hash_header_set(recr2_pl,
8001 MLXSW_REG_RECR2_IPV6_EN_NOT_TCP_NOT_UDP);
8002 mlxsw_sp_mp_hash_header_set(recr2_pl, MLXSW_REG_RECR2_IPV6_EN_TCP_UDP);
8003 mlxsw_reg_recr2_ipv6_sip_enable(recr2_pl);
8004 mlxsw_reg_recr2_ipv6_dip_enable(recr2_pl);
af658b6a 8005 mlxsw_sp_mp_hash_field_set(recr2_pl, MLXSW_REG_RECR2_IPV6_NEXT_HEADER);
5e18b9c5
DA
8006 if (only_l3) {
8007 mlxsw_sp_mp_hash_field_set(recr2_pl,
8008 MLXSW_REG_RECR2_IPV6_FLOW_LABEL);
8009 } else {
8010 mlxsw_sp_mp_hash_header_set(recr2_pl,
8011 MLXSW_REG_RECR2_TCP_UDP_EN_IPV6);
8012 mlxsw_sp_mp_hash_field_set(recr2_pl,
8013 MLXSW_REG_RECR2_TCP_UDP_SPORT);
8014 mlxsw_sp_mp_hash_field_set(recr2_pl,
8015 MLXSW_REG_RECR2_TCP_UDP_DPORT);
8016 }
af658b6a
IS
8017}
8018
8019static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp)
8020{
8021 char recr2_pl[MLXSW_REG_RECR2_LEN];
8022 u32 seed;
8023
fa73989f 8024 seed = jhash(mlxsw_sp->base_mac, sizeof(mlxsw_sp->base_mac), 0);
af658b6a
IS
8025 mlxsw_reg_recr2_pack(recr2_pl, seed);
8026 mlxsw_sp_mp4_hash_init(recr2_pl);
8027 mlxsw_sp_mp6_hash_init(recr2_pl);
8028
8029 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(recr2), recr2_pl);
8030}
8031#else
8032static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp)
8033{
8034 return 0;
8035}
8036#endif
8037
48276a29
YM
8038static int mlxsw_sp_dscp_init(struct mlxsw_sp *mlxsw_sp)
8039{
8040 char rdpm_pl[MLXSW_REG_RDPM_LEN];
8041 unsigned int i;
8042
8043 MLXSW_REG_ZERO(rdpm, rdpm_pl);
8044
8045 /* HW is determining switch priority based on DSCP-bits, but the
8046 * kernel is still doing that based on the ToS. Since there's a
8047 * mismatch in bits we need to make sure to translate the right
8048 * value ToS would observe, skipping the 2 least-significant ECN bits.
8049 */
8050 for (i = 0; i < MLXSW_REG_RDPM_DSCP_ENTRY_REC_MAX_COUNT; i++)
8051 mlxsw_reg_rdpm_pack(rdpm_pl, i, rt_tos2priority(i << 2));
8052
8053 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rdpm), rdpm_pl);
8054}
8055
4724ba56
IS
8056static int __mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp)
8057{
64953423 8058 bool usp = init_net.ipv4.sysctl_ip_fwd_update_priority;
4724ba56
IS
8059 char rgcr_pl[MLXSW_REG_RGCR_LEN];
8060 u64 max_rifs;
8061 int err;
8062
8063 if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_RIFS))
8064 return -EIO;
4724ba56 8065 max_rifs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS);
4724ba56 8066
e29237e7 8067 mlxsw_reg_rgcr_pack(rgcr_pl, true, true);
4724ba56 8068 mlxsw_reg_rgcr_max_router_interfaces_set(rgcr_pl, max_rifs);
64953423 8069 mlxsw_reg_rgcr_usp_set(rgcr_pl, usp);
4724ba56
IS
8070 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rgcr), rgcr_pl);
8071 if (err)
348b8fc3 8072 return err;
4724ba56 8073 return 0;
4724ba56
IS
8074}
8075
8076static void __mlxsw_sp_router_fini(struct mlxsw_sp *mlxsw_sp)
8077{
8078 char rgcr_pl[MLXSW_REG_RGCR_LEN];
4724ba56 8079
e29237e7 8080 mlxsw_reg_rgcr_pack(rgcr_pl, false, false);
4724ba56 8081 mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rgcr), rgcr_pl);
4724ba56
IS
8082}
8083
b45f64d1
JP
8084int mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp)
8085{
9011b677 8086 struct mlxsw_sp_router *router;
b45f64d1
JP
8087 int err;
8088
9011b677
IS
8089 router = kzalloc(sizeof(*mlxsw_sp->router), GFP_KERNEL);
8090 if (!router)
8091 return -ENOMEM;
8092 mlxsw_sp->router = router;
8093 router->mlxsw_sp = mlxsw_sp;
8094
965fa8e6
IS
8095 router->inetaddr_nb.notifier_call = mlxsw_sp_inetaddr_event;
8096 err = register_inetaddr_notifier(&router->inetaddr_nb);
8097 if (err)
8098 goto err_register_inetaddr_notifier;
8099
8100 router->inet6addr_nb.notifier_call = mlxsw_sp_inet6addr_event;
8101 err = register_inet6addr_notifier(&router->inet6addr_nb);
8102 if (err)
8103 goto err_register_inet6addr_notifier;
8104
9011b677 8105 INIT_LIST_HEAD(&mlxsw_sp->router->nexthop_neighs_list);
b45f64d1
JP
8106 err = __mlxsw_sp_router_init(mlxsw_sp);
8107 if (err)
9011b677 8108 goto err_router_init;
b45f64d1 8109
348b8fc3
IS
8110 err = mlxsw_sp_rifs_init(mlxsw_sp);
8111 if (err)
8112 goto err_rifs_init;
8113
38ebc0f4
PM
8114 err = mlxsw_sp_ipips_init(mlxsw_sp);
8115 if (err)
8116 goto err_ipips_init;
8117
9011b677 8118 err = rhashtable_init(&mlxsw_sp->router->nexthop_ht,
c53b8e1b
IS
8119 &mlxsw_sp_nexthop_ht_params);
8120 if (err)
8121 goto err_nexthop_ht_init;
8122
9011b677 8123 err = rhashtable_init(&mlxsw_sp->router->nexthop_group_ht,
e9ad5e7d
IS
8124 &mlxsw_sp_nexthop_group_ht_params);
8125 if (err)
8126 goto err_nexthop_group_ht_init;
8127
dbe4598c 8128 INIT_LIST_HEAD(&mlxsw_sp->router->nexthop_list);
8494ab06
IS
8129 err = mlxsw_sp_lpm_init(mlxsw_sp);
8130 if (err)
8131 goto err_lpm_init;
8132
d42b0965
YG
8133 err = mlxsw_sp_mr_init(mlxsw_sp, &mlxsw_sp_mr_tcam_ops);
8134 if (err)
8135 goto err_mr_init;
8136
b45f64d1
JP
8137 err = mlxsw_sp_vrs_init(mlxsw_sp);
8138 if (err)
8139 goto err_vrs_init;
8140
8c9583a8 8141 err = mlxsw_sp_neigh_init(mlxsw_sp);
b45f64d1
JP
8142 if (err)
8143 goto err_neigh_init;
8144
48fac885
IS
8145 mlxsw_sp->router->netevent_nb.notifier_call =
8146 mlxsw_sp_router_netevent_event;
8147 err = register_netevent_notifier(&mlxsw_sp->router->netevent_nb);
8148 if (err)
8149 goto err_register_netevent_notifier;
8150
af658b6a
IS
8151 err = mlxsw_sp_mp_hash_init(mlxsw_sp);
8152 if (err)
8153 goto err_mp_hash_init;
8154
48276a29
YM
8155 err = mlxsw_sp_dscp_init(mlxsw_sp);
8156 if (err)
8157 goto err_dscp_init;
8158
7e39d115
IS
8159 mlxsw_sp->router->fib_nb.notifier_call = mlxsw_sp_router_fib_event;
8160 err = register_fib_notifier(&mlxsw_sp->router->fib_nb,
c3852ef7
IS
8161 mlxsw_sp_router_fib_dump_flush);
8162 if (err)
8163 goto err_register_fib_notifier;
8164
b45f64d1
JP
8165 return 0;
8166
c3852ef7 8167err_register_fib_notifier:
48276a29 8168err_dscp_init:
af658b6a 8169err_mp_hash_init:
48fac885
IS
8170 unregister_netevent_notifier(&mlxsw_sp->router->netevent_nb);
8171err_register_netevent_notifier:
c3852ef7 8172 mlxsw_sp_neigh_fini(mlxsw_sp);
b45f64d1
JP
8173err_neigh_init:
8174 mlxsw_sp_vrs_fini(mlxsw_sp);
8175err_vrs_init:
d42b0965
YG
8176 mlxsw_sp_mr_fini(mlxsw_sp);
8177err_mr_init:
8494ab06
IS
8178 mlxsw_sp_lpm_fini(mlxsw_sp);
8179err_lpm_init:
9011b677 8180 rhashtable_destroy(&mlxsw_sp->router->nexthop_group_ht);
e9ad5e7d 8181err_nexthop_group_ht_init:
9011b677 8182 rhashtable_destroy(&mlxsw_sp->router->nexthop_ht);
c53b8e1b 8183err_nexthop_ht_init:
38ebc0f4
PM
8184 mlxsw_sp_ipips_fini(mlxsw_sp);
8185err_ipips_init:
348b8fc3
IS
8186 mlxsw_sp_rifs_fini(mlxsw_sp);
8187err_rifs_init:
b45f64d1 8188 __mlxsw_sp_router_fini(mlxsw_sp);
9011b677 8189err_router_init:
965fa8e6
IS
8190 unregister_inet6addr_notifier(&router->inet6addr_nb);
8191err_register_inet6addr_notifier:
8192 unregister_inetaddr_notifier(&router->inetaddr_nb);
8193err_register_inetaddr_notifier:
9011b677 8194 kfree(mlxsw_sp->router);
b45f64d1
JP
8195 return err;
8196}
8197
8198void mlxsw_sp_router_fini(struct mlxsw_sp *mlxsw_sp)
8199{
7e39d115 8200 unregister_fib_notifier(&mlxsw_sp->router->fib_nb);
48fac885 8201 unregister_netevent_notifier(&mlxsw_sp->router->netevent_nb);
b45f64d1
JP
8202 mlxsw_sp_neigh_fini(mlxsw_sp);
8203 mlxsw_sp_vrs_fini(mlxsw_sp);
d42b0965 8204 mlxsw_sp_mr_fini(mlxsw_sp);
8494ab06 8205 mlxsw_sp_lpm_fini(mlxsw_sp);
9011b677
IS
8206 rhashtable_destroy(&mlxsw_sp->router->nexthop_group_ht);
8207 rhashtable_destroy(&mlxsw_sp->router->nexthop_ht);
38ebc0f4 8208 mlxsw_sp_ipips_fini(mlxsw_sp);
348b8fc3 8209 mlxsw_sp_rifs_fini(mlxsw_sp);
b45f64d1 8210 __mlxsw_sp_router_fini(mlxsw_sp);
965fa8e6
IS
8211 unregister_inet6addr_notifier(&mlxsw_sp->router->inet6addr_nb);
8212 unregister_inetaddr_notifier(&mlxsw_sp->router->inetaddr_nb);
9011b677 8213 kfree(mlxsw_sp->router);
b45f64d1 8214}