1 // SPDX-License-Identifier: BSD-3-Clause OR GPL-2.0
2 /* Copyright (c) 2017-2018 Mellanox Technologies. All rights reserved */
3
4 #include <net/ip_tunnels.h>
5 #include <net/ip6_tunnel.h>
6
7 #include "spectrum_ipip.h"
8
9 struct ip_tunnel_parm
mlxsw_sp_ipip_netdev_parms4(const struct net_device * ol_dev)10 mlxsw_sp_ipip_netdev_parms4(const struct net_device *ol_dev)
11 {
12 struct ip_tunnel *tun = netdev_priv(ol_dev);
13
14 return tun->parms;
15 }
16
17 struct __ip6_tnl_parm
mlxsw_sp_ipip_netdev_parms6(const struct net_device * ol_dev)18 mlxsw_sp_ipip_netdev_parms6(const struct net_device *ol_dev)
19 {
20 struct ip6_tnl *tun = netdev_priv(ol_dev);
21
22 return tun->parms;
23 }
24
mlxsw_sp_ipip_parms4_has_ikey(struct ip_tunnel_parm parms)25 static bool mlxsw_sp_ipip_parms4_has_ikey(struct ip_tunnel_parm parms)
26 {
27 return !!(parms.i_flags & TUNNEL_KEY);
28 }
29
mlxsw_sp_ipip_parms4_has_okey(struct ip_tunnel_parm parms)30 static bool mlxsw_sp_ipip_parms4_has_okey(struct ip_tunnel_parm parms)
31 {
32 return !!(parms.o_flags & TUNNEL_KEY);
33 }
34
mlxsw_sp_ipip_parms4_ikey(struct ip_tunnel_parm parms)35 static u32 mlxsw_sp_ipip_parms4_ikey(struct ip_tunnel_parm parms)
36 {
37 return mlxsw_sp_ipip_parms4_has_ikey(parms) ?
38 be32_to_cpu(parms.i_key) : 0;
39 }
40
mlxsw_sp_ipip_parms4_okey(struct ip_tunnel_parm parms)41 static u32 mlxsw_sp_ipip_parms4_okey(struct ip_tunnel_parm parms)
42 {
43 return mlxsw_sp_ipip_parms4_has_okey(parms) ?
44 be32_to_cpu(parms.o_key) : 0;
45 }
46
47 static union mlxsw_sp_l3addr
mlxsw_sp_ipip_parms4_saddr(struct ip_tunnel_parm parms)48 mlxsw_sp_ipip_parms4_saddr(struct ip_tunnel_parm parms)
49 {
50 return (union mlxsw_sp_l3addr) { .addr4 = parms.iph.saddr };
51 }
52
53 static union mlxsw_sp_l3addr
mlxsw_sp_ipip_parms6_saddr(struct __ip6_tnl_parm parms)54 mlxsw_sp_ipip_parms6_saddr(struct __ip6_tnl_parm parms)
55 {
56 return (union mlxsw_sp_l3addr) { .addr6 = parms.laddr };
57 }
58
59 static union mlxsw_sp_l3addr
mlxsw_sp_ipip_parms4_daddr(struct ip_tunnel_parm parms)60 mlxsw_sp_ipip_parms4_daddr(struct ip_tunnel_parm parms)
61 {
62 return (union mlxsw_sp_l3addr) { .addr4 = parms.iph.daddr };
63 }
64
65 static union mlxsw_sp_l3addr
mlxsw_sp_ipip_parms6_daddr(struct __ip6_tnl_parm parms)66 mlxsw_sp_ipip_parms6_daddr(struct __ip6_tnl_parm parms)
67 {
68 return (union mlxsw_sp_l3addr) { .addr6 = parms.raddr };
69 }
70
71 union mlxsw_sp_l3addr
mlxsw_sp_ipip_netdev_saddr(enum mlxsw_sp_l3proto proto,const struct net_device * ol_dev)72 mlxsw_sp_ipip_netdev_saddr(enum mlxsw_sp_l3proto proto,
73 const struct net_device *ol_dev)
74 {
75 struct ip_tunnel_parm parms4;
76 struct __ip6_tnl_parm parms6;
77
78 switch (proto) {
79 case MLXSW_SP_L3_PROTO_IPV4:
80 parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev);
81 return mlxsw_sp_ipip_parms4_saddr(parms4);
82 case MLXSW_SP_L3_PROTO_IPV6:
83 parms6 = mlxsw_sp_ipip_netdev_parms6(ol_dev);
84 return mlxsw_sp_ipip_parms6_saddr(parms6);
85 }
86
87 WARN_ON(1);
88 return (union mlxsw_sp_l3addr) {0};
89 }
90
mlxsw_sp_ipip_netdev_daddr4(const struct net_device * ol_dev)91 static __be32 mlxsw_sp_ipip_netdev_daddr4(const struct net_device *ol_dev)
92 {
93
94 struct ip_tunnel_parm parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev);
95
96 return mlxsw_sp_ipip_parms4_daddr(parms4).addr4;
97 }
98
99 static union mlxsw_sp_l3addr
mlxsw_sp_ipip_netdev_daddr(enum mlxsw_sp_l3proto proto,const struct net_device * ol_dev)100 mlxsw_sp_ipip_netdev_daddr(enum mlxsw_sp_l3proto proto,
101 const struct net_device *ol_dev)
102 {
103 struct ip_tunnel_parm parms4;
104 struct __ip6_tnl_parm parms6;
105
106 switch (proto) {
107 case MLXSW_SP_L3_PROTO_IPV4:
108 parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev);
109 return mlxsw_sp_ipip_parms4_daddr(parms4);
110 case MLXSW_SP_L3_PROTO_IPV6:
111 parms6 = mlxsw_sp_ipip_netdev_parms6(ol_dev);
112 return mlxsw_sp_ipip_parms6_daddr(parms6);
113 }
114
115 WARN_ON(1);
116 return (union mlxsw_sp_l3addr) {0};
117 }
118
mlxsw_sp_l3addr_is_zero(union mlxsw_sp_l3addr addr)119 bool mlxsw_sp_l3addr_is_zero(union mlxsw_sp_l3addr addr)
120 {
121 union mlxsw_sp_l3addr naddr = {0};
122
123 return !memcmp(&addr, &naddr, sizeof(naddr));
124 }
125
126 static int
mlxsw_sp_ipip_nexthop_update_gre4(struct mlxsw_sp * mlxsw_sp,u32 adj_index,struct mlxsw_sp_ipip_entry * ipip_entry)127 mlxsw_sp_ipip_nexthop_update_gre4(struct mlxsw_sp *mlxsw_sp, u32 adj_index,
128 struct mlxsw_sp_ipip_entry *ipip_entry)
129 {
130 u16 rif_index = mlxsw_sp_ipip_lb_rif_index(ipip_entry->ol_lb);
131 __be32 daddr4 = mlxsw_sp_ipip_netdev_daddr4(ipip_entry->ol_dev);
132 char ratr_pl[MLXSW_REG_RATR_LEN];
133
134 mlxsw_reg_ratr_pack(ratr_pl, MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY,
135 true, MLXSW_REG_RATR_TYPE_IPIP,
136 adj_index, rif_index);
137 mlxsw_reg_ratr_ipip4_entry_pack(ratr_pl, be32_to_cpu(daddr4));
138
139 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl);
140 }
141
142 static int
mlxsw_sp_ipip_fib_entry_op_gre4_rtdp(struct mlxsw_sp * mlxsw_sp,u32 tunnel_index,struct mlxsw_sp_ipip_entry * ipip_entry)143 mlxsw_sp_ipip_fib_entry_op_gre4_rtdp(struct mlxsw_sp *mlxsw_sp,
144 u32 tunnel_index,
145 struct mlxsw_sp_ipip_entry *ipip_entry)
146 {
147 u16 rif_index = mlxsw_sp_ipip_lb_rif_index(ipip_entry->ol_lb);
148 u16 ul_rif_id = mlxsw_sp_ipip_lb_ul_rif_id(ipip_entry->ol_lb);
149 char rtdp_pl[MLXSW_REG_RTDP_LEN];
150 struct ip_tunnel_parm parms;
151 unsigned int type_check;
152 bool has_ikey;
153 u32 daddr4;
154 u32 ikey;
155
156 parms = mlxsw_sp_ipip_netdev_parms4(ipip_entry->ol_dev);
157 has_ikey = mlxsw_sp_ipip_parms4_has_ikey(parms);
158 ikey = mlxsw_sp_ipip_parms4_ikey(parms);
159
160 mlxsw_reg_rtdp_pack(rtdp_pl, MLXSW_REG_RTDP_TYPE_IPIP, tunnel_index);
161 mlxsw_reg_rtdp_egress_router_interface_set(rtdp_pl, ul_rif_id);
162
163 type_check = has_ikey ?
164 MLXSW_REG_RTDP_IPIP_TYPE_CHECK_ALLOW_GRE_KEY :
165 MLXSW_REG_RTDP_IPIP_TYPE_CHECK_ALLOW_GRE;
166
167 /* Linux demuxes tunnels based on packet SIP (which must match tunnel
168 * remote IP). Thus configure decap so that it filters out packets that
169 * are not IPv4 or have the wrong SIP. IPIP_DECAP_ERROR trap is
170 * generated for packets that fail this criterion. Linux then handles
171 * such packets in slow path and generates ICMP destination unreachable.
172 */
173 daddr4 = be32_to_cpu(mlxsw_sp_ipip_netdev_daddr4(ipip_entry->ol_dev));
174 mlxsw_reg_rtdp_ipip4_pack(rtdp_pl, rif_index,
175 MLXSW_REG_RTDP_IPIP_SIP_CHECK_FILTER_IPV4,
176 type_check, has_ikey, daddr4, ikey);
177
178 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rtdp), rtdp_pl);
179 }
180
181 static int
mlxsw_sp_ipip_fib_entry_op_gre4_ralue(struct mlxsw_sp * mlxsw_sp,u32 dip,u8 prefix_len,u16 ul_vr_id,enum mlxsw_reg_ralue_op op,u32 tunnel_index)182 mlxsw_sp_ipip_fib_entry_op_gre4_ralue(struct mlxsw_sp *mlxsw_sp,
183 u32 dip, u8 prefix_len, u16 ul_vr_id,
184 enum mlxsw_reg_ralue_op op,
185 u32 tunnel_index)
186 {
187 char ralue_pl[MLXSW_REG_RALUE_LEN];
188
189 mlxsw_reg_ralue_pack4(ralue_pl, MLXSW_REG_RALXX_PROTOCOL_IPV4, op,
190 ul_vr_id, prefix_len, dip);
191 mlxsw_reg_ralue_act_ip2me_tun_pack(ralue_pl, tunnel_index);
192 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
193 }
194
mlxsw_sp_ipip_fib_entry_op_gre4(struct mlxsw_sp * mlxsw_sp,struct mlxsw_sp_ipip_entry * ipip_entry,enum mlxsw_reg_ralue_op op,u32 tunnel_index)195 static int mlxsw_sp_ipip_fib_entry_op_gre4(struct mlxsw_sp *mlxsw_sp,
196 struct mlxsw_sp_ipip_entry *ipip_entry,
197 enum mlxsw_reg_ralue_op op,
198 u32 tunnel_index)
199 {
200 u16 ul_vr_id = mlxsw_sp_ipip_lb_ul_vr_id(ipip_entry->ol_lb);
201 __be32 dip;
202 int err;
203
204 err = mlxsw_sp_ipip_fib_entry_op_gre4_rtdp(mlxsw_sp, tunnel_index,
205 ipip_entry);
206 if (err)
207 return err;
208
209 dip = mlxsw_sp_ipip_netdev_saddr(MLXSW_SP_L3_PROTO_IPV4,
210 ipip_entry->ol_dev).addr4;
211 return mlxsw_sp_ipip_fib_entry_op_gre4_ralue(mlxsw_sp, be32_to_cpu(dip),
212 32, ul_vr_id, op,
213 tunnel_index);
214 }
215
mlxsw_sp_ipip_tunnel_complete(enum mlxsw_sp_l3proto proto,const struct net_device * ol_dev)216 static bool mlxsw_sp_ipip_tunnel_complete(enum mlxsw_sp_l3proto proto,
217 const struct net_device *ol_dev)
218 {
219 union mlxsw_sp_l3addr saddr = mlxsw_sp_ipip_netdev_saddr(proto, ol_dev);
220 union mlxsw_sp_l3addr daddr = mlxsw_sp_ipip_netdev_daddr(proto, ol_dev);
221
222 /* Tunnels with unset local or remote address are valid in Linux and
223 * used for lightweight tunnels (LWT) and Non-Broadcast Multi-Access
224 * (NBMA) tunnels. In principle these can be offloaded, but the driver
225 * currently doesn't support this. So punt.
226 */
227 return !mlxsw_sp_l3addr_is_zero(saddr) &&
228 !mlxsw_sp_l3addr_is_zero(daddr);
229 }
230
mlxsw_sp_ipip_can_offload_gre4(const struct mlxsw_sp * mlxsw_sp,const struct net_device * ol_dev,enum mlxsw_sp_l3proto ol_proto)231 static bool mlxsw_sp_ipip_can_offload_gre4(const struct mlxsw_sp *mlxsw_sp,
232 const struct net_device *ol_dev,
233 enum mlxsw_sp_l3proto ol_proto)
234 {
235 struct ip_tunnel *tunnel = netdev_priv(ol_dev);
236 __be16 okflags = TUNNEL_KEY; /* We can't offload any other features. */
237 bool inherit_ttl = tunnel->parms.iph.ttl == 0;
238 bool inherit_tos = tunnel->parms.iph.tos & 0x1;
239
240 return (tunnel->parms.i_flags & ~okflags) == 0 &&
241 (tunnel->parms.o_flags & ~okflags) == 0 &&
242 inherit_ttl && inherit_tos &&
243 mlxsw_sp_ipip_tunnel_complete(MLXSW_SP_L3_PROTO_IPV4, ol_dev);
244 }
245
246 static struct mlxsw_sp_rif_ipip_lb_config
mlxsw_sp_ipip_ol_loopback_config_gre4(struct mlxsw_sp * mlxsw_sp,const struct net_device * ol_dev)247 mlxsw_sp_ipip_ol_loopback_config_gre4(struct mlxsw_sp *mlxsw_sp,
248 const struct net_device *ol_dev)
249 {
250 struct ip_tunnel_parm parms = mlxsw_sp_ipip_netdev_parms4(ol_dev);
251 enum mlxsw_reg_ritr_loopback_ipip_type lb_ipipt;
252
253 lb_ipipt = mlxsw_sp_ipip_parms4_has_okey(parms) ?
254 MLXSW_REG_RITR_LOOPBACK_IPIP_TYPE_IP_IN_GRE_KEY_IN_IP :
255 MLXSW_REG_RITR_LOOPBACK_IPIP_TYPE_IP_IN_GRE_IN_IP;
256 return (struct mlxsw_sp_rif_ipip_lb_config){
257 .lb_ipipt = lb_ipipt,
258 .okey = mlxsw_sp_ipip_parms4_okey(parms),
259 .ul_protocol = MLXSW_SP_L3_PROTO_IPV4,
260 .saddr = mlxsw_sp_ipip_netdev_saddr(MLXSW_SP_L3_PROTO_IPV4,
261 ol_dev),
262 };
263 }
264
265 static int
mlxsw_sp_ipip_ol_netdev_change_gre4(struct mlxsw_sp * mlxsw_sp,struct mlxsw_sp_ipip_entry * ipip_entry,struct netlink_ext_ack * extack)266 mlxsw_sp_ipip_ol_netdev_change_gre4(struct mlxsw_sp *mlxsw_sp,
267 struct mlxsw_sp_ipip_entry *ipip_entry,
268 struct netlink_ext_ack *extack)
269 {
270 union mlxsw_sp_l3addr old_saddr, new_saddr;
271 union mlxsw_sp_l3addr old_daddr, new_daddr;
272 struct ip_tunnel_parm new_parms;
273 bool update_tunnel = false;
274 bool update_decap = false;
275 bool update_nhs = false;
276 int err = 0;
277
278 new_parms = mlxsw_sp_ipip_netdev_parms4(ipip_entry->ol_dev);
279
280 new_saddr = mlxsw_sp_ipip_parms4_saddr(new_parms);
281 old_saddr = mlxsw_sp_ipip_parms4_saddr(ipip_entry->parms4);
282 new_daddr = mlxsw_sp_ipip_parms4_daddr(new_parms);
283 old_daddr = mlxsw_sp_ipip_parms4_daddr(ipip_entry->parms4);
284
285 if (!mlxsw_sp_l3addr_eq(&new_saddr, &old_saddr)) {
286 u16 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev);
287
288 /* Since the local address has changed, if there is another
289 * tunnel with a matching saddr, both need to be demoted.
290 */
291 if (mlxsw_sp_ipip_demote_tunnel_by_saddr(mlxsw_sp,
292 MLXSW_SP_L3_PROTO_IPV4,
293 new_saddr, ul_tb_id,
294 ipip_entry)) {
295 mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry);
296 return 0;
297 }
298
299 update_tunnel = true;
300 } else if ((mlxsw_sp_ipip_parms4_okey(ipip_entry->parms4) !=
301 mlxsw_sp_ipip_parms4_okey(new_parms)) ||
302 ipip_entry->parms4.link != new_parms.link) {
303 update_tunnel = true;
304 } else if (!mlxsw_sp_l3addr_eq(&new_daddr, &old_daddr)) {
305 update_nhs = true;
306 } else if (mlxsw_sp_ipip_parms4_ikey(ipip_entry->parms4) !=
307 mlxsw_sp_ipip_parms4_ikey(new_parms)) {
308 update_decap = true;
309 }
310
311 if (update_tunnel)
312 err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
313 true, true, true,
314 extack);
315 else if (update_nhs)
316 err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
317 false, false, true,
318 extack);
319 else if (update_decap)
320 err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
321 false, false, false,
322 extack);
323
324 ipip_entry->parms4 = new_parms;
325 return err;
326 }
327
328 static const struct mlxsw_sp_ipip_ops mlxsw_sp_ipip_gre4_ops = {
329 .dev_type = ARPHRD_IPGRE,
330 .ul_proto = MLXSW_SP_L3_PROTO_IPV4,
331 .nexthop_update = mlxsw_sp_ipip_nexthop_update_gre4,
332 .fib_entry_op = mlxsw_sp_ipip_fib_entry_op_gre4,
333 .can_offload = mlxsw_sp_ipip_can_offload_gre4,
334 .ol_loopback_config = mlxsw_sp_ipip_ol_loopback_config_gre4,
335 .ol_netdev_change = mlxsw_sp_ipip_ol_netdev_change_gre4,
336 };
337
338 const struct mlxsw_sp_ipip_ops *mlxsw_sp_ipip_ops_arr[] = {
339 [MLXSW_SP_IPIP_TYPE_GRE4] = &mlxsw_sp_ipip_gre4_ops,
340 };
341