a1c4b1e63f8ddd58808021e7e28cc373402bda8e
[linux-2.6-microblaze.git] / drivers / net / ethernet / mellanox / mlxsw / spectrum_ipip.c
1 /*
2  * drivers/net/ethernet/mellanox/mlxsw/spectrum_ipip.c
3  * Copyright (c) 2017 Mellanox Technologies. All rights reserved.
4  * Copyright (c) 2017 Petr Machata <petrm@mellanox.com>
5  *
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions are met:
8  *
9  * 1. Redistributions of source code must retain the above copyright
10  *    notice, this list of conditions and the following disclaimer.
11  * 2. Redistributions in binary form must reproduce the above copyright
12  *    notice, this list of conditions and the following disclaimer in the
13  *    documentation and/or other materials provided with the distribution.
14  * 3. Neither the names of the copyright holders nor the names of its
15  *    contributors may be used to endorse or promote products derived from
16  *    this software without specific prior written permission.
17  *
18  * Alternatively, this software may be distributed under the terms of the
19  * GNU General Public License ("GPL") version 2 as published by the Free
20  * Software Foundation.
21  *
22  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
23  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
26  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
27  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
28  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
29  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
30  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
31  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
32  * POSSIBILITY OF SUCH DAMAGE.
33  */
34
35 #include <net/ip_tunnels.h>
36
37 #include "spectrum_ipip.h"
38
39 struct ip_tunnel_parm
40 mlxsw_sp_ipip_netdev_parms4(const struct net_device *ol_dev)
41 {
42         struct ip_tunnel *tun = netdev_priv(ol_dev);
43
44         return tun->parms;
45 }
46
47 static bool mlxsw_sp_ipip_parms4_has_ikey(struct ip_tunnel_parm parms)
48 {
49         return !!(parms.i_flags & TUNNEL_KEY);
50 }
51
52 static bool mlxsw_sp_ipip_parms4_has_okey(struct ip_tunnel_parm parms)
53 {
54         return !!(parms.o_flags & TUNNEL_KEY);
55 }
56
57 static u32 mlxsw_sp_ipip_parms4_ikey(struct ip_tunnel_parm parms)
58 {
59         return mlxsw_sp_ipip_parms4_has_ikey(parms) ?
60                 be32_to_cpu(parms.i_key) : 0;
61 }
62
63 static u32 mlxsw_sp_ipip_parms4_okey(struct ip_tunnel_parm parms)
64 {
65         return mlxsw_sp_ipip_parms4_has_okey(parms) ?
66                 be32_to_cpu(parms.o_key) : 0;
67 }
68
69 static union mlxsw_sp_l3addr
70 mlxsw_sp_ipip_parms4_saddr(struct ip_tunnel_parm parms)
71 {
72         return (union mlxsw_sp_l3addr) { .addr4 = parms.iph.saddr };
73 }
74
75 static union mlxsw_sp_l3addr
76 mlxsw_sp_ipip_parms4_daddr(struct ip_tunnel_parm parms)
77 {
78         return (union mlxsw_sp_l3addr) { .addr4 = parms.iph.daddr };
79 }
80
81 union mlxsw_sp_l3addr
82 mlxsw_sp_ipip_netdev_saddr(enum mlxsw_sp_l3proto proto,
83                            const struct net_device *ol_dev)
84 {
85         struct ip_tunnel_parm parms4;
86
87         switch (proto) {
88         case MLXSW_SP_L3_PROTO_IPV4:
89                 parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev);
90                 return mlxsw_sp_ipip_parms4_saddr(parms4);
91         case MLXSW_SP_L3_PROTO_IPV6:
92                 break;
93         }
94
95         WARN_ON(1);
96         return (union mlxsw_sp_l3addr) {0};
97 }
98
99 static __be32 mlxsw_sp_ipip_netdev_daddr4(const struct net_device *ol_dev)
100 {
101
102         struct ip_tunnel_parm parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev);
103
104         return mlxsw_sp_ipip_parms4_daddr(parms4).addr4;
105 }
106
107 static union mlxsw_sp_l3addr
108 mlxsw_sp_ipip_netdev_daddr(enum mlxsw_sp_l3proto proto,
109                            const struct net_device *ol_dev)
110 {
111         struct ip_tunnel_parm parms4;
112
113         switch (proto) {
114         case MLXSW_SP_L3_PROTO_IPV4:
115                 parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev);
116                 return mlxsw_sp_ipip_parms4_daddr(parms4);
117         case MLXSW_SP_L3_PROTO_IPV6:
118                 break;
119         }
120
121         WARN_ON(1);
122         return (union mlxsw_sp_l3addr) {0};
123 }
124
125 static int
126 mlxsw_sp_ipip_nexthop_update_gre4(struct mlxsw_sp *mlxsw_sp, u32 adj_index,
127                                   struct mlxsw_sp_ipip_entry *ipip_entry)
128 {
129         u16 rif_index = mlxsw_sp_ipip_lb_rif_index(ipip_entry->ol_lb);
130         __be32 daddr4 = mlxsw_sp_ipip_netdev_daddr4(ipip_entry->ol_dev);
131         char ratr_pl[MLXSW_REG_RATR_LEN];
132
133         mlxsw_reg_ratr_pack(ratr_pl, MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY,
134                             true, MLXSW_REG_RATR_TYPE_IPIP,
135                             adj_index, rif_index);
136         mlxsw_reg_ratr_ipip4_entry_pack(ratr_pl, be32_to_cpu(daddr4));
137
138         return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl);
139 }
140
141 static int
142 mlxsw_sp_ipip_fib_entry_op_gre4_rtdp(struct mlxsw_sp *mlxsw_sp,
143                                      u32 tunnel_index,
144                                      struct mlxsw_sp_ipip_entry *ipip_entry)
145 {
146         u16 rif_index = mlxsw_sp_ipip_lb_rif_index(ipip_entry->ol_lb);
147         char rtdp_pl[MLXSW_REG_RTDP_LEN];
148         struct ip_tunnel_parm parms;
149         unsigned int type_check;
150         bool has_ikey;
151         u32 daddr4;
152         u32 ikey;
153
154         parms = mlxsw_sp_ipip_netdev_parms4(ipip_entry->ol_dev);
155         has_ikey = mlxsw_sp_ipip_parms4_has_ikey(parms);
156         ikey = mlxsw_sp_ipip_parms4_ikey(parms);
157
158         mlxsw_reg_rtdp_pack(rtdp_pl, MLXSW_REG_RTDP_TYPE_IPIP, tunnel_index);
159
160         type_check = has_ikey ?
161                 MLXSW_REG_RTDP_IPIP_TYPE_CHECK_ALLOW_GRE_KEY :
162                 MLXSW_REG_RTDP_IPIP_TYPE_CHECK_ALLOW_GRE;
163
164         /* Linux demuxes tunnels based on packet SIP (which must match tunnel
165          * remote IP). Thus configure decap so that it filters out packets that
166          * are not IPv4 or have the wrong SIP. IPIP_DECAP_ERROR trap is
167          * generated for packets that fail this criterion. Linux then handles
168          * such packets in slow path and generates ICMP destination unreachable.
169          */
170         daddr4 = be32_to_cpu(mlxsw_sp_ipip_netdev_daddr4(ipip_entry->ol_dev));
171         mlxsw_reg_rtdp_ipip4_pack(rtdp_pl, rif_index,
172                                   MLXSW_REG_RTDP_IPIP_SIP_CHECK_FILTER_IPV4,
173                                   type_check, has_ikey, daddr4, ikey);
174
175         return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rtdp), rtdp_pl);
176 }
177
178 static int
179 mlxsw_sp_ipip_fib_entry_op_gre4_ralue(struct mlxsw_sp *mlxsw_sp,
180                                       u32 dip, u8 prefix_len, u16 ul_vr_id,
181                                       enum mlxsw_reg_ralue_op op,
182                                       u32 tunnel_index)
183 {
184         char ralue_pl[MLXSW_REG_RALUE_LEN];
185
186         mlxsw_reg_ralue_pack4(ralue_pl, MLXSW_REG_RALXX_PROTOCOL_IPV4, op,
187                               ul_vr_id, prefix_len, dip);
188         mlxsw_reg_ralue_act_ip2me_tun_pack(ralue_pl, tunnel_index);
189         return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl);
190 }
191
192 static int mlxsw_sp_ipip_fib_entry_op_gre4(struct mlxsw_sp *mlxsw_sp,
193                                         struct mlxsw_sp_ipip_entry *ipip_entry,
194                                         enum mlxsw_reg_ralue_op op,
195                                         u32 tunnel_index)
196 {
197         u16 ul_vr_id = mlxsw_sp_ipip_lb_ul_vr_id(ipip_entry->ol_lb);
198         __be32 dip;
199         int err;
200
201         err = mlxsw_sp_ipip_fib_entry_op_gre4_rtdp(mlxsw_sp, tunnel_index,
202                                                    ipip_entry);
203         if (err)
204                 return err;
205
206         dip = mlxsw_sp_ipip_netdev_saddr(MLXSW_SP_L3_PROTO_IPV4,
207                                          ipip_entry->ol_dev).addr4;
208         return mlxsw_sp_ipip_fib_entry_op_gre4_ralue(mlxsw_sp, be32_to_cpu(dip),
209                                                      32, ul_vr_id, op,
210                                                      tunnel_index);
211 }
212
213 static bool mlxsw_sp_ipip_tunnel_complete(enum mlxsw_sp_l3proto proto,
214                                           const struct net_device *ol_dev)
215 {
216         union mlxsw_sp_l3addr saddr = mlxsw_sp_ipip_netdev_saddr(proto, ol_dev);
217         union mlxsw_sp_l3addr daddr = mlxsw_sp_ipip_netdev_daddr(proto, ol_dev);
218         union mlxsw_sp_l3addr naddr = {0};
219
220         /* Tunnels with unset local or remote address are valid in Linux and
221          * used for lightweight tunnels (LWT) and Non-Broadcast Multi-Access
222          * (NBMA) tunnels. In principle these can be offloaded, but the driver
223          * currently doesn't support this. So punt.
224          */
225         return memcmp(&saddr, &naddr, sizeof(naddr)) &&
226                memcmp(&daddr, &naddr, sizeof(naddr));
227 }
228
229 static bool mlxsw_sp_ipip_can_offload_gre4(const struct mlxsw_sp *mlxsw_sp,
230                                            const struct net_device *ol_dev,
231                                            enum mlxsw_sp_l3proto ol_proto)
232 {
233         struct ip_tunnel *tunnel = netdev_priv(ol_dev);
234         __be16 okflags = TUNNEL_KEY; /* We can't offload any other features. */
235         bool inherit_ttl = tunnel->parms.iph.ttl == 0;
236         bool inherit_tos = tunnel->parms.iph.tos & 0x1;
237
238         return (tunnel->parms.i_flags & ~okflags) == 0 &&
239                (tunnel->parms.o_flags & ~okflags) == 0 &&
240                inherit_ttl && inherit_tos &&
241                mlxsw_sp_ipip_tunnel_complete(MLXSW_SP_L3_PROTO_IPV4, ol_dev);
242 }
243
244 static struct mlxsw_sp_rif_ipip_lb_config
245 mlxsw_sp_ipip_ol_loopback_config_gre4(struct mlxsw_sp *mlxsw_sp,
246                                       const struct net_device *ol_dev)
247 {
248         struct ip_tunnel_parm parms = mlxsw_sp_ipip_netdev_parms4(ol_dev);
249         enum mlxsw_reg_ritr_loopback_ipip_type lb_ipipt;
250
251         lb_ipipt = mlxsw_sp_ipip_parms4_has_okey(parms) ?
252                 MLXSW_REG_RITR_LOOPBACK_IPIP_TYPE_IP_IN_GRE_KEY_IN_IP :
253                 MLXSW_REG_RITR_LOOPBACK_IPIP_TYPE_IP_IN_GRE_IN_IP;
254         return (struct mlxsw_sp_rif_ipip_lb_config){
255                 .lb_ipipt = lb_ipipt,
256                 .okey = mlxsw_sp_ipip_parms4_okey(parms),
257                 .ul_protocol = MLXSW_SP_L3_PROTO_IPV4,
258                 .saddr = mlxsw_sp_ipip_netdev_saddr(MLXSW_SP_L3_PROTO_IPV4,
259                                                     ol_dev),
260         };
261 }
262
263 static int
264 mlxsw_sp_ipip_ol_netdev_change_gre4(struct mlxsw_sp *mlxsw_sp,
265                                     struct mlxsw_sp_ipip_entry *ipip_entry,
266                                     struct netlink_ext_ack *extack)
267 {
268         union mlxsw_sp_l3addr old_saddr, new_saddr;
269         union mlxsw_sp_l3addr old_daddr, new_daddr;
270         struct ip_tunnel_parm new_parms;
271         bool update_tunnel = false;
272         bool update_decap = false;
273         bool update_nhs = false;
274         int err = 0;
275
276         new_parms = mlxsw_sp_ipip_netdev_parms4(ipip_entry->ol_dev);
277
278         new_saddr = mlxsw_sp_ipip_parms4_saddr(new_parms);
279         old_saddr = mlxsw_sp_ipip_parms4_saddr(ipip_entry->parms4);
280         new_daddr = mlxsw_sp_ipip_parms4_daddr(new_parms);
281         old_daddr = mlxsw_sp_ipip_parms4_daddr(ipip_entry->parms4);
282
283         if (!mlxsw_sp_l3addr_eq(&new_saddr, &old_saddr)) {
284                 u16 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev);
285
286                 /* Since the local address has changed, if there is another
287                  * tunnel with a matching saddr, both need to be demoted.
288                  */
289                 if (mlxsw_sp_ipip_demote_tunnel_by_saddr(mlxsw_sp,
290                                                          MLXSW_SP_L3_PROTO_IPV4,
291                                                          new_saddr, ul_tb_id,
292                                                          ipip_entry)) {
293                         mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry);
294                         return 0;
295                 }
296
297                 update_tunnel = true;
298         } else if ((mlxsw_sp_ipip_parms4_okey(ipip_entry->parms4) !=
299                     mlxsw_sp_ipip_parms4_okey(new_parms)) ||
300                    ipip_entry->parms4.link != new_parms.link) {
301                 update_tunnel = true;
302         } else if (!mlxsw_sp_l3addr_eq(&new_daddr, &old_daddr)) {
303                 update_nhs = true;
304         } else if (mlxsw_sp_ipip_parms4_ikey(ipip_entry->parms4) !=
305                    mlxsw_sp_ipip_parms4_ikey(new_parms)) {
306                 update_decap = true;
307         }
308
309         if (update_tunnel)
310                 err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
311                                                           true, true, true,
312                                                           extack);
313         else if (update_nhs)
314                 err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
315                                                           false, false, true,
316                                                           extack);
317         else if (update_decap)
318                 err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry,
319                                                           false, false, false,
320                                                           extack);
321
322         ipip_entry->parms4 = new_parms;
323         return err;
324 }
325
326 static const struct mlxsw_sp_ipip_ops mlxsw_sp_ipip_gre4_ops = {
327         .dev_type = ARPHRD_IPGRE,
328         .ul_proto = MLXSW_SP_L3_PROTO_IPV4,
329         .nexthop_update = mlxsw_sp_ipip_nexthop_update_gre4,
330         .fib_entry_op = mlxsw_sp_ipip_fib_entry_op_gre4,
331         .can_offload = mlxsw_sp_ipip_can_offload_gre4,
332         .ol_loopback_config = mlxsw_sp_ipip_ol_loopback_config_gre4,
333         .ol_netdev_change = mlxsw_sp_ipip_ol_netdev_change_gre4,
334 };
335
336 const struct mlxsw_sp_ipip_ops *mlxsw_sp_ipip_ops_arr[] = {
337         [MLXSW_SP_IPIP_TYPE_GRE4] = &mlxsw_sp_ipip_gre4_ops,
338 };