| // SPDX-License-Identifier: BSD-3-Clause OR GPL-2.0 |
| /* Copyright (c) 2017-2018 Mellanox Technologies. All rights reserved */ |
| |
| #include <net/ip_tunnels.h> |
| #include <net/ip6_tunnel.h> |
| #include <net/inet_ecn.h> |
| |
| #include "spectrum_ipip.h" |
| #include "reg.h" |
| |
| struct ip_tunnel_parm |
| mlxsw_sp_ipip_netdev_parms4(const struct net_device *ol_dev) |
| { |
| struct ip_tunnel *tun = netdev_priv(ol_dev); |
| |
| return tun->parms; |
| } |
| |
| struct __ip6_tnl_parm |
| mlxsw_sp_ipip_netdev_parms6(const struct net_device *ol_dev) |
| { |
| struct ip6_tnl *tun = netdev_priv(ol_dev); |
| |
| return tun->parms; |
| } |
| |
| static bool mlxsw_sp_ipip_parms4_has_ikey(struct ip_tunnel_parm parms) |
| { |
| return !!(parms.i_flags & TUNNEL_KEY); |
| } |
| |
| static bool mlxsw_sp_ipip_parms4_has_okey(struct ip_tunnel_parm parms) |
| { |
| return !!(parms.o_flags & TUNNEL_KEY); |
| } |
| |
| static u32 mlxsw_sp_ipip_parms4_ikey(struct ip_tunnel_parm parms) |
| { |
| return mlxsw_sp_ipip_parms4_has_ikey(parms) ? |
| be32_to_cpu(parms.i_key) : 0; |
| } |
| |
| static u32 mlxsw_sp_ipip_parms4_okey(struct ip_tunnel_parm parms) |
| { |
| return mlxsw_sp_ipip_parms4_has_okey(parms) ? |
| be32_to_cpu(parms.o_key) : 0; |
| } |
| |
| static union mlxsw_sp_l3addr |
| mlxsw_sp_ipip_parms4_saddr(struct ip_tunnel_parm parms) |
| { |
| return (union mlxsw_sp_l3addr) { .addr4 = parms.iph.saddr }; |
| } |
| |
| static union mlxsw_sp_l3addr |
| mlxsw_sp_ipip_parms6_saddr(struct __ip6_tnl_parm parms) |
| { |
| return (union mlxsw_sp_l3addr) { .addr6 = parms.laddr }; |
| } |
| |
| static union mlxsw_sp_l3addr |
| mlxsw_sp_ipip_parms4_daddr(struct ip_tunnel_parm parms) |
| { |
| return (union mlxsw_sp_l3addr) { .addr4 = parms.iph.daddr }; |
| } |
| |
| static union mlxsw_sp_l3addr |
| mlxsw_sp_ipip_parms6_daddr(struct __ip6_tnl_parm parms) |
| { |
| return (union mlxsw_sp_l3addr) { .addr6 = parms.raddr }; |
| } |
| |
| union mlxsw_sp_l3addr |
| mlxsw_sp_ipip_netdev_saddr(enum mlxsw_sp_l3proto proto, |
| const struct net_device *ol_dev) |
| { |
| struct ip_tunnel_parm parms4; |
| struct __ip6_tnl_parm parms6; |
| |
| switch (proto) { |
| case MLXSW_SP_L3_PROTO_IPV4: |
| parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev); |
| return mlxsw_sp_ipip_parms4_saddr(parms4); |
| case MLXSW_SP_L3_PROTO_IPV6: |
| parms6 = mlxsw_sp_ipip_netdev_parms6(ol_dev); |
| return mlxsw_sp_ipip_parms6_saddr(parms6); |
| } |
| |
| WARN_ON(1); |
| return (union mlxsw_sp_l3addr) {0}; |
| } |
| |
| static __be32 mlxsw_sp_ipip_netdev_daddr4(const struct net_device *ol_dev) |
| { |
| |
| struct ip_tunnel_parm parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev); |
| |
| return mlxsw_sp_ipip_parms4_daddr(parms4).addr4; |
| } |
| |
| static union mlxsw_sp_l3addr |
| mlxsw_sp_ipip_netdev_daddr(enum mlxsw_sp_l3proto proto, |
| const struct net_device *ol_dev) |
| { |
| struct ip_tunnel_parm parms4; |
| struct __ip6_tnl_parm parms6; |
| |
| switch (proto) { |
| case MLXSW_SP_L3_PROTO_IPV4: |
| parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev); |
| return mlxsw_sp_ipip_parms4_daddr(parms4); |
| case MLXSW_SP_L3_PROTO_IPV6: |
| parms6 = mlxsw_sp_ipip_netdev_parms6(ol_dev); |
| return mlxsw_sp_ipip_parms6_daddr(parms6); |
| } |
| |
| WARN_ON(1); |
| return (union mlxsw_sp_l3addr) {0}; |
| } |
| |
| bool mlxsw_sp_l3addr_is_zero(union mlxsw_sp_l3addr addr) |
| { |
| union mlxsw_sp_l3addr naddr = {0}; |
| |
| return !memcmp(&addr, &naddr, sizeof(naddr)); |
| } |
| |
| static int |
| mlxsw_sp_ipip_nexthop_update_gre4(struct mlxsw_sp *mlxsw_sp, u32 adj_index, |
| struct mlxsw_sp_ipip_entry *ipip_entry) |
| { |
| u16 rif_index = mlxsw_sp_ipip_lb_rif_index(ipip_entry->ol_lb); |
| __be32 daddr4 = mlxsw_sp_ipip_netdev_daddr4(ipip_entry->ol_dev); |
| char ratr_pl[MLXSW_REG_RATR_LEN]; |
| |
| mlxsw_reg_ratr_pack(ratr_pl, MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY, |
| true, MLXSW_REG_RATR_TYPE_IPIP, |
| adj_index, rif_index); |
| mlxsw_reg_ratr_ipip4_entry_pack(ratr_pl, be32_to_cpu(daddr4)); |
| |
| return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl); |
| } |
| |
| static int |
| mlxsw_sp_ipip_fib_entry_op_gre4_rtdp(struct mlxsw_sp *mlxsw_sp, |
| u32 tunnel_index, |
| struct mlxsw_sp_ipip_entry *ipip_entry) |
| { |
| u16 rif_index = mlxsw_sp_ipip_lb_rif_index(ipip_entry->ol_lb); |
| u16 ul_rif_id = mlxsw_sp_ipip_lb_ul_rif_id(ipip_entry->ol_lb); |
| char rtdp_pl[MLXSW_REG_RTDP_LEN]; |
| struct ip_tunnel_parm parms; |
| unsigned int type_check; |
| bool has_ikey; |
| u32 daddr4; |
| u32 ikey; |
| |
| parms = mlxsw_sp_ipip_netdev_parms4(ipip_entry->ol_dev); |
| has_ikey = mlxsw_sp_ipip_parms4_has_ikey(parms); |
| ikey = mlxsw_sp_ipip_parms4_ikey(parms); |
| |
| mlxsw_reg_rtdp_pack(rtdp_pl, MLXSW_REG_RTDP_TYPE_IPIP, tunnel_index); |
| mlxsw_reg_rtdp_egress_router_interface_set(rtdp_pl, ul_rif_id); |
| |
| type_check = has_ikey ? |
| MLXSW_REG_RTDP_IPIP_TYPE_CHECK_ALLOW_GRE_KEY : |
| MLXSW_REG_RTDP_IPIP_TYPE_CHECK_ALLOW_GRE; |
| |
| /* Linux demuxes tunnels based on packet SIP (which must match tunnel |
| * remote IP). Thus configure decap so that it filters out packets that |
| * are not IPv4 or have the wrong SIP. IPIP_DECAP_ERROR trap is |
| * generated for packets that fail this criterion. Linux then handles |
| * such packets in slow path and generates ICMP destination unreachable. |
| */ |
| daddr4 = be32_to_cpu(mlxsw_sp_ipip_netdev_daddr4(ipip_entry->ol_dev)); |
| mlxsw_reg_rtdp_ipip4_pack(rtdp_pl, rif_index, |
| MLXSW_REG_RTDP_IPIP_SIP_CHECK_FILTER_IPV4, |
| type_check, has_ikey, daddr4, ikey); |
| |
| return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rtdp), rtdp_pl); |
| } |
| |
| static int |
| mlxsw_sp_ipip_fib_entry_op_gre4_ralue(struct mlxsw_sp *mlxsw_sp, |
| u32 dip, u8 prefix_len, u16 ul_vr_id, |
| enum mlxsw_reg_ralue_op op, |
| u32 tunnel_index) |
| { |
| char ralue_pl[MLXSW_REG_RALUE_LEN]; |
| |
| mlxsw_reg_ralue_pack4(ralue_pl, MLXSW_REG_RALXX_PROTOCOL_IPV4, op, |
| ul_vr_id, prefix_len, dip); |
| mlxsw_reg_ralue_act_ip2me_tun_pack(ralue_pl, tunnel_index); |
| return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl); |
| } |
| |
| static int mlxsw_sp_ipip_fib_entry_op_gre4(struct mlxsw_sp *mlxsw_sp, |
| struct mlxsw_sp_ipip_entry *ipip_entry, |
| enum mlxsw_reg_ralue_op op, |
| u32 tunnel_index) |
| { |
| u16 ul_vr_id = mlxsw_sp_ipip_lb_ul_vr_id(ipip_entry->ol_lb); |
| __be32 dip; |
| int err; |
| |
| err = mlxsw_sp_ipip_fib_entry_op_gre4_rtdp(mlxsw_sp, tunnel_index, |
| ipip_entry); |
| if (err) |
| return err; |
| |
| dip = mlxsw_sp_ipip_netdev_saddr(MLXSW_SP_L3_PROTO_IPV4, |
| ipip_entry->ol_dev).addr4; |
| return mlxsw_sp_ipip_fib_entry_op_gre4_ralue(mlxsw_sp, be32_to_cpu(dip), |
| 32, ul_vr_id, op, |
| tunnel_index); |
| } |
| |
| static bool mlxsw_sp_ipip_tunnel_complete(enum mlxsw_sp_l3proto proto, |
| const struct net_device *ol_dev) |
| { |
| union mlxsw_sp_l3addr saddr = mlxsw_sp_ipip_netdev_saddr(proto, ol_dev); |
| union mlxsw_sp_l3addr daddr = mlxsw_sp_ipip_netdev_daddr(proto, ol_dev); |
| |
| /* Tunnels with unset local or remote address are valid in Linux and |
| * used for lightweight tunnels (LWT) and Non-Broadcast Multi-Access |
| * (NBMA) tunnels. In principle these can be offloaded, but the driver |
| * currently doesn't support this. So punt. |
| */ |
| return !mlxsw_sp_l3addr_is_zero(saddr) && |
| !mlxsw_sp_l3addr_is_zero(daddr); |
| } |
| |
| static bool mlxsw_sp_ipip_can_offload_gre4(const struct mlxsw_sp *mlxsw_sp, |
| const struct net_device *ol_dev, |
| enum mlxsw_sp_l3proto ol_proto) |
| { |
| struct ip_tunnel *tunnel = netdev_priv(ol_dev); |
| __be16 okflags = TUNNEL_KEY; /* We can't offload any other features. */ |
| bool inherit_ttl = tunnel->parms.iph.ttl == 0; |
| bool inherit_tos = tunnel->parms.iph.tos & 0x1; |
| |
| return (tunnel->parms.i_flags & ~okflags) == 0 && |
| (tunnel->parms.o_flags & ~okflags) == 0 && |
| inherit_ttl && inherit_tos && |
| mlxsw_sp_ipip_tunnel_complete(MLXSW_SP_L3_PROTO_IPV4, ol_dev); |
| } |
| |
| static struct mlxsw_sp_rif_ipip_lb_config |
| mlxsw_sp_ipip_ol_loopback_config_gre4(struct mlxsw_sp *mlxsw_sp, |
| const struct net_device *ol_dev) |
| { |
| struct ip_tunnel_parm parms = mlxsw_sp_ipip_netdev_parms4(ol_dev); |
| enum mlxsw_reg_ritr_loopback_ipip_type lb_ipipt; |
| |
| lb_ipipt = mlxsw_sp_ipip_parms4_has_okey(parms) ? |
| MLXSW_REG_RITR_LOOPBACK_IPIP_TYPE_IP_IN_GRE_KEY_IN_IP : |
| MLXSW_REG_RITR_LOOPBACK_IPIP_TYPE_IP_IN_GRE_IN_IP; |
| return (struct mlxsw_sp_rif_ipip_lb_config){ |
| .lb_ipipt = lb_ipipt, |
| .okey = mlxsw_sp_ipip_parms4_okey(parms), |
| .ul_protocol = MLXSW_SP_L3_PROTO_IPV4, |
| .saddr = mlxsw_sp_ipip_netdev_saddr(MLXSW_SP_L3_PROTO_IPV4, |
| ol_dev), |
| }; |
| } |
| |
| static int |
| mlxsw_sp_ipip_ol_netdev_change_gre4(struct mlxsw_sp *mlxsw_sp, |
| struct mlxsw_sp_ipip_entry *ipip_entry, |
| struct netlink_ext_ack *extack) |
| { |
| union mlxsw_sp_l3addr old_saddr, new_saddr; |
| union mlxsw_sp_l3addr old_daddr, new_daddr; |
| struct ip_tunnel_parm new_parms; |
| bool update_tunnel = false; |
| bool update_decap = false; |
| bool update_nhs = false; |
| int err = 0; |
| |
| new_parms = mlxsw_sp_ipip_netdev_parms4(ipip_entry->ol_dev); |
| |
| new_saddr = mlxsw_sp_ipip_parms4_saddr(new_parms); |
| old_saddr = mlxsw_sp_ipip_parms4_saddr(ipip_entry->parms4); |
| new_daddr = mlxsw_sp_ipip_parms4_daddr(new_parms); |
| old_daddr = mlxsw_sp_ipip_parms4_daddr(ipip_entry->parms4); |
| |
| if (!mlxsw_sp_l3addr_eq(&new_saddr, &old_saddr)) { |
| u16 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev); |
| |
| /* Since the local address has changed, if there is another |
| * tunnel with a matching saddr, both need to be demoted. |
| */ |
| if (mlxsw_sp_ipip_demote_tunnel_by_saddr(mlxsw_sp, |
| MLXSW_SP_L3_PROTO_IPV4, |
| new_saddr, ul_tb_id, |
| ipip_entry)) { |
| mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry); |
| return 0; |
| } |
| |
| update_tunnel = true; |
| } else if ((mlxsw_sp_ipip_parms4_okey(ipip_entry->parms4) != |
| mlxsw_sp_ipip_parms4_okey(new_parms)) || |
| ipip_entry->parms4.link != new_parms.link) { |
| update_tunnel = true; |
| } else if (!mlxsw_sp_l3addr_eq(&new_daddr, &old_daddr)) { |
| update_nhs = true; |
| } else if (mlxsw_sp_ipip_parms4_ikey(ipip_entry->parms4) != |
| mlxsw_sp_ipip_parms4_ikey(new_parms)) { |
| update_decap = true; |
| } |
| |
| if (update_tunnel) |
| err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry, |
| true, true, true, |
| extack); |
| else if (update_nhs) |
| err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry, |
| false, false, true, |
| extack); |
| else if (update_decap) |
| err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry, |
| false, false, false, |
| extack); |
| |
| ipip_entry->parms4 = new_parms; |
| return err; |
| } |
| |
| static const struct mlxsw_sp_ipip_ops mlxsw_sp_ipip_gre4_ops = { |
| .dev_type = ARPHRD_IPGRE, |
| .ul_proto = MLXSW_SP_L3_PROTO_IPV4, |
| .nexthop_update = mlxsw_sp_ipip_nexthop_update_gre4, |
| .fib_entry_op = mlxsw_sp_ipip_fib_entry_op_gre4, |
| .can_offload = mlxsw_sp_ipip_can_offload_gre4, |
| .ol_loopback_config = mlxsw_sp_ipip_ol_loopback_config_gre4, |
| .ol_netdev_change = mlxsw_sp_ipip_ol_netdev_change_gre4, |
| }; |
| |
| const struct mlxsw_sp_ipip_ops *mlxsw_sp_ipip_ops_arr[] = { |
| [MLXSW_SP_IPIP_TYPE_GRE4] = &mlxsw_sp_ipip_gre4_ops, |
| }; |
| |
| static int mlxsw_sp_ipip_ecn_encap_init_one(struct mlxsw_sp *mlxsw_sp, |
| u8 inner_ecn, u8 outer_ecn) |
| { |
| char tieem_pl[MLXSW_REG_TIEEM_LEN]; |
| |
| mlxsw_reg_tieem_pack(tieem_pl, inner_ecn, outer_ecn); |
| return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(tieem), tieem_pl); |
| } |
| |
| int mlxsw_sp_ipip_ecn_encap_init(struct mlxsw_sp *mlxsw_sp) |
| { |
| int i; |
| |
| /* Iterate over inner ECN values */ |
| for (i = INET_ECN_NOT_ECT; i <= INET_ECN_CE; i++) { |
| u8 outer_ecn = INET_ECN_encapsulate(0, i); |
| int err; |
| |
| err = mlxsw_sp_ipip_ecn_encap_init_one(mlxsw_sp, i, outer_ecn); |
| if (err) |
| return err; |
| } |
| |
| return 0; |
| } |
| |
| static int mlxsw_sp_ipip_ecn_decap_init_one(struct mlxsw_sp *mlxsw_sp, |
| u8 inner_ecn, u8 outer_ecn) |
| { |
| char tidem_pl[MLXSW_REG_TIDEM_LEN]; |
| bool trap_en, set_ce = false; |
| u8 new_inner_ecn; |
| |
| trap_en = __INET_ECN_decapsulate(outer_ecn, inner_ecn, &set_ce); |
| new_inner_ecn = set_ce ? INET_ECN_CE : inner_ecn; |
| |
| mlxsw_reg_tidem_pack(tidem_pl, outer_ecn, inner_ecn, new_inner_ecn, |
| trap_en, trap_en ? MLXSW_TRAP_ID_DECAP_ECN0 : 0); |
| return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(tidem), tidem_pl); |
| } |
| |
| int mlxsw_sp_ipip_ecn_decap_init(struct mlxsw_sp *mlxsw_sp) |
| { |
| int i, j, err; |
| |
| /* Iterate over inner ECN values */ |
| for (i = INET_ECN_NOT_ECT; i <= INET_ECN_CE; i++) { |
| /* Iterate over outer ECN values */ |
| for (j = INET_ECN_NOT_ECT; j <= INET_ECN_CE; j++) { |
| err = mlxsw_sp_ipip_ecn_decap_init_one(mlxsw_sp, i, j); |
| if (err) |
| return err; |
| } |
| } |
| |
| return 0; |
| } |