// SPDX-License-Identifier: BSD-3-Clause OR GPL-2.0 /* Copyright (c) 2017-2018 Mellanox Technologies. All rights reserved */ #include #include #include #include "spectrum_ipip.h" #include "reg.h" struct ip_tunnel_parm mlxsw_sp_ipip_netdev_parms4(const struct net_device *ol_dev) { struct ip_tunnel *tun = netdev_priv(ol_dev); return tun->parms; } struct __ip6_tnl_parm mlxsw_sp_ipip_netdev_parms6(const struct net_device *ol_dev) { struct ip6_tnl *tun = netdev_priv(ol_dev); return tun->parms; } static bool mlxsw_sp_ipip_parms4_has_ikey(struct ip_tunnel_parm parms) { return !!(parms.i_flags & TUNNEL_KEY); } static bool mlxsw_sp_ipip_parms4_has_okey(struct ip_tunnel_parm parms) { return !!(parms.o_flags & TUNNEL_KEY); } static u32 mlxsw_sp_ipip_parms4_ikey(struct ip_tunnel_parm parms) { return mlxsw_sp_ipip_parms4_has_ikey(parms) ? be32_to_cpu(parms.i_key) : 0; } static u32 mlxsw_sp_ipip_parms4_okey(struct ip_tunnel_parm parms) { return mlxsw_sp_ipip_parms4_has_okey(parms) ? be32_to_cpu(parms.o_key) : 0; } static union mlxsw_sp_l3addr mlxsw_sp_ipip_parms4_saddr(struct ip_tunnel_parm parms) { return (union mlxsw_sp_l3addr) { .addr4 = parms.iph.saddr }; } static union mlxsw_sp_l3addr mlxsw_sp_ipip_parms6_saddr(struct __ip6_tnl_parm parms) { return (union mlxsw_sp_l3addr) { .addr6 = parms.laddr }; } static union mlxsw_sp_l3addr mlxsw_sp_ipip_parms4_daddr(struct ip_tunnel_parm parms) { return (union mlxsw_sp_l3addr) { .addr4 = parms.iph.daddr }; } static union mlxsw_sp_l3addr mlxsw_sp_ipip_parms6_daddr(struct __ip6_tnl_parm parms) { return (union mlxsw_sp_l3addr) { .addr6 = parms.raddr }; } union mlxsw_sp_l3addr mlxsw_sp_ipip_netdev_saddr(enum mlxsw_sp_l3proto proto, const struct net_device *ol_dev) { struct ip_tunnel_parm parms4; struct __ip6_tnl_parm parms6; switch (proto) { case MLXSW_SP_L3_PROTO_IPV4: parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev); return mlxsw_sp_ipip_parms4_saddr(parms4); case MLXSW_SP_L3_PROTO_IPV6: parms6 = mlxsw_sp_ipip_netdev_parms6(ol_dev); return mlxsw_sp_ipip_parms6_saddr(parms6); } WARN_ON(1); return (union mlxsw_sp_l3addr) {0}; } static __be32 mlxsw_sp_ipip_netdev_daddr4(const struct net_device *ol_dev) { struct ip_tunnel_parm parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev); return mlxsw_sp_ipip_parms4_daddr(parms4).addr4; } static union mlxsw_sp_l3addr mlxsw_sp_ipip_netdev_daddr(enum mlxsw_sp_l3proto proto, const struct net_device *ol_dev) { struct ip_tunnel_parm parms4; struct __ip6_tnl_parm parms6; switch (proto) { case MLXSW_SP_L3_PROTO_IPV4: parms4 = mlxsw_sp_ipip_netdev_parms4(ol_dev); return mlxsw_sp_ipip_parms4_daddr(parms4); case MLXSW_SP_L3_PROTO_IPV6: parms6 = mlxsw_sp_ipip_netdev_parms6(ol_dev); return mlxsw_sp_ipip_parms6_daddr(parms6); } WARN_ON(1); return (union mlxsw_sp_l3addr) {0}; } bool mlxsw_sp_l3addr_is_zero(union mlxsw_sp_l3addr addr) { union mlxsw_sp_l3addr naddr = {0}; return !memcmp(&addr, &naddr, sizeof(naddr)); } static int mlxsw_sp_ipip_nexthop_update_gre4(struct mlxsw_sp *mlxsw_sp, u32 adj_index, struct mlxsw_sp_ipip_entry *ipip_entry) { u16 rif_index = mlxsw_sp_ipip_lb_rif_index(ipip_entry->ol_lb); __be32 daddr4 = mlxsw_sp_ipip_netdev_daddr4(ipip_entry->ol_dev); char ratr_pl[MLXSW_REG_RATR_LEN]; mlxsw_reg_ratr_pack(ratr_pl, MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY, true, MLXSW_REG_RATR_TYPE_IPIP, adj_index, rif_index); mlxsw_reg_ratr_ipip4_entry_pack(ratr_pl, be32_to_cpu(daddr4)); return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl); } static int mlxsw_sp_ipip_fib_entry_op_gre4_rtdp(struct mlxsw_sp *mlxsw_sp, u32 tunnel_index, struct mlxsw_sp_ipip_entry *ipip_entry) { u16 rif_index = mlxsw_sp_ipip_lb_rif_index(ipip_entry->ol_lb); u16 ul_rif_id = mlxsw_sp_ipip_lb_ul_rif_id(ipip_entry->ol_lb); char rtdp_pl[MLXSW_REG_RTDP_LEN]; struct ip_tunnel_parm parms; unsigned int type_check; bool has_ikey; u32 daddr4; u32 ikey; parms = mlxsw_sp_ipip_netdev_parms4(ipip_entry->ol_dev); has_ikey = mlxsw_sp_ipip_parms4_has_ikey(parms); ikey = mlxsw_sp_ipip_parms4_ikey(parms); mlxsw_reg_rtdp_pack(rtdp_pl, MLXSW_REG_RTDP_TYPE_IPIP, tunnel_index); mlxsw_reg_rtdp_egress_router_interface_set(rtdp_pl, ul_rif_id); type_check = has_ikey ? MLXSW_REG_RTDP_IPIP_TYPE_CHECK_ALLOW_GRE_KEY : MLXSW_REG_RTDP_IPIP_TYPE_CHECK_ALLOW_GRE; /* Linux demuxes tunnels based on packet SIP (which must match tunnel * remote IP). Thus configure decap so that it filters out packets that * are not IPv4 or have the wrong SIP. IPIP_DECAP_ERROR trap is * generated for packets that fail this criterion. Linux then handles * such packets in slow path and generates ICMP destination unreachable. */ daddr4 = be32_to_cpu(mlxsw_sp_ipip_netdev_daddr4(ipip_entry->ol_dev)); mlxsw_reg_rtdp_ipip4_pack(rtdp_pl, rif_index, MLXSW_REG_RTDP_IPIP_SIP_CHECK_FILTER_IPV4, type_check, has_ikey, daddr4, ikey); return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rtdp), rtdp_pl); } static int mlxsw_sp_ipip_fib_entry_op_gre4_ralue(struct mlxsw_sp *mlxsw_sp, u32 dip, u8 prefix_len, u16 ul_vr_id, enum mlxsw_reg_ralue_op op, u32 tunnel_index) { char ralue_pl[MLXSW_REG_RALUE_LEN]; mlxsw_reg_ralue_pack4(ralue_pl, MLXSW_REG_RALXX_PROTOCOL_IPV4, op, ul_vr_id, prefix_len, dip); mlxsw_reg_ralue_act_ip2me_tun_pack(ralue_pl, tunnel_index); return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl); } static int mlxsw_sp_ipip_fib_entry_op_gre4(struct mlxsw_sp *mlxsw_sp, struct mlxsw_sp_ipip_entry *ipip_entry, enum mlxsw_reg_ralue_op op, u32 tunnel_index) { u16 ul_vr_id = mlxsw_sp_ipip_lb_ul_vr_id(ipip_entry->ol_lb); __be32 dip; int err; err = mlxsw_sp_ipip_fib_entry_op_gre4_rtdp(mlxsw_sp, tunnel_index, ipip_entry); if (err) return err; dip = mlxsw_sp_ipip_netdev_saddr(MLXSW_SP_L3_PROTO_IPV4, ipip_entry->ol_dev).addr4; return mlxsw_sp_ipip_fib_entry_op_gre4_ralue(mlxsw_sp, be32_to_cpu(dip), 32, ul_vr_id, op, tunnel_index); } static bool mlxsw_sp_ipip_tunnel_complete(enum mlxsw_sp_l3proto proto, const struct net_device *ol_dev) { union mlxsw_sp_l3addr saddr = mlxsw_sp_ipip_netdev_saddr(proto, ol_dev); union mlxsw_sp_l3addr daddr = mlxsw_sp_ipip_netdev_daddr(proto, ol_dev); /* Tunnels with unset local or remote address are valid in Linux and * used for lightweight tunnels (LWT) and Non-Broadcast Multi-Access * (NBMA) tunnels. In principle these can be offloaded, but the driver * currently doesn't support this. So punt. */ return !mlxsw_sp_l3addr_is_zero(saddr) && !mlxsw_sp_l3addr_is_zero(daddr); } static bool mlxsw_sp_ipip_can_offload_gre4(const struct mlxsw_sp *mlxsw_sp, const struct net_device *ol_dev, enum mlxsw_sp_l3proto ol_proto) { struct ip_tunnel *tunnel = netdev_priv(ol_dev); __be16 okflags = TUNNEL_KEY; /* We can't offload any other features. */ bool inherit_ttl = tunnel->parms.iph.ttl == 0; bool inherit_tos = tunnel->parms.iph.tos & 0x1; return (tunnel->parms.i_flags & ~okflags) == 0 && (tunnel->parms.o_flags & ~okflags) == 0 && inherit_ttl && inherit_tos && mlxsw_sp_ipip_tunnel_complete(MLXSW_SP_L3_PROTO_IPV4, ol_dev); } static struct mlxsw_sp_rif_ipip_lb_config mlxsw_sp_ipip_ol_loopback_config_gre4(struct mlxsw_sp *mlxsw_sp, const struct net_device *ol_dev) { struct ip_tunnel_parm parms = mlxsw_sp_ipip_netdev_parms4(ol_dev); enum mlxsw_reg_ritr_loopback_ipip_type lb_ipipt; lb_ipipt = mlxsw_sp_ipip_parms4_has_okey(parms) ? MLXSW_REG_RITR_LOOPBACK_IPIP_TYPE_IP_IN_GRE_KEY_IN_IP : MLXSW_REG_RITR_LOOPBACK_IPIP_TYPE_IP_IN_GRE_IN_IP; return (struct mlxsw_sp_rif_ipip_lb_config){ .lb_ipipt = lb_ipipt, .okey = mlxsw_sp_ipip_parms4_okey(parms), .ul_protocol = MLXSW_SP_L3_PROTO_IPV4, .saddr = mlxsw_sp_ipip_netdev_saddr(MLXSW_SP_L3_PROTO_IPV4, ol_dev), }; } static int mlxsw_sp_ipip_ol_netdev_change_gre4(struct mlxsw_sp *mlxsw_sp, struct mlxsw_sp_ipip_entry *ipip_entry, struct netlink_ext_ack *extack) { union mlxsw_sp_l3addr old_saddr, new_saddr; union mlxsw_sp_l3addr old_daddr, new_daddr; struct ip_tunnel_parm new_parms; bool update_tunnel = false; bool update_decap = false; bool update_nhs = false; int err = 0; new_parms = mlxsw_sp_ipip_netdev_parms4(ipip_entry->ol_dev); new_saddr = mlxsw_sp_ipip_parms4_saddr(new_parms); old_saddr = mlxsw_sp_ipip_parms4_saddr(ipip_entry->parms4); new_daddr = mlxsw_sp_ipip_parms4_daddr(new_parms); old_daddr = mlxsw_sp_ipip_parms4_daddr(ipip_entry->parms4); if (!mlxsw_sp_l3addr_eq(&new_saddr, &old_saddr)) { u16 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev); /* Since the local address has changed, if there is another * tunnel with a matching saddr, both need to be demoted. */ if (mlxsw_sp_ipip_demote_tunnel_by_saddr(mlxsw_sp, MLXSW_SP_L3_PROTO_IPV4, new_saddr, ul_tb_id, ipip_entry)) { mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry); return 0; } update_tunnel = true; } else if ((mlxsw_sp_ipip_parms4_okey(ipip_entry->parms4) != mlxsw_sp_ipip_parms4_okey(new_parms)) || ipip_entry->parms4.link != new_parms.link) { update_tunnel = true; } else if (!mlxsw_sp_l3addr_eq(&new_daddr, &old_daddr)) { update_nhs = true; } else if (mlxsw_sp_ipip_parms4_ikey(ipip_entry->parms4) != mlxsw_sp_ipip_parms4_ikey(new_parms)) { update_decap = true; } if (update_tunnel) err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry, true, true, true, extack); else if (update_nhs) err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry, false, false, true, extack); else if (update_decap) err = __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry, false, false, false, extack); ipip_entry->parms4 = new_parms; return err; } static const struct mlxsw_sp_ipip_ops mlxsw_sp_ipip_gre4_ops = { .dev_type = ARPHRD_IPGRE, .ul_proto = MLXSW_SP_L3_PROTO_IPV4, .nexthop_update = mlxsw_sp_ipip_nexthop_update_gre4, .fib_entry_op = mlxsw_sp_ipip_fib_entry_op_gre4, .can_offload = mlxsw_sp_ipip_can_offload_gre4, .ol_loopback_config = mlxsw_sp_ipip_ol_loopback_config_gre4, .ol_netdev_change = mlxsw_sp_ipip_ol_netdev_change_gre4, }; const struct mlxsw_sp_ipip_ops *mlxsw_sp_ipip_ops_arr[] = { [MLXSW_SP_IPIP_TYPE_GRE4] = &mlxsw_sp_ipip_gre4_ops, }; static int mlxsw_sp_ipip_ecn_encap_init_one(struct mlxsw_sp *mlxsw_sp, u8 inner_ecn, u8 outer_ecn) { char tieem_pl[MLXSW_REG_TIEEM_LEN]; mlxsw_reg_tieem_pack(tieem_pl, inner_ecn, outer_ecn); return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(tieem), tieem_pl); } int mlxsw_sp_ipip_ecn_encap_init(struct mlxsw_sp *mlxsw_sp) { int i; /* Iterate over inner ECN values */ for (i = INET_ECN_NOT_ECT; i <= INET_ECN_CE; i++) { u8 outer_ecn = INET_ECN_encapsulate(0, i); int err; err = mlxsw_sp_ipip_ecn_encap_init_one(mlxsw_sp, i, outer_ecn); if (err) return err; } return 0; } static int mlxsw_sp_ipip_ecn_decap_init_one(struct mlxsw_sp *mlxsw_sp, u8 inner_ecn, u8 outer_ecn) { char tidem_pl[MLXSW_REG_TIDEM_LEN]; u8 new_inner_ecn; bool trap_en; new_inner_ecn = mlxsw_sp_tunnel_ecn_decap(outer_ecn, inner_ecn, &trap_en); mlxsw_reg_tidem_pack(tidem_pl, outer_ecn, inner_ecn, new_inner_ecn, trap_en, trap_en ? MLXSW_TRAP_ID_DECAP_ECN0 : 0); return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(tidem), tidem_pl); } int mlxsw_sp_ipip_ecn_decap_init(struct mlxsw_sp *mlxsw_sp) { int i, j, err; /* Iterate over inner ECN values */ for (i = INET_ECN_NOT_ECT; i <= INET_ECN_CE; i++) { /* Iterate over outer ECN values */ for (j = INET_ECN_NOT_ECT; j <= INET_ECN_CE; j++) { err = mlxsw_sp_ipip_ecn_decap_init_one(mlxsw_sp, i, j); if (err) return err; } } return 0; }