mirror of
https://mirrors.bfsu.edu.cn/git/linux.git
synced 2024-11-16 16:54:20 +08:00
dab4e1f06c
Extend the bpf_fib_lookup() helper by making it to return the source IPv4/IPv6 address if the BPF_FIB_LOOKUP_SRC flag is set. For example, the following snippet can be used to derive the desired source IP address: struct bpf_fib_lookup p = { .ipv4_dst = ip4->daddr }; ret = bpf_skb_fib_lookup(skb, p, sizeof(p), BPF_FIB_LOOKUP_SRC | BPF_FIB_LOOKUP_SKIP_NEIGH); if (ret != BPF_FIB_LKUP_RET_SUCCESS) return TC_ACT_SHOT; /* the p.ipv4_src now contains the source address */ The inability to derive the proper source address may cause malfunctions in BPF-based dataplanes for hosts containing netdevs with more than one routable IP address or for multi-homed hosts. For example, Cilium implements packet masquerading in BPF. If an egressing netdev to which the Cilium's BPF prog is attached has multiple IP addresses, then only one [hardcoded] IP address can be used for masquerading. This breaks connectivity if any other IP address should have been selected instead, for example, when a public and private addresses are attached to the same egress interface. The change was tested with Cilium [1]. Nikolay Aleksandrov helped to figure out the IPv6 addr selection. [1]: https://github.com/cilium/cilium/pull/28283 Signed-off-by: Martynas Pumputis <m@lambda.lt> Link: https://lore.kernel.org/r/20231007081415.33502-2-m@lambda.lt Signed-off-by: Martin KaFai Lau <martin.lau@kernel.org>
97 lines
3.6 KiB
C
97 lines
3.6 KiB
C
/* SPDX-License-Identifier: GPL-2.0 */
|
|
#ifndef _IPV6_STUBS_H
|
|
#define _IPV6_STUBS_H
|
|
|
|
#include <linux/in6.h>
|
|
#include <linux/netdevice.h>
|
|
#include <linux/skbuff.h>
|
|
#include <net/dst.h>
|
|
#include <net/flow.h>
|
|
#include <net/neighbour.h>
|
|
#include <net/sock.h>
|
|
|
|
/* structs from net/ip6_fib.h */
|
|
struct fib6_info;
|
|
struct fib6_nh;
|
|
struct fib6_config;
|
|
struct fib6_result;
|
|
|
|
/* This is ugly, ideally these symbols should be built
|
|
* into the core kernel.
|
|
*/
|
|
struct ipv6_stub {
|
|
int (*ipv6_sock_mc_join)(struct sock *sk, int ifindex,
|
|
const struct in6_addr *addr);
|
|
int (*ipv6_sock_mc_drop)(struct sock *sk, int ifindex,
|
|
const struct in6_addr *addr);
|
|
struct dst_entry *(*ipv6_dst_lookup_flow)(struct net *net,
|
|
const struct sock *sk,
|
|
struct flowi6 *fl6,
|
|
const struct in6_addr *final_dst);
|
|
int (*ipv6_route_input)(struct sk_buff *skb);
|
|
|
|
struct fib6_table *(*fib6_get_table)(struct net *net, u32 id);
|
|
int (*fib6_lookup)(struct net *net, int oif, struct flowi6 *fl6,
|
|
struct fib6_result *res, int flags);
|
|
int (*fib6_table_lookup)(struct net *net, struct fib6_table *table,
|
|
int oif, struct flowi6 *fl6,
|
|
struct fib6_result *res, int flags);
|
|
void (*fib6_select_path)(const struct net *net, struct fib6_result *res,
|
|
struct flowi6 *fl6, int oif, bool oif_match,
|
|
const struct sk_buff *skb, int strict);
|
|
u32 (*ip6_mtu_from_fib6)(const struct fib6_result *res,
|
|
const struct in6_addr *daddr,
|
|
const struct in6_addr *saddr);
|
|
|
|
int (*fib6_nh_init)(struct net *net, struct fib6_nh *fib6_nh,
|
|
struct fib6_config *cfg, gfp_t gfp_flags,
|
|
struct netlink_ext_ack *extack);
|
|
void (*fib6_nh_release)(struct fib6_nh *fib6_nh);
|
|
void (*fib6_nh_release_dsts)(struct fib6_nh *fib6_nh);
|
|
void (*fib6_update_sernum)(struct net *net, struct fib6_info *rt);
|
|
int (*ip6_del_rt)(struct net *net, struct fib6_info *rt, bool skip_notify);
|
|
void (*fib6_rt_update)(struct net *net, struct fib6_info *rt,
|
|
struct nl_info *info);
|
|
|
|
void (*udpv6_encap_enable)(void);
|
|
void (*ndisc_send_na)(struct net_device *dev, const struct in6_addr *daddr,
|
|
const struct in6_addr *solicited_addr,
|
|
bool router, bool solicited, bool override, bool inc_opt);
|
|
#if IS_ENABLED(CONFIG_XFRM)
|
|
void (*xfrm6_local_rxpmtu)(struct sk_buff *skb, u32 mtu);
|
|
int (*xfrm6_udp_encap_rcv)(struct sock *sk, struct sk_buff *skb);
|
|
int (*xfrm6_rcv_encap)(struct sk_buff *skb, int nexthdr, __be32 spi,
|
|
int encap_type);
|
|
#endif
|
|
struct neigh_table *nd_tbl;
|
|
|
|
int (*ipv6_fragment)(struct net *net, struct sock *sk, struct sk_buff *skb,
|
|
int (*output)(struct net *, struct sock *, struct sk_buff *));
|
|
struct net_device *(*ipv6_dev_find)(struct net *net, const struct in6_addr *addr,
|
|
struct net_device *dev);
|
|
};
|
|
extern const struct ipv6_stub *ipv6_stub __read_mostly;
|
|
|
|
/* A stub used by bpf helpers. Similarly ugly as ipv6_stub */
|
|
struct ipv6_bpf_stub {
|
|
int (*inet6_bind)(struct sock *sk, struct sockaddr *uaddr, int addr_len,
|
|
u32 flags);
|
|
struct sock *(*udp6_lib_lookup)(struct net *net,
|
|
const struct in6_addr *saddr, __be16 sport,
|
|
const struct in6_addr *daddr, __be16 dport,
|
|
int dif, int sdif, struct udp_table *tbl,
|
|
struct sk_buff *skb);
|
|
int (*ipv6_setsockopt)(struct sock *sk, int level, int optname,
|
|
sockptr_t optval, unsigned int optlen);
|
|
int (*ipv6_getsockopt)(struct sock *sk, int level, int optname,
|
|
sockptr_t optval, sockptr_t optlen);
|
|
int (*ipv6_dev_get_saddr)(struct net *net,
|
|
const struct net_device *dst_dev,
|
|
const struct in6_addr *daddr,
|
|
unsigned int prefs,
|
|
struct in6_addr *saddr);
|
|
};
|
|
extern const struct ipv6_bpf_stub *ipv6_bpf_stub __read_mostly;
|
|
|
|
#endif
|