📄 br_netfilter.c

📁 linux 内核源代码
💻 C
📖 第 1 页 / 共 2 页
字号:
12 下一页
/* *	Handle firewalling *	Linux ethernet bridge * *	Authors: *	Lennert Buytenhek               <buytenh@gnu.org> *	Bart De Schuymer (maintainer)	<bdschuym@pandora.be> * *	Changes: *	Apr 29 2003: physdev module support (bdschuym) *	Jun 19 2003: let arptables see bridged ARP traffic (bdschuym) *	Oct 06 2003: filter encapsulated IP/ARP VLAN traffic on untagged bridge *	             (bdschuym) *	Sep 01 2004: add IPv6 filtering (bdschuym) * *	This program is free software; you can redistribute it and/or *	modify it under the terms of the GNU General Public License *	as published by the Free Software Foundation; either version *	2 of the License, or (at your option) any later version. * *	Lennert dedicates this file to Kerstin Wurdinger. */#include <linux/module.h>#include <linux/kernel.h>#include <linux/ip.h>#include <linux/netdevice.h>#include <linux/skbuff.h>#include <linux/if_arp.h>#include <linux/if_ether.h>#include <linux/if_vlan.h>#include <linux/if_pppox.h>#include <linux/ppp_defs.h>#include <linux/netfilter_bridge.h>#include <linux/netfilter_ipv4.h>#include <linux/netfilter_ipv6.h>#include <linux/netfilter_arp.h>#include <linux/in_route.h>#include <linux/inetdevice.h>#include <net/ip.h>#include <net/ipv6.h>#include <net/route.h>#include <asm/uaccess.h>#include "br_private.h"#ifdef CONFIG_SYSCTL#include <linux/sysctl.h>#endif#define skb_origaddr(skb)	 (((struct bridge_skb_cb *) \				 (skb->nf_bridge->data))->daddr.ipv4)#define store_orig_dstaddr(skb)	 (skb_origaddr(skb) = ip_hdr(skb)->daddr)#define dnat_took_place(skb)	 (skb_origaddr(skb) != ip_hdr(skb)->daddr)#ifdef CONFIG_SYSCTLstatic struct ctl_table_header *brnf_sysctl_header;static int brnf_call_iptables __read_mostly = 1;static int brnf_call_ip6tables __read_mostly = 1;static int brnf_call_arptables __read_mostly = 1;static int brnf_filter_vlan_tagged __read_mostly = 1;static int brnf_filter_pppoe_tagged __read_mostly = 1;#else#define brnf_filter_vlan_tagged 1#define brnf_filter_pppoe_tagged 1#endifstatic inline __be16 vlan_proto(const struct sk_buff *skb){	return vlan_eth_hdr(skb)->h_vlan_encapsulated_proto;}#define IS_VLAN_IP(skb) \	(skb->protocol == htons(ETH_P_8021Q) && \	 vlan_proto(skb) == htons(ETH_P_IP) && 	\	 brnf_filter_vlan_tagged)#define IS_VLAN_IPV6(skb) \	(skb->protocol == htons(ETH_P_8021Q) && \	 vlan_proto(skb) == htons(ETH_P_IPV6) &&\	 brnf_filter_vlan_tagged)#define IS_VLAN_ARP(skb) \	(skb->protocol == htons(ETH_P_8021Q) &&	\	 vlan_proto(skb) == htons(ETH_P_ARP) &&	\	 brnf_filter_vlan_tagged)static inline __be16 pppoe_proto(const struct sk_buff *skb){	return *((__be16 *)(skb_mac_header(skb) + ETH_HLEN +			    sizeof(struct pppoe_hdr)));}#define IS_PPPOE_IP(skb) \	(skb->protocol == htons(ETH_P_PPP_SES) && \	 pppoe_proto(skb) == htons(PPP_IP) && \	 brnf_filter_pppoe_tagged)#define IS_PPPOE_IPV6(skb) \	(skb->protocol == htons(ETH_P_PPP_SES) && \	 pppoe_proto(skb) == htons(PPP_IPV6) && \	 brnf_filter_pppoe_tagged)/* We need these fake structures to make netfilter happy -- * lots of places assume that skb->dst != NULL, which isn't * all that unreasonable. * * Currently, we fill in the PMTU entry because netfilter * refragmentation needs it, and the rt_flags entry because * ipt_REJECT needs it.  Future netfilter modules might * require us to fill additional fields. */static struct net_device __fake_net_device = {	.hard_header_len	= ETH_HLEN};static struct rtable __fake_rtable = {	.u = {		.dst = {			.__refcnt		= ATOMIC_INIT(1),			.dev			= &__fake_net_device,			.path			= &__fake_rtable.u.dst,			.metrics		= {[RTAX_MTU - 1] = 1500},			.flags			= DST_NOXFRM,		}	},	.rt_flags	= 0,};static inline struct net_device *bridge_parent(const struct net_device *dev){	struct net_bridge_port *port = rcu_dereference(dev->br_port);	return port ? port->br->dev : NULL;}static inline struct nf_bridge_info *nf_bridge_alloc(struct sk_buff *skb){	skb->nf_bridge = kzalloc(sizeof(struct nf_bridge_info), GFP_ATOMIC);	if (likely(skb->nf_bridge))		atomic_set(&(skb->nf_bridge->use), 1);	return skb->nf_bridge;}static inline struct nf_bridge_info *nf_bridge_unshare(struct sk_buff *skb){	struct nf_bridge_info *nf_bridge = skb->nf_bridge;	if (atomic_read(&nf_bridge->use) > 1) {		struct nf_bridge_info *tmp = nf_bridge_alloc(skb);		if (tmp) {			memcpy(tmp, nf_bridge, sizeof(struct nf_bridge_info));			atomic_set(&tmp->use, 1);			nf_bridge_put(nf_bridge);		}		nf_bridge = tmp;	}	return nf_bridge;}static inline void nf_bridge_push_encap_header(struct sk_buff *skb){	unsigned int len = nf_bridge_encap_header_len(skb);	skb_push(skb, len);	skb->network_header -= len;}static inline void nf_bridge_pull_encap_header(struct sk_buff *skb){	unsigned int len = nf_bridge_encap_header_len(skb);	skb_pull(skb, len);	skb->network_header += len;}static inline void nf_bridge_pull_encap_header_rcsum(struct sk_buff *skb){	unsigned int len = nf_bridge_encap_header_len(skb);	skb_pull_rcsum(skb, len);	skb->network_header += len;}static inline void nf_bridge_save_header(struct sk_buff *skb){	int header_size = ETH_HLEN + nf_bridge_encap_header_len(skb);	skb_copy_from_linear_data_offset(skb, -header_size,					 skb->nf_bridge->data, header_size);}/* * When forwarding bridge frames, we save a copy of the original * header before processing. */int nf_bridge_copy_header(struct sk_buff *skb){	int err;	int header_size = ETH_HLEN + nf_bridge_encap_header_len(skb);	err = skb_cow_head(skb, header_size);	if (err)		return err;	skb_copy_to_linear_data_offset(skb, -header_size,				       skb->nf_bridge->data, header_size);	__skb_push(skb, nf_bridge_encap_header_len(skb));	return 0;}/* PF_BRIDGE/PRE_ROUTING *********************************************//* Undo the changes made for ip6tables PREROUTING and continue the * bridge PRE_ROUTING hook. */static int br_nf_pre_routing_finish_ipv6(struct sk_buff *skb){	struct nf_bridge_info *nf_bridge = skb->nf_bridge;	if (nf_bridge->mask & BRNF_PKT_TYPE) {		skb->pkt_type = PACKET_OTHERHOST;		nf_bridge->mask ^= BRNF_PKT_TYPE;	}	nf_bridge->mask ^= BRNF_NF_BRIDGE_PREROUTING;	skb->dst = (struct dst_entry *)&__fake_rtable;	dst_hold(skb->dst);	skb->dev = nf_bridge->physindev;	nf_bridge_push_encap_header(skb);	NF_HOOK_THRESH(PF_BRIDGE, NF_BR_PRE_ROUTING, skb, skb->dev, NULL,		       br_handle_frame_finish, 1);	return 0;}static void __br_dnat_complain(void){	static unsigned long last_complaint;	if (jiffies - last_complaint >= 5 * HZ) {		printk(KERN_WARNING "Performing cross-bridge DNAT requires IP "		       "forwarding to be enabled\n");		last_complaint = jiffies;	}}/* This requires some explaining. If DNAT has taken place, * we will need to fix up the destination Ethernet address, * and this is a tricky process. * * There are two cases to consider: * 1. The packet was DNAT'ed to a device in the same bridge *    port group as it was received on. We can still bridge *    the packet. * 2. The packet was DNAT'ed to a different device, either *    a non-bridged device or another bridge port group. *    The packet will need to be routed. * * The correct way of distinguishing between these two cases is to * call ip_route_input() and to look at skb->dst->dev, which is * changed to the destination device if ip_route_input() succeeds. * * Let us first consider the case that ip_route_input() succeeds: * * If skb->dst->dev equals the logical bridge device the packet * came in on, we can consider this bridging. The packet is passed * through the neighbour output function to build a new destination * MAC address, which will make the packet enter br_nf_local_out() * not much later. In that function it is assured that the iptables * FORWARD chain is traversed for the packet. * * Otherwise, the packet is considered to be routed and we just * change the destination MAC address so that the packet will * later be passed up to the IP stack to be routed. For a redirected * packet, ip_route_input() will give back the localhost as output device, * which differs from the bridge device. * * Let us now consider the case that ip_route_input() fails: * * This can be because the destination address is martian, in which case * the packet will be dropped. * After a "echo '0' > /proc/sys/net/ipv4/ip_forward" ip_route_input() * will fail, while __ip_route_output_key() will return success. The source * address for __ip_route_output_key() is set to zero, so __ip_route_output_key * thinks we're handling a locally generated packet and won't care * if IP forwarding is allowed. We send a warning message to the users's * log telling her to put IP forwarding on. * * ip_route_input() will also fail if there is no route available. * In that case we just drop the packet. * * --Lennert, 20020411 * --Bart, 20020416 (updated) * --Bart, 20021007 (updated) * --Bart, 20062711 (updated) */static int br_nf_pre_routing_finish_bridge(struct sk_buff *skb){	if (skb->pkt_type == PACKET_OTHERHOST) {		skb->pkt_type = PACKET_HOST;		skb->nf_bridge->mask |= BRNF_PKT_TYPE;	}	skb->nf_bridge->mask ^= BRNF_NF_BRIDGE_PREROUTING;	skb->dev = bridge_parent(skb->dev);	if (skb->dev) {		struct dst_entry *dst = skb->dst;		nf_bridge_pull_encap_header(skb);		if (dst->hh)			return neigh_hh_output(dst->hh, skb);		else if (dst->neighbour)			return dst->neighbour->output(skb);	}	kfree_skb(skb);	return 0;}static int br_nf_pre_routing_finish(struct sk_buff *skb){	struct net_device *dev = skb->dev;	struct iphdr *iph = ip_hdr(skb);	struct nf_bridge_info *nf_bridge = skb->nf_bridge;	int err;	if (nf_bridge->mask & BRNF_PKT_TYPE) {		skb->pkt_type = PACKET_OTHERHOST;		nf_bridge->mask ^= BRNF_PKT_TYPE;	}	nf_bridge->mask ^= BRNF_NF_BRIDGE_PREROUTING;	if (dnat_took_place(skb)) {		if ((err = ip_route_input(skb, iph->daddr, iph->saddr, iph->tos, dev))) {			struct rtable *rt;			struct flowi fl = {				.nl_u = {					.ip4_u = {						 .daddr = iph->daddr,						 .saddr = 0,						 .tos = RT_TOS(iph->tos) },				},				.proto = 0,			};			struct in_device *in_dev = in_dev_get(dev);			/* If err equals -EHOSTUNREACH the error is due to a			 * martian destination or due to the fact that			 * forwarding is disabled. For most martian packets,			 * ip_route_output_key() will fail. It won't fail for 2 types of			 * martian destinations: loopback destinations and destination			 * 0.0.0.0. In both cases the packet will be dropped because the			 * destination is the loopback device and not the bridge. */			if (err != -EHOSTUNREACH || !in_dev || IN_DEV_FORWARD(in_dev))				goto free_skb;			if (!ip_route_output_key(&rt, &fl)) {				/* - Bridged-and-DNAT'ed traffic doesn't				 *   require ip_forwarding. */				if (((struct dst_entry *)rt)->dev == dev) {					skb->dst = (struct dst_entry *)rt;					goto bridged_dnat;				}				/* we are sure that forwarding is disabled, so printing				 * this message is no problem. Note that the packet could				 * still have a martian destination address, in which case				 * the packet could be dropped even if forwarding were enabled */				__br_dnat_complain();				dst_release((struct dst_entry *)rt);			}free_skb:			kfree_skb(skb);			return 0;		} else {			if (skb->dst->dev == dev) {bridged_dnat:				/* Tell br_nf_local_out this is a				 * bridged frame */				nf_bridge->mask |= BRNF_BRIDGED_DNAT;				skb->dev = nf_bridge->physindev;				nf_bridge_push_encap_header(skb);				NF_HOOK_THRESH(PF_BRIDGE, NF_BR_PRE_ROUTING,					       skb, skb->dev, NULL,					       br_nf_pre_routing_finish_bridge,					       1);				return 0;			}			memcpy(eth_hdr(skb)->h_dest, dev->dev_addr, ETH_ALEN);			skb->pkt_type = PACKET_HOST;		}	} else {		skb->dst = (struct dst_entry *)&__fake_rtable;		dst_hold(skb->dst);	}	skb->dev = nf_bridge->physindev;	nf_bridge_push_encap_header(skb);	NF_HOOK_THRESH(PF_BRIDGE, NF_BR_PRE_ROUTING, skb, skb->dev, NULL,		       br_handle_frame_finish, 1);	return 0;}/* Some common code for IPv4/IPv6 */static struct net_device *setup_pre_routing(struct sk_buff *skb){	struct nf_bridge_info *nf_bridge = skb->nf_bridge;	if (skb->pkt_type == PACKET_OTHERHOST) {		skb->pkt_type = PACKET_HOST;		nf_bridge->mask |= BRNF_PKT_TYPE;	}	nf_bridge->mask |= BRNF_NF_BRIDGE_PREROUTING;	nf_bridge->physindev = skb->dev;	skb->dev = bridge_parent(skb->dev);	return skb->dev;}/* We only check the length. A bridge shouldn't do any hop-by-hop stuff anyway */static int check_hbh_len(struct sk_buff *skb){	unsigned char *raw = (u8 *)(ipv6_hdr(skb) + 1);	u32 pkt_len;	const unsigned char *nh = skb_network_header(skb);	int off = raw - nh;	int len = (raw[1] + 1) << 3;	if ((raw + len) - skb->data > skb_headlen(skb))		goto bad;	off += 2;	len -= 2;	while (len > 0) {		int optlen = nh[off + 1] + 2;		switch (nh[off]) {		case IPV6_TLV_PAD0:			optlen = 1;			break;		case IPV6_TLV_PADN:			break;		case IPV6_TLV_JUMBO:			if (nh[off + 1] != 4 || (off & 3) != 2)				goto bad;			pkt_len = ntohl(*(__be32 *) (nh + off + 2));			if (pkt_len <= IPV6_MAXPLEN ||			    ipv6_hdr(skb)->payload_len)				goto bad;			if (pkt_len > skb->len - sizeof(struct ipv6hdr))				goto bad;			if (pskb_trim_rcsum(skb,					    pkt_len + sizeof(struct ipv6hdr)))				goto bad;			nh = skb_network_header(skb);			break;		default:			if (optlen > len)				goto bad;			break;		}		off += optlen;		len -= optlen;	}	if (len == 0)		return 0;bad:	return -1;}/* Replicate the checks that IPv6 does on packet reception and pass the packet * to ip6tables, which doesn't support NAT, so things are fairly simple. */static unsigned int br_nf_pre_routing_ipv6(unsigned int hook,					   struct sk_buff *skb,					   const struct net_device *in,					   const struct net_device *out,					   int (*okfn)(struct sk_buff *)){	struct ipv6hdr *hdr;	u32 pkt_len;	if (skb->len < sizeof(struct ipv6hdr))		goto inhdr_error;	if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))		goto inhdr_error;	hdr = ipv6_hdr(skb);	if (hdr->version != 6)		goto inhdr_error;	pkt_len = ntohs(hdr->payload_len);	if (pkt_len || hdr->nexthdr != NEXTHDR_HOP) {		if (pkt_len + sizeof(struct ipv6hdr) > skb->len)			goto inhdr_error;		if (pskb_trim_rcsum(skb, pkt_len + sizeof(struct ipv6hdr)))			goto inhdr_error;	}	if (hdr->nexthdr == NEXTHDR_HOP && check_hbh_len(skb))		goto inhdr_error;	nf_bridge_put(skb->nf_bridge);	if (!nf_bridge_alloc(skb))
12 下一页
💿 文件大小 57701 K
👤 上传用户 huanzhudev
📂 所属分类网络
🏷️ 相关标签

#linux #内核 #源代码
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -