2 * IPv6 specific functions of netfilter core
4 * Rusty Russell (C) 2000 -- This code is GPL.
5 * Patrick McHardy (C) 2006-2012
7 #include <linux/kernel.h>
8 #include <linux/init.h>
9 #include <linux/ipv6.h>
10 #include <linux/netfilter.h>
11 #include <linux/netfilter_ipv6.h>
12 #include <linux/export.h>
13 #include <net/addrconf.h>
16 #include <net/ip6_route.h>
18 #include <net/netfilter/nf_queue.h>
19 #include <net/netfilter/nf_conntrack_bridge.h>
20 #include <net/netfilter/ipv6/nf_defrag_ipv6.h>
21 #include "../bridge/br_private.h"
23 int ip6_route_me_harder(struct net *net, struct sock *sk_partial, struct sk_buff *skb)
25 const struct ipv6hdr *iph = ipv6_hdr(skb);
26 struct sock *sk = sk_to_full_sk(sk_partial);
27 struct net_device *dev = skb_dst(skb)->dev;
28 struct flow_keys flkeys;
30 struct dst_entry *dst;
31 int strict = (ipv6_addr_type(&iph->daddr) &
32 (IPV6_ADDR_MULTICAST | IPV6_ADDR_LINKLOCAL));
34 .flowi6_mark = skb->mark,
35 .flowi6_uid = sock_net_uid(net, sk),
41 if (sk && sk->sk_bound_dev_if)
42 fl6.flowi6_oif = sk->sk_bound_dev_if;
44 fl6.flowi6_oif = dev->ifindex;
46 fl6.flowi6_oif = l3mdev_master_ifindex(dev);
48 fib6_rules_early_flow_dissect(net, skb, &fl6, &flkeys);
49 dst = ip6_route_output(net, sk, &fl6);
52 IP6_INC_STATS(net, ip6_dst_idev(dst), IPSTATS_MIB_OUTNOROUTES);
53 net_dbg_ratelimited("ip6_route_me_harder: No more route\n");
61 skb_dst_set(skb, dst);
64 if (!(IP6CB(skb)->flags & IP6SKB_XFRM_TRANSFORMED) &&
65 xfrm_decode_session(skb, flowi6_to_flowi(&fl6), AF_INET6) == 0) {
66 skb_dst_set(skb, NULL);
67 dst = xfrm_lookup(net, dst, flowi6_to_flowi(&fl6), sk, 0);
70 skb_dst_set(skb, dst);
74 /* Change in oif may mean change in hh_len. */
75 hh_len = skb_dst(skb)->dev->hard_header_len;
76 if (skb_headroom(skb) < hh_len &&
77 pskb_expand_head(skb, HH_DATA_ALIGN(hh_len - skb_headroom(skb)),
83 EXPORT_SYMBOL(ip6_route_me_harder);
85 static int nf_ip6_reroute(struct sk_buff *skb,
86 const struct nf_queue_entry *entry)
88 struct ip6_rt_info *rt_info = nf_queue_entry_reroute(entry);
90 if (entry->state.hook == NF_INET_LOCAL_OUT) {
91 const struct ipv6hdr *iph = ipv6_hdr(skb);
92 if (!ipv6_addr_equal(&iph->daddr, &rt_info->daddr) ||
93 !ipv6_addr_equal(&iph->saddr, &rt_info->saddr) ||
94 skb->mark != rt_info->mark)
95 return ip6_route_me_harder(entry->state.net, entry->state.sk, skb);
100 int __nf_ip6_route(struct net *net, struct dst_entry **dst,
101 struct flowi *fl, bool strict)
103 static const struct ipv6_pinfo fake_pinfo;
104 static const struct inet_sock fake_sk = {
105 /* makes ip6_route_output set RT6_LOOKUP_F_IFACE: */
106 .sk.sk_bound_dev_if = 1,
107 .pinet6 = (struct ipv6_pinfo *) &fake_pinfo,
109 const void *sk = strict ? &fake_sk : NULL;
110 struct dst_entry *result;
113 result = ip6_route_output(net, sk, &fl->u.ip6);
121 EXPORT_SYMBOL_GPL(__nf_ip6_route);
123 int br_ip6_fragment(struct net *net, struct sock *sk, struct sk_buff *skb,
124 struct nf_bridge_frag_data *data,
125 int (*output)(struct net *, struct sock *sk,
126 const struct nf_bridge_frag_data *data,
129 int frag_max_size = BR_INPUT_SKB_CB(skb)->frag_max_size;
130 ktime_t tstamp = skb->tstamp;
131 struct ip6_frag_state state;
132 u8 *prevhdr, nexthdr = 0;
133 unsigned int mtu, hlen;
137 err = ip6_find_1stfragopt(skb, &prevhdr);
144 if (frag_max_size > mtu ||
145 frag_max_size < IPV6_MIN_MTU)
149 if (mtu < hlen + sizeof(struct frag_hdr) + 8)
151 mtu -= hlen + sizeof(struct frag_hdr);
153 frag_id = ipv6_select_ident(net, &ipv6_hdr(skb)->daddr,
154 &ipv6_hdr(skb)->saddr);
156 if (skb->ip_summed == CHECKSUM_PARTIAL &&
157 (err = skb_checksum_help(skb)))
160 hroom = LL_RESERVED_SPACE(skb->dev);
161 if (skb_has_frag_list(skb)) {
162 unsigned int first_len = skb_pagelen(skb);
163 struct ip6_fraglist_iter iter;
164 struct sk_buff *frag2;
166 if (first_len - hlen > mtu ||
167 skb_headroom(skb) < (hroom + sizeof(struct frag_hdr)))
173 skb_walk_frags(skb, frag2) {
174 if (frag2->len > mtu ||
175 skb_headroom(frag2) < (hlen + hroom + sizeof(struct frag_hdr)))
178 /* Partially cloned skb? */
179 if (skb_shared(frag2))
183 err = ip6_fraglist_init(skb, hlen, prevhdr, nexthdr, frag_id,
189 /* Prepare header of the next frame,
190 * before previous one went down.
193 ip6_fraglist_prepare(skb, &iter);
195 skb->tstamp = tstamp;
196 err = output(net, sk, data, skb);
197 if (err || !iter.frag)
200 skb = ip6_fraglist_next(&iter);
207 kfree_skb_list(iter.frag);
211 /* This is a linearized skbuff, the original geometry is lost for us.
212 * This may also be a clone skbuff, we could preserve the geometry for
213 * the copies but probably not worth the effort.
215 ip6_frag_init(skb, hlen, mtu, skb->dev->needed_tailroom,
216 LL_RESERVED_SPACE(skb->dev), prevhdr, nexthdr, frag_id,
219 while (state.left > 0) {
220 struct sk_buff *skb2;
222 skb2 = ip6_frag_next(skb, &state);
228 skb2->tstamp = tstamp;
229 err = output(net, sk, data, skb2);
240 EXPORT_SYMBOL_GPL(br_ip6_fragment);
242 static const struct nf_ipv6_ops ipv6ops = {
243 #if IS_MODULE(CONFIG_IPV6)
244 .chk_addr = ipv6_chk_addr,
245 .route_me_harder = ip6_route_me_harder,
246 .dev_get_saddr = ipv6_dev_get_saddr,
247 .route = __nf_ip6_route,
248 #if IS_ENABLED(CONFIG_SYN_COOKIES)
249 .cookie_init_sequence = __cookie_v6_init_sequence,
250 .cookie_v6_check = __cookie_v6_check,
253 .route_input = ip6_route_input,
254 .fragment = ip6_fragment,
255 .reroute = nf_ip6_reroute,
256 #if IS_MODULE(CONFIG_IPV6)
257 .br_fragment = br_ip6_fragment,
261 int __init ipv6_netfilter_init(void)
263 RCU_INIT_POINTER(nf_ipv6_ops, &ipv6ops);
267 /* This can be called from inet6_init() on errors, so it cannot
268 * be marked __exit. -DaveM
270 void ipv6_netfilter_fini(void)
272 RCU_INIT_POINTER(nf_ipv6_ops, NULL);