1 /*
2  * Rusty Russell (C)2000 -- This code is GPL.
3  * Patrick McHardy (c) 2006-2012
4  */
5 
6 #include <linux/kernel.h>
7 #include <linux/slab.h>
8 #include <linux/init.h>
9 #include <linux/module.h>
10 #include <linux/proc_fs.h>
11 #include <linux/skbuff.h>
12 #include <linux/netfilter.h>
13 #include <linux/netfilter_ipv4.h>
14 #include <linux/netfilter_ipv6.h>
15 #include <linux/netfilter_bridge.h>
16 #include <linux/seq_file.h>
17 #include <linux/rcupdate.h>
18 #include <net/protocol.h>
19 #include <net/netfilter/nf_queue.h>
20 #include <net/dst.h>
21 
22 #include "nf_internals.h"
23 
24 static const struct nf_queue_handler __rcu *nf_queue_handler;
25 
26 /*
27  * Hook for nfnetlink_queue to register its queue handler.
28  * We do this so that most of the NFQUEUE code can be modular.
29  *
30  * Once the queue is registered it must reinject all packets it
31  * receives, no matter what.
32  */
33 
nf_register_queue_handler(const struct nf_queue_handler * qh)34 void nf_register_queue_handler(const struct nf_queue_handler *qh)
35 {
36 	/* should never happen, we only have one queueing backend in kernel */
37 	WARN_ON(rcu_access_pointer(nf_queue_handler));
38 	rcu_assign_pointer(nf_queue_handler, qh);
39 }
40 EXPORT_SYMBOL(nf_register_queue_handler);
41 
42 /* The caller must flush their queue before this */
nf_unregister_queue_handler(void)43 void nf_unregister_queue_handler(void)
44 {
45 	RCU_INIT_POINTER(nf_queue_handler, NULL);
46 }
47 EXPORT_SYMBOL(nf_unregister_queue_handler);
48 
nf_queue_sock_put(struct sock * sk)49 static void nf_queue_sock_put(struct sock *sk)
50 {
51 #ifdef CONFIG_INET
52 	sock_gen_put(sk);
53 #else
54 	sock_put(sk);
55 #endif
56 }
57 
nf_queue_entry_release_refs(struct nf_queue_entry * entry)58 static void nf_queue_entry_release_refs(struct nf_queue_entry *entry)
59 {
60 	struct nf_hook_state *state = &entry->state;
61 
62 	/* Release those devices we held, or Alexey will kill me. */
63 	dev_put(state->in);
64 	dev_put(state->out);
65 	if (state->sk)
66 		nf_queue_sock_put(state->sk);
67 
68 #if IS_ENABLED(CONFIG_BRIDGE_NETFILTER)
69 	dev_put(entry->physin);
70 	dev_put(entry->physout);
71 #endif
72 }
73 
nf_queue_entry_free(struct nf_queue_entry * entry)74 void nf_queue_entry_free(struct nf_queue_entry *entry)
75 {
76 	nf_queue_entry_release_refs(entry);
77 	kfree(entry);
78 }
79 EXPORT_SYMBOL_GPL(nf_queue_entry_free);
80 
__nf_queue_entry_init_physdevs(struct nf_queue_entry * entry)81 static void __nf_queue_entry_init_physdevs(struct nf_queue_entry *entry)
82 {
83 #if IS_ENABLED(CONFIG_BRIDGE_NETFILTER)
84 	const struct sk_buff *skb = entry->skb;
85 
86 	if (nf_bridge_info_exists(skb)) {
87 		entry->physin = nf_bridge_get_physindev(skb, entry->state.net);
88 		entry->physout = nf_bridge_get_physoutdev(skb);
89 	} else {
90 		entry->physin = NULL;
91 		entry->physout = NULL;
92 	}
93 #endif
94 }
95 
96 /* Bump dev refs so they don't vanish while packet is out */
nf_queue_entry_get_refs(struct nf_queue_entry * entry)97 bool nf_queue_entry_get_refs(struct nf_queue_entry *entry)
98 {
99 	struct nf_hook_state *state = &entry->state;
100 
101 	if (state->sk && !refcount_inc_not_zero(&state->sk->sk_refcnt))
102 		return false;
103 
104 	dev_hold(state->in);
105 	dev_hold(state->out);
106 
107 #if IS_ENABLED(CONFIG_BRIDGE_NETFILTER)
108 	dev_hold(entry->physin);
109 	dev_hold(entry->physout);
110 #endif
111 	return true;
112 }
113 EXPORT_SYMBOL_GPL(nf_queue_entry_get_refs);
114 
nf_queue_nf_hook_drop(struct net * net)115 void nf_queue_nf_hook_drop(struct net *net)
116 {
117 	const struct nf_queue_handler *qh;
118 
119 	rcu_read_lock();
120 	qh = rcu_dereference(nf_queue_handler);
121 	if (qh)
122 		qh->nf_hook_drop(net);
123 	rcu_read_unlock();
124 }
125 EXPORT_SYMBOL_GPL(nf_queue_nf_hook_drop);
126 
nf_ip_saveroute(const struct sk_buff * skb,struct nf_queue_entry * entry)127 static void nf_ip_saveroute(const struct sk_buff *skb,
128 			    struct nf_queue_entry *entry)
129 {
130 	struct ip_rt_info *rt_info = nf_queue_entry_reroute(entry);
131 
132 	if (entry->state.hook == NF_INET_LOCAL_OUT) {
133 		const struct iphdr *iph = ip_hdr(skb);
134 
135 		rt_info->tos = iph->tos;
136 		rt_info->daddr = iph->daddr;
137 		rt_info->saddr = iph->saddr;
138 		rt_info->mark = skb->mark;
139 	}
140 }
141 
nf_ip6_saveroute(const struct sk_buff * skb,struct nf_queue_entry * entry)142 static void nf_ip6_saveroute(const struct sk_buff *skb,
143 			     struct nf_queue_entry *entry)
144 {
145 	struct ip6_rt_info *rt_info = nf_queue_entry_reroute(entry);
146 
147 	if (entry->state.hook == NF_INET_LOCAL_OUT) {
148 		const struct ipv6hdr *iph = ipv6_hdr(skb);
149 
150 		rt_info->daddr = iph->daddr;
151 		rt_info->saddr = iph->saddr;
152 		rt_info->mark = skb->mark;
153 	}
154 }
155 
__nf_queue(struct sk_buff * skb,const struct nf_hook_state * state,unsigned int index,unsigned int queuenum)156 static int __nf_queue(struct sk_buff *skb, const struct nf_hook_state *state,
157 		      unsigned int index, unsigned int queuenum)
158 {
159 	struct nf_queue_entry *entry = NULL;
160 	const struct nf_queue_handler *qh;
161 	unsigned int route_key_size;
162 	int status;
163 
164 	/* QUEUE == DROP if no one is waiting, to be safe. */
165 	qh = rcu_dereference(nf_queue_handler);
166 	if (!qh)
167 		return -ESRCH;
168 
169 	switch (state->pf) {
170 	case AF_INET:
171 		route_key_size = sizeof(struct ip_rt_info);
172 		break;
173 	case AF_INET6:
174 		route_key_size = sizeof(struct ip6_rt_info);
175 		break;
176 	default:
177 		route_key_size = 0;
178 		break;
179 	}
180 
181 	if (skb_sk_is_prefetched(skb)) {
182 		struct sock *sk = skb->sk;
183 
184 		if (!sk_is_refcounted(sk)) {
185 			if (!refcount_inc_not_zero(&sk->sk_refcnt))
186 				return -ENOTCONN;
187 
188 			/* drop refcount on skb_orphan */
189 			skb->destructor = sock_edemux;
190 		}
191 	}
192 
193 	entry = kmalloc(sizeof(*entry) + route_key_size, GFP_ATOMIC);
194 	if (!entry)
195 		return -ENOMEM;
196 
197 	if (skb_dst(skb) && !skb_dst_force(skb)) {
198 		kfree(entry);
199 		return -ENETDOWN;
200 	}
201 
202 	*entry = (struct nf_queue_entry) {
203 		.skb	= skb,
204 		.state	= *state,
205 		.hook_index = index,
206 		.size	= sizeof(*entry) + route_key_size,
207 	};
208 
209 	__nf_queue_entry_init_physdevs(entry);
210 
211 	if (!nf_queue_entry_get_refs(entry)) {
212 		kfree(entry);
213 		return -ENOTCONN;
214 	}
215 
216 	switch (entry->state.pf) {
217 	case AF_INET:
218 		nf_ip_saveroute(skb, entry);
219 		break;
220 	case AF_INET6:
221 		nf_ip6_saveroute(skb, entry);
222 		break;
223 	}
224 
225 	status = qh->outfn(entry, queuenum);
226 	if (status < 0) {
227 		nf_queue_entry_free(entry);
228 		return status;
229 	}
230 
231 	return 0;
232 }
233 
234 /* Packets leaving via this function must come back through nf_reinject(). */
nf_queue(struct sk_buff * skb,struct nf_hook_state * state,unsigned int index,unsigned int verdict)235 int nf_queue(struct sk_buff *skb, struct nf_hook_state *state,
236 	     unsigned int index, unsigned int verdict)
237 {
238 	int ret;
239 
240 	ret = __nf_queue(skb, state, index, verdict >> NF_VERDICT_QBITS);
241 	if (ret < 0) {
242 		if (ret == -ESRCH &&
243 		    (verdict & NF_VERDICT_FLAG_QUEUE_BYPASS))
244 			return 1;
245 		kfree_skb(skb);
246 	}
247 
248 	return 0;
249 }
250 EXPORT_SYMBOL_GPL(nf_queue);
251 
nf_iterate(struct sk_buff * skb,struct nf_hook_state * state,const struct nf_hook_entries * hooks,unsigned int * index)252 static unsigned int nf_iterate(struct sk_buff *skb,
253 			       struct nf_hook_state *state,
254 			       const struct nf_hook_entries *hooks,
255 			       unsigned int *index)
256 {
257 	const struct nf_hook_entry *hook;
258 	unsigned int verdict, i = *index;
259 
260 	while (i < hooks->num_hook_entries) {
261 		hook = &hooks->hooks[i];
262 repeat:
263 		verdict = nf_hook_entry_hookfn(hook, skb, state);
264 		if (verdict != NF_ACCEPT) {
265 			*index = i;
266 			if (verdict != NF_REPEAT)
267 				return verdict;
268 			goto repeat;
269 		}
270 		i++;
271 	}
272 
273 	*index = i;
274 	return NF_ACCEPT;
275 }
276 
nf_hook_entries_head(const struct net * net,u8 pf,u8 hooknum)277 static struct nf_hook_entries *nf_hook_entries_head(const struct net *net, u8 pf, u8 hooknum)
278 {
279 	switch (pf) {
280 #ifdef CONFIG_NETFILTER_FAMILY_BRIDGE
281 	case NFPROTO_BRIDGE:
282 		return rcu_dereference(net->nf.hooks_bridge[hooknum]);
283 #endif
284 	case NFPROTO_IPV4:
285 		return rcu_dereference(net->nf.hooks_ipv4[hooknum]);
286 	case NFPROTO_IPV6:
287 		return rcu_dereference(net->nf.hooks_ipv6[hooknum]);
288 	default:
289 		WARN_ON_ONCE(1);
290 		return NULL;
291 	}
292 
293 	return NULL;
294 }
295 
296 /* Caller must hold rcu read-side lock */
nf_reinject(struct nf_queue_entry * entry,unsigned int verdict)297 void nf_reinject(struct nf_queue_entry *entry, unsigned int verdict)
298 {
299 	const struct nf_hook_entry *hook_entry;
300 	const struct nf_hook_entries *hooks;
301 	struct sk_buff *skb = entry->skb;
302 	const struct net *net;
303 	unsigned int i;
304 	int err;
305 	u8 pf;
306 
307 	net = entry->state.net;
308 	pf = entry->state.pf;
309 
310 	hooks = nf_hook_entries_head(net, pf, entry->state.hook);
311 
312 	i = entry->hook_index;
313 	if (WARN_ON_ONCE(!hooks || i >= hooks->num_hook_entries)) {
314 		kfree_skb(skb);
315 		nf_queue_entry_free(entry);
316 		return;
317 	}
318 
319 	hook_entry = &hooks->hooks[i];
320 
321 	/* Continue traversal iff userspace said ok... */
322 	if (verdict == NF_REPEAT)
323 		verdict = nf_hook_entry_hookfn(hook_entry, skb, &entry->state);
324 
325 	if (verdict == NF_ACCEPT) {
326 		if (nf_reroute(skb, entry) < 0)
327 			verdict = NF_DROP;
328 	}
329 
330 	if (verdict == NF_ACCEPT) {
331 next_hook:
332 		++i;
333 		verdict = nf_iterate(skb, &entry->state, hooks, &i);
334 	}
335 
336 	switch (verdict & NF_VERDICT_MASK) {
337 	case NF_ACCEPT:
338 	case NF_STOP:
339 		local_bh_disable();
340 		entry->state.okfn(entry->state.net, entry->state.sk, skb);
341 		local_bh_enable();
342 		break;
343 	case NF_QUEUE:
344 		err = nf_queue(skb, &entry->state, i, verdict);
345 		if (err == 1)
346 			goto next_hook;
347 		break;
348 	case NF_STOLEN:
349 		break;
350 	default:
351 		kfree_skb(skb);
352 	}
353 
354 	nf_queue_entry_free(entry);
355 }
356 EXPORT_SYMBOL(nf_reinject);
357