Commit | Line | Data |
---|---|---|
f6ebe77f | 1 | #include <linux/kernel.h> |
5a0e3ad6 | 2 | #include <linux/slab.h> |
f6ebe77f HW |
3 | #include <linux/init.h> |
4 | #include <linux/module.h> | |
5 | #include <linux/proc_fs.h> | |
6 | #include <linux/skbuff.h> | |
7 | #include <linux/netfilter.h> | |
bbd86b9f | 8 | #include <linux/seq_file.h> |
7a11b984 | 9 | #include <linux/rcupdate.h> |
f6ebe77f | 10 | #include <net/protocol.h> |
c01cd429 | 11 | #include <net/netfilter/nf_queue.h> |
f6ebe77f HW |
12 | |
13 | #include "nf_internals.h" | |
14 | ||
601e68e1 | 15 | /* |
f6ebe77f HW |
16 | * A queue handler may be registered for each protocol. Each is protected by |
17 | * long term mutex. The handler must provide an an outfn() to accept packets | |
18 | * for queueing and must reinject all packets it receives, no matter what. | |
19 | */ | |
7e9c6eeb | 20 | static const struct nf_queue_handler *queue_handler[NFPROTO_NUMPROTO] __read_mostly; |
f6ebe77f | 21 | |
585426fd | 22 | static DEFINE_MUTEX(queue_handler_mutex); |
f6ebe77f | 23 | |
d72367b6 HW |
24 | /* return EBUSY when somebody else is registered, return EEXIST if the |
25 | * same handler is registered, return 0 in case of success. */ | |
76108cea | 26 | int nf_register_queue_handler(u_int8_t pf, const struct nf_queue_handler *qh) |
601e68e1 | 27 | { |
f6ebe77f HW |
28 | int ret; |
29 | ||
7e9c6eeb | 30 | if (pf >= ARRAY_SIZE(queue_handler)) |
f6ebe77f HW |
31 | return -EINVAL; |
32 | ||
585426fd | 33 | mutex_lock(&queue_handler_mutex); |
d72367b6 HW |
34 | if (queue_handler[pf] == qh) |
35 | ret = -EEXIST; | |
36 | else if (queue_handler[pf]) | |
f6ebe77f HW |
37 | ret = -EBUSY; |
38 | else { | |
585426fd | 39 | rcu_assign_pointer(queue_handler[pf], qh); |
f6ebe77f HW |
40 | ret = 0; |
41 | } | |
585426fd | 42 | mutex_unlock(&queue_handler_mutex); |
f6ebe77f HW |
43 | |
44 | return ret; | |
45 | } | |
46 | EXPORT_SYMBOL(nf_register_queue_handler); | |
47 | ||
48 | /* The caller must flush their queue before this */ | |
76108cea | 49 | int nf_unregister_queue_handler(u_int8_t pf, const struct nf_queue_handler *qh) |
f6ebe77f | 50 | { |
7e9c6eeb | 51 | if (pf >= ARRAY_SIZE(queue_handler)) |
f6ebe77f HW |
52 | return -EINVAL; |
53 | ||
585426fd | 54 | mutex_lock(&queue_handler_mutex); |
94be1a3f | 55 | if (queue_handler[pf] && queue_handler[pf] != qh) { |
585426fd | 56 | mutex_unlock(&queue_handler_mutex); |
ce7663d8 YK |
57 | return -EINVAL; |
58 | } | |
59 | ||
585426fd YK |
60 | rcu_assign_pointer(queue_handler[pf], NULL); |
61 | mutex_unlock(&queue_handler_mutex); | |
62 | ||
63 | synchronize_rcu(); | |
601e68e1 | 64 | |
f6ebe77f HW |
65 | return 0; |
66 | } | |
67 | EXPORT_SYMBOL(nf_unregister_queue_handler); | |
68 | ||
e3ac5298 | 69 | void nf_unregister_queue_handlers(const struct nf_queue_handler *qh) |
f6ebe77f | 70 | { |
76108cea | 71 | u_int8_t pf; |
f6ebe77f | 72 | |
585426fd | 73 | mutex_lock(&queue_handler_mutex); |
7e9c6eeb | 74 | for (pf = 0; pf < ARRAY_SIZE(queue_handler); pf++) { |
bbd86b9f | 75 | if (queue_handler[pf] == qh) |
585426fd | 76 | rcu_assign_pointer(queue_handler[pf], NULL); |
f6ebe77f | 77 | } |
585426fd YK |
78 | mutex_unlock(&queue_handler_mutex); |
79 | ||
80 | synchronize_rcu(); | |
f6ebe77f HW |
81 | } |
82 | EXPORT_SYMBOL_GPL(nf_unregister_queue_handlers); | |
83 | ||
daaa8be2 PM |
84 | static void nf_queue_entry_release_refs(struct nf_queue_entry *entry) |
85 | { | |
86 | /* Release those devices we held, or Alexey will kill me. */ | |
87 | if (entry->indev) | |
88 | dev_put(entry->indev); | |
89 | if (entry->outdev) | |
90 | dev_put(entry->outdev); | |
91 | #ifdef CONFIG_BRIDGE_NETFILTER | |
92 | if (entry->skb->nf_bridge) { | |
93 | struct nf_bridge_info *nf_bridge = entry->skb->nf_bridge; | |
94 | ||
95 | if (nf_bridge->physindev) | |
96 | dev_put(nf_bridge->physindev); | |
97 | if (nf_bridge->physoutdev) | |
98 | dev_put(nf_bridge->physoutdev); | |
99 | } | |
100 | #endif | |
101 | /* Drop reference to owner of hook which queued us. */ | |
102 | module_put(entry->elem->owner); | |
103 | } | |
104 | ||
601e68e1 YH |
105 | /* |
106 | * Any packet that leaves via this function must come back | |
f6ebe77f HW |
107 | * through nf_reinject(). |
108 | */ | |
394f545d PM |
109 | static int __nf_queue(struct sk_buff *skb, |
110 | struct list_head *elem, | |
76108cea | 111 | u_int8_t pf, unsigned int hook, |
394f545d PM |
112 | struct net_device *indev, |
113 | struct net_device *outdev, | |
114 | int (*okfn)(struct sk_buff *), | |
115 | unsigned int queuenum) | |
f6ebe77f HW |
116 | { |
117 | int status; | |
daaa8be2 | 118 | struct nf_queue_entry *entry = NULL; |
f6ebe77f | 119 | #ifdef CONFIG_BRIDGE_NETFILTER |
daaa8be2 PM |
120 | struct net_device *physindev; |
121 | struct net_device *physoutdev; | |
f6ebe77f | 122 | #endif |
1e796fda | 123 | const struct nf_afinfo *afinfo; |
e3ac5298 | 124 | const struct nf_queue_handler *qh; |
f6ebe77f HW |
125 | |
126 | /* QUEUE == DROP if noone is waiting, to be safe. */ | |
585426fd YK |
127 | rcu_read_lock(); |
128 | ||
129 | qh = rcu_dereference(queue_handler[pf]); | |
daaa8be2 PM |
130 | if (!qh) |
131 | goto err_unlock; | |
f6ebe77f | 132 | |
bce8032e | 133 | afinfo = nf_get_afinfo(pf); |
daaa8be2 PM |
134 | if (!afinfo) |
135 | goto err_unlock; | |
bce8032e | 136 | |
02f014d8 | 137 | entry = kmalloc(sizeof(*entry) + afinfo->route_key_size, GFP_ATOMIC); |
daaa8be2 PM |
138 | if (!entry) |
139 | goto err_unlock; | |
f6ebe77f | 140 | |
02f014d8 PM |
141 | *entry = (struct nf_queue_entry) { |
142 | .skb = skb, | |
143 | .elem = list_entry(elem, struct nf_hook_ops, list), | |
144 | .pf = pf, | |
145 | .hook = hook, | |
146 | .indev = indev, | |
147 | .outdev = outdev, | |
148 | .okfn = okfn, | |
149 | }; | |
f6ebe77f HW |
150 | |
151 | /* If it's going away, ignore hook. */ | |
02f014d8 | 152 | if (!try_module_get(entry->elem->owner)) { |
585426fd | 153 | rcu_read_unlock(); |
02f014d8 | 154 | kfree(entry); |
f6ebe77f HW |
155 | return 0; |
156 | } | |
157 | ||
158 | /* Bump dev refs so they don't vanish while packet is out */ | |
8b1cf0db PM |
159 | if (indev) |
160 | dev_hold(indev); | |
161 | if (outdev) | |
162 | dev_hold(outdev); | |
f6ebe77f | 163 | #ifdef CONFIG_BRIDGE_NETFILTER |
394f545d PM |
164 | if (skb->nf_bridge) { |
165 | physindev = skb->nf_bridge->physindev; | |
8b1cf0db PM |
166 | if (physindev) |
167 | dev_hold(physindev); | |
394f545d | 168 | physoutdev = skb->nf_bridge->physoutdev; |
8b1cf0db PM |
169 | if (physoutdev) |
170 | dev_hold(physoutdev); | |
f6ebe77f HW |
171 | } |
172 | #endif | |
02f014d8 PM |
173 | afinfo->saveroute(skb, entry); |
174 | status = qh->outfn(entry, queuenum); | |
f6ebe77f | 175 | |
585426fd | 176 | rcu_read_unlock(); |
f6ebe77f HW |
177 | |
178 | if (status < 0) { | |
daaa8be2 PM |
179 | nf_queue_entry_release_refs(entry); |
180 | goto err; | |
f6ebe77f HW |
181 | } |
182 | ||
183 | return 1; | |
daaa8be2 PM |
184 | |
185 | err_unlock: | |
186 | rcu_read_unlock(); | |
187 | err: | |
188 | kfree_skb(skb); | |
189 | kfree(entry); | |
190 | return 1; | |
f6ebe77f HW |
191 | } |
192 | ||
394f545d PM |
193 | int nf_queue(struct sk_buff *skb, |
194 | struct list_head *elem, | |
76108cea | 195 | u_int8_t pf, unsigned int hook, |
394f545d PM |
196 | struct net_device *indev, |
197 | struct net_device *outdev, | |
198 | int (*okfn)(struct sk_buff *), | |
199 | unsigned int queuenum) | |
200 | { | |
201 | struct sk_buff *segs; | |
202 | ||
203 | if (!skb_is_gso(skb)) | |
204 | return __nf_queue(skb, elem, pf, hook, indev, outdev, okfn, | |
205 | queuenum); | |
206 | ||
207 | switch (pf) { | |
4b1e27e9 | 208 | case NFPROTO_IPV4: |
394f545d PM |
209 | skb->protocol = htons(ETH_P_IP); |
210 | break; | |
4b1e27e9 | 211 | case NFPROTO_IPV6: |
394f545d PM |
212 | skb->protocol = htons(ETH_P_IPV6); |
213 | break; | |
214 | } | |
215 | ||
216 | segs = skb_gso_segment(skb, 0); | |
217 | kfree_skb(skb); | |
801678c5 | 218 | if (IS_ERR(segs)) |
394f545d PM |
219 | return 1; |
220 | ||
221 | do { | |
222 | struct sk_buff *nskb = segs->next; | |
223 | ||
224 | segs->next = NULL; | |
225 | if (!__nf_queue(segs, elem, pf, hook, indev, outdev, okfn, | |
226 | queuenum)) | |
227 | kfree_skb(segs); | |
228 | segs = nskb; | |
229 | } while (segs); | |
230 | return 1; | |
231 | } | |
232 | ||
02f014d8 | 233 | void nf_reinject(struct nf_queue_entry *entry, unsigned int verdict) |
f6ebe77f | 234 | { |
02f014d8 PM |
235 | struct sk_buff *skb = entry->skb; |
236 | struct list_head *elem = &entry->elem->list; | |
1e796fda | 237 | const struct nf_afinfo *afinfo; |
f6ebe77f HW |
238 | |
239 | rcu_read_lock(); | |
240 | ||
daaa8be2 | 241 | nf_queue_entry_release_refs(entry); |
f6ebe77f | 242 | |
f6ebe77f HW |
243 | /* Continue traversal iff userspace said ok... */ |
244 | if (verdict == NF_REPEAT) { | |
245 | elem = elem->prev; | |
246 | verdict = NF_ACCEPT; | |
247 | } | |
248 | ||
7a11b984 | 249 | if (verdict == NF_ACCEPT) { |
02f014d8 PM |
250 | afinfo = nf_get_afinfo(entry->pf); |
251 | if (!afinfo || afinfo->reroute(skb, entry) < 0) | |
7a11b984 PM |
252 | verdict = NF_DROP; |
253 | } | |
254 | ||
f6ebe77f HW |
255 | if (verdict == NF_ACCEPT) { |
256 | next_hook: | |
02f014d8 PM |
257 | verdict = nf_iterate(&nf_hooks[entry->pf][entry->hook], |
258 | skb, entry->hook, | |
259 | entry->indev, entry->outdev, &elem, | |
260 | entry->okfn, INT_MIN); | |
f6ebe77f HW |
261 | } |
262 | ||
263 | switch (verdict & NF_VERDICT_MASK) { | |
264 | case NF_ACCEPT: | |
3bc38712 | 265 | case NF_STOP: |
4b3d15ef | 266 | local_bh_disable(); |
02f014d8 | 267 | entry->okfn(skb); |
4b3d15ef | 268 | local_bh_enable(); |
f6ebe77f | 269 | break; |
f6ebe77f | 270 | case NF_QUEUE: |
02f014d8 PM |
271 | if (!__nf_queue(skb, elem, entry->pf, entry->hook, |
272 | entry->indev, entry->outdev, entry->okfn, | |
394f545d | 273 | verdict >> NF_VERDICT_BITS)) |
f6ebe77f HW |
274 | goto next_hook; |
275 | break; | |
64507fdb | 276 | case NF_STOLEN: |
3bc38712 PM |
277 | default: |
278 | kfree_skb(skb); | |
f6ebe77f HW |
279 | } |
280 | rcu_read_unlock(); | |
02f014d8 | 281 | kfree(entry); |
f6ebe77f HW |
282 | } |
283 | EXPORT_SYMBOL(nf_reinject); | |
284 | ||
bbd86b9f HW |
285 | #ifdef CONFIG_PROC_FS |
286 | static void *seq_start(struct seq_file *seq, loff_t *pos) | |
287 | { | |
7e9c6eeb | 288 | if (*pos >= ARRAY_SIZE(queue_handler)) |
bbd86b9f HW |
289 | return NULL; |
290 | ||
291 | return pos; | |
292 | } | |
293 | ||
294 | static void *seq_next(struct seq_file *s, void *v, loff_t *pos) | |
295 | { | |
296 | (*pos)++; | |
297 | ||
7e9c6eeb | 298 | if (*pos >= ARRAY_SIZE(queue_handler)) |
bbd86b9f HW |
299 | return NULL; |
300 | ||
301 | return pos; | |
302 | } | |
303 | ||
304 | static void seq_stop(struct seq_file *s, void *v) | |
305 | { | |
306 | ||
307 | } | |
308 | ||
309 | static int seq_show(struct seq_file *s, void *v) | |
310 | { | |
311 | int ret; | |
312 | loff_t *pos = v; | |
e3ac5298 | 313 | const struct nf_queue_handler *qh; |
bbd86b9f | 314 | |
585426fd YK |
315 | rcu_read_lock(); |
316 | qh = rcu_dereference(queue_handler[*pos]); | |
bbd86b9f HW |
317 | if (!qh) |
318 | ret = seq_printf(s, "%2lld NONE\n", *pos); | |
319 | else | |
320 | ret = seq_printf(s, "%2lld %s\n", *pos, qh->name); | |
585426fd | 321 | rcu_read_unlock(); |
bbd86b9f HW |
322 | |
323 | return ret; | |
324 | } | |
325 | ||
56b3d975 | 326 | static const struct seq_operations nfqueue_seq_ops = { |
bbd86b9f HW |
327 | .start = seq_start, |
328 | .next = seq_next, | |
329 | .stop = seq_stop, | |
330 | .show = seq_show, | |
331 | }; | |
332 | ||
333 | static int nfqueue_open(struct inode *inode, struct file *file) | |
334 | { | |
335 | return seq_open(file, &nfqueue_seq_ops); | |
336 | } | |
337 | ||
da7071d7 | 338 | static const struct file_operations nfqueue_file_ops = { |
bbd86b9f HW |
339 | .owner = THIS_MODULE, |
340 | .open = nfqueue_open, | |
341 | .read = seq_read, | |
342 | .llseek = seq_lseek, | |
343 | .release = seq_release, | |
344 | }; | |
345 | #endif /* PROC_FS */ | |
346 | ||
347 | ||
f6ebe77f HW |
348 | int __init netfilter_queue_init(void) |
349 | { | |
bbd86b9f | 350 | #ifdef CONFIG_PROC_FS |
8eeee8b1 DL |
351 | if (!proc_create("nf_queue", S_IRUGO, |
352 | proc_net_netfilter, &nfqueue_file_ops)) | |
bbd86b9f | 353 | return -1; |
bbd86b9f | 354 | #endif |
f6ebe77f HW |
355 | return 0; |
356 | } | |
357 |