[IPV6] Remove three method declarations in include/net/ndisc.h.
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / net / core / filter.c
CommitLineData
1da177e4
LT
1/*
2 * Linux Socket Filter - Kernel level socket filtering
3 *
4 * Author:
5 * Jay Schulist <jschlst@samba.org>
6 *
7 * Based on the design of:
8 * - The Berkeley Packet Filter
9 *
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
14 *
15 * Andi Kleen - Fix a few bad bugs and races.
93699863 16 * Kris Katterjohn - Added many additional checks in sk_chk_filter()
1da177e4
LT
17 */
18
19#include <linux/module.h>
20#include <linux/types.h>
1da177e4
LT
21#include <linux/mm.h>
22#include <linux/fcntl.h>
23#include <linux/socket.h>
24#include <linux/in.h>
25#include <linux/inet.h>
26#include <linux/netdevice.h>
27#include <linux/if_packet.h>
28#include <net/ip.h>
29#include <net/protocol.h>
30#include <linux/skbuff.h>
31#include <net/sock.h>
32#include <linux/errno.h>
33#include <linux/timer.h>
34#include <asm/system.h>
35#include <asm/uaccess.h>
40daafc8 36#include <asm/unaligned.h>
1da177e4
LT
37#include <linux/filter.h>
38
39/* No hurry in this branch */
0b05b2a4 40static void *__load_pointer(struct sk_buff *skb, int k)
1da177e4
LT
41{
42 u8 *ptr = NULL;
43
44 if (k >= SKF_NET_OFF)
d56f90a7 45 ptr = skb_network_header(skb) + k - SKF_NET_OFF;
1da177e4 46 else if (k >= SKF_LL_OFF)
98e399f8 47 ptr = skb_mac_header(skb) + k - SKF_LL_OFF;
1da177e4 48
27a884dc 49 if (ptr >= skb->head && ptr < skb_tail_pointer(skb))
1da177e4
LT
50 return ptr;
51 return NULL;
52}
53
0b05b2a4 54static inline void *load_pointer(struct sk_buff *skb, int k,
4ec93edb 55 unsigned int size, void *buffer)
0b05b2a4
PM
56{
57 if (k >= 0)
58 return skb_header_pointer(skb, k, size, buffer);
59 else {
60 if (k >= SKF_AD_OFF)
61 return NULL;
62 return __load_pointer(skb, k);
63 }
64}
65
43db6d65
SH
66/**
67 * sk_filter - run a packet through a socket filter
68 * @sk: sock associated with &sk_buff
69 * @skb: buffer to filter
70 * @needlock: set to 1 if the sock is not locked by caller.
71 *
72 * Run the filter code and then cut skb->data to correct size returned by
73 * sk_run_filter. If pkt_len is 0 we toss packet. If skb->len is smaller
74 * than pkt_len we keep whole skb->data. This is the socket level
75 * wrapper to sk_run_filter. It returns 0 if the packet should
76 * be accepted or -EPERM if the packet should be tossed.
77 *
78 */
79int sk_filter(struct sock *sk, struct sk_buff *skb)
80{
81 int err;
82 struct sk_filter *filter;
83
84 err = security_sock_rcv_skb(sk, skb);
85 if (err)
86 return err;
87
88 rcu_read_lock_bh();
89 filter = rcu_dereference(sk->sk_filter);
90 if (filter) {
91 unsigned int pkt_len = sk_run_filter(skb, filter->insns,
92 filter->len);
93 err = pkt_len ? pskb_trim(skb, pkt_len) : -EPERM;
94 }
95 rcu_read_unlock_bh();
96
97 return err;
98}
99EXPORT_SYMBOL(sk_filter);
100
1da177e4 101/**
2966b66c 102 * sk_run_filter - run a filter on a socket
1da177e4
LT
103 * @skb: buffer to run the filter on
104 * @filter: filter to apply
105 * @flen: length of filter
106 *
107 * Decode and apply filter instructions to the skb->data.
108 * Return length to keep, 0 for none. skb is the data we are
109 * filtering, filter is the array of filter instructions, and
110 * len is the number of filter blocks in the array.
111 */
4bad4dc9 112unsigned int sk_run_filter(struct sk_buff *skb, struct sock_filter *filter, int flen)
1da177e4 113{
1da177e4 114 struct sock_filter *fentry; /* We walk down these */
0b05b2a4 115 void *ptr;
2966b66c
KK
116 u32 A = 0; /* Accumulator */
117 u32 X = 0; /* Index Register */
1da177e4 118 u32 mem[BPF_MEMWORDS]; /* Scratch Memory Store */
0b05b2a4 119 u32 tmp;
1da177e4
LT
120 int k;
121 int pc;
122
123 /*
124 * Process array of filter instructions.
125 */
126 for (pc = 0; pc < flen; pc++) {
127 fentry = &filter[pc];
4ec93edb 128
1da177e4
LT
129 switch (fentry->code) {
130 case BPF_ALU|BPF_ADD|BPF_X:
131 A += X;
132 continue;
133 case BPF_ALU|BPF_ADD|BPF_K:
134 A += fentry->k;
135 continue;
136 case BPF_ALU|BPF_SUB|BPF_X:
137 A -= X;
138 continue;
139 case BPF_ALU|BPF_SUB|BPF_K:
140 A -= fentry->k;
141 continue;
142 case BPF_ALU|BPF_MUL|BPF_X:
143 A *= X;
144 continue;
145 case BPF_ALU|BPF_MUL|BPF_K:
146 A *= fentry->k;
147 continue;
148 case BPF_ALU|BPF_DIV|BPF_X:
149 if (X == 0)
150 return 0;
151 A /= X;
152 continue;
153 case BPF_ALU|BPF_DIV|BPF_K:
1da177e4
LT
154 A /= fentry->k;
155 continue;
156 case BPF_ALU|BPF_AND|BPF_X:
157 A &= X;
158 continue;
159 case BPF_ALU|BPF_AND|BPF_K:
160 A &= fentry->k;
161 continue;
162 case BPF_ALU|BPF_OR|BPF_X:
163 A |= X;
164 continue;
165 case BPF_ALU|BPF_OR|BPF_K:
166 A |= fentry->k;
167 continue;
168 case BPF_ALU|BPF_LSH|BPF_X:
169 A <<= X;
170 continue;
171 case BPF_ALU|BPF_LSH|BPF_K:
172 A <<= fentry->k;
173 continue;
174 case BPF_ALU|BPF_RSH|BPF_X:
175 A >>= X;
176 continue;
177 case BPF_ALU|BPF_RSH|BPF_K:
178 A >>= fentry->k;
179 continue;
180 case BPF_ALU|BPF_NEG:
181 A = -A;
182 continue;
183 case BPF_JMP|BPF_JA:
184 pc += fentry->k;
185 continue;
186 case BPF_JMP|BPF_JGT|BPF_K:
187 pc += (A > fentry->k) ? fentry->jt : fentry->jf;
188 continue;
189 case BPF_JMP|BPF_JGE|BPF_K:
190 pc += (A >= fentry->k) ? fentry->jt : fentry->jf;
191 continue;
192 case BPF_JMP|BPF_JEQ|BPF_K:
193 pc += (A == fentry->k) ? fentry->jt : fentry->jf;
194 continue;
195 case BPF_JMP|BPF_JSET|BPF_K:
196 pc += (A & fentry->k) ? fentry->jt : fentry->jf;
197 continue;
198 case BPF_JMP|BPF_JGT|BPF_X:
199 pc += (A > X) ? fentry->jt : fentry->jf;
200 continue;
201 case BPF_JMP|BPF_JGE|BPF_X:
202 pc += (A >= X) ? fentry->jt : fentry->jf;
203 continue;
204 case BPF_JMP|BPF_JEQ|BPF_X:
205 pc += (A == X) ? fentry->jt : fentry->jf;
206 continue;
207 case BPF_JMP|BPF_JSET|BPF_X:
208 pc += (A & X) ? fentry->jt : fentry->jf;
209 continue;
210 case BPF_LD|BPF_W|BPF_ABS:
211 k = fentry->k;
e35bedf3 212load_w:
0b05b2a4
PM
213 ptr = load_pointer(skb, k, 4, &tmp);
214 if (ptr != NULL) {
252e3346 215 A = ntohl(get_unaligned((__be32 *)ptr));
0b05b2a4 216 continue;
1da177e4 217 }
1198ad00 218 break;
1da177e4
LT
219 case BPF_LD|BPF_H|BPF_ABS:
220 k = fentry->k;
e35bedf3 221load_h:
0b05b2a4
PM
222 ptr = load_pointer(skb, k, 2, &tmp);
223 if (ptr != NULL) {
252e3346 224 A = ntohs(get_unaligned((__be16 *)ptr));
0b05b2a4 225 continue;
1da177e4 226 }
1198ad00 227 break;
1da177e4
LT
228 case BPF_LD|BPF_B|BPF_ABS:
229 k = fentry->k;
230load_b:
0b05b2a4
PM
231 ptr = load_pointer(skb, k, 1, &tmp);
232 if (ptr != NULL) {
233 A = *(u8 *)ptr;
234 continue;
1da177e4 235 }
1198ad00 236 break;
1da177e4 237 case BPF_LD|BPF_W|BPF_LEN:
3154e540 238 A = skb->len;
1da177e4
LT
239 continue;
240 case BPF_LDX|BPF_W|BPF_LEN:
3154e540 241 X = skb->len;
1da177e4
LT
242 continue;
243 case BPF_LD|BPF_W|BPF_IND:
244 k = X + fentry->k;
245 goto load_w;
246 case BPF_LD|BPF_H|BPF_IND:
247 k = X + fentry->k;
248 goto load_h;
249 case BPF_LD|BPF_B|BPF_IND:
250 k = X + fentry->k;
251 goto load_b;
252 case BPF_LDX|BPF_B|BPF_MSH:
0b05b2a4
PM
253 ptr = load_pointer(skb, fentry->k, 1, &tmp);
254 if (ptr != NULL) {
255 X = (*(u8 *)ptr & 0xf) << 2;
256 continue;
257 }
258 return 0;
1da177e4
LT
259 case BPF_LD|BPF_IMM:
260 A = fentry->k;
261 continue;
262 case BPF_LDX|BPF_IMM:
263 X = fentry->k;
264 continue;
265 case BPF_LD|BPF_MEM:
266 A = mem[fentry->k];
267 continue;
268 case BPF_LDX|BPF_MEM:
269 X = mem[fentry->k];
270 continue;
271 case BPF_MISC|BPF_TAX:
272 X = A;
273 continue;
274 case BPF_MISC|BPF_TXA:
275 A = X;
276 continue;
277 case BPF_RET|BPF_K:
4bad4dc9 278 return fentry->k;
1da177e4 279 case BPF_RET|BPF_A:
4bad4dc9 280 return A;
1da177e4
LT
281 case BPF_ST:
282 mem[fentry->k] = A;
283 continue;
284 case BPF_STX:
285 mem[fentry->k] = X;
286 continue;
287 default:
93699863 288 WARN_ON(1);
1da177e4
LT
289 return 0;
290 }
291
292 /*
293 * Handle ancillary data, which are impossible
294 * (or very difficult) to get parsing packet contents.
295 */
296 switch (k-SKF_AD_OFF) {
297 case SKF_AD_PROTOCOL:
252e3346 298 A = ntohs(skb->protocol);
1da177e4
LT
299 continue;
300 case SKF_AD_PKTTYPE:
301 A = skb->pkt_type;
302 continue;
303 case SKF_AD_IFINDEX:
304 A = skb->dev->ifindex;
305 continue;
306 default:
307 return 0;
308 }
309 }
310
311 return 0;
312}
b715631f 313EXPORT_SYMBOL(sk_run_filter);
1da177e4
LT
314
315/**
316 * sk_chk_filter - verify socket filter code
317 * @filter: filter to verify
318 * @flen: length of filter
319 *
320 * Check the user's filter code. If we let some ugly
321 * filter code slip through kaboom! The filter must contain
93699863
KK
322 * no references or jumps that are out of range, no illegal
323 * instructions, and must end with a RET instruction.
1da177e4 324 *
7b11f69f
KK
325 * All jumps are forward as they are not signed.
326 *
327 * Returns 0 if the rule set is legal or -EINVAL if not.
1da177e4
LT
328 */
329int sk_chk_filter(struct sock_filter *filter, int flen)
330{
331 struct sock_filter *ftest;
332 int pc;
333
1b93ae64 334 if (flen == 0 || flen > BPF_MAXINSNS)
1da177e4
LT
335 return -EINVAL;
336
337 /* check the filter code now */
338 for (pc = 0; pc < flen; pc++) {
1da177e4 339 ftest = &filter[pc];
1da177e4 340
93699863
KK
341 /* Only allow valid instructions */
342 switch (ftest->code) {
343 case BPF_ALU|BPF_ADD|BPF_K:
344 case BPF_ALU|BPF_ADD|BPF_X:
345 case BPF_ALU|BPF_SUB|BPF_K:
346 case BPF_ALU|BPF_SUB|BPF_X:
347 case BPF_ALU|BPF_MUL|BPF_K:
348 case BPF_ALU|BPF_MUL|BPF_X:
349 case BPF_ALU|BPF_DIV|BPF_X:
350 case BPF_ALU|BPF_AND|BPF_K:
351 case BPF_ALU|BPF_AND|BPF_X:
352 case BPF_ALU|BPF_OR|BPF_K:
353 case BPF_ALU|BPF_OR|BPF_X:
354 case BPF_ALU|BPF_LSH|BPF_K:
355 case BPF_ALU|BPF_LSH|BPF_X:
356 case BPF_ALU|BPF_RSH|BPF_K:
357 case BPF_ALU|BPF_RSH|BPF_X:
358 case BPF_ALU|BPF_NEG:
359 case BPF_LD|BPF_W|BPF_ABS:
360 case BPF_LD|BPF_H|BPF_ABS:
361 case BPF_LD|BPF_B|BPF_ABS:
362 case BPF_LD|BPF_W|BPF_LEN:
363 case BPF_LD|BPF_W|BPF_IND:
364 case BPF_LD|BPF_H|BPF_IND:
365 case BPF_LD|BPF_B|BPF_IND:
366 case BPF_LD|BPF_IMM:
367 case BPF_LDX|BPF_W|BPF_LEN:
368 case BPF_LDX|BPF_B|BPF_MSH:
369 case BPF_LDX|BPF_IMM:
370 case BPF_MISC|BPF_TAX:
371 case BPF_MISC|BPF_TXA:
372 case BPF_RET|BPF_K:
373 case BPF_RET|BPF_A:
374 break;
375
376 /* Some instructions need special checks */
fb0d366b 377
93699863
KK
378 case BPF_ALU|BPF_DIV|BPF_K:
379 /* check for division by zero */
380 if (ftest->k == 0)
1da177e4 381 return -EINVAL;
93699863
KK
382 break;
383
384 case BPF_LD|BPF_MEM:
385 case BPF_LDX|BPF_MEM:
386 case BPF_ST:
387 case BPF_STX:
388 /* check for invalid memory addresses */
389 if (ftest->k >= BPF_MEMWORDS)
390 return -EINVAL;
391 break;
392
393 case BPF_JMP|BPF_JA:
394 /*
395 * Note, the large ftest->k might cause loops.
396 * Compare this with conditional jumps below,
397 * where offsets are limited. --ANK (981016)
398 */
399 if (ftest->k >= (unsigned)(flen-pc-1))
400 return -EINVAL;
401 break;
402
403 case BPF_JMP|BPF_JEQ|BPF_K:
404 case BPF_JMP|BPF_JEQ|BPF_X:
405 case BPF_JMP|BPF_JGE|BPF_K:
406 case BPF_JMP|BPF_JGE|BPF_X:
407 case BPF_JMP|BPF_JGT|BPF_K:
408 case BPF_JMP|BPF_JGT|BPF_X:
409 case BPF_JMP|BPF_JSET|BPF_K:
410 case BPF_JMP|BPF_JSET|BPF_X:
411 /* for conditionals both must be safe */
e35bedf3 412 if (pc + ftest->jt + 1 >= flen ||
93699863
KK
413 pc + ftest->jf + 1 >= flen)
414 return -EINVAL;
415 break;
416
417 default:
418 return -EINVAL;
1da177e4
LT
419 }
420 }
421
e35bedf3 422 return (BPF_CLASS(filter[flen - 1].code) == BPF_RET) ? 0 : -EINVAL;
1da177e4 423}
b715631f 424EXPORT_SYMBOL(sk_chk_filter);
1da177e4 425
47e958ea
PE
426/**
427 * sk_filter_rcu_release: Release a socket filter by rcu_head
428 * @rcu: rcu_head that contains the sk_filter to free
429 */
430static void sk_filter_rcu_release(struct rcu_head *rcu)
431{
432 struct sk_filter *fp = container_of(rcu, struct sk_filter, rcu);
433
434 sk_filter_release(fp);
435}
436
437static void sk_filter_delayed_uncharge(struct sock *sk, struct sk_filter *fp)
438{
439 unsigned int size = sk_filter_len(fp);
440
441 atomic_sub(size, &sk->sk_omem_alloc);
442 call_rcu_bh(&fp->rcu, sk_filter_rcu_release);
443}
444
1da177e4
LT
445/**
446 * sk_attach_filter - attach a socket filter
447 * @fprog: the filter program
448 * @sk: the socket to use
449 *
450 * Attach the user's filter code. We first run some sanity checks on
451 * it to make sure it does not explode on us later. If an error
452 * occurs or there is insufficient memory for the filter a negative
453 * errno code is returned. On success the return is zero.
454 */
455int sk_attach_filter(struct sock_fprog *fprog, struct sock *sk)
456{
d3904b73 457 struct sk_filter *fp, *old_fp;
1da177e4
LT
458 unsigned int fsize = sizeof(struct sock_filter) * fprog->len;
459 int err;
460
461 /* Make sure new filter is there and in the right amounts. */
e35bedf3
KK
462 if (fprog->filter == NULL)
463 return -EINVAL;
1da177e4
LT
464
465 fp = sock_kmalloc(sk, fsize+sizeof(*fp), GFP_KERNEL);
466 if (!fp)
467 return -ENOMEM;
468 if (copy_from_user(fp->insns, fprog->filter, fsize)) {
4ec93edb 469 sock_kfree_s(sk, fp, fsize+sizeof(*fp));
1da177e4
LT
470 return -EFAULT;
471 }
472
473 atomic_set(&fp->refcnt, 1);
474 fp->len = fprog->len;
475
476 err = sk_chk_filter(fp->insns, fp->len);
d3904b73
PE
477 if (err) {
478 sk_filter_uncharge(sk, fp);
479 return err;
1da177e4
LT
480 }
481
d3904b73
PE
482 rcu_read_lock_bh();
483 old_fp = rcu_dereference(sk->sk_filter);
484 rcu_assign_pointer(sk->sk_filter, fp);
485 rcu_read_unlock_bh();
486
9b013e05
OJ
487 if (old_fp)
488 sk_filter_delayed_uncharge(sk, old_fp);
d3904b73 489 return 0;
1da177e4
LT
490}
491
55b33325
PE
492int sk_detach_filter(struct sock *sk)
493{
494 int ret = -ENOENT;
495 struct sk_filter *filter;
496
497 rcu_read_lock_bh();
498 filter = rcu_dereference(sk->sk_filter);
499 if (filter) {
500 rcu_assign_pointer(sk->sk_filter, NULL);
47e958ea 501 sk_filter_delayed_uncharge(sk, filter);
55b33325
PE
502 ret = 0;
503 }
504 rcu_read_unlock_bh();
505 return ret;
506}