upgrade to linux 2.6.10-1.12_FC2
[linux-2.6.git] / net / ipv4 / netfilter / ipt_REJECT.c
1 /*
2  * This is a module which is used for rejecting packets.
3  * Added support for customized reject packets (Jozsef Kadlecsik).
4  * Added support for ICMP type-3-code-13 (Maciej Soltysiak). [RFC 1812]
5  */
6
7 /* (C) 1999-2001 Paul `Rusty' Russell
8  * (C) 2002-2004 Netfilter Core Team <coreteam@netfilter.org>
9  *
10  * This program is free software; you can redistribute it and/or modify
11  * it under the terms of the GNU General Public License version 2 as
12  * published by the Free Software Foundation.
13  */
14
15 #include <linux/config.h>
16 #include <linux/module.h>
17 #include <linux/skbuff.h>
18 #include <linux/ip.h>
19 #include <linux/udp.h>
20 #include <linux/icmp.h>
21 #include <net/icmp.h>
22 #include <net/ip.h>
23 #include <net/tcp.h>
24 #include <net/route.h>
25 #include <net/dst.h>
26 #include <linux/netfilter_ipv4/ip_tables.h>
27 #include <linux/netfilter_ipv4/ipt_REJECT.h>
28 #ifdef CONFIG_BRIDGE_NETFILTER
29 #include <linux/netfilter_bridge.h>
30 #endif
31
32 MODULE_LICENSE("GPL");
33 MODULE_AUTHOR("Netfilter Core Team <coreteam@netfilter.org>");
34 MODULE_DESCRIPTION("iptables REJECT target module");
35
36 #if 0
37 #define DEBUGP printk
38 #else
39 #define DEBUGP(format, args...)
40 #endif
41
42 static inline struct rtable *route_reverse(struct sk_buff *skb, 
43                                            struct tcphdr *tcph, int hook)
44 {
45         struct iphdr *iph = skb->nh.iph;
46         struct dst_entry *odst;
47         struct flowi fl = {};
48         struct rtable *rt;
49
50         /* We don't require ip forwarding to be enabled to be able to
51          * send a RST reply for bridged traffic. */
52         if (hook != NF_IP_FORWARD
53 #ifdef CONFIG_BRIDGE_NETFILTER
54             || (skb->nf_bridge && skb->nf_bridge->mask & BRNF_BRIDGED)
55 #endif
56            ) {
57                 fl.nl_u.ip4_u.daddr = iph->saddr;
58                 if (hook == NF_IP_LOCAL_IN)
59                         fl.nl_u.ip4_u.saddr = iph->daddr;
60                 fl.nl_u.ip4_u.tos = RT_TOS(iph->tos);
61
62                 if (ip_route_output_key(&rt, &fl) != 0)
63                         return NULL;
64         } else {
65                 /* non-local src, find valid iif to satisfy
66                  * rp-filter when calling ip_route_input. */
67                 fl.nl_u.ip4_u.daddr = iph->daddr;
68                 if (ip_route_output_key(&rt, &fl) != 0)
69                         return NULL;
70
71                 odst = skb->dst;
72                 if (ip_route_input(skb, iph->saddr, iph->daddr,
73                                    RT_TOS(iph->tos), rt->u.dst.dev) != 0) {
74                         dst_release(&rt->u.dst);
75                         return NULL;
76                 }
77                 dst_release(&rt->u.dst);
78                 rt = (struct rtable *)skb->dst;
79                 skb->dst = odst;
80
81                 fl.nl_u.ip4_u.daddr = iph->saddr;
82                 fl.nl_u.ip4_u.saddr = iph->daddr;
83                 fl.nl_u.ip4_u.tos = RT_TOS(iph->tos);
84         }
85
86         if (rt->u.dst.error) {
87                 dst_release(&rt->u.dst);
88                 return NULL;
89         }
90
91         fl.proto = IPPROTO_TCP;
92         fl.fl_ip_sport = tcph->dest;
93         fl.fl_ip_dport = tcph->source;
94
95         if (xfrm_lookup((struct dst_entry **)&rt, &fl, NULL, 0)) {
96                 dst_release(&rt->u.dst);
97                 rt = NULL;
98         }
99
100         return rt;
101 }
102
103 /* Send RST reply */
104 static void send_reset(struct sk_buff *oldskb, int hook)
105 {
106         struct sk_buff *nskb;
107         struct tcphdr _otcph, *oth, *tcph;
108         struct rtable *rt;
109         u_int16_t tmp_port;
110         u_int32_t tmp_addr;
111         int needs_ack;
112         int hh_len;
113
114         /* IP header checks: fragment. */
115         if (oldskb->nh.iph->frag_off & htons(IP_OFFSET))
116                 return;
117
118         oth = skb_header_pointer(oldskb, oldskb->nh.iph->ihl * 4,
119                                  sizeof(_otcph), &_otcph);
120         if (oth == NULL)
121                 return;
122
123         /* No RST for RST. */
124         if (oth->rst)
125                 return;
126
127         /* FIXME: Check checksum --RR */
128         if ((rt = route_reverse(oldskb, oth, hook)) == NULL)
129                 return;
130
131         hh_len = LL_RESERVED_SPACE(rt->u.dst.dev);
132
133         /* We need a linear, writeable skb.  We also need to expand
134            headroom in case hh_len of incoming interface < hh_len of
135            outgoing interface */
136         nskb = skb_copy_expand(oldskb, hh_len, skb_tailroom(oldskb),
137                                GFP_ATOMIC);
138         if (!nskb) {
139                 dst_release(&rt->u.dst);
140                 return;
141         }
142
143         dst_release(nskb->dst);
144         nskb->dst = &rt->u.dst;
145
146         /* This packet will not be the same as the other: clear nf fields */
147         nf_reset(nskb);
148         nskb->nfcache = 0;
149         nskb->nfmark = 0;
150 #ifdef CONFIG_BRIDGE_NETFILTER
151         nf_bridge_put(nskb->nf_bridge);
152         nskb->nf_bridge = NULL;
153 #endif
154
155         tcph = (struct tcphdr *)((u_int32_t*)nskb->nh.iph + nskb->nh.iph->ihl);
156
157         /* Swap source and dest */
158         tmp_addr = nskb->nh.iph->saddr;
159         nskb->nh.iph->saddr = nskb->nh.iph->daddr;
160         nskb->nh.iph->daddr = tmp_addr;
161         tmp_port = tcph->source;
162         tcph->source = tcph->dest;
163         tcph->dest = tmp_port;
164
165         /* Truncate to length (no data) */
166         tcph->doff = sizeof(struct tcphdr)/4;
167         skb_trim(nskb, nskb->nh.iph->ihl*4 + sizeof(struct tcphdr));
168         nskb->nh.iph->tot_len = htons(nskb->len);
169
170         if (tcph->ack) {
171                 needs_ack = 0;
172                 tcph->seq = oth->ack_seq;
173                 tcph->ack_seq = 0;
174         } else {
175                 needs_ack = 1;
176                 tcph->ack_seq = htonl(ntohl(oth->seq) + oth->syn + oth->fin
177                                       + oldskb->len - oldskb->nh.iph->ihl*4
178                                       - (oth->doff<<2));
179                 tcph->seq = 0;
180         }
181
182         /* Reset flags */
183         ((u_int8_t *)tcph)[13] = 0;
184         tcph->rst = 1;
185         tcph->ack = needs_ack;
186
187         tcph->window = 0;
188         tcph->urg_ptr = 0;
189
190         /* Adjust TCP checksum */
191         tcph->check = 0;
192         tcph->check = tcp_v4_check(tcph, sizeof(struct tcphdr),
193                                    nskb->nh.iph->saddr,
194                                    nskb->nh.iph->daddr,
195                                    csum_partial((char *)tcph,
196                                                 sizeof(struct tcphdr), 0));
197
198         /* Adjust IP TTL, DF */
199         nskb->nh.iph->ttl = MAXTTL;
200         /* Set DF, id = 0 */
201         nskb->nh.iph->frag_off = htons(IP_DF);
202         nskb->nh.iph->id = 0;
203
204         /* Adjust IP checksum */
205         nskb->nh.iph->check = 0;
206         nskb->nh.iph->check = ip_fast_csum((unsigned char *)nskb->nh.iph, 
207                                            nskb->nh.iph->ihl);
208
209         /* "Never happens" */
210         if (nskb->len > dst_pmtu(nskb->dst))
211                 goto free_nskb;
212
213         nf_ct_attach(nskb, oldskb);
214
215         NF_HOOK(PF_INET, NF_IP_LOCAL_OUT, nskb, NULL, nskb->dst->dev,
216                 ip_finish_output);
217         return;
218
219  free_nskb:
220         kfree_skb(nskb);
221 }
222
223 static void send_unreach(struct sk_buff *skb_in, int code)
224 {
225         struct iphdr *iph;
226         struct udphdr *udph;
227         struct icmphdr *icmph;
228         struct sk_buff *nskb;
229         u32 saddr;
230         u8 tos;
231         int hh_len, length;
232         struct rtable *rt = (struct rtable*)skb_in->dst;
233         unsigned char *data;
234
235         if (!rt)
236                 return;
237
238         /* FIXME: Use sysctl number. --RR */
239         if (!xrlim_allow(&rt->u.dst, 1*HZ))
240                 return;
241
242         iph = skb_in->nh.iph;
243
244         /* No replies to physical multicast/broadcast */
245         if (skb_in->pkt_type!=PACKET_HOST)
246                 return;
247
248         /* Now check at the protocol level */
249         if (rt->rt_flags&(RTCF_BROADCAST|RTCF_MULTICAST))
250                 return;
251
252         /* Only reply to fragment 0. */
253         if (iph->frag_off&htons(IP_OFFSET))
254                 return;
255
256         /* Ensure we have at least 8 bytes of proto header. */
257         if (skb_in->len < skb_in->nh.iph->ihl*4 + 8)
258                 return;
259
260         /* if UDP checksum is set, verify it's correct */
261         if (iph->protocol == IPPROTO_UDP
262             && skb_in->tail-(u8*)iph >= sizeof(struct udphdr)) {
263                 int datalen = skb_in->len - (iph->ihl<<2);
264                 udph = (struct udphdr *)((char *)iph + (iph->ihl<<2));
265                 if (udph->check
266                     && csum_tcpudp_magic(iph->saddr, iph->daddr,
267                                          datalen, IPPROTO_UDP,
268                                          csum_partial((char *)udph, datalen,
269                                                       0)) != 0)
270                         return;
271         }
272
273         /* If we send an ICMP error to an ICMP error a mess would result.. */
274         if (iph->protocol == IPPROTO_ICMP
275             && skb_in->tail-(u8*)iph >= sizeof(struct icmphdr)) {
276                 icmph = (struct icmphdr *)((char *)iph + (iph->ihl<<2));
277
278                 if (skb_copy_bits(skb_in, skb_in->nh.iph->ihl*4,
279                                   icmph, sizeof(*icmph)) < 0)
280                         return;
281
282                 /* Between echo-reply (0) and timestamp (13),
283                    everything except echo-request (8) is an error.
284                    Also, anything greater than NR_ICMP_TYPES is
285                    unknown, and hence should be treated as an error... */
286                 if ((icmph->type < ICMP_TIMESTAMP
287                      && icmph->type != ICMP_ECHOREPLY
288                      && icmph->type != ICMP_ECHO)
289                     || icmph->type > NR_ICMP_TYPES)
290                         return;
291         }
292
293         saddr = iph->daddr;
294         if (!(rt->rt_flags & RTCF_LOCAL))
295                 saddr = 0;
296
297         tos = (iph->tos & IPTOS_TOS_MASK) | IPTOS_PREC_INTERNETCONTROL;
298
299         {
300                 struct flowi fl = {
301                         .nl_u = {
302                                 .ip4_u = {
303                                         .daddr = skb_in->nh.iph->saddr,
304                                         .saddr = saddr,
305                                         .tos = RT_TOS(tos)
306                                 }
307                         },
308                         .proto = IPPROTO_ICMP,
309                         .uli_u = {
310                                 .icmpt = {
311                                         .type = ICMP_DEST_UNREACH,
312                                         .code = code
313                                 }
314                         }
315                 };
316
317                 if (ip_route_output_key(&rt, &fl))
318                         return;
319         }
320         /* RFC says return as much as we can without exceeding 576 bytes. */
321         length = skb_in->len + sizeof(struct iphdr) + sizeof(struct icmphdr);
322
323         if (length > dst_pmtu(&rt->u.dst))
324                 length = dst_pmtu(&rt->u.dst);
325         if (length > 576)
326                 length = 576;
327
328         hh_len = LL_RESERVED_SPACE(rt->u.dst.dev);
329
330         nskb = alloc_skb(hh_len + length, GFP_ATOMIC);
331         if (!nskb) {
332                 ip_rt_put(rt);
333                 return;
334         }
335
336         nskb->priority = 0;
337         nskb->dst = &rt->u.dst;
338         skb_reserve(nskb, hh_len);
339
340         /* Set up IP header */
341         iph = nskb->nh.iph
342                 = (struct iphdr *)skb_put(nskb, sizeof(struct iphdr));
343         iph->version=4;
344         iph->ihl=5;
345         iph->tos=tos;
346         iph->tot_len = htons(length);
347
348         /* PMTU discovery never applies to ICMP packets. */
349         iph->frag_off = 0;
350
351         iph->ttl = MAXTTL;
352         ip_select_ident(iph, &rt->u.dst, NULL);
353         iph->protocol=IPPROTO_ICMP;
354         iph->saddr=rt->rt_src;
355         iph->daddr=rt->rt_dst;
356         iph->check=0;
357         iph->check = ip_fast_csum((unsigned char *)iph, iph->ihl);
358
359         /* Set up ICMP header. */
360         icmph = nskb->h.icmph
361                 = (struct icmphdr *)skb_put(nskb, sizeof(struct icmphdr));
362         icmph->type = ICMP_DEST_UNREACH;
363         icmph->code = code;     
364         icmph->un.gateway = 0;
365         icmph->checksum = 0;
366         
367         /* Copy as much of original packet as will fit */
368         data = skb_put(nskb,
369                        length - sizeof(struct iphdr) - sizeof(struct icmphdr));
370
371         skb_copy_bits(skb_in, 0, data,
372                       length - sizeof(struct iphdr) - sizeof(struct icmphdr));
373
374         icmph->checksum = ip_compute_csum((unsigned char *)icmph,
375                                           length - sizeof(struct iphdr));
376
377         nf_ct_attach(nskb, skb_in);
378
379         NF_HOOK(PF_INET, NF_IP_LOCAL_OUT, nskb, NULL, nskb->dst->dev,
380                 ip_finish_output);
381 }       
382
383 static unsigned int reject(struct sk_buff **pskb,
384                            const struct net_device *in,
385                            const struct net_device *out,
386                            unsigned int hooknum,
387                            const void *targinfo,
388                            void *userinfo)
389 {
390         const struct ipt_reject_info *reject = targinfo;
391
392         /* Our naive response construction doesn't deal with IP
393            options, and probably shouldn't try. */
394         if ((*pskb)->nh.iph->ihl<<2 != sizeof(struct iphdr))
395                 return NF_DROP;
396
397         /* WARNING: This code causes reentry within iptables.
398            This means that the iptables jump stack is now crap.  We
399            must return an absolute verdict. --RR */
400         switch (reject->with) {
401         case IPT_ICMP_NET_UNREACHABLE:
402                 send_unreach(*pskb, ICMP_NET_UNREACH);
403                 break;
404         case IPT_ICMP_HOST_UNREACHABLE:
405                 send_unreach(*pskb, ICMP_HOST_UNREACH);
406                 break;
407         case IPT_ICMP_PROT_UNREACHABLE:
408                 send_unreach(*pskb, ICMP_PROT_UNREACH);
409                 break;
410         case IPT_ICMP_PORT_UNREACHABLE:
411                 send_unreach(*pskb, ICMP_PORT_UNREACH);
412                 break;
413         case IPT_ICMP_NET_PROHIBITED:
414                 send_unreach(*pskb, ICMP_NET_ANO);
415                 break;
416         case IPT_ICMP_HOST_PROHIBITED:
417                 send_unreach(*pskb, ICMP_HOST_ANO);
418                 break;
419         case IPT_ICMP_ADMIN_PROHIBITED:
420                 send_unreach(*pskb, ICMP_PKT_FILTERED);
421                 break;
422         case IPT_TCP_RESET:
423                 send_reset(*pskb, hooknum);
424         case IPT_ICMP_ECHOREPLY:
425                 /* Doesn't happen. */
426                 break;
427         }
428
429         return NF_DROP;
430 }
431
432 static int check(const char *tablename,
433                  const struct ipt_entry *e,
434                  void *targinfo,
435                  unsigned int targinfosize,
436                  unsigned int hook_mask)
437 {
438         const struct ipt_reject_info *rejinfo = targinfo;
439
440         if (targinfosize != IPT_ALIGN(sizeof(struct ipt_reject_info))) {
441                 DEBUGP("REJECT: targinfosize %u != 0\n", targinfosize);
442                 return 0;
443         }
444
445         /* Only allow these for packet filtering. */
446         if (strcmp(tablename, "filter") != 0) {
447                 DEBUGP("REJECT: bad table `%s'.\n", tablename);
448                 return 0;
449         }
450         if ((hook_mask & ~((1 << NF_IP_LOCAL_IN)
451                            | (1 << NF_IP_FORWARD)
452                            | (1 << NF_IP_LOCAL_OUT))) != 0) {
453                 DEBUGP("REJECT: bad hook mask %X\n", hook_mask);
454                 return 0;
455         }
456
457         if (rejinfo->with == IPT_ICMP_ECHOREPLY) {
458                 printk("REJECT: ECHOREPLY no longer supported.\n");
459                 return 0;
460         } else if (rejinfo->with == IPT_TCP_RESET) {
461                 /* Must specify that it's a TCP packet */
462                 if (e->ip.proto != IPPROTO_TCP
463                     || (e->ip.invflags & IPT_INV_PROTO)) {
464                         DEBUGP("REJECT: TCP_RESET invalid for non-tcp\n");
465                         return 0;
466                 }
467         }
468
469         return 1;
470 }
471
472 static struct ipt_target ipt_reject_reg = {
473         .name           = "REJECT",
474         .target         = reject,
475         .checkentry     = check,
476         .me             = THIS_MODULE,
477 };
478
479 static int __init init(void)
480 {
481         return ipt_register_target(&ipt_reject_reg);
482 }
483
484 static void __exit fini(void)
485 {
486         ipt_unregister_target(&ipt_reject_reg);
487 }
488
489 module_init(init);
490 module_exit(fini);