1 /* Cluster IP hashmark target
2  * (C) 2003-2004 by Harald Welte <laforge@netfilter.org>
3  * based on ideas of Fabio Olive Leite <olive@unixforge.org>
4  *
5  * Development of this code funded by SuSE Linux AG, http://www.suse.com/
6  *
7  * This program is free software; you can redistribute it and/or modify
8  * it under the terms of the GNU General Public License version 2 as
9  * published by the Free Software Foundation.
10  *
11  */
12 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
13 #include <linux/module.h>
14 #include <linux/proc_fs.h>
15 #include <linux/jhash.h>
16 #include <linux/bitops.h>
17 #include <linux/skbuff.h>
18 #include <linux/slab.h>
19 #include <linux/ip.h>
20 #include <linux/tcp.h>
21 #include <linux/udp.h>
22 #include <linux/icmp.h>
23 #include <linux/if_arp.h>
24 #include <linux/seq_file.h>
25 #include <linux/netfilter_arp.h>
26 #include <linux/netfilter/x_tables.h>
27 #include <linux/netfilter_ipv4/ip_tables.h>
28 #include <linux/netfilter_ipv4/ipt_CLUSTERIP.h>
29 #include <net/netfilter/nf_conntrack.h>
30 #include <net/net_namespace.h>
31 #include <net/checksum.h>
32 #include <net/ip.h>
33 
34 #define CLUSTERIP_VERSION "0.8"
35 
36 MODULE_LICENSE("GPL");
37 MODULE_AUTHOR("Harald Welte <laforge@netfilter.org>");
38 MODULE_DESCRIPTION("Xtables: CLUSTERIP target");
39 
40 struct clusterip_config {
41 	struct list_head list;			/* list of all configs */
42 	atomic_t refcount;			/* reference count */
43 	atomic_t entries;			/* number of entries/rules
44 						 * referencing us */
45 
46 	__be32 clusterip;			/* the IP address */
47 	u_int8_t clustermac[ETH_ALEN];		/* the MAC address */
48 	struct net_device *dev;			/* device */
49 	u_int16_t num_total_nodes;		/* total number of nodes */
50 	unsigned long local_nodes;		/* node number array */
51 
52 #ifdef CONFIG_PROC_FS
53 	struct proc_dir_entry *pde;		/* proc dir entry */
54 #endif
55 	enum clusterip_hashmode hash_mode;	/* which hashing mode */
56 	u_int32_t hash_initval;			/* hash initialization */
57 	struct rcu_head rcu;
58 };
59 
60 static LIST_HEAD(clusterip_configs);
61 
62 /* clusterip_lock protects the clusterip_configs list */
63 static DEFINE_SPINLOCK(clusterip_lock);
64 
65 #ifdef CONFIG_PROC_FS
66 static const struct file_operations clusterip_proc_fops;
67 static struct proc_dir_entry *clusterip_procdir;
68 #endif
69 
70 static inline void
clusterip_config_get(struct clusterip_config * c)71 clusterip_config_get(struct clusterip_config *c)
72 {
73 	atomic_inc(&c->refcount);
74 }
75 
76 
clusterip_config_rcu_free(struct rcu_head * head)77 static void clusterip_config_rcu_free(struct rcu_head *head)
78 {
79 	kfree(container_of(head, struct clusterip_config, rcu));
80 }
81 
82 static inline void
clusterip_config_put(struct clusterip_config * c)83 clusterip_config_put(struct clusterip_config *c)
84 {
85 	if (atomic_dec_and_test(&c->refcount))
86 		call_rcu_bh(&c->rcu, clusterip_config_rcu_free);
87 }
88 
89 /* decrease the count of entries using/referencing this config.  If last
90  * entry(rule) is removed, remove the config from lists, but don't free it
91  * yet, since proc-files could still be holding references */
92 static inline void
clusterip_config_entry_put(struct clusterip_config * c)93 clusterip_config_entry_put(struct clusterip_config *c)
94 {
95 	local_bh_disable();
96 	if (atomic_dec_and_lock(&c->entries, &clusterip_lock)) {
97 		list_del_rcu(&c->list);
98 		spin_unlock(&clusterip_lock);
99 		local_bh_enable();
100 
101 		dev_mc_del(c->dev, c->clustermac);
102 		dev_put(c->dev);
103 
104 		/* In case anyone still accesses the file, the open/close
105 		 * functions are also incrementing the refcount on their own,
106 		 * so it's safe to remove the entry even if it's in use. */
107 #ifdef CONFIG_PROC_FS
108 		remove_proc_entry(c->pde->name, c->pde->parent);
109 #endif
110 		return;
111 	}
112 	local_bh_enable();
113 }
114 
115 static struct clusterip_config *
__clusterip_config_find(__be32 clusterip)116 __clusterip_config_find(__be32 clusterip)
117 {
118 	struct clusterip_config *c;
119 
120 	list_for_each_entry_rcu(c, &clusterip_configs, list) {
121 		if (c->clusterip == clusterip)
122 			return c;
123 	}
124 
125 	return NULL;
126 }
127 
128 static inline struct clusterip_config *
clusterip_config_find_get(__be32 clusterip,int entry)129 clusterip_config_find_get(__be32 clusterip, int entry)
130 {
131 	struct clusterip_config *c;
132 
133 	rcu_read_lock_bh();
134 	c = __clusterip_config_find(clusterip);
135 	if (c) {
136 		if (unlikely(!atomic_inc_not_zero(&c->refcount)))
137 			c = NULL;
138 		else if (entry)
139 			atomic_inc(&c->entries);
140 	}
141 	rcu_read_unlock_bh();
142 
143 	return c;
144 }
145 
146 static void
clusterip_config_init_nodelist(struct clusterip_config * c,const struct ipt_clusterip_tgt_info * i)147 clusterip_config_init_nodelist(struct clusterip_config *c,
148 			       const struct ipt_clusterip_tgt_info *i)
149 {
150 	int n;
151 
152 	for (n = 0; n < i->num_local_nodes; n++)
153 		set_bit(i->local_nodes[n] - 1, &c->local_nodes);
154 }
155 
156 static struct clusterip_config *
clusterip_config_init(const struct ipt_clusterip_tgt_info * i,__be32 ip,struct net_device * dev)157 clusterip_config_init(const struct ipt_clusterip_tgt_info *i, __be32 ip,
158 			struct net_device *dev)
159 {
160 	struct clusterip_config *c;
161 
162 	c = kzalloc(sizeof(*c), GFP_ATOMIC);
163 	if (!c)
164 		return NULL;
165 
166 	c->dev = dev;
167 	c->clusterip = ip;
168 	memcpy(&c->clustermac, &i->clustermac, ETH_ALEN);
169 	c->num_total_nodes = i->num_total_nodes;
170 	clusterip_config_init_nodelist(c, i);
171 	c->hash_mode = i->hash_mode;
172 	c->hash_initval = i->hash_initval;
173 	atomic_set(&c->refcount, 1);
174 	atomic_set(&c->entries, 1);
175 
176 #ifdef CONFIG_PROC_FS
177 	{
178 		char buffer[16];
179 
180 		/* create proc dir entry */
181 		sprintf(buffer, "%pI4", &ip);
182 		c->pde = proc_create_data(buffer, S_IWUSR|S_IRUSR,
183 					  clusterip_procdir,
184 					  &clusterip_proc_fops, c);
185 		if (!c->pde) {
186 			kfree(c);
187 			return NULL;
188 		}
189 	}
190 #endif
191 
192 	spin_lock_bh(&clusterip_lock);
193 	list_add_rcu(&c->list, &clusterip_configs);
194 	spin_unlock_bh(&clusterip_lock);
195 
196 	return c;
197 }
198 
199 #ifdef CONFIG_PROC_FS
200 static int
clusterip_add_node(struct clusterip_config * c,u_int16_t nodenum)201 clusterip_add_node(struct clusterip_config *c, u_int16_t nodenum)
202 {
203 
204 	if (nodenum == 0 ||
205 	    nodenum > c->num_total_nodes)
206 		return 1;
207 
208 	/* check if we already have this number in our bitfield */
209 	if (test_and_set_bit(nodenum - 1, &c->local_nodes))
210 		return 1;
211 
212 	return 0;
213 }
214 
215 static bool
clusterip_del_node(struct clusterip_config * c,u_int16_t nodenum)216 clusterip_del_node(struct clusterip_config *c, u_int16_t nodenum)
217 {
218 	if (nodenum == 0 ||
219 	    nodenum > c->num_total_nodes)
220 		return true;
221 
222 	if (test_and_clear_bit(nodenum - 1, &c->local_nodes))
223 		return false;
224 
225 	return true;
226 }
227 #endif
228 
229 static inline u_int32_t
clusterip_hashfn(const struct sk_buff * skb,const struct clusterip_config * config)230 clusterip_hashfn(const struct sk_buff *skb,
231 		 const struct clusterip_config *config)
232 {
233 	const struct iphdr *iph = ip_hdr(skb);
234 	unsigned long hashval;
235 	u_int16_t sport = 0, dport = 0;
236 	int poff;
237 
238 	poff = proto_ports_offset(iph->protocol);
239 	if (poff >= 0) {
240 		const u_int16_t *ports;
241 		u16 _ports[2];
242 
243 		ports = skb_header_pointer(skb, iph->ihl * 4 + poff, 4, _ports);
244 		if (ports) {
245 			sport = ports[0];
246 			dport = ports[1];
247 		}
248 	} else {
249 		if (net_ratelimit())
250 			pr_info("unknown protocol %u\n", iph->protocol);
251 	}
252 
253 	switch (config->hash_mode) {
254 	case CLUSTERIP_HASHMODE_SIP:
255 		hashval = jhash_1word(ntohl(iph->saddr),
256 				      config->hash_initval);
257 		break;
258 	case CLUSTERIP_HASHMODE_SIP_SPT:
259 		hashval = jhash_2words(ntohl(iph->saddr), sport,
260 				       config->hash_initval);
261 		break;
262 	case CLUSTERIP_HASHMODE_SIP_SPT_DPT:
263 		hashval = jhash_3words(ntohl(iph->saddr), sport, dport,
264 				       config->hash_initval);
265 		break;
266 	default:
267 		/* to make gcc happy */
268 		hashval = 0;
269 		/* This cannot happen, unless the check function wasn't called
270 		 * at rule load time */
271 		pr_info("unknown mode %u\n", config->hash_mode);
272 		BUG();
273 		break;
274 	}
275 
276 	/* node numbers are 1..n, not 0..n */
277 	return (((u64)hashval * config->num_total_nodes) >> 32) + 1;
278 }
279 
280 static inline int
clusterip_responsible(const struct clusterip_config * config,u_int32_t hash)281 clusterip_responsible(const struct clusterip_config *config, u_int32_t hash)
282 {
283 	return test_bit(hash - 1, &config->local_nodes);
284 }
285 
286 /***********************************************************************
287  * IPTABLES TARGET
288  ***********************************************************************/
289 
290 static unsigned int
clusterip_tg(struct sk_buff * skb,const struct xt_action_param * par)291 clusterip_tg(struct sk_buff *skb, const struct xt_action_param *par)
292 {
293 	const struct ipt_clusterip_tgt_info *cipinfo = par->targinfo;
294 	struct nf_conn *ct;
295 	enum ip_conntrack_info ctinfo;
296 	u_int32_t hash;
297 
298 	/* don't need to clusterip_config_get() here, since refcount
299 	 * is only decremented by destroy() - and ip_tables guarantees
300 	 * that the ->target() function isn't called after ->destroy() */
301 
302 	ct = nf_ct_get(skb, &ctinfo);
303 	if (ct == NULL)
304 		return NF_DROP;
305 
306 	/* special case: ICMP error handling. conntrack distinguishes between
307 	 * error messages (RELATED) and information requests (see below) */
308 	if (ip_hdr(skb)->protocol == IPPROTO_ICMP &&
309 	    (ctinfo == IP_CT_RELATED ||
310 	     ctinfo == IP_CT_RELATED_REPLY))
311 		return XT_CONTINUE;
312 
313 	/* ip_conntrack_icmp guarantees us that we only have ICMP_ECHO,
314 	 * TIMESTAMP, INFO_REQUEST or ADDRESS type icmp packets from here
315 	 * on, which all have an ID field [relevant for hashing]. */
316 
317 	hash = clusterip_hashfn(skb, cipinfo->config);
318 
319 	switch (ctinfo) {
320 	case IP_CT_NEW:
321 		ct->mark = hash;
322 		break;
323 	case IP_CT_RELATED:
324 	case IP_CT_RELATED_REPLY:
325 		/* FIXME: we don't handle expectations at the moment.
326 		 * They can arrive on a different node than
327 		 * the master connection (e.g. FTP passive mode) */
328 	case IP_CT_ESTABLISHED:
329 	case IP_CT_ESTABLISHED_REPLY:
330 		break;
331 	default:			/* Prevent gcc warnings */
332 		break;
333 	}
334 
335 #ifdef DEBUG
336 	nf_ct_dump_tuple_ip(&ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple);
337 #endif
338 	pr_debug("hash=%u ct_hash=%u ", hash, ct->mark);
339 	if (!clusterip_responsible(cipinfo->config, hash)) {
340 		pr_debug("not responsible\n");
341 		return NF_DROP;
342 	}
343 	pr_debug("responsible\n");
344 
345 	/* despite being received via linklayer multicast, this is
346 	 * actually a unicast IP packet. TCP doesn't like PACKET_MULTICAST */
347 	skb->pkt_type = PACKET_HOST;
348 
349 	return XT_CONTINUE;
350 }
351 
clusterip_tg_check(const struct xt_tgchk_param * par)352 static int clusterip_tg_check(const struct xt_tgchk_param *par)
353 {
354 	struct ipt_clusterip_tgt_info *cipinfo = par->targinfo;
355 	const struct ipt_entry *e = par->entryinfo;
356 	struct clusterip_config *config;
357 	int ret;
358 
359 	if (cipinfo->hash_mode != CLUSTERIP_HASHMODE_SIP &&
360 	    cipinfo->hash_mode != CLUSTERIP_HASHMODE_SIP_SPT &&
361 	    cipinfo->hash_mode != CLUSTERIP_HASHMODE_SIP_SPT_DPT) {
362 		pr_info("unknown mode %u\n", cipinfo->hash_mode);
363 		return -EINVAL;
364 
365 	}
366 	if (e->ip.dmsk.s_addr != htonl(0xffffffff) ||
367 	    e->ip.dst.s_addr == 0) {
368 		pr_info("Please specify destination IP\n");
369 		return -EINVAL;
370 	}
371 
372 	/* FIXME: further sanity checks */
373 
374 	config = clusterip_config_find_get(e->ip.dst.s_addr, 1);
375 	if (!config) {
376 		if (!(cipinfo->flags & CLUSTERIP_FLAG_NEW)) {
377 			pr_info("no config found for %pI4, need 'new'\n",
378 				&e->ip.dst.s_addr);
379 			return -EINVAL;
380 		} else {
381 			struct net_device *dev;
382 
383 			if (e->ip.iniface[0] == '\0') {
384 				pr_info("Please specify an interface name\n");
385 				return -EINVAL;
386 			}
387 
388 			dev = dev_get_by_name(&init_net, e->ip.iniface);
389 			if (!dev) {
390 				pr_info("no such interface %s\n",
391 					e->ip.iniface);
392 				return -ENOENT;
393 			}
394 
395 			config = clusterip_config_init(cipinfo,
396 							e->ip.dst.s_addr, dev);
397 			if (!config) {
398 				dev_put(dev);
399 				return -ENOMEM;
400 			}
401 			dev_mc_add(config->dev, config->clustermac);
402 		}
403 	}
404 	cipinfo->config = config;
405 
406 	ret = nf_ct_l3proto_try_module_get(par->family);
407 	if (ret < 0)
408 		pr_info("cannot load conntrack support for proto=%u\n",
409 			par->family);
410 	return ret;
411 }
412 
413 /* drop reference count of cluster config when rule is deleted */
clusterip_tg_destroy(const struct xt_tgdtor_param * par)414 static void clusterip_tg_destroy(const struct xt_tgdtor_param *par)
415 {
416 	const struct ipt_clusterip_tgt_info *cipinfo = par->targinfo;
417 
418 	/* if no more entries are referencing the config, remove it
419 	 * from the list and destroy the proc entry */
420 	clusterip_config_entry_put(cipinfo->config);
421 
422 	clusterip_config_put(cipinfo->config);
423 
424 	nf_ct_l3proto_module_put(par->family);
425 }
426 
427 #ifdef CONFIG_COMPAT
428 struct compat_ipt_clusterip_tgt_info
429 {
430 	u_int32_t	flags;
431 	u_int8_t	clustermac[6];
432 	u_int16_t	num_total_nodes;
433 	u_int16_t	num_local_nodes;
434 	u_int16_t	local_nodes[CLUSTERIP_MAX_NODES];
435 	u_int32_t	hash_mode;
436 	u_int32_t	hash_initval;
437 	compat_uptr_t	config;
438 };
439 #endif /* CONFIG_COMPAT */
440 
441 static struct xt_target clusterip_tg_reg __read_mostly = {
442 	.name		= "CLUSTERIP",
443 	.family		= NFPROTO_IPV4,
444 	.target		= clusterip_tg,
445 	.checkentry	= clusterip_tg_check,
446 	.destroy	= clusterip_tg_destroy,
447 	.targetsize	= sizeof(struct ipt_clusterip_tgt_info),
448 #ifdef CONFIG_COMPAT
449 	.compatsize	= sizeof(struct compat_ipt_clusterip_tgt_info),
450 #endif /* CONFIG_COMPAT */
451 	.me		= THIS_MODULE
452 };
453 
454 
455 /***********************************************************************
456  * ARP MANGLING CODE
457  ***********************************************************************/
458 
459 /* hardcoded for 48bit ethernet and 32bit ipv4 addresses */
460 struct arp_payload {
461 	u_int8_t src_hw[ETH_ALEN];
462 	__be32 src_ip;
463 	u_int8_t dst_hw[ETH_ALEN];
464 	__be32 dst_ip;
465 } __packed;
466 
467 #ifdef DEBUG
arp_print(struct arp_payload * payload)468 static void arp_print(struct arp_payload *payload)
469 {
470 #define HBUFFERLEN 30
471 	char hbuffer[HBUFFERLEN];
472 	int j,k;
473 
474 	for (k=0, j=0; k < HBUFFERLEN-3 && j < ETH_ALEN; j++) {
475 		hbuffer[k++] = hex_asc_hi(payload->src_hw[j]);
476 		hbuffer[k++] = hex_asc_lo(payload->src_hw[j]);
477 		hbuffer[k++]=':';
478 	}
479 	hbuffer[--k]='\0';
480 
481 	pr_debug("src %pI4@%s, dst %pI4\n",
482 		 &payload->src_ip, hbuffer, &payload->dst_ip);
483 }
484 #endif
485 
486 static unsigned int
arp_mangle(unsigned int hook,struct sk_buff * skb,const struct net_device * in,const struct net_device * out,int (* okfn)(struct sk_buff *))487 arp_mangle(unsigned int hook,
488 	   struct sk_buff *skb,
489 	   const struct net_device *in,
490 	   const struct net_device *out,
491 	   int (*okfn)(struct sk_buff *))
492 {
493 	struct arphdr *arp = arp_hdr(skb);
494 	struct arp_payload *payload;
495 	struct clusterip_config *c;
496 
497 	/* we don't care about non-ethernet and non-ipv4 ARP */
498 	if (arp->ar_hrd != htons(ARPHRD_ETHER) ||
499 	    arp->ar_pro != htons(ETH_P_IP) ||
500 	    arp->ar_pln != 4 || arp->ar_hln != ETH_ALEN)
501 		return NF_ACCEPT;
502 
503 	/* we only want to mangle arp requests and replies */
504 	if (arp->ar_op != htons(ARPOP_REPLY) &&
505 	    arp->ar_op != htons(ARPOP_REQUEST))
506 		return NF_ACCEPT;
507 
508 	payload = (void *)(arp+1);
509 
510 	/* if there is no clusterip configuration for the arp reply's
511 	 * source ip, we don't want to mangle it */
512 	c = clusterip_config_find_get(payload->src_ip, 0);
513 	if (!c)
514 		return NF_ACCEPT;
515 
516 	/* normally the linux kernel always replies to arp queries of
517 	 * addresses on different interfacs.  However, in the CLUSTERIP case
518 	 * this wouldn't work, since we didn't subscribe the mcast group on
519 	 * other interfaces */
520 	if (c->dev != out) {
521 		pr_debug("not mangling arp reply on different "
522 			 "interface: cip'%s'-skb'%s'\n",
523 			 c->dev->name, out->name);
524 		clusterip_config_put(c);
525 		return NF_ACCEPT;
526 	}
527 
528 	/* mangle reply hardware address */
529 	memcpy(payload->src_hw, c->clustermac, arp->ar_hln);
530 
531 #ifdef DEBUG
532 	pr_debug("mangled arp reply: ");
533 	arp_print(payload);
534 #endif
535 
536 	clusterip_config_put(c);
537 
538 	return NF_ACCEPT;
539 }
540 
541 static struct nf_hook_ops cip_arp_ops __read_mostly = {
542 	.hook = arp_mangle,
543 	.pf = NFPROTO_ARP,
544 	.hooknum = NF_ARP_OUT,
545 	.priority = -1
546 };
547 
548 /***********************************************************************
549  * PROC DIR HANDLING
550  ***********************************************************************/
551 
552 #ifdef CONFIG_PROC_FS
553 
554 struct clusterip_seq_position {
555 	unsigned int pos;	/* position */
556 	unsigned int weight;	/* number of bits set == size */
557 	unsigned int bit;	/* current bit */
558 	unsigned long val;	/* current value */
559 };
560 
clusterip_seq_start(struct seq_file * s,loff_t * pos)561 static void *clusterip_seq_start(struct seq_file *s, loff_t *pos)
562 {
563 	struct clusterip_config *c = s->private;
564 	unsigned int weight;
565 	u_int32_t local_nodes;
566 	struct clusterip_seq_position *idx;
567 
568 	/* FIXME: possible race */
569 	local_nodes = c->local_nodes;
570 	weight = hweight32(local_nodes);
571 	if (*pos >= weight)
572 		return NULL;
573 
574 	idx = kmalloc(sizeof(struct clusterip_seq_position), GFP_KERNEL);
575 	if (!idx)
576 		return ERR_PTR(-ENOMEM);
577 
578 	idx->pos = *pos;
579 	idx->weight = weight;
580 	idx->bit = ffs(local_nodes);
581 	idx->val = local_nodes;
582 	clear_bit(idx->bit - 1, &idx->val);
583 
584 	return idx;
585 }
586 
clusterip_seq_next(struct seq_file * s,void * v,loff_t * pos)587 static void *clusterip_seq_next(struct seq_file *s, void *v, loff_t *pos)
588 {
589 	struct clusterip_seq_position *idx = v;
590 
591 	*pos = ++idx->pos;
592 	if (*pos >= idx->weight) {
593 		kfree(v);
594 		return NULL;
595 	}
596 	idx->bit = ffs(idx->val);
597 	clear_bit(idx->bit - 1, &idx->val);
598 	return idx;
599 }
600 
clusterip_seq_stop(struct seq_file * s,void * v)601 static void clusterip_seq_stop(struct seq_file *s, void *v)
602 {
603 	if (!IS_ERR(v))
604 		kfree(v);
605 }
606 
clusterip_seq_show(struct seq_file * s,void * v)607 static int clusterip_seq_show(struct seq_file *s, void *v)
608 {
609 	struct clusterip_seq_position *idx = v;
610 
611 	if (idx->pos != 0)
612 		seq_putc(s, ',');
613 
614 	seq_printf(s, "%u", idx->bit);
615 
616 	if (idx->pos == idx->weight - 1)
617 		seq_putc(s, '\n');
618 
619 	return 0;
620 }
621 
622 static const struct seq_operations clusterip_seq_ops = {
623 	.start	= clusterip_seq_start,
624 	.next	= clusterip_seq_next,
625 	.stop	= clusterip_seq_stop,
626 	.show	= clusterip_seq_show,
627 };
628 
clusterip_proc_open(struct inode * inode,struct file * file)629 static int clusterip_proc_open(struct inode *inode, struct file *file)
630 {
631 	int ret = seq_open(file, &clusterip_seq_ops);
632 
633 	if (!ret) {
634 		struct seq_file *sf = file->private_data;
635 		struct clusterip_config *c = PDE(inode)->data;
636 
637 		sf->private = c;
638 
639 		clusterip_config_get(c);
640 	}
641 
642 	return ret;
643 }
644 
clusterip_proc_release(struct inode * inode,struct file * file)645 static int clusterip_proc_release(struct inode *inode, struct file *file)
646 {
647 	struct clusterip_config *c = PDE(inode)->data;
648 	int ret;
649 
650 	ret = seq_release(inode, file);
651 
652 	if (!ret)
653 		clusterip_config_put(c);
654 
655 	return ret;
656 }
657 
clusterip_proc_write(struct file * file,const char __user * input,size_t size,loff_t * ofs)658 static ssize_t clusterip_proc_write(struct file *file, const char __user *input,
659 				size_t size, loff_t *ofs)
660 {
661 	struct clusterip_config *c = PDE(file->f_path.dentry->d_inode)->data;
662 #define PROC_WRITELEN	10
663 	char buffer[PROC_WRITELEN+1];
664 	unsigned long nodenum;
665 
666 	if (size > PROC_WRITELEN)
667 		return -EIO;
668 	if (copy_from_user(buffer, input, size))
669 		return -EFAULT;
670 	buffer[size] = 0;
671 
672 	if (*buffer == '+') {
673 		nodenum = simple_strtoul(buffer+1, NULL, 10);
674 		if (clusterip_add_node(c, nodenum))
675 			return -ENOMEM;
676 	} else if (*buffer == '-') {
677 		nodenum = simple_strtoul(buffer+1, NULL,10);
678 		if (clusterip_del_node(c, nodenum))
679 			return -ENOENT;
680 	} else
681 		return -EIO;
682 
683 	return size;
684 }
685 
686 static const struct file_operations clusterip_proc_fops = {
687 	.owner	 = THIS_MODULE,
688 	.open	 = clusterip_proc_open,
689 	.read	 = seq_read,
690 	.write	 = clusterip_proc_write,
691 	.llseek	 = seq_lseek,
692 	.release = clusterip_proc_release,
693 };
694 
695 #endif /* CONFIG_PROC_FS */
696 
clusterip_tg_init(void)697 static int __init clusterip_tg_init(void)
698 {
699 	int ret;
700 
701 	ret = xt_register_target(&clusterip_tg_reg);
702 	if (ret < 0)
703 		return ret;
704 
705 	ret = nf_register_hook(&cip_arp_ops);
706 	if (ret < 0)
707 		goto cleanup_target;
708 
709 #ifdef CONFIG_PROC_FS
710 	clusterip_procdir = proc_mkdir("ipt_CLUSTERIP", init_net.proc_net);
711 	if (!clusterip_procdir) {
712 		pr_err("Unable to proc dir entry\n");
713 		ret = -ENOMEM;
714 		goto cleanup_hook;
715 	}
716 #endif /* CONFIG_PROC_FS */
717 
718 	pr_info("ClusterIP Version %s loaded successfully\n",
719 		CLUSTERIP_VERSION);
720 	return 0;
721 
722 #ifdef CONFIG_PROC_FS
723 cleanup_hook:
724 	nf_unregister_hook(&cip_arp_ops);
725 #endif /* CONFIG_PROC_FS */
726 cleanup_target:
727 	xt_unregister_target(&clusterip_tg_reg);
728 	return ret;
729 }
730 
clusterip_tg_exit(void)731 static void __exit clusterip_tg_exit(void)
732 {
733 	pr_info("ClusterIP Version %s unloading\n", CLUSTERIP_VERSION);
734 #ifdef CONFIG_PROC_FS
735 	remove_proc_entry(clusterip_procdir->name, clusterip_procdir->parent);
736 #endif
737 	nf_unregister_hook(&cip_arp_ops);
738 	xt_unregister_target(&clusterip_tg_reg);
739 
740 	/* Wait for completion of call_rcu_bh()'s (clusterip_config_rcu_free) */
741 	rcu_barrier_bh();
742 }
743 
744 module_init(clusterip_tg_init);
745 module_exit(clusterip_tg_exit);
746