| 
									
										
											  
											
												rcu: Introduce hlist_nulls variant of hlist
hlist uses NULL value to finish a chain.
hlist_nulls variant use the low order bit set to 1 to signal an end-of-list marker.
This allows to store many different end markers, so that some RCU lockless
algos (used in TCP/UDP stack for example) can save some memory barriers in
fast paths.
Two new files are added :
include/linux/list_nulls.h
  - mimics hlist part of include/linux/list.h, derived to hlist_nulls variant
include/linux/rculist_nulls.h
  - mimics hlist part of include/linux/rculist.h, derived to hlist_nulls variant
   Only four helpers are declared for the moment :
     hlist_nulls_del_init_rcu(), hlist_nulls_del_rcu(),
     hlist_nulls_add_head_rcu() and hlist_nulls_for_each_entry_rcu()
prefetches() were removed, since an end of list is not anymore NULL value.
prefetches() could trigger useless (and possibly dangerous) memory transactions.
Example of use (extracted from __udp4_lib_lookup())
	struct sock *sk, *result;
        struct hlist_nulls_node *node;
        unsigned short hnum = ntohs(dport);
        unsigned int hash = udp_hashfn(net, hnum);
        struct udp_hslot *hslot = &udptable->hash[hash];
        int score, badness;
        rcu_read_lock();
begin:
        result = NULL;
        badness = -1;
        sk_nulls_for_each_rcu(sk, node, &hslot->head) {
                score = compute_score(sk, net, saddr, hnum, sport,
                                      daddr, dport, dif);
                if (score > badness) {
                        result = sk;
                        badness = score;
                }
        }
        /*
         * if the nulls value we got at the end of this lookup is
         * not the expected one, we must restart lookup.
         * We probably met an item that was moved to another chain.
         */
        if (get_nulls_value(node) != hash)
                goto begin;
        if (result) {
                if (unlikely(!atomic_inc_not_zero(&result->sk_refcnt)))
                        result = NULL;
                else if (unlikely(compute_score(result, net, saddr, hnum, sport,
                                  daddr, dport, dif) < badness)) {
                        sock_put(result);
                        goto begin;
                }
        }
        rcu_read_unlock();
        return result;
Signed-off-by: Eric Dumazet <dada1@cosmosbay.com>
Acked-by: Peter Zijlstra <a.p.zijlstra@chello.nl>
Signed-off-by: David S. Miller <davem@davemloft.net>
											
										 
											2008-11-16 19:37:55 -08:00
										 |  |  | #ifndef _LINUX_LIST_NULLS_H
 | 
					
						
							|  |  |  | #define _LINUX_LIST_NULLS_H
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /*
 | 
					
						
							|  |  |  |  * Special version of lists, where end of list is not a NULL pointer, | 
					
						
							|  |  |  |  * but a 'nulls' marker, which can have many different values. | 
					
						
							|  |  |  |  * (up to 2^31 different values guaranteed on all platforms) | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * In the standard hlist, termination of a list is the NULL pointer. | 
					
						
							|  |  |  |  * In this special 'nulls' variant, we use the fact that objects stored in | 
					
						
							|  |  |  |  * a list are aligned on a word (4 or 8 bytes alignment). | 
					
						
							|  |  |  |  * We therefore use the last significant bit of 'ptr' : | 
					
						
							|  |  |  |  * Set to 1 : This is a 'nulls' end-of-list marker (ptr >> 1) | 
					
						
							|  |  |  |  * Set to 0 : This is a pointer to some object (ptr) | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | struct hlist_nulls_head { | 
					
						
							|  |  |  | 	struct hlist_nulls_node *first; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | struct hlist_nulls_node { | 
					
						
							|  |  |  | 	struct hlist_nulls_node *next, **pprev; | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | #define INIT_HLIST_NULLS_HEAD(ptr, nulls) \
 | 
					
						
							|  |  |  | 	((ptr)->first = (struct hlist_nulls_node *) (1UL | (((long)nulls) << 1))) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #define hlist_nulls_entry(ptr, type, member) container_of(ptr,type,member)
 | 
					
						
							|  |  |  | /**
 | 
					
						
							|  |  |  |  * ptr_is_a_nulls - Test if a ptr is a nulls | 
					
						
							|  |  |  |  * @ptr: ptr to be tested | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | static inline int is_a_nulls(const struct hlist_nulls_node *ptr) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return ((unsigned long)ptr & 1); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /**
 | 
					
						
							|  |  |  |  * get_nulls_value - Get the 'nulls' value of the end of chain | 
					
						
							|  |  |  |  * @ptr: end of chain | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Should be called only if is_a_nulls(ptr); | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | static inline unsigned long get_nulls_value(const struct hlist_nulls_node *ptr) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return ((unsigned long)ptr) >> 1; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static inline int hlist_nulls_unhashed(const struct hlist_nulls_node *h) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return !h->pprev; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static inline int hlist_nulls_empty(const struct hlist_nulls_head *h) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return is_a_nulls(h->first); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2009-06-13 12:28:57 +02:00
										 |  |  | static inline void hlist_nulls_add_head(struct hlist_nulls_node *n, | 
					
						
							|  |  |  | 					struct hlist_nulls_head *h) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	struct hlist_nulls_node *first = h->first; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	n->next = first; | 
					
						
							|  |  |  | 	n->pprev = &h->first; | 
					
						
							|  |  |  | 	h->first = n; | 
					
						
							|  |  |  | 	if (!is_a_nulls(first)) | 
					
						
							|  |  |  | 		first->pprev = &n->next; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
											  
											
												rcu: Introduce hlist_nulls variant of hlist
hlist uses NULL value to finish a chain.
hlist_nulls variant use the low order bit set to 1 to signal an end-of-list marker.
This allows to store many different end markers, so that some RCU lockless
algos (used in TCP/UDP stack for example) can save some memory barriers in
fast paths.
Two new files are added :
include/linux/list_nulls.h
  - mimics hlist part of include/linux/list.h, derived to hlist_nulls variant
include/linux/rculist_nulls.h
  - mimics hlist part of include/linux/rculist.h, derived to hlist_nulls variant
   Only four helpers are declared for the moment :
     hlist_nulls_del_init_rcu(), hlist_nulls_del_rcu(),
     hlist_nulls_add_head_rcu() and hlist_nulls_for_each_entry_rcu()
prefetches() were removed, since an end of list is not anymore NULL value.
prefetches() could trigger useless (and possibly dangerous) memory transactions.
Example of use (extracted from __udp4_lib_lookup())
	struct sock *sk, *result;
        struct hlist_nulls_node *node;
        unsigned short hnum = ntohs(dport);
        unsigned int hash = udp_hashfn(net, hnum);
        struct udp_hslot *hslot = &udptable->hash[hash];
        int score, badness;
        rcu_read_lock();
begin:
        result = NULL;
        badness = -1;
        sk_nulls_for_each_rcu(sk, node, &hslot->head) {
                score = compute_score(sk, net, saddr, hnum, sport,
                                      daddr, dport, dif);
                if (score > badness) {
                        result = sk;
                        badness = score;
                }
        }
        /*
         * if the nulls value we got at the end of this lookup is
         * not the expected one, we must restart lookup.
         * We probably met an item that was moved to another chain.
         */
        if (get_nulls_value(node) != hash)
                goto begin;
        if (result) {
                if (unlikely(!atomic_inc_not_zero(&result->sk_refcnt)))
                        result = NULL;
                else if (unlikely(compute_score(result, net, saddr, hnum, sport,
                                  daddr, dport, dif) < badness)) {
                        sock_put(result);
                        goto begin;
                }
        }
        rcu_read_unlock();
        return result;
Signed-off-by: Eric Dumazet <dada1@cosmosbay.com>
Acked-by: Peter Zijlstra <a.p.zijlstra@chello.nl>
Signed-off-by: David S. Miller <davem@davemloft.net>
											
										 
											2008-11-16 19:37:55 -08:00
										 |  |  | static inline void __hlist_nulls_del(struct hlist_nulls_node *n) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	struct hlist_nulls_node *next = n->next; | 
					
						
							|  |  |  | 	struct hlist_nulls_node **pprev = n->pprev; | 
					
						
							|  |  |  | 	*pprev = next; | 
					
						
							|  |  |  | 	if (!is_a_nulls(next)) | 
					
						
							|  |  |  | 		next->pprev = pprev; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2009-06-13 12:28:57 +02:00
										 |  |  | static inline void hlist_nulls_del(struct hlist_nulls_node *n) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	__hlist_nulls_del(n); | 
					
						
							|  |  |  | 	n->pprev = LIST_POISON2; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
											  
											
												rcu: Introduce hlist_nulls variant of hlist
hlist uses NULL value to finish a chain.
hlist_nulls variant use the low order bit set to 1 to signal an end-of-list marker.
This allows to store many different end markers, so that some RCU lockless
algos (used in TCP/UDP stack for example) can save some memory barriers in
fast paths.
Two new files are added :
include/linux/list_nulls.h
  - mimics hlist part of include/linux/list.h, derived to hlist_nulls variant
include/linux/rculist_nulls.h
  - mimics hlist part of include/linux/rculist.h, derived to hlist_nulls variant
   Only four helpers are declared for the moment :
     hlist_nulls_del_init_rcu(), hlist_nulls_del_rcu(),
     hlist_nulls_add_head_rcu() and hlist_nulls_for_each_entry_rcu()
prefetches() were removed, since an end of list is not anymore NULL value.
prefetches() could trigger useless (and possibly dangerous) memory transactions.
Example of use (extracted from __udp4_lib_lookup())
	struct sock *sk, *result;
        struct hlist_nulls_node *node;
        unsigned short hnum = ntohs(dport);
        unsigned int hash = udp_hashfn(net, hnum);
        struct udp_hslot *hslot = &udptable->hash[hash];
        int score, badness;
        rcu_read_lock();
begin:
        result = NULL;
        badness = -1;
        sk_nulls_for_each_rcu(sk, node, &hslot->head) {
                score = compute_score(sk, net, saddr, hnum, sport,
                                      daddr, dport, dif);
                if (score > badness) {
                        result = sk;
                        badness = score;
                }
        }
        /*
         * if the nulls value we got at the end of this lookup is
         * not the expected one, we must restart lookup.
         * We probably met an item that was moved to another chain.
         */
        if (get_nulls_value(node) != hash)
                goto begin;
        if (result) {
                if (unlikely(!atomic_inc_not_zero(&result->sk_refcnt)))
                        result = NULL;
                else if (unlikely(compute_score(result, net, saddr, hnum, sport,
                                  daddr, dport, dif) < badness)) {
                        sock_put(result);
                        goto begin;
                }
        }
        rcu_read_unlock();
        return result;
Signed-off-by: Eric Dumazet <dada1@cosmosbay.com>
Acked-by: Peter Zijlstra <a.p.zijlstra@chello.nl>
Signed-off-by: David S. Miller <davem@davemloft.net>
											
										 
											2008-11-16 19:37:55 -08:00
										 |  |  | /**
 | 
					
						
							|  |  |  |  * hlist_nulls_for_each_entry	- iterate over list of given type | 
					
						
							|  |  |  |  * @tpos:	the type * to use as a loop cursor. | 
					
						
							|  |  |  |  * @pos:	the &struct hlist_node to use as a loop cursor. | 
					
						
							|  |  |  |  * @head:	the head for your list. | 
					
						
							|  |  |  |  * @member:	the name of the hlist_node within the struct. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | #define hlist_nulls_for_each_entry(tpos, pos, head, member)		       \
 | 
					
						
							|  |  |  | 	for (pos = (head)->first;					       \ | 
					
						
							|  |  |  | 	     (!is_a_nulls(pos)) &&					       \ | 
					
						
							|  |  |  | 		({ tpos = hlist_nulls_entry(pos, typeof(*tpos), member); 1;}); \ | 
					
						
							|  |  |  | 	     pos = pos->next) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /**
 | 
					
						
							|  |  |  |  * hlist_nulls_for_each_entry_from - iterate over a hlist continuing from current point | 
					
						
							|  |  |  |  * @tpos:	the type * to use as a loop cursor. | 
					
						
							|  |  |  |  * @pos:	the &struct hlist_node to use as a loop cursor. | 
					
						
							|  |  |  |  * @member:	the name of the hlist_node within the struct. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | #define hlist_nulls_for_each_entry_from(tpos, pos, member)	\
 | 
					
						
							|  |  |  | 	for (; (!is_a_nulls(pos)) && 				\ | 
					
						
							|  |  |  | 		({ tpos = hlist_nulls_entry(pos, typeof(*tpos), member); 1;}); \ | 
					
						
							|  |  |  | 	     pos = pos->next) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #endif
 |