b.a.t.m.a.n.lists.open-mesh.org archive mirror
 help / color / mirror / Atom feed
From: "Linus Lüssing" <linus.luessing@web.de>
To: The list for a Better Approach To Mobile Ad-hoc Networking
	<b.a.t.m.a.n@lists.open-mesh.org>
Subject: Re: [B.A.T.M.A.N.] slowpath warning
Date: Sun, 31 Jan 2010 20:37:29 +0100	[thread overview]
Message-ID: <20100131193729.GA20988@Linus-Debian> (raw)
In-Reply-To: <20100130165059.GV24649@lunn.ch>


[-- Warning: decoded text below may be mangled, UTF-8 assumed --]
[-- Attachment #1.1: Type: text/plain; charset=utf-8, Size: 14179 bytes --]

Hi Andrew,

Yes, ehm it does indeed cause a kernel panic on the server side
immediately :). See the attachment for the full call trace.

Cheers, Linus

On Sat, Jan 30, 2010 at 05:50:59PM +0100, Andrew Lunn wrote:
> Hi Linus
> 
> Please could you try this patch and see if it fixes the vis problem.
> It compiles cleanly with 2.6.32. It is checkpatch clean, it is sparse
> clean. However, since i've not actually tried running the code i would
> not be too surprised if it deadlocked, leaked memory, oopsed, ...
> 
>     Andrew
> 
> Staging: batman-adv: Don't have interrupts disabled while sending.
> 
> send_vis_packets() would disable interrupts before calling
> dev_queue_xmit() which resulting in a backtrace in local_bh_enable().
> Fix this by using kref on the vis_info object so that we can call
> send_vis_packets() without holding vis_hash_lock. vis_hash_lock also
> used to protect recv_list, so we now need a new lock to protect that
> instead of vis_hash_lock.
> 
> Also a few checkpatch cleanups.
> 
> Reported-by: Linus Lüssing <linus.luessing@web.de>
> Signed-off-by: Andrew Lunn <andrew@lunn.ch>
> 
> Index: vis.c
> ===================================================================
> --- vis.c	(revision 1568)
> +++ vis.c	(working copy)
> @@ -30,22 +30,26 @@
>  
>  struct hashtable_t *vis_hash;
>  DEFINE_SPINLOCK(vis_hash_lock);
> +static DEFINE_SPINLOCK(recv_list_lock);
>  static struct vis_info *my_vis_info;
>  static struct list_head send_list;	/* always locked with vis_hash_lock */
>  
>  static void start_vis_timer(void);
>  
>  /* free the info */
> -static void free_info(void *data)
> +static void free_info(struct kref *ref)
>  {
> -	struct vis_info *info = data;
> +	struct vis_info *info = container_of(ref, struct vis_info, refcount);
>  	struct recvlist_node *entry, *tmp;
> +	unsigned long flags;
>  
>  	list_del_init(&info->send_list);
> +	spin_lock_irqsave(&recv_list_lock, flags);
>  	list_for_each_entry_safe(entry, tmp, &info->recv_list, list) {
>  		list_del(&entry->list);
>  		kfree(entry);
>  	}
> +	spin_unlock_irqrestore(&recv_list_lock, flags);
>  	kfree(info);
>  }
>  
> @@ -147,32 +151,41 @@
>  static void recv_list_add(struct list_head *recv_list, char *mac)
>  {
>  	struct recvlist_node *entry;
> +	unsigned long flags;
> +
>  	entry = kmalloc(sizeof(struct recvlist_node), GFP_ATOMIC);
>  	if (!entry)
>  		return;
>  
>  	memcpy(entry->mac, mac, ETH_ALEN);
> +	spin_lock_irqsave(&recv_list_lock, flags);
>  	list_add_tail(&entry->list, recv_list);
> +	spin_unlock_irqrestore(&recv_list_lock, flags);
>  }
>  
>  /* returns 1 if this mac is in the recv_list */
>  static int recv_list_is_in(struct list_head *recv_list, char *mac)
>  {
>  	struct recvlist_node *entry;
> +	unsigned long flags;
>  
> +	spin_lock_irqsave(&recv_list_lock, flags);
>  	list_for_each_entry(entry, recv_list, list) {
> -		if (memcmp(entry->mac, mac, ETH_ALEN) == 0)
> +		if (memcmp(entry->mac, mac, ETH_ALEN) == 0) {
> +			spin_unlock_irqrestore(&recv_list_lock, flags);
>  			return 1;
> +		}
>  	}
> -
> +	spin_unlock_irqrestore(&recv_list_lock, flags);
>  	return 0;
>  }
>  
>  /* try to add the packet to the vis_hash. return NULL if invalid (e.g. too old,
> - * broken.. ).  vis hash must be locked outside.  is_new is set when the packet
> + * broken.. ).	vis hash must be locked outside.  is_new is set when the packet
>   * is newer than old entries in the hash. */
>  static struct vis_info *add_packet(struct vis_packet *vis_packet,
> -				   int vis_info_len, int *is_new)
> +				   int vis_info_len, int *is_new,
> +				   int make_broadcast)
>  {
>  	struct vis_info *info, *old_info;
>  	struct vis_info search_elem;
> @@ -199,7 +212,7 @@
>  		}
>  		/* remove old entry */
>  		hash_remove(vis_hash, old_info);
> -		free_info(old_info);
> +		kref_put(&old_info->refcount, free_info);
>  	}
>  
>  	info = kmalloc(sizeof(struct vis_info) + vis_info_len, GFP_ATOMIC);
> @@ -208,6 +221,7 @@
>  
>  	INIT_LIST_HEAD(&info->send_list);
>  	INIT_LIST_HEAD(&info->recv_list);
> +	kref_init(&info->refcount);
>  	info->first_seen = jiffies;
>  	memcpy(&info->packet, vis_packet,
>  	       sizeof(struct vis_packet) + vis_info_len);
> @@ -215,16 +229,21 @@
>  	/* initialize and add new packet. */
>  	*is_new = 1;
>  
> +	/* Make it a broadcast packet, if required */
> +	if (make_broadcast)
> +		memcpy(info->packet.target_orig, broadcastAddr, ETH_ALEN);
> +
>  	/* repair if entries is longer than packet. */
>  	if (info->packet.entries * sizeof(struct vis_info_entry) > vis_info_len)
> -		info->packet.entries = vis_info_len / sizeof(struct vis_info_entry);
> +		info->packet.entries = vis_info_len /
> +			sizeof(struct vis_info_entry);
>  
>  	recv_list_add(&info->recv_list, info->packet.sender_orig);
>  
>  	/* try to add it */
>  	if (hash_add(vis_hash, info) < 0) {
>  		/* did not work (for some reason) */
> -		free_info(info);
> +		kref_put(&old_info->refcount, free_info);
>  		info = NULL;
>  	}
>  
> @@ -235,19 +254,20 @@
>  void receive_server_sync_packet(struct vis_packet *vis_packet, int vis_info_len)
>  {
>  	struct vis_info *info;
> -	int is_new;
> +	int is_new, make_broadcast;
>  	unsigned long flags;
>  	int vis_server = atomic_read(&vis_mode);
>  
> +	make_broadcast = (vis_server == VIS_TYPE_SERVER_SYNC);
> +
>  	spin_lock_irqsave(&vis_hash_lock, flags);
> -	info = add_packet(vis_packet, vis_info_len, &is_new);
> +	info = add_packet(vis_packet, vis_info_len, &is_new, make_broadcast);
>  	if (info == NULL)
>  		goto end;
>  
>  	/* only if we are server ourselves and packet is newer than the one in
>  	 * hash.*/
>  	if (vis_server == VIS_TYPE_SERVER_SYNC && is_new) {
> -		memcpy(info->packet.target_orig, broadcastAddr, ETH_ALEN);
>  		if (list_empty(&info->send_list))
>  			list_add_tail(&info->send_list, &send_list);
>  	}
> @@ -263,24 +283,27 @@
>  	int is_new;
>  	unsigned long flags;
>  	int vis_server = atomic_read(&vis_mode);
> +	int are_target = 0;
>  
>  	/* clients shall not broadcast. */
>  	if (is_bcast(vis_packet->target_orig))
>  		return;
>  
> +	/* Are we the target for this VIS packet? */
> +	if (vis_server == VIS_TYPE_SERVER_SYNC	&&
> +	    is_my_mac(info->packet.target_orig))
> +		are_target = 1;
> +
>  	spin_lock_irqsave(&vis_hash_lock, flags);
> -	info = add_packet(vis_packet, vis_info_len, &is_new);
> +	info = add_packet(vis_packet, vis_info_len, &is_new, are_target);
>  	if (info == NULL)
>  		goto end;
>  	/* note that outdated packets will be dropped at this point. */
>  
>  
>  	/* send only if we're the target server or ... */
> -	if (vis_server == VIS_TYPE_SERVER_SYNC  &&
> -	    is_my_mac(info->packet.target_orig) &&
> -	    is_new) {
> +	if (are_target && is_new) {
>  		info->packet.vis_type = VIS_TYPE_SERVER_SYNC;	/* upgrade! */
> -		memcpy(info->packet.target_orig, broadcastAddr, ETH_ALEN);
>  		if (list_empty(&info->send_list))
>  			list_add_tail(&info->send_list, &send_list);
>  
> @@ -362,14 +385,17 @@
>  	while (hash_iterate(orig_hash, &hashit_global)) {
>  		orig_node = hashit_global.bucket->data;
>  		if (orig_node->router != NULL
> -			&& compare_orig(orig_node->router->addr, orig_node->orig)
> +			&& compare_orig(orig_node->router->addr,
> +					orig_node->orig)
>  			&& orig_node->batman_if
>  			&& (orig_node->batman_if->if_active == IF_ACTIVE)
>  		    && orig_node->router->tq_avg > 0) {
>  
>  			/* fill one entry into buffer. */
>  			entry = &entry_array[info->packet.entries];
> -			memcpy(entry->src, orig_node->batman_if->net_dev->dev_addr, ETH_ALEN);
> +			memcpy(entry->src,
> +			       orig_node->batman_if->net_dev->dev_addr,
> +			       ETH_ALEN);
>  			memcpy(entry->dest, orig_node->orig, ETH_ALEN);
>  			entry->quality = orig_node->router->tq_avg;
>  			info->packet.entries++;
> @@ -401,6 +427,8 @@
>  	return 0;
>  }
>  
> +/* free old vis packets. Must be called with this vis_hash_lock
> + * held */
>  static void purge_vis_packets(void)
>  {
>  	HASHIT(hashit);
> @@ -413,7 +441,7 @@
>  		if (time_after(jiffies,
>  			       info->first_seen + (VIS_TIMEOUT*HZ)/1000)) {
>  			hash_remove_bucket(vis_hash, &hashit);
> -			free_info(info);
> +			kref_put(&info->refcount, free_info);
>  		}
>  	}
>  }
> @@ -423,6 +451,8 @@
>  	HASHIT(hashit);
>  	struct orig_node *orig_node;
>  	unsigned long flags;
> +	struct batman_if *batman_if;
> +	uint8_t dstaddr[ETH_ALEN];
>  
>  	spin_lock_irqsave(&orig_hash_lock, flags);
>  
> @@ -431,46 +461,57 @@
>  		orig_node = hashit.bucket->data;
>  
>  		/* if it's a vis server and reachable, send it. */
> -		if (orig_node &&
> -		    (orig_node->flags & VIS_SERVER) &&
> -		    orig_node->batman_if &&
> -		    orig_node->router) {
> +		if ((!orig_node) || (!orig_node->batman_if) ||
> +		    (!orig_node->router))
> +			continue;
> +		if (!(orig_node->flags & VIS_SERVER))
> +			continue;
> +		/* don't send it if we already received the packet from
> +		 * this node. */
> +		if (recv_list_is_in(&info->recv_list, orig_node->orig))
> +			continue;
>  
> -			/* don't send it if we already received the packet from
> -			 * this node. */
> -			if (recv_list_is_in(&info->recv_list, orig_node->orig))
> -				continue;
> +		memcpy(info->packet.target_orig, orig_node->orig, ETH_ALEN);
> +		batman_if = orig_node->batman_if;
> +		memcpy(dstaddr, orig_node->router->addr, ETH_ALEN);
> +		spin_unlock_irqrestore(&orig_hash_lock, flags);
>  
> -			memcpy(info->packet.target_orig,
> -			       orig_node->orig, ETH_ALEN);
> +		send_raw_packet((unsigned char *)&info->packet,
> +				packet_length, batman_if, dstaddr);
>  
> -			send_raw_packet((unsigned char *) &info->packet,
> -					packet_length,
> -					orig_node->batman_if,
> -					orig_node->router->addr);
> -		}
> +		spin_lock_irqsave(&orig_hash_lock, flags);
> +
>  	}
> +	spin_unlock_irqrestore(&orig_hash_lock, flags);
>  	memcpy(info->packet.target_orig, broadcastAddr, ETH_ALEN);
> -	spin_unlock_irqrestore(&orig_hash_lock, flags);
>  }
>  
>  static void unicast_vis_packet(struct vis_info *info, int packet_length)
>  {
>  	struct orig_node *orig_node;
>  	unsigned long flags;
> +	struct batman_if *batman_if;
> +	uint8_t dstaddr[ETH_ALEN];
>  
>  	spin_lock_irqsave(&orig_hash_lock, flags);
>  	orig_node = ((struct orig_node *)
>  		     hash_find(orig_hash, info->packet.target_orig));
>  
> -	if ((orig_node != NULL) &&
> -	    (orig_node->batman_if != NULL) &&
> -	    (orig_node->router != NULL)) {
> -		send_raw_packet((unsigned char *) &info->packet, packet_length,
> -				orig_node->batman_if,
> -				orig_node->router->addr);
> -	}
> +	if ((!orig_node) || (!orig_node->batman_if) || (!orig_node->router))
> +		goto out;
> +
> +	/* don't lock while sending the packets ... we therefore
> +	 * copy the required data before sending */
> +	batman_if = orig_node->batman_if;
> +	memcpy(dstaddr, orig_node->router->addr, ETH_ALEN);
>  	spin_unlock_irqrestore(&orig_hash_lock, flags);
> +
> +	send_raw_packet((unsigned char *)&info->packet,
> +			packet_length, batman_if, dstaddr);
> +	return;
> +
> +out:
> +	spin_unlock_irqrestore(&orig_hash_lock, flags);
>  }
>  
>  /* only send one vis packet. called from send_vis_packets() */
> @@ -503,6 +544,7 @@
>  	unsigned long flags;
>  
>  	spin_lock_irqsave(&vis_hash_lock, flags);
> +
>  	purge_vis_packets();
>  
>  	if (generate_vis_packet() == 0)
> @@ -511,7 +553,11 @@
>  
>  	list_for_each_entry_safe(info, temp, &send_list, send_list) {
>  		list_del_init(&info->send_list);
> +		kref_get(&info->refcount);
> +		spin_unlock_irqrestore(&vis_hash_lock, flags);
>  		send_vis_packet(info);
> +		spin_lock_irqsave(&vis_hash_lock, flags);
> +		kref_put(&info->refcount, free_info);
>  	}
>  	spin_unlock_irqrestore(&vis_hash_lock, flags);
>  	start_vis_timer();
> @@ -544,6 +590,7 @@
>  	my_vis_info->first_seen = jiffies - atomic_read(&vis_interval);
>  	INIT_LIST_HEAD(&my_vis_info->recv_list);
>  	INIT_LIST_HEAD(&my_vis_info->send_list);
> +	kref_init(&my_vis_info->refcount);
>  	my_vis_info->packet.version = COMPAT_VERSION;
>  	my_vis_info->packet.packet_type = BAT_VIS;
>  	my_vis_info->packet.ttl = TTL;
> @@ -557,9 +604,9 @@
>  
>  	if (hash_add(vis_hash, my_vis_info) < 0) {
>  		printk(KERN_ERR
> -			  "batman-adv:Can't add own vis packet into hash\n");
> -		free_info(my_vis_info);	/* not in hash, need to remove it
> -					 * manually. */
> +		       "batman-adv:Can't add own vis packet into hash\n");
> +		/* not in hash, need to remove it manually. */
> +		kref_put(&my_vis_info->refcount, free_info);
>  		goto err;
>  	}
>  
> @@ -573,6 +620,13 @@
>  	return 0;
>  }
>  
> +/* Decrease the reference count on a hash item info */
> +static void free_info_ref(void *data)
> +{
> +	struct vis_info *info = data;
> +	kref_put(&info->refcount, free_info);
> +}
> +
>  /* shutdown vis-server */
>  void vis_quit(void)
>  {
> @@ -584,7 +638,7 @@
>  
>  	spin_lock_irqsave(&vis_hash_lock, flags);
>  	/* properly remove, kill timers ... */
> -	hash_delete(vis_hash, free_info);
> +	hash_delete(vis_hash, free_info_ref);
>  	vis_hash = NULL;
>  	my_vis_info = NULL;
>  	spin_unlock_irqrestore(&vis_hash_lock, flags);
> @@ -594,5 +648,5 @@
>  static void start_vis_timer(void)
>  {
>  	queue_delayed_work(bat_event_workqueue, &vis_timer_wq,
> -			   (atomic_read(&vis_interval) * HZ ) / 1000);
> +			   (atomic_read(&vis_interval) * HZ) / 1000);
>  }
> Index: vis.h
> ===================================================================
> --- vis.h	(revision 1568)
> +++ vis.h	(working copy)
> @@ -29,6 +29,7 @@
>  			    /* list of server-neighbors we received a vis-packet
>  			     * from.  we should not reply to them. */
>  	struct list_head send_list;
> +	struct kref refcount;
>  	/* this packet might be part of the vis send queue. */
>  	struct vis_packet packet;
>  	/* vis_info may follow here*/
> 

[-- Attachment #1.2: 2010-01-31-2030-vis-patch-kernelpanic.log --]
[-- Type: text/plain, Size: 2279 bytes --]

root@OpenWrt:/# batctl vs
[ ] client mode (server disabled)
[x] server mode (server enabled)
root@OpenWrt:/# CPU 0 Unable to handle kernel paging request at virtual address 00000024, epc == 8014d58c, ra == 80410154
Oops[#1]:
Cpu 0
$ 0   : 00000000 10009c00 8070e140 00000006
$ 4   : 8070e140 00000024 00000006 00000001
$ 8   : 00000024 00000000 00000000 00000000
$12   : 00000000 7fd89ed8 00000413 00430000
$16   : 80fef500 8041cdc0 00000024 8070e000
$20   : 0000004c 80d63000 00004305 80c05040
$24   : 00000002 8061c874
$28   : 80290000 80291ca8 00000000 80410154
Hi    : 000000f5
Lo    : 15a32180
epc   : 8014d58c memcmp+0xc/0x38
    Tainted: P
ra    : 80410154 is_my_mac+0x3c/0x78 [batman_adv]
Status: 10009c03    KERNEL EXL IE
Cause : 10800008
BadVA : 00000024
PrId  : 00019064 (MIPS 4KEc)
Modules linked in: ath_ahb ath_hal(P) batman_adv ip6t_REJECT ip6t_LOG ip6t_rt ip6t_hbh ip6t_mh ip6t_ipv6header ip6t_frag ip6t_eui64 ip6t_ah ip6table_raw ip6_queue ip6table_mangle ip6table_filter ip6_tables ebt_redirect ebt_mark ebt_vlan ebt_stp ebt_pkttype ebt_mark_m ebt_limit ebt_among ebt_802_3 ebtable_nat ebtable_filter ebtable_broute ebtables xt_quota xt_pkttype xt_physdev ipt_REJECT xt_TCPMSS ipt_LOG xt_multiport xt_mac xt_limit iptable_mangle iptable_filter ip_tables xt_tcpudp x_tables tun ipv6
Process swapper (pid: 0, threadinfo=80290000, task=80292170, tls=00000000)
Stack : 80225540 00000000 80a11c00 8022b330 00000000 00000000 80c05060 80417264
        00000000 8022a728 80000000 806c0052 c02e4000 c02e7000 80f49a40 80c05060
        80c05052 8070e000 80d63000 804124e4 80225540 00000000 80a11c00 00000000
        80c14e40 80fef500 80f49a40 80417bf4 8070e2c0 80c05052 8070e000 80d63000
        80d63000 80f49a40 8070e2c0 806215c4 00000000 80292170 80291db0 000332b6
        ...
Call Trace:
[<8014d58c>] memcmp+0xc/0x38
[<80410154>] is_my_mac+0x3c/0x78 [batman_adv]
[<80417264>] receive_client_update_packet+0x4c/0x154 [batman_adv]
[<804124e4>] recv_vis_packet+0xa4/0xbc [batman_adv]
[<80417bf4>] batman_skb_recv+0x168/0x1dc [batman_adv]
[<806215c4>] ieee80211_saveath+0xb24/0xb80 [ath_ahb]


Code: 08053567  00003821  90430000 <91020000> 00621023  14400006  24c6ffff  00871021  00a74021
Kernel panic - not syncing: Fatal exception in interrupt
Rebooting in 3 seconds..+

[-- Attachment #2: Digital signature --]
[-- Type: application/pgp-signature, Size: 836 bytes --]

  reply	other threads:[~2010-01-31 19:37 UTC|newest]

Thread overview: 37+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2010-01-23 17:46 [B.A.T.M.A.N.] bat_events: page allocation failure (batman-adv maint) Linus Lüssing
2010-01-23 18:10 ` Andrew Lunn
2010-01-23 23:30   ` Linus Lüssing
2010-01-24 20:42   ` Linus Lüssing
2010-01-24 21:00     ` Andrew Lunn
2010-01-25  6:46       ` Andrew Lunn
2010-01-25  6:47     ` Andrew Lunn
2010-01-25  8:21       ` Marek Lindner
2010-01-26  1:48       ` Linus Lüssing
2010-01-24  4:24 ` Linus Lüssing
2010-01-26  6:13 ` [B.A.T.M.A.N.] slowpath warning Linus Lüssing
2010-01-26  7:16   ` Marek Lindner
2010-01-27  0:10     ` Linus Lüssing
2010-01-28  0:09       ` Marek Lindner
2010-01-28  6:29         ` Andrew Lunn
2010-01-29  8:25   ` Andrew Lunn
2010-01-29  8:59     ` Marek Lindner
2010-01-30 16:50       ` Andrew Lunn
2010-01-31 19:37         ` Linus Lüssing [this message]
2010-01-31 20:56           ` Andrew Lunn
2010-02-11  9:46         ` Andrew Lunn
2010-02-11 10:01           ` Andrew Lunn
2010-02-19 17:19             ` Linus Lüssing
2010-02-20 18:04               ` Andrew Lunn
2010-02-21 13:10                 ` Linus Lüssing
2010-02-28 16:34             ` Simon Wunderlich
2010-03-01  5:59               ` Andrew Lunn
2010-03-01 16:57                 ` Simon Wunderlich
2010-03-02  6:43                   ` Andrew Lunn
2010-03-02 21:13                     ` Simon Wunderlich
2010-03-02 21:26                       ` elektra
2010-03-02 21:44                       ` Linus Lüssing
2010-03-04  0:26                         ` Linus Lüssing
2010-03-04  8:57                           ` Andrew Lunn
2010-03-04  9:19                             ` Marek Lindner
2010-03-04  9:49                               ` Andrew Lunn
2010-03-04 10:00                                 ` Marek Lindner

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=20100131193729.GA20988@Linus-Debian \
    --to=linus.luessing@web.de \
    --cc=b.a.t.m.a.n@lists.open-mesh.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).