diff mbox series

[net,v2] net: neigh: don't call kfree_skb() under spin_lock_irqsave()

Message ID 20220819044724.961356-1-yangyingliang@huawei.com (mailing list archive)
State Superseded
Delegated to: Netdev Maintainers
Headers show
Series [net,v2] net: neigh: don't call kfree_skb() under spin_lock_irqsave() | expand

Checks

Context Check Description
netdev/tree_selection success Clearly marked for net
netdev/fixes_present success Fixes tag present in non-next series
netdev/subject_prefix success Link
netdev/cover_letter success Single patches do not need cover letters
netdev/patch_count success Link
netdev/header_inline success No static functions without inline keyword in header files
netdev/build_32bit success Errors and warnings before: 344 this patch: 344
netdev/cc_maintainers warning 2 maintainers not CCed: daniel@iogearbox.net pabeni@redhat.com
netdev/build_clang success Errors and warnings before: 5 this patch: 5
netdev/module_param success Was 0 now: 0
netdev/verify_signedoff success Signed-off-by tag matches author and committer
netdev/check_selftest success No net selftest shell script
netdev/verify_fixes success Fixes tag looks correct
netdev/build_allmodconfig_warn success Errors and warnings before: 344 this patch: 344
netdev/checkpatch success total: 0 errors, 0 warnings, 0 checks, 34 lines checked
netdev/kdoc success Errors and warnings before: 0 this patch: 0
netdev/source_inline success Was 0 now: 0

Commit Message

Yang Yingliang Aug. 19, 2022, 4:47 a.m. UTC
It is not allowed to call kfree_skb() from hardware interrupt
context or with interrupts being disabled. So add all skb to
a tmp list, then free them after spin_unlock_irqrestore() at
once.

Fixes: 66ba215cb513 ("neigh: fix possible DoS due to net iface start/stop loop")
Signed-off-by: Yang Yingliang <yangyingliang@huawei.com>
---
 net/core/neighbour.c | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

Comments

Denis V. Lunev Aug. 19, 2022, 7:56 a.m. UTC | #1
On 19.08.2022 06:47, 'Yang Yingliang' via den wrote:
> It is not allowed to call kfree_skb() from hardware interrupt
> context or with interrupts being disabled. So add all skb to
> a tmp list, then free them after spin_unlock_irqrestore() at
> once.
>
> Fixes: 66ba215cb513 ("neigh: fix possible DoS due to net iface start/stop loop")
> Signed-off-by: Yang Yingliang <yangyingliang@huawei.com>
> ---
>   net/core/neighbour.c | 10 +++++++++-
>   1 file changed, 9 insertions(+), 1 deletion(-)
>
> diff --git a/net/core/neighbour.c b/net/core/neighbour.c
> index 5b669eb80270..d21c7de1ff1a 100644
> --- a/net/core/neighbour.c
> +++ b/net/core/neighbour.c
> @@ -309,14 +309,17 @@ static int neigh_del_timer(struct neighbour *n)
>   
>   static void pneigh_queue_purge(struct sk_buff_head *list, struct net *net)
>   {
> +	struct sk_buff_head tmp;
>   	unsigned long flags;
>   	struct sk_buff *skb;
>   
> +	skb_queue_head_init(&tmp);
>   	spin_lock_irqsave(&list->lock, flags);
>   	skb = skb_peek(list);
>   	while (skb != NULL) {
>   		struct sk_buff *skb_next = skb_peek_next(skb, list);
>   		struct net_device *dev = skb->dev;
> +
>   		if (net == NULL || net_eq(dev_net(dev), net)) {
>   			struct in_device *in_dev;
>   
> @@ -328,11 +331,16 @@ static void pneigh_queue_purge(struct sk_buff_head *list, struct net *net)
>   			__skb_unlink(skb, list);
>   
>   			dev_put(dev);
> -			kfree_skb(skb);
> +			dev_kfree_skb_irq(skb);
>   		}
>   		skb = skb_next;
>   	}
>   	spin_unlock_irqrestore(&list->lock, flags);
> +
> +	while ((skb = __skb_dequeue(&tmp))) {
> +		dev_put(skb->dev);
> +		kfree_skb(skb);
> +	}
>   }
>   
>   static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev,
Reviewed-by: Denis V. Lunev <den@openvz.org>
Nikolay Aleksandrov Aug. 19, 2022, 12:15 p.m. UTC | #2
On 19/08/2022 07:47, Yang Yingliang wrote:
> It is not allowed to call kfree_skb() from hardware interrupt
> context or with interrupts being disabled. So add all skb to
> a tmp list, then free them after spin_unlock_irqrestore() at
> once.
> 
> Fixes: 66ba215cb513 ("neigh: fix possible DoS due to net iface start/stop loop")
> Signed-off-by: Yang Yingliang <yangyingliang@huawei.com>
> ---
>  net/core/neighbour.c | 10 +++++++++-
>  1 file changed, 9 insertions(+), 1 deletion(-)
> 
> diff --git a/net/core/neighbour.c b/net/core/neighbour.c
> index 5b669eb80270..d21c7de1ff1a 100644
> --- a/net/core/neighbour.c
> +++ b/net/core/neighbour.c
> @@ -309,14 +309,17 @@ static int neigh_del_timer(struct neighbour *n)
>  
>  static void pneigh_queue_purge(struct sk_buff_head *list, struct net *net)
>  {
> +	struct sk_buff_head tmp;
>  	unsigned long flags;
>  	struct sk_buff *skb;
>  
> +	skb_queue_head_init(&tmp);
>  	spin_lock_irqsave(&list->lock, flags);
>  	skb = skb_peek(list);
>  	while (skb != NULL) {
>  		struct sk_buff *skb_next = skb_peek_next(skb, list);
>  		struct net_device *dev = skb->dev;
> +
>  		if (net == NULL || net_eq(dev_net(dev), net)) {
>  			struct in_device *in_dev;
>  
> @@ -328,11 +331,16 @@ static void :q

(struct sk_buff_head *list, struct net *net)
>  			__skb_unlink(skb, list);
>  
>  			dev_put(dev);
> -			kfree_skb(skb);
> +			dev_kfree_skb_irq(skb);

this is still doing dev_kfree_skb_irq() instead of attaching the skb to tmp, in fact
tmp seems unused so the loop below does nothing

>  		}
>  		skb = skb_next;
>  	}
>  	spin_unlock_irqrestore(&list->lock, flags);
> +
> +	while ((skb = __skb_dequeue(&tmp))) {
> +		dev_put(skb->dev);

Also note that there's already a dev_put() above

> +		kfree_skb(skb);
> +	}
>  }
>  
>  static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev,
Yang Yingliang Aug. 22, 2022, 1:39 a.m. UTC | #3
Hi,

On 2022/8/19 20:15, Nikolay Aleksandrov wrote:
> On 19/08/2022 07:47, Yang Yingliang wrote:
>> It is not allowed to call kfree_skb() from hardware interrupt
>> context or with interrupts being disabled. So add all skb to
>> a tmp list, then free them after spin_unlock_irqrestore() at
>> once.
>>
>> Fixes: 66ba215cb513 ("neigh: fix possible DoS due to net iface start/stop loop")
>> Signed-off-by: Yang Yingliang <yangyingliang@huawei.com>
>> ---
>>   net/core/neighbour.c | 10 +++++++++-
>>   1 file changed, 9 insertions(+), 1 deletion(-)
>>
>> diff --git a/net/core/neighbour.c b/net/core/neighbour.c
>> index 5b669eb80270..d21c7de1ff1a 100644
>> --- a/net/core/neighbour.c
>> +++ b/net/core/neighbour.c
>> @@ -309,14 +309,17 @@ static int neigh_del_timer(struct neighbour *n)
>>   
>>   static void pneigh_queue_purge(struct sk_buff_head *list, struct net *net)
>>   {
>> +	struct sk_buff_head tmp;
>>   	unsigned long flags;
>>   	struct sk_buff *skb;
>>   
>> +	skb_queue_head_init(&tmp);
>>   	spin_lock_irqsave(&list->lock, flags);
>>   	skb = skb_peek(list);
>>   	while (skb != NULL) {
>>   		struct sk_buff *skb_next = skb_peek_next(skb, list);
>>   		struct net_device *dev = skb->dev;
>> +
>>   		if (net == NULL || net_eq(dev_net(dev), net)) {
>>   			struct in_device *in_dev;
>>   
>> @@ -328,11 +331,16 @@ static void :q
> (struct sk_buff_head *list, struct net *net)
>>   			__skb_unlink(skb, list);
>>   
>>   			dev_put(dev);
>> -			kfree_skb(skb);
>> +			dev_kfree_skb_irq(skb);
> this is still doing dev_kfree_skb_irq() instead of attaching the skb to tmp, in fact
> tmp seems unused so the loop below does nothing
>
>>   		}
>>   		skb = skb_next;
>>   	}
>>   	spin_unlock_irqrestore(&list->lock, flags);
>> +
>> +	while ((skb = __skb_dequeue(&tmp))) {
>> +		dev_put(skb->dev);
> Also note that there's already a dev_put() above
I made a mistake and send a wrong patch, please ignore this patch.

Thanks,
Yang
>
>> +		kfree_skb(skb);
>> +	}
>>   }
>>   
>>   static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev,
>
> .
diff mbox series

Patch

diff --git a/net/core/neighbour.c b/net/core/neighbour.c
index 5b669eb80270..d21c7de1ff1a 100644
--- a/net/core/neighbour.c
+++ b/net/core/neighbour.c
@@ -309,14 +309,17 @@  static int neigh_del_timer(struct neighbour *n)
 
 static void pneigh_queue_purge(struct sk_buff_head *list, struct net *net)
 {
+	struct sk_buff_head tmp;
 	unsigned long flags;
 	struct sk_buff *skb;
 
+	skb_queue_head_init(&tmp);
 	spin_lock_irqsave(&list->lock, flags);
 	skb = skb_peek(list);
 	while (skb != NULL) {
 		struct sk_buff *skb_next = skb_peek_next(skb, list);
 		struct net_device *dev = skb->dev;
+
 		if (net == NULL || net_eq(dev_net(dev), net)) {
 			struct in_device *in_dev;
 
@@ -328,11 +331,16 @@  static void pneigh_queue_purge(struct sk_buff_head *list, struct net *net)
 			__skb_unlink(skb, list);
 
 			dev_put(dev);
-			kfree_skb(skb);
+			dev_kfree_skb_irq(skb);
 		}
 		skb = skb_next;
 	}
 	spin_unlock_irqrestore(&list->lock, flags);
+
+	while ((skb = __skb_dequeue(&tmp))) {
+		dev_put(skb->dev);
+		kfree_skb(skb);
+	}
 }
 
 static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev,