Skip to content

Commit a6126d1

Browse files
author
Maxim Levitsky
committed
hv_netvsc: Fix panic during namespace deletion with VF
JIRA: https://issues.redhat.com/browse/RHEL-109583 commit 33caa20 Author: Haiyang Zhang <haiyangz@microsoft.com> Date: Wed Aug 6 13:21:51 2025 -0700 hv_netvsc: Fix panic during namespace deletion with VF The existing code move the VF NIC to new namespace when NETDEV_REGISTER is received on netvsc NIC. During deletion of the namespace, default_device_exit_batch() >> default_device_exit_net() is called. When netvsc NIC is moved back and registered to the default namespace, it automatically brings VF NIC back to the default namespace. This will cause the default_device_exit_net() >> for_each_netdev_safe loop unable to detect the list end, and hit NULL ptr: [ 231.449420] mana 7870:00:00.0 enP30832s1: Moved VF to namespace with: eth0 [ 231.449656] BUG: kernel NULL pointer dereference, address: 0000000000000010 [ 231.450246] #PF: supervisor read access in kernel mode [ 231.450579] #PF: error_code(0x0000) - not-present page [ 231.450916] PGD 17b8a8067 P4D 0 [ 231.451163] Oops: Oops: 0000 [#1] SMP NOPTI [ 231.451450] CPU: 82 UID: 0 PID: 1394 Comm: kworker/u768:1 Not tainted 6.16.0-rc4+ #3 VOLUNTARY [ 231.452042] Hardware name: Microsoft Corporation Virtual Machine/Virtual Machine, BIOS Hyper-V UEFI Release v4.1 11/21/2024 [ 231.452692] Workqueue: netns cleanup_net [ 231.452947] RIP: 0010:default_device_exit_batch+0x16c/0x3f0 [ 231.453326] Code: c0 0c f5 b3 e8 d5 db fe ff 48 85 c0 74 15 48 c7 c2 f8 fd ca b2 be 10 00 00 00 48 8d 7d c0 e8 7b 77 25 00 49 8b 86 28 01 00 00 <48> 8b 50 10 4c 8b 2a 4c 8d 62 f0 49 83 ed 10 4c 39 e0 0f 84 d6 00 [ 231.454294] RSP: 0018:ff75fc7c9bf9fd00 EFLAGS: 00010246 [ 231.454610] RAX: 0000000000000000 RBX: 0000000000000002 RCX: 61c8864680b583eb [ 231.455094] RDX: ff1fa9f71462d800 RSI: ff75fc7c9bf9fd38 RDI: 0000000030766564 [ 231.455686] RBP: ff75fc7c9bf9fd78 R08: 0000000000000000 R09: 0000000000000000 [ 231.456126] R10: 0000000000000001 R11: 0000000000000004 R12: ff1fa9f70088e340 [ 231.456621] R13: ff1fa9f70088e340 R14: ffffffffb3f50c20 R15: ff1fa9f7103e6340 [ 231.457161] FS: 0000000000000000(0000) GS:ff1faa6783a08000(0000) knlGS:0000000000000000 [ 231.457707] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 [ 231.458031] CR2: 0000000000000010 CR3: 0000000179ab2006 CR4: 0000000000b73ef0 [ 231.458434] Call Trace: [ 231.458600] <TASK> [ 231.458777] ops_undo_list+0x100/0x220 [ 231.459015] cleanup_net+0x1b8/0x300 [ 231.459285] process_one_work+0x184/0x340 To fix it, move the ns change to a workqueue, and take rtnl_lock to avoid changing the netdev list when default_device_exit_net() is using it. Cc: stable@vger.kernel.org Fixes: 4c26280 ("hv_netvsc: Fix VF namespace also in synthetic NIC NETDEV_REGISTER event") Signed-off-by: Haiyang Zhang <haiyangz@microsoft.com> Link: https://patch.msgid.link/1754511711-11188-1-git-send-email-haiyangz@linux.microsoft.com Signed-off-by: Jakub Kicinski <kuba@kernel.org> Signed-off-by: Maxim Levitsky <mlevitsk@redhat.com>
1 parent 9167dbd commit a6126d1

File tree

2 files changed

+31
-1
lines changed

2 files changed

+31
-1
lines changed

drivers/net/hyperv/hyperv_net.h

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1060,6 +1060,7 @@ struct net_device_context {
10601060
struct net_device __rcu *vf_netdev;
10611061
struct netvsc_vf_pcpu_stats __percpu *vf_stats;
10621062
struct delayed_work vf_takeover;
1063+
struct delayed_work vfns_work;
10631064

10641065
/* 1: allocated, serial number is valid. 0: not allocated */
10651066
u32 vf_alloc;
@@ -1074,6 +1075,8 @@ struct net_device_context {
10741075
struct netvsc_device_info *saved_netvsc_dev_info;
10751076
};
10761077

1078+
void netvsc_vfns_work(struct work_struct *w);
1079+
10771080
/* Azure hosts don't support non-TCP port numbers in hashing for fragmented
10781081
* packets. We can use ethtool to change UDP hash level when necessary.
10791082
*/

drivers/net/hyperv/netvsc_drv.c

Lines changed: 28 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2531,6 +2531,7 @@ static int netvsc_probe(struct hv_device *dev,
25312531
spin_lock_init(&net_device_ctx->lock);
25322532
INIT_LIST_HEAD(&net_device_ctx->reconfig_events);
25332533
INIT_DELAYED_WORK(&net_device_ctx->vf_takeover, netvsc_vf_setup);
2534+
INIT_DELAYED_WORK(&net_device_ctx->vfns_work, netvsc_vfns_work);
25342535

25352536
net_device_ctx->vf_stats
25362537
= netdev_alloc_pcpu_stats(struct netvsc_vf_pcpu_stats);
@@ -2673,6 +2674,8 @@ static void netvsc_remove(struct hv_device *dev)
26732674
cancel_delayed_work_sync(&ndev_ctx->dwork);
26742675

26752676
rtnl_lock();
2677+
cancel_delayed_work_sync(&ndev_ctx->vfns_work);
2678+
26762679
nvdev = rtnl_dereference(ndev_ctx->nvdev);
26772680
if (nvdev) {
26782681
cancel_work_sync(&nvdev->subchan_work);
@@ -2714,6 +2717,7 @@ static int netvsc_suspend(struct hv_device *dev)
27142717
cancel_delayed_work_sync(&ndev_ctx->dwork);
27152718

27162719
rtnl_lock();
2720+
cancel_delayed_work_sync(&ndev_ctx->vfns_work);
27172721

27182722
nvdev = rtnl_dereference(ndev_ctx->nvdev);
27192723
if (nvdev == NULL) {
@@ -2807,6 +2811,27 @@ static void netvsc_event_set_vf_ns(struct net_device *ndev)
28072811
}
28082812
}
28092813

2814+
void netvsc_vfns_work(struct work_struct *w)
2815+
{
2816+
struct net_device_context *ndev_ctx =
2817+
container_of(w, struct net_device_context, vfns_work.work);
2818+
struct net_device *ndev;
2819+
2820+
if (!rtnl_trylock()) {
2821+
schedule_delayed_work(&ndev_ctx->vfns_work, 1);
2822+
return;
2823+
}
2824+
2825+
ndev = hv_get_drvdata(ndev_ctx->device_ctx);
2826+
if (!ndev)
2827+
goto out;
2828+
2829+
netvsc_event_set_vf_ns(ndev);
2830+
2831+
out:
2832+
rtnl_unlock();
2833+
}
2834+
28102835
/*
28112836
* On Hyper-V, every VF interface is matched with a corresponding
28122837
* synthetic interface. The synthetic interface is presented first
@@ -2817,10 +2842,12 @@ static int netvsc_netdev_event(struct notifier_block *this,
28172842
unsigned long event, void *ptr)
28182843
{
28192844
struct net_device *event_dev = netdev_notifier_info_to_dev(ptr);
2845+
struct net_device_context *ndev_ctx;
28202846
int ret = 0;
28212847

28222848
if (event_dev->netdev_ops == &device_ops && event == NETDEV_REGISTER) {
2823-
netvsc_event_set_vf_ns(event_dev);
2849+
ndev_ctx = netdev_priv(event_dev);
2850+
schedule_delayed_work(&ndev_ctx->vfns_work, 0);
28242851
return NOTIFY_DONE;
28252852
}
28262853

0 commit comments

Comments
 (0)