Skip to content

Commit

Permalink
xen-netfront: Fix race between device setup and open
Browse files Browse the repository at this point in the history
[ Upstream commit f599c64fdf7d9c108e8717fb04bc41c680120da4 ]

When a netfront device is set up it registers a netdev fairly early on,
before it has set up the queues and is actually usable. A userspace tool
like NetworkManager will immediately try to open it and access its state
as soon as it appears. The bug can be reproduced by hotplugging VIFs
until the VM runs out of grant refs. It registers the netdev but fails
to set up any queues (since there are no more grant refs). In the
meantime, NetworkManager opens the device and the kernel crashes trying
to access the queues (of which there are none).

Fix this in two ways:
* For initial setup, register the netdev much later, after the queues
are setup. This avoids the race entirely.
* During a suspend/resume cycle, the frontend reconnects to the backend
and the queues are recreated. It is possible (though highly unlikely) to
race with something opening the device and accessing the queues after
they have been destroyed but before they have been recreated. Extend the
region covered by the rtnl semaphore to protect against this race. There
is a possibility that we fail to recreate the queues so check for this
in the open function.

Signed-off-by: Ross Lagerwall <ross.lagerwall@citrix.com>
Reviewed-by: Boris Ostrovsky <boris.ostrovsky@oracle.com>
Signed-off-by: Juergen Gross <jgross@suse.com>
Signed-off-by: Sasha Levin <alexander.levin@microsoft.com>
Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Signed-off-by: Lee Jones <lee.jones@linaro.org>
Change-Id: I0a08e90ed47bbe56b46ffa21144e50934adc557d
  • Loading branch information
rosslagerwall authored and Lee Jones committed Feb 9, 2021
1 parent 98be39c commit 85766bf
Showing 1 changed file with 23 additions and 23 deletions.
46 changes: 23 additions & 23 deletions drivers/net/xen-netfront.c
Original file line number Diff line number Diff line change
Expand Up @@ -376,6 +376,9 @@ static int xennet_open(struct net_device *dev)
unsigned int i = 0;
struct netfront_queue *queue = NULL;

if (!np->queues)
return -ENODEV;

for (i = 0; i < num_queues; ++i) {
queue = &np->queues[i];
napi_enable(&queue->napi);
Expand Down Expand Up @@ -1393,25 +1396,14 @@ static int netfront_probe(struct xenbus_device *dev,
info = netdev_priv(netdev);
dev_set_drvdata(&dev->dev, info);

err = register_netdev(info->netdev);
if (err) {
pr_warn("%s: register_netdev err=%d\n", __func__, err);
goto fail;
}

err = xennet_sysfs_addif(info->netdev);
if (err) {
unregister_netdev(info->netdev);
pr_warn("%s: add sysfs failed err=%d\n", __func__, err);
goto fail;
return err;
}

return 0;

fail:
free_netdev(netdev);
dev_set_drvdata(&dev->dev, NULL);
return err;
}

static void xennet_end_access(int ref, void *page)
Expand Down Expand Up @@ -1785,8 +1777,6 @@ static void xennet_destroy_queues(struct netfront_info *info)
{
unsigned int i;

rtnl_lock();

for (i = 0; i < info->netdev->real_num_tx_queues; i++) {
struct netfront_queue *queue = &info->queues[i];

Expand All @@ -1795,8 +1785,6 @@ static void xennet_destroy_queues(struct netfront_info *info)
netif_napi_del(&queue->napi);
}

rtnl_unlock();

kfree(info->queues);
info->queues = NULL;
}
Expand All @@ -1812,8 +1800,6 @@ static int xennet_create_queues(struct netfront_info *info,
if (!info->queues)
return -ENOMEM;

rtnl_lock();

for (i = 0; i < *num_queues; i++) {
struct netfront_queue *queue = &info->queues[i];

Expand All @@ -1822,7 +1808,7 @@ static int xennet_create_queues(struct netfront_info *info,

ret = xennet_init_queue(queue);
if (ret < 0) {
dev_warn(&info->netdev->dev,
dev_warn(&info->xbdev->dev,
"only created %d queues\n", i);
*num_queues = i;
break;
Expand All @@ -1836,10 +1822,8 @@ static int xennet_create_queues(struct netfront_info *info,

netif_set_real_num_tx_queues(info->netdev, *num_queues);

rtnl_unlock();

if (*num_queues == 0) {
dev_err(&info->netdev->dev, "no queues\n");
dev_err(&info->xbdev->dev, "no queues\n");
return -EINVAL;
}
return 0;
Expand Down Expand Up @@ -1881,6 +1865,7 @@ static int talk_to_netback(struct xenbus_device *dev,
goto out;
}

rtnl_lock();
if (info->queues)
xennet_destroy_queues(info);

Expand All @@ -1891,6 +1876,7 @@ static int talk_to_netback(struct xenbus_device *dev,
info->queues = NULL;
goto out;
}
rtnl_unlock();

/* Create shared ring, alloc event channel -- for each queue */
for (i = 0; i < num_queues; ++i) {
Expand Down Expand Up @@ -1984,11 +1970,13 @@ static int talk_to_netback(struct xenbus_device *dev,
xenbus_transaction_end(xbt, 1);
destroy_ring:
xennet_disconnect_backend(info);
rtnl_lock();
xennet_destroy_queues(info);
rtnl_lock();
netif_set_real_num_tx_queues(info->netdev, 0);
rtnl_unlock();
out:
rtnl_unlock();
device_unregister(&dev->dev);
return err;
}
Expand Down Expand Up @@ -2024,6 +2012,15 @@ static int xennet_connect(struct net_device *dev)
netdev_update_features(dev);
rtnl_unlock();

if (dev->reg_state == NETREG_UNINITIALIZED) {
err = register_netdev(dev);
if (err) {
pr_warn("%s: register_netdev err=%d\n", __func__, err);
device_unregister(&np->xbdev->dev);
return err;
}
}

/*
* All public and private state should now be sane. Get
* ready to start sending and receiving packets and give the driver
Expand Down Expand Up @@ -2329,16 +2326,19 @@ static int xennet_remove(struct xenbus_device *dev)

xennet_sysfs_delif(info->netdev);

unregister_netdev(info->netdev);
if (info->netdev->reg_state == NETREG_REGISTERED)
unregister_netdev(info->netdev);

for (i = 0; i < num_queues; ++i) {
queue = &info->queues[i];
del_timer_sync(&queue->rx_refill_timer);
}

if (num_queues) {
rtnl_lock();
kfree(info->queues);
info->queues = NULL;
rtnl_unlock();
}

free_percpu(info->stats);
Expand Down

0 comments on commit 85766bf

Please sign in to comment.