vfio: Split migration ops from main device ops
authorYishai Hadas <yishaih@nvidia.com>
Tue, 28 Jun 2022 15:59:10 +0000 (18:59 +0300)
committerAlex Williamson <alex.williamson@redhat.com>
Thu, 30 Jun 2022 16:47:22 +0000 (10:47 -0600)
vfio core checks whether the driver sets some migration op (e.g.
set_state/get_state) and accordingly calls its op.

However, currently mlx5 driver sets the above ops without regards to its
migration caps.

This might lead to unexpected usage/Oops if user space may call to the
above ops even if the driver doesn't support migration. As for example,
the migration state_mutex is not initialized in that case.

The cleanest way to manage that seems to split the migration ops from
the main device ops, this will let the driver setting them separately
from the main ops when it's applicable.

As part of that, validate ops construction on registration and include a
check for VFIO_MIGRATION_STOP_COPY since the uAPI claims it must be set
in migration_flags.

HISI driver was changed as well to match this scheme.

This scheme may enable down the road to come with some extra group of
ops (e.g. DMA log) that can be set without regards to the other options
based on driver caps.

Fixes: 6fadb021266d ("vfio/mlx5: Implement vfio_pci driver for mlx5 devices")
Reviewed-by: Kevin Tian <kevin.tian@intel.com>
Signed-off-by: Yishai Hadas <yishaih@nvidia.com>
Link: https://lore.kernel.org/r/20220628155910.171454-3-yishaih@nvidia.com
Signed-off-by: Alex Williamson <alex.williamson@redhat.com>
drivers/vfio/pci/hisilicon/hisi_acc_vfio_pci.c
drivers/vfio/pci/mlx5/cmd.c
drivers/vfio/pci/mlx5/cmd.h
drivers/vfio/pci/mlx5/main.c
drivers/vfio/pci/vfio_pci_core.c
drivers/vfio/vfio.c
include/linux/vfio.h

index 4def43f5f7b619d9b5dbd8d0a3495b95782ca10c..ea762e28c1cc6ece32f624740d6cf8b74013651e 100644 (file)
@@ -1185,7 +1185,7 @@ static int hisi_acc_vfio_pci_open_device(struct vfio_device *core_vdev)
        if (ret)
                return ret;
 
-       if (core_vdev->ops->migration_set_state) {
+       if (core_vdev->mig_ops) {
                ret = hisi_acc_vf_qm_init(hisi_acc_vdev);
                if (ret) {
                        vfio_pci_core_disable(vdev);
@@ -1208,6 +1208,11 @@ static void hisi_acc_vfio_pci_close_device(struct vfio_device *core_vdev)
        vfio_pci_core_close_device(core_vdev);
 }
 
+static const struct vfio_migration_ops hisi_acc_vfio_pci_migrn_state_ops = {
+       .migration_set_state = hisi_acc_vfio_pci_set_device_state,
+       .migration_get_state = hisi_acc_vfio_pci_get_device_state,
+};
+
 static const struct vfio_device_ops hisi_acc_vfio_pci_migrn_ops = {
        .name = "hisi-acc-vfio-pci-migration",
        .open_device = hisi_acc_vfio_pci_open_device,
@@ -1219,8 +1224,6 @@ static const struct vfio_device_ops hisi_acc_vfio_pci_migrn_ops = {
        .mmap = hisi_acc_vfio_pci_mmap,
        .request = vfio_pci_core_request,
        .match = vfio_pci_core_match,
-       .migration_set_state = hisi_acc_vfio_pci_set_device_state,
-       .migration_get_state = hisi_acc_vfio_pci_get_device_state,
 };
 
 static const struct vfio_device_ops hisi_acc_vfio_pci_ops = {
@@ -1272,6 +1275,8 @@ static int hisi_acc_vfio_pci_probe(struct pci_dev *pdev, const struct pci_device
                if (!ret) {
                        vfio_pci_core_init_device(&hisi_acc_vdev->core_device, pdev,
                                                  &hisi_acc_vfio_pci_migrn_ops);
+                       hisi_acc_vdev->core_device.vdev.mig_ops =
+                                       &hisi_acc_vfio_pci_migrn_state_ops;
                } else {
                        pci_warn(pdev, "migration support failed, continue with generic interface\n");
                        vfio_pci_core_init_device(&hisi_acc_vdev->core_device, pdev,
index cdd0c667dc7746401a5d84f39295b4d3df33721f..dd5d7bfe0a498422ccb9098d8b18f3ccfc370f1b 100644 (file)
@@ -108,7 +108,8 @@ void mlx5vf_cmd_remove_migratable(struct mlx5vf_pci_core_device *mvdev)
        destroy_workqueue(mvdev->cb_wq);
 }
 
-void mlx5vf_cmd_set_migratable(struct mlx5vf_pci_core_device *mvdev)
+void mlx5vf_cmd_set_migratable(struct mlx5vf_pci_core_device *mvdev,
+                              const struct vfio_migration_ops *mig_ops)
 {
        struct pci_dev *pdev = mvdev->core_device.pdev;
        int ret;
@@ -149,6 +150,7 @@ void mlx5vf_cmd_set_migratable(struct mlx5vf_pci_core_device *mvdev)
        mvdev->core_device.vdev.migration_flags =
                VFIO_MIGRATION_STOP_COPY |
                VFIO_MIGRATION_P2P;
+       mvdev->core_device.vdev.mig_ops = mig_ops;
 
 end:
        mlx5_vf_put_core_dev(mvdev->mdev);
index aa692d9ce65697dc87f2a5ae7780e2575b41f890..8208f4701a90800f33c45c7e468a2ea4d652f54c 100644 (file)
@@ -62,7 +62,8 @@ int mlx5vf_cmd_suspend_vhca(struct mlx5vf_pci_core_device *mvdev, u16 op_mod);
 int mlx5vf_cmd_resume_vhca(struct mlx5vf_pci_core_device *mvdev, u16 op_mod);
 int mlx5vf_cmd_query_vhca_migration_state(struct mlx5vf_pci_core_device *mvdev,
                                          size_t *state_size);
-void mlx5vf_cmd_set_migratable(struct mlx5vf_pci_core_device *mvdev);
+void mlx5vf_cmd_set_migratable(struct mlx5vf_pci_core_device *mvdev,
+                              const struct vfio_migration_ops *mig_ops);
 void mlx5vf_cmd_remove_migratable(struct mlx5vf_pci_core_device *mvdev);
 void mlx5vf_cmd_close_migratable(struct mlx5vf_pci_core_device *mvdev);
 int mlx5vf_cmd_save_vhca_state(struct mlx5vf_pci_core_device *mvdev,
index d754990f0662a566b6d0aa409b4c8470ca69e954..a9b63d15c5d3490353653490ade5f8c97092fc96 100644 (file)
@@ -574,6 +574,11 @@ static void mlx5vf_pci_close_device(struct vfio_device *core_vdev)
        vfio_pci_core_close_device(core_vdev);
 }
 
+static const struct vfio_migration_ops mlx5vf_pci_mig_ops = {
+       .migration_set_state = mlx5vf_pci_set_device_state,
+       .migration_get_state = mlx5vf_pci_get_device_state,
+};
+
 static const struct vfio_device_ops mlx5vf_pci_ops = {
        .name = "mlx5-vfio-pci",
        .open_device = mlx5vf_pci_open_device,
@@ -585,8 +590,6 @@ static const struct vfio_device_ops mlx5vf_pci_ops = {
        .mmap = vfio_pci_core_mmap,
        .request = vfio_pci_core_request,
        .match = vfio_pci_core_match,
-       .migration_set_state = mlx5vf_pci_set_device_state,
-       .migration_get_state = mlx5vf_pci_get_device_state,
 };
 
 static int mlx5vf_pci_probe(struct pci_dev *pdev,
@@ -599,7 +602,7 @@ static int mlx5vf_pci_probe(struct pci_dev *pdev,
        if (!mvdev)
                return -ENOMEM;
        vfio_pci_core_init_device(&mvdev->core_device, pdev, &mlx5vf_pci_ops);
-       mlx5vf_cmd_set_migratable(mvdev);
+       mlx5vf_cmd_set_migratable(mvdev, &mlx5vf_pci_mig_ops);
        dev_set_drvdata(&pdev->dev, &mvdev->core_device);
        ret = vfio_pci_core_register_device(&mvdev->core_device);
        if (ret)
index a0d69ddaf90d80a0e373e5f38a8a54a619d58ea6..2efa06b1fafaa6fbdb8cdac100adf38add6fa98b 100644 (file)
@@ -1855,6 +1855,13 @@ int vfio_pci_core_register_device(struct vfio_pci_core_device *vdev)
        if (pdev->hdr_type != PCI_HEADER_TYPE_NORMAL)
                return -EINVAL;
 
+       if (vdev->vdev.mig_ops) {
+               if (!(vdev->vdev.mig_ops->migration_get_state &&
+                     vdev->vdev.mig_ops->migration_set_state) ||
+                   !(vdev->vdev.migration_flags & VFIO_MIGRATION_STOP_COPY))
+                       return -EINVAL;
+       }
+
        /*
         * Prevent binding to PFs with VFs enabled, the VFs might be in use
         * by the host or other users.  We cannot capture the VFs if they
index 61e71c1154be673e9c40989958ff0c6a86600161..aac9213a783d1d569906808e41f4f427d97b3db2 100644 (file)
@@ -1541,8 +1541,7 @@ vfio_ioctl_device_feature_mig_device_state(struct vfio_device *device,
        struct file *filp = NULL;
        int ret;
 
-       if (!device->ops->migration_set_state ||
-           !device->ops->migration_get_state)
+       if (!device->mig_ops)
                return -ENOTTY;
 
        ret = vfio_check_feature(flags, argsz,
@@ -1558,7 +1557,8 @@ vfio_ioctl_device_feature_mig_device_state(struct vfio_device *device,
        if (flags & VFIO_DEVICE_FEATURE_GET) {
                enum vfio_device_mig_state curr_state;
 
-               ret = device->ops->migration_get_state(device, &curr_state);
+               ret = device->mig_ops->migration_get_state(device,
+                                                          &curr_state);
                if (ret)
                        return ret;
                mig.device_state = curr_state;
@@ -1566,7 +1566,7 @@ vfio_ioctl_device_feature_mig_device_state(struct vfio_device *device,
        }
 
        /* Handle the VFIO_DEVICE_FEATURE_SET */
-       filp = device->ops->migration_set_state(device, mig.device_state);
+       filp = device->mig_ops->migration_set_state(device, mig.device_state);
        if (IS_ERR(filp) || !filp)
                goto out_copy;
 
@@ -1589,8 +1589,7 @@ static int vfio_ioctl_device_feature_migration(struct vfio_device *device,
        };
        int ret;
 
-       if (!device->ops->migration_set_state ||
-           !device->ops->migration_get_state)
+       if (!device->mig_ops)
                return -ENOTTY;
 
        ret = vfio_check_feature(flags, argsz, VFIO_DEVICE_FEATURE_GET,
index 49580fa2073a8d7bab792fa7716f6ac8340bddc4..4d26e149db81826943c31e1473e669124e052986 100644 (file)
@@ -32,6 +32,11 @@ struct vfio_device_set {
 struct vfio_device {
        struct device *dev;
        const struct vfio_device_ops *ops;
+       /*
+        * mig_ops is a static property of the vfio_device which must be set
+        * prior to registering the vfio_device.
+        */
+       const struct vfio_migration_ops *mig_ops;
        struct vfio_group *group;
        struct vfio_device_set *dev_set;
        struct list_head dev_set_list;
@@ -61,16 +66,6 @@ struct vfio_device {
  *         match, -errno for abort (ex. match with insufficient or incorrect
  *         additional args)
  * @device_feature: Optional, fill in the VFIO_DEVICE_FEATURE ioctl
- * @migration_set_state: Optional callback to change the migration state for
- *         devices that support migration. It's mandatory for
- *         VFIO_DEVICE_FEATURE_MIGRATION migration support.
- *         The returned FD is used for data transfer according to the FSM
- *         definition. The driver is responsible to ensure that FD reaches end
- *         of stream or error whenever the migration FSM leaves a data transfer
- *         state or before close_device() returns.
- * @migration_get_state: Optional callback to get the migration state for
- *         devices that support migration. It's mandatory for
- *         VFIO_DEVICE_FEATURE_MIGRATION migration support.
  */
 struct vfio_device_ops {
        char    *name;
@@ -87,6 +82,21 @@ struct vfio_device_ops {
        int     (*match)(struct vfio_device *vdev, char *buf);
        int     (*device_feature)(struct vfio_device *device, u32 flags,
                                  void __user *arg, size_t argsz);
+};
+
+/**
+ * @migration_set_state: Optional callback to change the migration state for
+ *         devices that support migration. It's mandatory for
+ *         VFIO_DEVICE_FEATURE_MIGRATION migration support.
+ *         The returned FD is used for data transfer according to the FSM
+ *         definition. The driver is responsible to ensure that FD reaches end
+ *         of stream or error whenever the migration FSM leaves a data transfer
+ *         state or before close_device() returns.
+ * @migration_get_state: Optional callback to get the migration state for
+ *         devices that support migration. It's mandatory for
+ *         VFIO_DEVICE_FEATURE_MIGRATION migration support.
+ */
+struct vfio_migration_ops {
        struct file *(*migration_set_state)(
                struct vfio_device *device,
                enum vfio_device_mig_state new_state);