Hi Zhenzhong,

On 10/9/23 03:25, Duan, Zhenzhong wrote:
>
>> -----Original Message-----
>> From: Eric Auger <eric.au...@redhat.com>
>> Sent: Monday, October 9, 2023 1:46 AM
>> Subject: Re: [PATCH v4 10/15] vfio/ccw: Use vfio_[attach/detach]_device
>>
>> Hi Zhenzhong,
>> On 10/8/23 12:21, Duan, Zhenzhong wrote:
>>> Hi Eric,
>>>
>>>> -----Original Message-----
>>>> From: Eric Auger <eric.au...@redhat.com>
>>>> Sent: Wednesday, October 4, 2023 11:44 PM
>>>> Subject: [PATCH v4 10/15] vfio/ccw: Use vfio_[attach/detach]_device
>>>>
>>>> Let the vfio-ccw device use vfio_attach_device() and
>>>> vfio_detach_device(), hence hiding the details of the used
>>>> IOMMU backend.
>>>>
>>>> Note that the migration reduces the following trace
>>>> "vfio: subchannel %s has already been attached" (featuring
>>>> cssid.ssid.devid) into "device is already attached"
>>>>
>>>> Also now all the devices have been migrated to use the new
>>>> vfio_attach_device/vfio_detach_device API, let's turn the
>>>> legacy functions into static functions, local to container.c.
>>>>
>>>> Signed-off-by: Eric Auger <eric.au...@redhat.com>
>>>> Signed-off-by: Yi Liu <yi.l....@intel.com>
>>>> Signed-off-by: Zhenzhong Duan <zhenzhong.d...@intel.com>
>>>> Reviewed-by: Matthew Rosato <mjros...@linux.ibm.com>
>>>>
>>>> ---
>>>>
>>>> v3:
>>>> - simplified vbasedev->dev setting
>>>>
>>>> v2 -> v3:
>>>> - Hopefully fix confusion beteen vbasedev->name, mdevid and sysfsdev
>>>>  while keeping into account Matthew's comment
>>>>  https://lore.kernel.org/qemu-devel/6e04ab8f-dc84-e9c2-deea-
>>>> 2b6b31678...@linux.ibm.com/
>>>> ---
>>>> include/hw/vfio/vfio-common.h |   5 --
>>>> hw/vfio/ccw.c                 | 122 +++++++++-------------------------
>>>> hw/vfio/common.c              |  10 +--
>>>> 3 files changed, 37 insertions(+), 100 deletions(-)
>>>>
>>>> diff --git a/include/hw/vfio/vfio-common.h b/include/hw/vfio/vfio-common.h
>>>> index 12fbfbc37d..c486bdef2a 100644
>>>> --- a/include/hw/vfio/vfio-common.h
>>>> +++ b/include/hw/vfio/vfio-common.h
>>>> @@ -202,7 +202,6 @@ typedef struct {
>>>>     hwaddr pages;
>>>> } VFIOBitmap;
>>>>
>>>> -void vfio_put_base_device(VFIODevice *vbasedev);
>>>> void vfio_disable_irqindex(VFIODevice *vbasedev, int index);
>>>> void vfio_unmask_single_irqindex(VFIODevice *vbasedev, int index);
>>>> void vfio_mask_single_irqindex(VFIODevice *vbasedev, int index);
>>>> @@ -220,11 +219,7 @@ void vfio_region_unmap(VFIORegion *region);
>>>> void vfio_region_exit(VFIORegion *region);
>>>> void vfio_region_finalize(VFIORegion *region);
>>>> void vfio_reset_handler(void *opaque);
>>>> -VFIOGroup *vfio_get_group(int groupid, AddressSpace *as, Error **errp);
>>>> -void vfio_put_group(VFIOGroup *group);
>>>> struct vfio_device_info *vfio_get_device_info(int fd);
>>>> -int vfio_get_device(VFIOGroup *group, const char *name,
>>>> -                    VFIODevice *vbasedev, Error **errp);
>>>> int vfio_attach_device(char *name, VFIODevice *vbasedev,
>>>>                        AddressSpace *as, Error **errp);
>>>> void vfio_detach_device(VFIODevice *vbasedev);
>>>> diff --git a/hw/vfio/ccw.c b/hw/vfio/ccw.c
>>>> index 1e2fce83b0..6ec35fedc9 100644
>>>> --- a/hw/vfio/ccw.c
>>>> +++ b/hw/vfio/ccw.c
>>>> @@ -572,88 +572,15 @@ static void vfio_ccw_put_region(VFIOCCWDevice
>>>> *vcdev)
>>>>     g_free(vcdev->io_region);
>>>> }
>>>>
>>>> -static void vfio_ccw_put_device(VFIOCCWDevice *vcdev)
>>>> -{
>>>> -    g_free(vcdev->vdev.name);
>>>> -    vfio_put_base_device(&vcdev->vdev);
>>>> -}
>>>> -
>>>> -static void vfio_ccw_get_device(VFIOGroup *group, VFIOCCWDevice *vcdev,
>>>> -                                Error **errp)
>>>> -{
>>>> -    S390CCWDevice *cdev = S390_CCW_DEVICE(vcdev);
>>>> -    char *name = g_strdup_printf("%x.%x.%04x", cdev->hostid.cssid,
>>>> -                                 cdev->hostid.ssid,
>>>> -                                 cdev->hostid.devid);
>>>> -    VFIODevice *vbasedev;
>>>> -
>>>> -    QLIST_FOREACH(vbasedev, &group->device_list, next) {
>>>> -        if (strcmp(vbasedev->name, name) == 0) {
>>>> -            error_setg(errp, "vfio: subchannel %s has already been 
>>>> attached",
>>>> -                       name);
>>>> -            goto out_err;
>>>> -        }
>>>> -    }
>>>> -
>>>> -    /*
>>>> -     * All vfio-ccw devices are believed to operate in a way compatible 
>>>> with
>>>> -     * discarding of memory in RAM blocks, ie. pages pinned in the host 
>>>> are
>>>> -     * in the current working set of the guest driver and therefore never
>>>> -     * overlap e.g., with pages available to the guest balloon driver.  
>>>> This
>>>> -     * needs to be set before vfio_get_device() for vfio common to handle
>>>> -     * ram_block_discard_disable().
>>>> -     */
>>>> -    vcdev->vdev.ram_block_discard_allowed = true;
>>>> -
>>>> -    if (vfio_get_device(group, cdev->mdevid, &vcdev->vdev, errp)) {
>>>> -        goto out_err;
>>>> -    }
>>>> -
>>>> -    vcdev->vdev.ops = &vfio_ccw_ops;
>>>> -    vcdev->vdev.type = VFIO_DEVICE_TYPE_CCW;
>>>> -    vcdev->vdev.name = name;
>>>> -    vcdev->vdev.dev = DEVICE(vcdev);
>>>> -
>>>> -    return;
>>>> -
>>>> -out_err:
>>>> -    g_free(name);
>>>> -}
>>>> -
>>>> -static VFIOGroup *vfio_ccw_get_group(S390CCWDevice *cdev, Error **errp)
>>>> -{
>>>> -    char *tmp, group_path[PATH_MAX];
>>>> -    ssize_t len;
>>>> -    int groupid;
>>>> -
>>>> -    tmp =
>> g_strdup_printf("/sys/bus/css/devices/%x.%x.%04x/%s/iommu_group",
>>>> -                          cdev->hostid.cssid, cdev->hostid.ssid,
>>>> -                          cdev->hostid.devid, cdev->mdevid);
>>>> -    len = readlink(tmp, group_path, sizeof(group_path));
>>>> -    g_free(tmp);
>>>> -
>>>> -    if (len <= 0 || len >= sizeof(group_path)) {
>>>> -        error_setg(errp, "vfio: no iommu_group found");
>>>> -        return NULL;
>>>> -    }
>>>> -
>>>> -    group_path[len] = 0;
>>>> -
>>>> -    if (sscanf(basename(group_path), "%d", &groupid) != 1) {
>>>> -        error_setg(errp, "vfio: failed to read %s", group_path);
>>>> -        return NULL;
>>>> -    }
>>>> -
>>>> -    return vfio_get_group(groupid, &address_space_memory, errp);
>>>> -}
>>>> -
>>>> static void vfio_ccw_realize(DeviceState *dev, Error **errp)
>>>> {
>>>> -    VFIOGroup *group;
>>>>     S390CCWDevice *cdev = S390_CCW_DEVICE(dev);
>>>>     VFIOCCWDevice *vcdev = VFIO_CCW(cdev);
>>>>     S390CCWDeviceClass *cdc = S390_CCW_DEVICE_GET_CLASS(cdev);
>>>> +    VFIODevice *vbasedev = &vcdev->vdev;
>>>>     Error *err = NULL;
>>>> +    char *name;
>>>> +    int ret;
>>>>
>>>>     /* Call the class init function for subchannel. */
>>>>     if (cdc->realize) {
>>>> @@ -663,14 +590,31 @@ static void vfio_ccw_realize(DeviceState *dev, Error
>>>> **errp)
>>>>         }
>>>>     }
>>>>
>>>> -    group = vfio_ccw_get_group(cdev, &err);
>>>> -    if (!group) {
>>>> -        goto out_group_err;
>>>> -    }
>>>> +    name = g_strdup_printf("%x.%x.%04x", vcdev->cdev.hostid.cssid,
>>>> +                           vcdev->cdev.hostid.ssid,
>>>> +                           vcdev->cdev.hostid.devid);
>>>> +    vbasedev->sysfsdev = g_strdup_printf("/sys/bus/css/devices/%s/%s",
>>>> +                                         name,
>>>> +                                         cdev->mdevid);
>>> Hoping not late for you to include this in v5.
>>> I think no need to re-assign sysfsdev as it's a user property, we'd better 
>>> to
>>> keep the original user value. Also looks a memory leak here.
>> OK I removed it.
>>>> +    vbasedev->ops = &vfio_ccw_ops;
>>>> +    vbasedev->type = VFIO_DEVICE_TYPE_CCW;
>>>> +    vbasedev->name = name;
>>> There will be a potential failure when a second mdev device under
>>> same cssid.ssid.devid attached. We can use cdev->mdevid as name.
>> But this mathes vfio_ccw_get_device() existing code where
>> vcdev->vdev.name = name; and
>> name = g_strdup_printf("%x.%x.%04x", cdev->hostid.cssid,
>>                                  cdev->hostid.ssid,
>>                                  cdev->hostid.devid);
> I suspect this is a bug of the existing code.
Then I would prefer we fix it separately. This patch migrates the
existing code without functional change intended.

>
>> cdev->mdevid is passed as first arg of vfio_attach_device() instead .
> vfio_attach_device() uses cdev->mdevid to get device FD, nothing more.
>
> If we use cssid.ssid.devid as name, then different mdev under same 
> cssid.ssid.devid will have same name, and the second mdev attachment will 
> fail to attach in vfio_attach_device():
>
>     QLIST_FOREACH(vbasedev_iter, &group->device_list, next) {
>         if (strcmp(vbasedev_iter->name, vbasedev->name) == 0) {
>             error_setg(errp, "device is already attached");
>             vfio_put_group(group);
>             return -EBUSY;
>         }
>     }
I get your point but this conversion matches the existing
vfio_ccw_get_device() code:
    char *name = g_strdup_printf("%x.%x.%04x", cdev->hostid.cssid,
                                 cdev->hostid.ssid,
                                 cdev->hostid.devid);
    VFIODevice *vbasedev;

    QLIST_FOREACH(vbasedev, &group->device_list, next) {
        if (strcmp(vbasedev->name, name) == 0) {
            error_setg(errp, "vfio: subchannel %s has already been
attached",
                       name);
            goto out_err;
        }
    }

>
>> i think this also matches
>> https://lore.kernel.org/all/PH7PR11MB67222DD282F98E03095FBA8A92C1A@PH
>> 7PR11MB6722.namprd11.prod.outlook.com/
>> no?
> It doesn't match what Mattew suggested: 
> https://lore.kernel.org/qemu-devel/6e04ab8f-dc84-e9c2-deea-2b6b31678...@linux.ibm.com/
this was RFC v3. At that time we did not pass any "name" arg to

vfio_attach_device(VFIODevice *vbasedev, AddressSpace *as, Error **errp)
and vbasedev->name was used when calling vfio_get_device() while we now
use cdev->mdevid. Besides Mattew ran some basic tests on PATCH v3:
https://lore.kernel.org/all/33b7803c-f231-d4fb-d9d9-26a097a89...@redhat.com/
So I would be tempted to leave it as is (without the sysfsdev overwrite
which came from Mattew's suggestion in
https://lore.kernel.org/qemu-devel/6e04ab8f-dc84-e9c2-deea-2b6b31678...@linux.ibm.com/
). Thanks Eric

>
> Thanks
> Zhenzhong
>


Reply via email to