From: Sam Li <faithilikerun@gmail.com>
Use get_sysfs_str_val() to get the string value of device
zoned model. Then get_sysfs_zoned_model() can convert it to
BlockZoneModel type of QEMU.
Use get_sysfs_long_val() to get the long value of zoned device
information.
Signed-off-by: Sam Li <faithilikerun@gmail.com>
Reviewed-by: Hannes Reinecke <hare@suse.de>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Reviewed-by: Damien Le Moal <damien.lemoal@opensource.wdc.com>
Reviewed-by: Dmitry Fomichev <dmitry.fomichev@wdc.com>
Acked-by: Kevin Wolf <kwolf@redhat.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Message-id: 20230508045533.175575-3-faithilikerun@gmail.com
Message-id: 20230324090605.28361-3-faithilikerun@gmail.com
[Adjust commit message prefix as suggested by Philippe Mathieu-Daudé
<philmd@linaro.org>.
--Stefan]
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
include/block/block_int-common.h | 3 +
block/file-posix.c | 135 ++++++++++++++++++++++---------
2 files changed, 100 insertions(+), 38 deletions(-)
diff --git a/include/block/block_int-common.h b/include/block/block_int-common.h
index 4909876756..c7ca5a83e9 100644
--- a/include/block/block_int-common.h
+++ b/include/block/block_int-common.h
@@ -862,6 +862,9 @@ typedef struct BlockLimits {
* an explicit monitor command to load the disk inside the guest).
*/
bool has_variable_length;
+
+ /* device zone model */
+ BlockZoneModel zoned;
} BlockLimits;
typedef struct BdrvOpBlocker BdrvOpBlocker;
diff --git a/block/file-posix.c b/block/file-posix.c
index c7b723368e..97c597a2a0 100644
--- a/block/file-posix.c
+++ b/block/file-posix.c
@@ -1202,15 +1202,89 @@ static int hdev_get_max_hw_transfer(int fd, struct stat *st)
#endif
}
-static int hdev_get_max_segments(int fd, struct stat *st)
+/*
+ * Get a sysfs attribute value as character string.
+ */
+#ifdef CONFIG_LINUX
+static int get_sysfs_str_val(struct stat *st, const char *attribute,
+ char **val) {
+ g_autofree char *sysfspath = NULL;
+ int ret;
+ size_t len;
+
+ if (!S_ISBLK(st->st_mode)) {
+ return -ENOTSUP;
+ }
+
+ sysfspath = g_strdup_printf("/sys/dev/block/%u:%u/queue/%s",
+ major(st->st_rdev), minor(st->st_rdev),
+ attribute);
+ ret = g_file_get_contents(sysfspath, val, &len, NULL);
+ if (ret == -1) {
+ return -ENOENT;
+ }
+
+ /* The file is ended with '\n' */
+ char *p;
+ p = *val;
+ if (*(p + len - 1) == '\n') {
+ *(p + len - 1) = '\0';
+ }
+ return ret;
+}
+#endif
+
+static int get_sysfs_zoned_model(struct stat *st, BlockZoneModel *zoned)
{
+ g_autofree char *val = NULL;
+ int ret;
+
+ ret = get_sysfs_str_val(st, "zoned", &val);
+ if (ret < 0) {
+ return ret;
+ }
+
+ if (strcmp(val, "host-managed") == 0) {
+ *zoned = BLK_Z_HM;
+ } else if (strcmp(val, "host-aware") == 0) {
+ *zoned = BLK_Z_HA;
+ } else if (strcmp(val, "none") == 0) {
+ *zoned = BLK_Z_NONE;
+ } else {
+ return -ENOTSUP;
+ }
+ return 0;
+}
+
+/*
+ * Get a sysfs attribute value as a long integer.
+ */
#ifdef CONFIG_LINUX
- char buf[32];
+static long get_sysfs_long_val(struct stat *st, const char *attribute)
+{
+ g_autofree char *str = NULL;
const char *end;
- char *sysfspath = NULL;
+ long val;
+ int ret;
+
+ ret = get_sysfs_str_val(st, attribute, &str);
+ if (ret < 0) {
+ return ret;
+ }
+
+ /* The file is ended with '\n', pass 'end' to accept that. */
+ ret = qemu_strtol(str, &end, 10, &val);
+ if (ret == 0 && end && *end == '\0') {
+ ret = val;
+ }
+ return ret;
+}
+#endif
+
+static int hdev_get_max_segments(int fd, struct stat *st)
+{
+#ifdef CONFIG_LINUX
int ret;
- int sysfd = -1;
- long max_segments;
if (S_ISCHR(st->st_mode)) {
if (ioctl(fd, SG_GET_SG_TABLESIZE, &ret) == 0) {
@@ -1218,44 +1292,27 @@ static int hdev_get_max_segments(int fd, struct stat *st)
}
return -ENOTSUP;
}
-
- if (!S_ISBLK(st->st_mode)) {
- return -ENOTSUP;
- }
-
- sysfspath = g_strdup_printf("/sys/dev/block/%u:%u/queue/max_segments",
- major(st->st_rdev), minor(st->st_rdev));
- sysfd = open(sysfspath, O_RDONLY);
- if (sysfd == -1) {
- ret = -errno;
- goto out;
- }
- ret = RETRY_ON_EINTR(read(sysfd, buf, sizeof(buf) - 1));
- if (ret < 0) {
- ret = -errno;
- goto out;
- } else if (ret == 0) {
- ret = -EIO;
- goto out;
- }
- buf[ret] = 0;
- /* The file is ended with '\n', pass 'end' to accept that. */
- ret = qemu_strtol(buf, &end, 10, &max_segments);
- if (ret == 0 && end && *end == '\n') {
- ret = max_segments;
- }
-
-out:
- if (sysfd != -1) {
- close(sysfd);
- }
- g_free(sysfspath);
- return ret;
+ return get_sysfs_long_val(st, "max_segments");
#else
return -ENOTSUP;
#endif
}
+static void raw_refresh_zoned_limits(BlockDriverState *bs, struct stat *st,
+ Error **errp)
+{
+ BlockZoneModel zoned;
+ int ret;
+
+ bs->bl.zoned = BLK_Z_NONE;
+
+ ret = get_sysfs_zoned_model(st, &zoned);
+ if (ret < 0 || zoned == BLK_Z_NONE) {
+ return;
+ }
+ bs->bl.zoned = zoned;
+}
+
static void raw_refresh_limits(BlockDriverState *bs, Error **errp)
{
BDRVRawState *s = bs->opaque;
@@ -1297,6 +1354,8 @@ static void raw_refresh_limits(BlockDriverState *bs, Error **errp)
bs->bl.max_hw_iov = ret;
}
}
+
+ raw_refresh_zoned_limits(bs, &st, errp);
}
static int check_for_dasd(int fd)
--
2.40.1
On 5/15/23 12:04 PM, Stefan Hajnoczi wrote: > From: Sam Li <faithilikerun@gmail.com> > > Use get_sysfs_str_val() to get the string value of device > zoned model. Then get_sysfs_zoned_model() can convert it to > BlockZoneModel type of QEMU. > > Use get_sysfs_long_val() to get the long value of zoned device > information. Hi Stefan, Sam, I am having an issue on s390x using virtio-blk-{pci,ccw} backed by an NVMe partition, and I've bisected the root cause to this commit. I noticed that tests which use the partition e.g. /dev/nvme0n1p1 as a backing device would fail, but those that use the namespace e.g. /dev/nvme0n1 would still succeed. The root issue appears to be that the block device associated with the partition does not have a "max_segments" attribute, and prior to this patch hdev_get_max_segment() would return -ENOENT in this case. After this patch, however, QEMU is instead crashing. It looks like g_file_get_contents is returning 0 with a len == 0 if the specified sysfs path does not exist. The following diff on top seems to resolve the issue for me: diff --git a/block/file-posix.c b/block/file-posix.c index 0ab158efba2..eeb0247c74e 100644 --- a/block/file-posix.c +++ b/block/file-posix.c @@ -1243,7 +1243,7 @@ static int get_sysfs_str_val(struct stat *st, const char *attribute, major(st->st_rdev), minor(st->st_rdev), attribute); ret = g_file_get_contents(sysfspath, val, &len, NULL); - if (ret == -1) { + if (ret == -1 || len == 0) { return -ENOENT; } > > Signed-off-by: Sam Li <faithilikerun@gmail.com> > Reviewed-by: Hannes Reinecke <hare@suse.de> > Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com> > Reviewed-by: Damien Le Moal <damien.lemoal@opensource.wdc.com> > Reviewed-by: Dmitry Fomichev <dmitry.fomichev@wdc.com> > Acked-by: Kevin Wolf <kwolf@redhat.com> > Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com> > Message-id: 20230508045533.175575-3-faithilikerun@gmail.com > Message-id: 20230324090605.28361-3-faithilikerun@gmail.com > [Adjust commit message prefix as suggested by Philippe Mathieu-Daudé > <philmd@linaro.org>. > --Stefan] > Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com> > --- > include/block/block_int-common.h | 3 + > block/file-posix.c | 135 ++++++++++++++++++++++--------- > 2 files changed, 100 insertions(+), 38 deletions(-) > > diff --git a/include/block/block_int-common.h b/include/block/block_int-common.h > index 4909876756..c7ca5a83e9 100644 > --- a/include/block/block_int-common.h > +++ b/include/block/block_int-common.h > @@ -862,6 +862,9 @@ typedef struct BlockLimits { > * an explicit monitor command to load the disk inside the guest). > */ > bool has_variable_length; > + > + /* device zone model */ > + BlockZoneModel zoned; > } BlockLimits; > > typedef struct BdrvOpBlocker BdrvOpBlocker; > diff --git a/block/file-posix.c b/block/file-posix.c > index c7b723368e..97c597a2a0 100644 > --- a/block/file-posix.c > +++ b/block/file-posix.c > @@ -1202,15 +1202,89 @@ static int hdev_get_max_hw_transfer(int fd, struct stat *st) > #endif > } > > -static int hdev_get_max_segments(int fd, struct stat *st) > +/* > + * Get a sysfs attribute value as character string. > + */ > +#ifdef CONFIG_LINUX > +static int get_sysfs_str_val(struct stat *st, const char *attribute, > + char **val) { > + g_autofree char *sysfspath = NULL; > + int ret; > + size_t len; > + > + if (!S_ISBLK(st->st_mode)) { > + return -ENOTSUP; > + } > + > + sysfspath = g_strdup_printf("/sys/dev/block/%u:%u/queue/%s", > + major(st->st_rdev), minor(st->st_rdev), > + attribute); > + ret = g_file_get_contents(sysfspath, val, &len, NULL); > + if (ret == -1) { > + return -ENOENT; > + } > + > + /* The file is ended with '\n' */ > + char *p; > + p = *val; > + if (*(p + len - 1) == '\n') { > + *(p + len - 1) = '\0'; > + } > + return ret; > +} > +#endif > + > +static int get_sysfs_zoned_model(struct stat *st, BlockZoneModel *zoned) > { > + g_autofree char *val = NULL; > + int ret; > + > + ret = get_sysfs_str_val(st, "zoned", &val); > + if (ret < 0) { > + return ret; > + } > + > + if (strcmp(val, "host-managed") == 0) { > + *zoned = BLK_Z_HM; > + } else if (strcmp(val, "host-aware") == 0) { > + *zoned = BLK_Z_HA; > + } else if (strcmp(val, "none") == 0) { > + *zoned = BLK_Z_NONE; > + } else { > + return -ENOTSUP; > + } > + return 0; > +} > + > +/* > + * Get a sysfs attribute value as a long integer. > + */ > #ifdef CONFIG_LINUX > - char buf[32]; > +static long get_sysfs_long_val(struct stat *st, const char *attribute) > +{ > + g_autofree char *str = NULL; > const char *end; > - char *sysfspath = NULL; > + long val; > + int ret; > + > + ret = get_sysfs_str_val(st, attribute, &str); > + if (ret < 0) { > + return ret; > + } > + > + /* The file is ended with '\n', pass 'end' to accept that. */ > + ret = qemu_strtol(str, &end, 10, &val); > + if (ret == 0 && end && *end == '\0') { > + ret = val; > + } > + return ret; > +} > +#endif > + > +static int hdev_get_max_segments(int fd, struct stat *st) > +{ > +#ifdef CONFIG_LINUX > int ret; > - int sysfd = -1; > - long max_segments; > > if (S_ISCHR(st->st_mode)) { > if (ioctl(fd, SG_GET_SG_TABLESIZE, &ret) == 0) { > @@ -1218,44 +1292,27 @@ static int hdev_get_max_segments(int fd, struct stat *st) > } > return -ENOTSUP; > } > - > - if (!S_ISBLK(st->st_mode)) { > - return -ENOTSUP; > - } > - > - sysfspath = g_strdup_printf("/sys/dev/block/%u:%u/queue/max_segments", > - major(st->st_rdev), minor(st->st_rdev)); > - sysfd = open(sysfspath, O_RDONLY); > - if (sysfd == -1) { > - ret = -errno; > - goto out; > - } > - ret = RETRY_ON_EINTR(read(sysfd, buf, sizeof(buf) - 1)); > - if (ret < 0) { > - ret = -errno; > - goto out; > - } else if (ret == 0) { > - ret = -EIO; > - goto out; > - } > - buf[ret] = 0; > - /* The file is ended with '\n', pass 'end' to accept that. */ > - ret = qemu_strtol(buf, &end, 10, &max_segments); > - if (ret == 0 && end && *end == '\n') { > - ret = max_segments; > - } > - > -out: > - if (sysfd != -1) { > - close(sysfd); > - } > - g_free(sysfspath); > - return ret; > + return get_sysfs_long_val(st, "max_segments"); > #else > return -ENOTSUP; > #endif > } > > +static void raw_refresh_zoned_limits(BlockDriverState *bs, struct stat *st, > + Error **errp) > +{ > + BlockZoneModel zoned; > + int ret; > + > + bs->bl.zoned = BLK_Z_NONE; > + > + ret = get_sysfs_zoned_model(st, &zoned); > + if (ret < 0 || zoned == BLK_Z_NONE) { > + return; > + } > + bs->bl.zoned = zoned; > +} > + > static void raw_refresh_limits(BlockDriverState *bs, Error **errp) > { > BDRVRawState *s = bs->opaque; > @@ -1297,6 +1354,8 @@ static void raw_refresh_limits(BlockDriverState *bs, Error **errp) > bs->bl.max_hw_iov = ret; > } > } > + > + raw_refresh_zoned_limits(bs, &st, errp); > } > > static int check_for_dasd(int fd)
Matthew Rosato <mjrosato@linux.ibm.com> 于2023年6月1日周四 02:21写道: > > On 5/15/23 12:04 PM, Stefan Hajnoczi wrote: > > From: Sam Li <faithilikerun@gmail.com> > > > > Use get_sysfs_str_val() to get the string value of device > > zoned model. Then get_sysfs_zoned_model() can convert it to > > BlockZoneModel type of QEMU. > > > > Use get_sysfs_long_val() to get the long value of zoned device > > information. > > Hi Stefan, Sam, > > I am having an issue on s390x using virtio-blk-{pci,ccw} backed by an NVMe partition, and I've bisected the root cause to this commit. > > I noticed that tests which use the partition e.g. /dev/nvme0n1p1 as a backing device would fail, but those that use the namespace e.g. /dev/nvme0n1 would still succeed. The root issue appears to be that the block device associated with the partition does not have a "max_segments" attribute, and prior to this patch hdev_get_max_segment() would return -ENOENT in this case. After this patch, however, QEMU is instead crashing. It looks like g_file_get_contents is returning 0 with a len == 0 if the specified sysfs path does not exist. The following diff on top seems to resolve the issue for me: > > > diff --git a/block/file-posix.c b/block/file-posix.c > index 0ab158efba2..eeb0247c74e 100644 > --- a/block/file-posix.c > +++ b/block/file-posix.c > @@ -1243,7 +1243,7 @@ static int get_sysfs_str_val(struct stat *st, const char *attribute, > major(st->st_rdev), minor(st->st_rdev), > attribute); > ret = g_file_get_contents(sysfspath, val, &len, NULL); > - if (ret == -1) { > + if (ret == -1 || len == 0) { > return -ENOENT; > } > Hi Matthew, Thanks for the information. After some checking, I think the bug here is that g_file_get_contens returns g_boolean value and the error case will return 0 instead of -1 in my previous code. Can the following line fix your issue on the s390x device? + if (ret == FALSE) { https://docs.gtk.org/glib/func.file_get_contents.html Thanks, Sam > > > > > > > Signed-off-by: Sam Li <faithilikerun@gmail.com> > > Reviewed-by: Hannes Reinecke <hare@suse.de> > > Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com> > > Reviewed-by: Damien Le Moal <damien.lemoal@opensource.wdc.com> > > Reviewed-by: Dmitry Fomichev <dmitry.fomichev@wdc.com> > > Acked-by: Kevin Wolf <kwolf@redhat.com> > > Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com> > > Message-id: 20230508045533.175575-3-faithilikerun@gmail.com > > Message-id: 20230324090605.28361-3-faithilikerun@gmail.com > > [Adjust commit message prefix as suggested by Philippe Mathieu-Daudé > > <philmd@linaro.org>. > > --Stefan] > > Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com> > > --- > > include/block/block_int-common.h | 3 + > > block/file-posix.c | 135 ++++++++++++++++++++++--------- > > 2 files changed, 100 insertions(+), 38 deletions(-) > > > > diff --git a/include/block/block_int-common.h b/include/block/block_int-common.h > > index 4909876756..c7ca5a83e9 100644 > > --- a/include/block/block_int-common.h > > +++ b/include/block/block_int-common.h > > @@ -862,6 +862,9 @@ typedef struct BlockLimits { > > * an explicit monitor command to load the disk inside the guest). > > */ > > bool has_variable_length; > > + > > + /* device zone model */ > > + BlockZoneModel zoned; > > } BlockLimits; > > > > typedef struct BdrvOpBlocker BdrvOpBlocker; > > diff --git a/block/file-posix.c b/block/file-posix.c > > index c7b723368e..97c597a2a0 100644 > > --- a/block/file-posix.c > > +++ b/block/file-posix.c > > @@ -1202,15 +1202,89 @@ static int hdev_get_max_hw_transfer(int fd, struct stat *st) > > #endif > > } > > > > -static int hdev_get_max_segments(int fd, struct stat *st) > > +/* > > + * Get a sysfs attribute value as character string. > > + */ > > +#ifdef CONFIG_LINUX > > +static int get_sysfs_str_val(struct stat *st, const char *attribute, > > + char **val) { > > + g_autofree char *sysfspath = NULL; > > + int ret; > > + size_t len; > > + > > + if (!S_ISBLK(st->st_mode)) { > > + return -ENOTSUP; > > + } > > + > > + sysfspath = g_strdup_printf("/sys/dev/block/%u:%u/queue/%s", > > + major(st->st_rdev), minor(st->st_rdev), > > + attribute); > > + ret = g_file_get_contents(sysfspath, val, &len, NULL); > > + if (ret == -1) { > > + return -ENOENT; > > + } > > + > > + /* The file is ended with '\n' */ > > + char *p; > > + p = *val; > > + if (*(p + len - 1) == '\n') { > > + *(p + len - 1) = '\0'; > > + } > > + return ret; > > +} > > +#endif > > + > > +static int get_sysfs_zoned_model(struct stat *st, BlockZoneModel *zoned) > > { > > + g_autofree char *val = NULL; > > + int ret; > > + > > + ret = get_sysfs_str_val(st, "zoned", &val); > > + if (ret < 0) { > > + return ret; > > + } > > + > > + if (strcmp(val, "host-managed") == 0) { > > + *zoned = BLK_Z_HM; > > + } else if (strcmp(val, "host-aware") == 0) { > > + *zoned = BLK_Z_HA; > > + } else if (strcmp(val, "none") == 0) { > > + *zoned = BLK_Z_NONE; > > + } else { > > + return -ENOTSUP; > > + } > > + return 0; > > +} > > + > > +/* > > + * Get a sysfs attribute value as a long integer. > > + */ > > #ifdef CONFIG_LINUX > > - char buf[32]; > > +static long get_sysfs_long_val(struct stat *st, const char *attribute) > > +{ > > + g_autofree char *str = NULL; > > const char *end; > > - char *sysfspath = NULL; > > + long val; > > + int ret; > > + > > + ret = get_sysfs_str_val(st, attribute, &str); > > + if (ret < 0) { > > + return ret; > > + } > > + > > + /* The file is ended with '\n', pass 'end' to accept that. */ > > + ret = qemu_strtol(str, &end, 10, &val); > > + if (ret == 0 && end && *end == '\0') { > > + ret = val; > > + } > > + return ret; > > +} > > +#endif > > + > > +static int hdev_get_max_segments(int fd, struct stat *st) > > +{ > > +#ifdef CONFIG_LINUX > > int ret; > > - int sysfd = -1; > > - long max_segments; > > > > if (S_ISCHR(st->st_mode)) { > > if (ioctl(fd, SG_GET_SG_TABLESIZE, &ret) == 0) { > > @@ -1218,44 +1292,27 @@ static int hdev_get_max_segments(int fd, struct stat *st) > > } > > return -ENOTSUP; > > } > > - > > - if (!S_ISBLK(st->st_mode)) { > > - return -ENOTSUP; > > - } > > - > > - sysfspath = g_strdup_printf("/sys/dev/block/%u:%u/queue/max_segments", > > - major(st->st_rdev), minor(st->st_rdev)); > > - sysfd = open(sysfspath, O_RDONLY); > > - if (sysfd == -1) { > > - ret = -errno; > > - goto out; > > - } > > - ret = RETRY_ON_EINTR(read(sysfd, buf, sizeof(buf) - 1)); > > - if (ret < 0) { > > - ret = -errno; > > - goto out; > > - } else if (ret == 0) { > > - ret = -EIO; > > - goto out; > > - } > > - buf[ret] = 0; > > - /* The file is ended with '\n', pass 'end' to accept that. */ > > - ret = qemu_strtol(buf, &end, 10, &max_segments); > > - if (ret == 0 && end && *end == '\n') { > > - ret = max_segments; > > - } > > - > > -out: > > - if (sysfd != -1) { > > - close(sysfd); > > - } > > - g_free(sysfspath); > > - return ret; > > + return get_sysfs_long_val(st, "max_segments"); > > #else > > return -ENOTSUP; > > #endif > > } > > > > +static void raw_refresh_zoned_limits(BlockDriverState *bs, struct stat *st, > > + Error **errp) > > +{ > > + BlockZoneModel zoned; > > + int ret; > > + > > + bs->bl.zoned = BLK_Z_NONE; > > + > > + ret = get_sysfs_zoned_model(st, &zoned); > > + if (ret < 0 || zoned == BLK_Z_NONE) { > > + return; > > + } > > + bs->bl.zoned = zoned; > > +} > > + > > static void raw_refresh_limits(BlockDriverState *bs, Error **errp) > > { > > BDRVRawState *s = bs->opaque; > > @@ -1297,6 +1354,8 @@ static void raw_refresh_limits(BlockDriverState *bs, Error **errp) > > bs->bl.max_hw_iov = ret; > > } > > } > > + > > + raw_refresh_zoned_limits(bs, &st, errp); > > } > > > > static int check_for_dasd(int fd) >
On 6/2/23 2:18 PM, Sam Li wrote: > Matthew Rosato <mjrosato@linux.ibm.com> 于2023年6月1日周四 02:21写道: >> >> On 5/15/23 12:04 PM, Stefan Hajnoczi wrote: >>> From: Sam Li <faithilikerun@gmail.com> >>> >>> Use get_sysfs_str_val() to get the string value of device >>> zoned model. Then get_sysfs_zoned_model() can convert it to >>> BlockZoneModel type of QEMU. >>> >>> Use get_sysfs_long_val() to get the long value of zoned device >>> information. >> >> Hi Stefan, Sam, >> >> I am having an issue on s390x using virtio-blk-{pci,ccw} backed by an NVMe partition, and I've bisected the root cause to this commit. >> >> I noticed that tests which use the partition e.g. /dev/nvme0n1p1 as a backing device would fail, but those that use the namespace e.g. /dev/nvme0n1 would still succeed. The root issue appears to be that the block device associated with the partition does not have a "max_segments" attribute, and prior to this patch hdev_get_max_segment() would return -ENOENT in this case. After this patch, however, QEMU is instead crashing. It looks like g_file_get_contents is returning 0 with a len == 0 if the specified sysfs path does not exist. The following diff on top seems to resolve the issue for me: >> >> >> diff --git a/block/file-posix.c b/block/file-posix.c >> index 0ab158efba2..eeb0247c74e 100644 >> --- a/block/file-posix.c >> +++ b/block/file-posix.c >> @@ -1243,7 +1243,7 @@ static int get_sysfs_str_val(struct stat *st, const char *attribute, >> major(st->st_rdev), minor(st->st_rdev), >> attribute); >> ret = g_file_get_contents(sysfspath, val, &len, NULL); >> - if (ret == -1) { >> + if (ret == -1 || len == 0) { >> return -ENOENT; >> } >> > > Hi Matthew, > > Thanks for the information. After some checking, I think the bug here > is that g_file_get_contens returns g_boolean value and the error case > will return 0 instead of -1 in my previous code. Can the following > line fix your issue on the s390x device? > > + if (ret == FALSE) { > > https://docs.gtk.org/glib/func.file_get_contents.html Hi Sam, Ah, good point, I didn't notice file_get_contents was meant to be a bool return and wondered why I was getting a return of 0 in the failing case, hence the check for len == 0. Anyway, yes, I verified that checking for ret == FALSE fixes the issue. FWIW, along the same line I also checked that this works: if (!g_file_get_contents(sysfspath, val, &len, NULL)) { return -ENOENT; } which I personally think looks cleaner and matches the other uses of g_file_get_contents in QEMU. Could also get rid of ret and just return 0 at the bottom of the function. Thanks, Matt
Matthew Rosato <mjrosato@linux.ibm.com> 于2023年6月3日周六 02:41写道: > > On 6/2/23 2:18 PM, Sam Li wrote: > > Matthew Rosato <mjrosato@linux.ibm.com> 于2023年6月1日周四 02:21写道: > >> > >> On 5/15/23 12:04 PM, Stefan Hajnoczi wrote: > >>> From: Sam Li <faithilikerun@gmail.com> > >>> > >>> Use get_sysfs_str_val() to get the string value of device > >>> zoned model. Then get_sysfs_zoned_model() can convert it to > >>> BlockZoneModel type of QEMU. > >>> > >>> Use get_sysfs_long_val() to get the long value of zoned device > >>> information. > >> > >> Hi Stefan, Sam, > >> > >> I am having an issue on s390x using virtio-blk-{pci,ccw} backed by an NVMe partition, and I've bisected the root cause to this commit. > >> > >> I noticed that tests which use the partition e.g. /dev/nvme0n1p1 as a backing device would fail, but those that use the namespace e.g. /dev/nvme0n1 would still succeed. The root issue appears to be that the block device associated with the partition does not have a "max_segments" attribute, and prior to this patch hdev_get_max_segment() would return -ENOENT in this case. After this patch, however, QEMU is instead crashing. It looks like g_file_get_contents is returning 0 with a len == 0 if the specified sysfs path does not exist. The following diff on top seems to resolve the issue for me: > >> > >> > >> diff --git a/block/file-posix.c b/block/file-posix.c > >> index 0ab158efba2..eeb0247c74e 100644 > >> --- a/block/file-posix.c > >> +++ b/block/file-posix.c > >> @@ -1243,7 +1243,7 @@ static int get_sysfs_str_val(struct stat *st, const char *attribute, > >> major(st->st_rdev), minor(st->st_rdev), > >> attribute); > >> ret = g_file_get_contents(sysfspath, val, &len, NULL); > >> - if (ret == -1) { > >> + if (ret == -1 || len == 0) { > >> return -ENOENT; > >> } > >> > > > > Hi Matthew, > > > > Thanks for the information. After some checking, I think the bug here > > is that g_file_get_contens returns g_boolean value and the error case > > will return 0 instead of -1 in my previous code. Can the following > > line fix your issue on the s390x device? > > > > + if (ret == FALSE) { > > > > https://docs.gtk.org/glib/func.file_get_contents.html > > Hi Sam, > > Ah, good point, I didn't notice file_get_contents was meant to be a bool return and wondered why I was getting a return of 0 in the failing case, hence the check for len == 0. > > Anyway, yes, I verified that checking for ret == FALSE fixes the issue. FWIW, along the same line I also checked that this works: > > if (!g_file_get_contents(sysfspath, val, &len, NULL)) { > return -ENOENT; > } > > which I personally think looks cleaner and matches the other uses of g_file_get_contents in QEMU. Could also get rid of ret and just return 0 at the bottom of the function. Indeed. I will fix this. Thanks! Sam
© 2016 - 2025 Red Hat, Inc.