Uses UADK wd_do_comp_sync() API to (de)compress a normal page using
hardware accelerator.
Signed-off-by: Shameer Kolothum <shameerali.kolothum.thodi@huawei.com>
---
migration/multifd-uadk.c | 132 ++++++++++++++++++++++++++++++++++++++-
1 file changed, 130 insertions(+), 2 deletions(-)
diff --git a/migration/multifd-uadk.c b/migration/multifd-uadk.c
index 3172e4d5ca..3329819bd4 100644
--- a/migration/multifd-uadk.c
+++ b/migration/multifd-uadk.c
@@ -13,6 +13,7 @@
#include "qemu/osdep.h"
#include "qemu/module.h"
#include "qapi/error.h"
+#include "exec/ramblock.h"
#include "migration.h"
#include "multifd.h"
#include "options.h"
@@ -140,6 +141,15 @@ static void multifd_uadk_send_cleanup(MultiFDSendParams *p, Error **errp)
p->compress_data = NULL;
}
+static inline void prepare_next_iov(MultiFDSendParams *p, void *base,
+ uint32_t len)
+{
+ p->iov[p->iovs_num].iov_base = (uint8_t *)base;
+ p->iov[p->iovs_num].iov_len = len;
+ p->next_packet_size += len;
+ p->iovs_num++;
+}
+
/**
* multifd_uadk_send_prepare: prepare data to be able to send
*
@@ -153,7 +163,56 @@ static void multifd_uadk_send_cleanup(MultiFDSendParams *p, Error **errp)
*/
static int multifd_uadk_send_prepare(MultiFDSendParams *p, Error **errp)
{
- return -1;
+ struct wd_data *uadk_data = p->compress_data;
+ uint32_t hdr_size;
+ uint8_t *buf = uadk_data->buf;
+ int ret = 0;
+
+ if (!multifd_send_prepare_common(p)) {
+ goto out;
+ }
+
+ hdr_size = p->pages->normal_num * sizeof(uint32_t);
+ /* prepare the header that stores the lengths of all compressed data */
+ prepare_next_iov(p, uadk_data->buf_hdr, hdr_size);
+
+ for (int i = 0; i < p->pages->normal_num; i++) {
+ struct wd_comp_req creq = {
+ .op_type = WD_DIR_COMPRESS,
+ .src = p->pages->block->host + p->pages->offset[i],
+ .src_len = p->page_size,
+ .dst = buf,
+ /* Set dst_len to double the src to take care of -ve compression */
+ .dst_len = p->page_size * 2,
+ };
+
+ ret = wd_do_comp_sync(uadk_data->handle, &creq);
+ if (ret || creq.status) {
+ error_setg(errp, "multifd %u: failed wd_do_comp_sync, ret %d status %d",
+ p->id, ret, creq.status);
+ return -1;
+ }
+ if (creq.dst_len < p->page_size) {
+ uadk_data->buf_hdr[i] = cpu_to_be32(creq.dst_len);
+ prepare_next_iov(p, buf, creq.dst_len);
+ buf += creq.dst_len;
+ } else {
+ /*
+ * Send raw data if compressed out >= page_size. We might be better
+ * off sending raw data if output is slightly less than page_size
+ * as well because at the receive end we can skip the decompression.
+ * But it is tricky to find the right number here.
+ */
+ uadk_data->buf_hdr[i] = cpu_to_be32(p->page_size);
+ prepare_next_iov(p, p->pages->block->host + p->pages->offset[i],
+ p->page_size);
+ buf += p->page_size;
+ }
+ }
+out:
+ p->flags |= MULTIFD_FLAG_UADK;
+ multifd_send_fill_packet(p);
+ return 0;
}
/**
@@ -206,7 +265,76 @@ static void multifd_uadk_recv_cleanup(MultiFDRecvParams *p)
*/
static int multifd_uadk_recv(MultiFDRecvParams *p, Error **errp)
{
- return -1;
+ struct wd_data *uadk_data = p->compress_data;
+ uint32_t in_size = p->next_packet_size;
+ uint32_t flags = p->flags & MULTIFD_FLAG_COMPRESSION_MASK;
+ uint32_t hdr_len = p->normal_num * sizeof(uint32_t);
+ uint32_t data_len = 0;
+ uint8_t *buf = uadk_data->buf;
+ int ret = 0;
+
+ if (flags != MULTIFD_FLAG_UADK) {
+ error_setg(errp, "multifd %u: flags received %x flags expected %x",
+ p->id, flags, MULTIFD_FLAG_ZLIB);
+ return -1;
+ }
+
+ multifd_recv_zero_page_process(p);
+ if (!p->normal_num) {
+ assert(in_size == 0);
+ return 0;
+ }
+
+ /* read compressed data lengths */
+ assert(hdr_len < in_size);
+ ret = qio_channel_read_all(p->c, (void *) uadk_data->buf_hdr,
+ hdr_len, errp);
+ if (ret != 0) {
+ return ret;
+ }
+
+ for (int i = 0; i < p->normal_num; i++) {
+ uadk_data->buf_hdr[i] = be32_to_cpu(uadk_data->buf_hdr[i]);
+ data_len += uadk_data->buf_hdr[i];
+ assert(uadk_data->buf_hdr[i] <= p->page_size);
+ }
+
+ /* read compressed data */
+ assert(in_size == hdr_len + data_len);
+ ret = qio_channel_read_all(p->c, (void *)buf, data_len, errp);
+ if (ret != 0) {
+ return ret;
+ }
+
+ for (int i = 0; i < p->normal_num; i++) {
+ struct wd_comp_req creq = {
+ .op_type = WD_DIR_DECOMPRESS,
+ .src = buf,
+ .src_len = uadk_data->buf_hdr[i],
+ .dst = p->host + p->normal[i],
+ .dst_len = p->page_size,
+ };
+
+ if (uadk_data->buf_hdr[i] == p->page_size) {
+ memcpy(p->host + p->normal[i], buf, p->page_size);
+ buf += p->page_size;
+ continue;
+ }
+
+ ret = wd_do_comp_sync(uadk_data->handle, &creq);
+ if (ret || creq.status) {
+ error_setg(errp, "multifd %u: failed wd_do_comp_sync, ret %d status %d",
+ p->id, ret, creq.status);
+ return -1;
+ }
+ if (creq.dst_len != p->page_size) {
+ error_setg(errp, "multifd %u: decompressed length error", p->id);
+ return -1;
+ }
+ buf += uadk_data->buf_hdr[i];
+ }
+
+ return 0;
}
static MultiFDMethods multifd_uadk_ops = {
--
2.17.1
Shameer Kolothum via <qemu-devel@nongnu.org> writes:
> Uses UADK wd_do_comp_sync() API to (de)compress a normal page using
> hardware accelerator.
>
> Signed-off-by: Shameer Kolothum <shameerali.kolothum.thodi@huawei.com>
A couple of comments below.
Reviewed-by: Fabiano Rosas <farosas@suse.de>
> ---
> migration/multifd-uadk.c | 132 ++++++++++++++++++++++++++++++++++++++-
> 1 file changed, 130 insertions(+), 2 deletions(-)
>
> diff --git a/migration/multifd-uadk.c b/migration/multifd-uadk.c
> index 3172e4d5ca..3329819bd4 100644
> --- a/migration/multifd-uadk.c
> +++ b/migration/multifd-uadk.c
> @@ -13,6 +13,7 @@
> #include "qemu/osdep.h"
> #include "qemu/module.h"
> #include "qapi/error.h"
> +#include "exec/ramblock.h"
> #include "migration.h"
> #include "multifd.h"
> #include "options.h"
> @@ -140,6 +141,15 @@ static void multifd_uadk_send_cleanup(MultiFDSendParams *p, Error **errp)
> p->compress_data = NULL;
> }
>
> +static inline void prepare_next_iov(MultiFDSendParams *p, void *base,
> + uint32_t len)
> +{
> + p->iov[p->iovs_num].iov_base = (uint8_t *)base;
> + p->iov[p->iovs_num].iov_len = len;
> + p->next_packet_size += len;
> + p->iovs_num++;
> +}
> +
> /**
> * multifd_uadk_send_prepare: prepare data to be able to send
> *
> @@ -153,7 +163,56 @@ static void multifd_uadk_send_cleanup(MultiFDSendParams *p, Error **errp)
> */
> static int multifd_uadk_send_prepare(MultiFDSendParams *p, Error **errp)
> {
> - return -1;
> + struct wd_data *uadk_data = p->compress_data;
> + uint32_t hdr_size;
> + uint8_t *buf = uadk_data->buf;
> + int ret = 0;
> +
> + if (!multifd_send_prepare_common(p)) {
> + goto out;
> + }
> +
> + hdr_size = p->pages->normal_num * sizeof(uint32_t);
> + /* prepare the header that stores the lengths of all compressed data */
> + prepare_next_iov(p, uadk_data->buf_hdr, hdr_size);
> +
> + for (int i = 0; i < p->pages->normal_num; i++) {
> + struct wd_comp_req creq = {
> + .op_type = WD_DIR_COMPRESS,
> + .src = p->pages->block->host + p->pages->offset[i],
> + .src_len = p->page_size,
> + .dst = buf,
> + /* Set dst_len to double the src to take care of -ve compression */
What's -ve compression?
> + .dst_len = p->page_size * 2,
> + };
> +
> + ret = wd_do_comp_sync(uadk_data->handle, &creq);
> + if (ret || creq.status) {
> + error_setg(errp, "multifd %u: failed wd_do_comp_sync, ret %d status %d",
> + p->id, ret, creq.status);
> + return -1;
> + }
> + if (creq.dst_len < p->page_size) {
> + uadk_data->buf_hdr[i] = cpu_to_be32(creq.dst_len);
> + prepare_next_iov(p, buf, creq.dst_len);
> + buf += creq.dst_len;
> + } else {
> + /*
> + * Send raw data if compressed out >= page_size. We might be better
> + * off sending raw data if output is slightly less than page_size
> + * as well because at the receive end we can skip the decompression.
> + * But it is tricky to find the right number here.
> + */
> + uadk_data->buf_hdr[i] = cpu_to_be32(p->page_size);
> + prepare_next_iov(p, p->pages->block->host + p->pages->offset[i],
> + p->page_size);
> + buf += p->page_size;
> + }
> + }
> +out:
> + p->flags |= MULTIFD_FLAG_UADK;
> + multifd_send_fill_packet(p);
> + return 0;
> }
>
> /**
> @@ -206,7 +265,76 @@ static void multifd_uadk_recv_cleanup(MultiFDRecvParams *p)
> */
> static int multifd_uadk_recv(MultiFDRecvParams *p, Error **errp)
> {
> - return -1;
> + struct wd_data *uadk_data = p->compress_data;
> + uint32_t in_size = p->next_packet_size;
> + uint32_t flags = p->flags & MULTIFD_FLAG_COMPRESSION_MASK;
> + uint32_t hdr_len = p->normal_num * sizeof(uint32_t);
> + uint32_t data_len = 0;
> + uint8_t *buf = uadk_data->buf;
> + int ret = 0;
> +
> + if (flags != MULTIFD_FLAG_UADK) {
> + error_setg(errp, "multifd %u: flags received %x flags expected %x",
> + p->id, flags, MULTIFD_FLAG_ZLIB);
> + return -1;
> + }
> +
> + multifd_recv_zero_page_process(p);
> + if (!p->normal_num) {
> + assert(in_size == 0);
> + return 0;
> + }
> +
> + /* read compressed data lengths */
> + assert(hdr_len < in_size);
> + ret = qio_channel_read_all(p->c, (void *) uadk_data->buf_hdr,
> + hdr_len, errp);
> + if (ret != 0) {
> + return ret;
> + }
> +
> + for (int i = 0; i < p->normal_num; i++) {
> + uadk_data->buf_hdr[i] = be32_to_cpu(uadk_data->buf_hdr[i]);
> + data_len += uadk_data->buf_hdr[i];
> + assert(uadk_data->buf_hdr[i] <= p->page_size);
> + }
> +
> + /* read compressed data */
> + assert(in_size == hdr_len + data_len);
> + ret = qio_channel_read_all(p->c, (void *)buf, data_len, errp);
> + if (ret != 0) {
> + return ret;
> + }
> +
> + for (int i = 0; i < p->normal_num; i++) {
> + struct wd_comp_req creq = {
> + .op_type = WD_DIR_DECOMPRESS,
> + .src = buf,
> + .src_len = uadk_data->buf_hdr[i],
> + .dst = p->host + p->normal[i],
> + .dst_len = p->page_size,
> + };
> +
> + if (uadk_data->buf_hdr[i] == p->page_size) {
> + memcpy(p->host + p->normal[i], buf, p->page_size);
> + buf += p->page_size;
> + continue;
> + }
> +
> + ret = wd_do_comp_sync(uadk_data->handle, &creq);
> + if (ret || creq.status) {
> + error_setg(errp, "multifd %u: failed wd_do_comp_sync, ret %d status %d",
> + p->id, ret, creq.status);
It would be nice to be able to tell compression from decompression in
these error messages.
> + return -1;
> + }
> + if (creq.dst_len != p->page_size) {
> + error_setg(errp, "multifd %u: decompressed length error", p->id);
> + return -1;
> + }
> + buf += uadk_data->buf_hdr[i];
> + }
> +
> + return 0;
> }
>
> static MultiFDMethods multifd_uadk_ops = {
> -----Original Message-----
> From: Fabiano Rosas <farosas@suse.de>
> Sent: Wednesday, June 5, 2024 7:57 PM
> To: Shameerali Kolothum Thodi <shameerali.kolothum.thodi@huawei.com>;
> peterx@redhat.com; yuan1.liu@intel.com
> Cc: qemu-devel@nongnu.org; Linuxarm <linuxarm@huawei.com>; linwenkai
> (C) <linwenkai6@hisilicon.com>; zhangfei.gao@linaro.org; huangchenghai
> <huangchenghai2@huawei.com>
> Subject: Re: [PATCH 5/7] migration/multifd: Add UADK based compression
> and decompression
>
> Shameer Kolothum via <qemu-devel@nongnu.org> writes:
>
> > Uses UADK wd_do_comp_sync() API to (de)compress a normal page using
> > hardware accelerator.
> >
> > Signed-off-by: Shameer Kolothum
> <shameerali.kolothum.thodi@huawei.com>
>
> A couple of comments below.
>
> Reviewed-by: Fabiano Rosas <farosas@suse.de>
> > ---
> > migration/multifd-uadk.c | 132
> ++++++++++++++++++++++++++++++++++++++-
> > 1 file changed, 130 insertions(+), 2 deletions(-)
> >
> > diff --git a/migration/multifd-uadk.c b/migration/multifd-uadk.c
> > index 3172e4d5ca..3329819bd4 100644
> > --- a/migration/multifd-uadk.c
> > +++ b/migration/multifd-uadk.c
> > @@ -13,6 +13,7 @@
> > #include "qemu/osdep.h"
> > #include "qemu/module.h"
> > #include "qapi/error.h"
> > +#include "exec/ramblock.h"
> > #include "migration.h"
> > #include "multifd.h"
> > #include "options.h"
> > @@ -140,6 +141,15 @@ static void
> multifd_uadk_send_cleanup(MultiFDSendParams *p, Error **errp)
> > p->compress_data = NULL;
> > }
> >
> > +static inline void prepare_next_iov(MultiFDSendParams *p, void *base,
> > + uint32_t len)
> > +{
> > + p->iov[p->iovs_num].iov_base = (uint8_t *)base;
> > + p->iov[p->iovs_num].iov_len = len;
> > + p->next_packet_size += len;
> > + p->iovs_num++;
> > +}
> > +
> > /**
> > * multifd_uadk_send_prepare: prepare data to be able to send
> > *
> > @@ -153,7 +163,56 @@ static void
> multifd_uadk_send_cleanup(MultiFDSendParams *p, Error **errp)
> > */
> > static int multifd_uadk_send_prepare(MultiFDSendParams *p, Error
> **errp)
> > {
> > - return -1;
> > + struct wd_data *uadk_data = p->compress_data;
> > + uint32_t hdr_size;
> > + uint8_t *buf = uadk_data->buf;
> > + int ret = 0;
> > +
> > + if (!multifd_send_prepare_common(p)) {
> > + goto out;
> > + }
> > +
> > + hdr_size = p->pages->normal_num * sizeof(uint32_t);
> > + /* prepare the header that stores the lengths of all compressed data */
> > + prepare_next_iov(p, uadk_data->buf_hdr, hdr_size);
> > +
> > + for (int i = 0; i < p->pages->normal_num; i++) {
> > + struct wd_comp_req creq = {
> > + .op_type = WD_DIR_COMPRESS,
> > + .src = p->pages->block->host + p->pages->offset[i],
> > + .src_len = p->page_size,
> > + .dst = buf,
> > + /* Set dst_len to double the src to take care of -ve compression */
>
> What's -ve compression?
Just meant the case where output is > input. I can reword this.
>
> > + .dst_len = p->page_size * 2,
> > + };
> > +
> > + ret = wd_do_comp_sync(uadk_data->handle, &creq);
> > + if (ret || creq.status) {
> > + error_setg(errp, "multifd %u: failed wd_do_comp_sync, ret %d
> status %d",
> > + p->id, ret, creq.status);
> > + return -1;
> > + }
> > + if (creq.dst_len < p->page_size) {
> > + uadk_data->buf_hdr[i] = cpu_to_be32(creq.dst_len);
> > + prepare_next_iov(p, buf, creq.dst_len);
> > + buf += creq.dst_len;
> > + } else {
> > + /*
> > + * Send raw data if compressed out >= page_size. We might be
> better
> > + * off sending raw data if output is slightly less than page_size
> > + * as well because at the receive end we can skip the
> decompression.
> > + * But it is tricky to find the right number here.
> > + */
> > + uadk_data->buf_hdr[i] = cpu_to_be32(p->page_size);
> > + prepare_next_iov(p, p->pages->block->host + p->pages->offset[i],
> > + p->page_size);
> > + buf += p->page_size;
> > + }
> > + }
> > +out:
> > + p->flags |= MULTIFD_FLAG_UADK;
> > + multifd_send_fill_packet(p);
> > + return 0;
> > }
> >
> > /**
> > @@ -206,7 +265,76 @@ static void
> multifd_uadk_recv_cleanup(MultiFDRecvParams *p)
> > */
> > static int multifd_uadk_recv(MultiFDRecvParams *p, Error **errp)
> > {
> > - return -1;
> > + struct wd_data *uadk_data = p->compress_data;
> > + uint32_t in_size = p->next_packet_size;
> > + uint32_t flags = p->flags & MULTIFD_FLAG_COMPRESSION_MASK;
> > + uint32_t hdr_len = p->normal_num * sizeof(uint32_t);
> > + uint32_t data_len = 0;
> > + uint8_t *buf = uadk_data->buf;
> > + int ret = 0;
> > +
> > + if (flags != MULTIFD_FLAG_UADK) {
> > + error_setg(errp, "multifd %u: flags received %x flags expected %x",
> > + p->id, flags, MULTIFD_FLAG_ZLIB);
> > + return -1;
> > + }
> > +
> > + multifd_recv_zero_page_process(p);
> > + if (!p->normal_num) {
> > + assert(in_size == 0);
> > + return 0;
> > + }
> > +
> > + /* read compressed data lengths */
> > + assert(hdr_len < in_size);
> > + ret = qio_channel_read_all(p->c, (void *) uadk_data->buf_hdr,
> > + hdr_len, errp);
> > + if (ret != 0) {
> > + return ret;
> > + }
> > +
> > + for (int i = 0; i < p->normal_num; i++) {
> > + uadk_data->buf_hdr[i] = be32_to_cpu(uadk_data->buf_hdr[i]);
> > + data_len += uadk_data->buf_hdr[i];
> > + assert(uadk_data->buf_hdr[i] <= p->page_size);
> > + }
> > +
> > + /* read compressed data */
> > + assert(in_size == hdr_len + data_len);
> > + ret = qio_channel_read_all(p->c, (void *)buf, data_len, errp);
> > + if (ret != 0) {
> > + return ret;
> > + }
> > +
> > + for (int i = 0; i < p->normal_num; i++) {
> > + struct wd_comp_req creq = {
> > + .op_type = WD_DIR_DECOMPRESS,
> > + .src = buf,
> > + .src_len = uadk_data->buf_hdr[i],
> > + .dst = p->host + p->normal[i],
> > + .dst_len = p->page_size,
> > + };
> > +
> > + if (uadk_data->buf_hdr[i] == p->page_size) {
> > + memcpy(p->host + p->normal[i], buf, p->page_size);
> > + buf += p->page_size;
> > + continue;
> > + }
> > +
> > + ret = wd_do_comp_sync(uadk_data->handle, &creq);
> > + if (ret || creq.status) {
> > + error_setg(errp, "multifd %u: failed wd_do_comp_sync, ret %d
> status %d",
> > + p->id, ret, creq.status);
>
> It would be nice to be able to tell compression from decompression in
> these error messages.
Ok. Will change.
Thanks,
Shameer
© 2016 - 2026 Red Hat, Inc.