1
The following changes since commit 673205379fb499d2b72f2985b47ec7114282f5fe:
1
The following changes since commit aa90f1161bb17a4863e16ec2f75104cff0752d4e:
2
2
3
Merge remote-tracking branch 'remotes/philmd-gitlab/tags/python-next-20200714' into staging (2020-07-15 13:04:27 +0100)
3
Merge tag 'migration-20250314-pull-request' of https://gitlab.com/farosas/qemu into staging (2025-03-16 02:45:22 -0400)
4
4
5
are available in the git repository at:
5
are available in the Git repository at:
6
6
7
https://github.com/jasowang/qemu.git tags/net-pull-request
7
https://github.com/jasowang/qemu.git tags/net-pull-request
8
8
9
for you to fetch changes up to a134321ef676723768973537bb9b49365ae2062e:
9
for you to fetch changes up to b027f55a994af885a7a498a40373a2dcc2d8b15e:
10
10
11
ftgmac100: fix dblac write test (2020-07-15 21:00:13 +0800)
11
vdpa: Allow vDPA to work on big-endian machine (2025-03-17 13:46:28 +0800)
12
12
13
----------------------------------------------------------------
13
----------------------------------------------------------------
14
-----BEGIN PGP SIGNATURE-----
15
16
iQEzBAABCAAdFiEEIV1G9IJGaJ7HfzVi7wSWWzmNYhEFAmfX5/cACgkQ7wSWWzmN
17
YhFRHQgArp4daHmnfc4r8TNel7fBjeSTpfDGwQcUJbcljKK2ABtylcESAEg6tsAw
18
aBzaZ2PwoTQfDV2s//g/d2uzd3BWH0Iu3qimsyBtx7Um7D4h7NsGB+gTB/7IhcK8
19
1LjMHqDnaeS6fzJ93/umTXuyQLzA3tIFkJBzvxVseLrmv6uBPmAy+PDNe/uZ2jeF
20
2H20jNt/HMc1Yf7sE7NKTBkX+OxuIFkpOGcBtVxiPK1//Wmhw+v+zlQOFjUC+6CD
21
LxiBB0Q0tD7ekfbuF6x2SOnuzLDHgpMzgoGqLIYzeQhBX9TdHLM0LtEHHaMyW1pj
22
7mGPSY4avVSM1sePgtmNJ5Y5r/xTRA==
23
=e7Sc
24
-----END PGP SIGNATURE-----
14
25
15
----------------------------------------------------------------
26
----------------------------------------------------------------
16
Andrew (1):
27
Konstantin Shkolnyy (1):
17
hw/net: Added CSO for IPv6
28
vdpa: Allow vDPA to work on big-endian machine
18
29
19
Daniel P. Berrangé (1):
30
net/vhost-vdpa.c | 13 +++++++++++++
20
net: detect errors from probing vnet hdr flag for TAP devices
31
1 file changed, 13 insertions(+)
21
22
Juan Quintela (1):
23
virtio-net: fix removal of failover device
24
25
Laurent Vivier (1):
26
net: check if the file descriptor is valid before using it
27
28
Zhang Chen (2):
29
net/colo-compare.c: Expose compare "max_queue_size" to users
30
qemu-options.hx: Clean up and fix typo for colo-compare
31
32
erik-smit (1):
33
ftgmac100: fix dblac write test
34
35
hw/net/ftgmac100.c | 14 +++++++------
36
hw/net/net_tx_pkt.c | 15 ++++++++++---
37
hw/net/virtio-net.c | 1 +
38
include/qemu/sockets.h | 1 +
39
net/colo-compare.c | 43 ++++++++++++++++++++++++++++++++++++-
40
net/socket.c | 9 ++++++--
41
net/tap-bsd.c | 2 +-
42
net/tap-linux.c | 8 ++++---
43
net/tap-solaris.c | 2 +-
44
net/tap-stub.c | 2 +-
45
net/tap.c | 50 +++++++++++++++++++++++++++++++++++--------
46
net/tap_int.h | 2 +-
47
qemu-options.hx | 33 +++++++++++++++--------------
48
util/oslib-posix.c | 26 ++++++++++++++++-------
49
util/oslib-win32.c | 57 ++++++++++++++++++++++++++++----------------------
50
15 files changed, 188 insertions(+), 77 deletions(-)
51
52
diff view generated by jsdifflib
Deleted patch
1
From: Juan Quintela <quintela@redhat.com>
2
1
3
If you have a networking device and its virtio failover device, and
4
you remove them in this order:
5
- virtio device
6
- the real device
7
8
You get qemu crash.
9
See bugzilla: https://bugzilla.redhat.com/show_bug.cgi?id=1820120
10
11
Bug exist on qemu 4.2 and 5.0.
12
But in 5.0 don't shows because commit
13
77b06bba62034a87cc61a9c8de1309ae3e527d97
14
15
somehow papers over it.
16
17
CC: Jason Wang <jasowang@redhat.com>
18
CC: Michael S. Tsirkin <mst@redhat.com>
19
Reviewed-by: Michael S. Tsirkin <mst@redhat.com>
20
Acked-by: Laurent Vivier <lvivier@redhat.com>
21
Signed-off-by: Juan Quintela <quintela@redhat.com>
22
Signed-off-by: Jason Wang <jasowang@redhat.com>
23
---
24
hw/net/virtio-net.c | 1 +
25
1 file changed, 1 insertion(+)
26
27
diff --git a/hw/net/virtio-net.c b/hw/net/virtio-net.c
28
index XXXXXXX..XXXXXXX 100644
29
--- a/hw/net/virtio-net.c
30
+++ b/hw/net/virtio-net.c
31
@@ -XXX,XX +XXX,XX @@ static void virtio_net_device_unrealize(DeviceState *dev)
32
g_free(n->vlans);
33
34
if (n->failover) {
35
+ device_listener_unregister(&n->primary_listener);
36
g_free(n->primary_device_id);
37
g_free(n->standby_id);
38
qobject_unref(n->primary_device_dict);
39
--
40
2.5.0
41
42
diff view generated by jsdifflib
Deleted patch
1
From: Andrew <andrew@daynix.com>
2
1
3
Added fix for checksum offload for IPv6 if a backend doesn't
4
have a virtual header.
5
This patch is a part of IPv6 fragmentation.
6
7
Signed-off-by: Andrew Melnychenko <andrew@daynix.com>
8
Signed-off-by: Jason Wang <jasowang@redhat.com>
9
---
10
hw/net/net_tx_pkt.c | 15 ++++++++++++---
11
1 file changed, 12 insertions(+), 3 deletions(-)
12
13
diff --git a/hw/net/net_tx_pkt.c b/hw/net/net_tx_pkt.c
14
index XXXXXXX..XXXXXXX 100644
15
--- a/hw/net/net_tx_pkt.c
16
+++ b/hw/net/net_tx_pkt.c
17
@@ -XXX,XX +XXX,XX @@ static void net_tx_pkt_do_sw_csum(struct NetTxPkt *pkt)
18
/* num of iovec without vhdr */
19
uint32_t iov_len = pkt->payload_frags + NET_TX_PKT_PL_START_FRAG - 1;
20
uint16_t csl;
21
- struct ip_header *iphdr;
22
size_t csum_offset = pkt->virt_hdr.csum_start + pkt->virt_hdr.csum_offset;
23
+ uint16_t l3_proto = eth_get_l3_proto(iov, 1, iov->iov_len);
24
25
/* Put zero to checksum field */
26
iov_from_buf(iov, iov_len, csum_offset, &csum, sizeof csum);
27
@@ -XXX,XX +XXX,XX @@ static void net_tx_pkt_do_sw_csum(struct NetTxPkt *pkt)
28
/* Calculate L4 TCP/UDP checksum */
29
csl = pkt->payload_len;
30
31
+ csum_cntr = 0;
32
+ cso = 0;
33
/* add pseudo header to csum */
34
- iphdr = pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_base;
35
- csum_cntr = eth_calc_ip4_pseudo_hdr_csum(iphdr, csl, &cso);
36
+ if (l3_proto == ETH_P_IP) {
37
+ csum_cntr = eth_calc_ip4_pseudo_hdr_csum(
38
+ pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_base,
39
+ csl, &cso);
40
+ } else if (l3_proto == ETH_P_IPV6) {
41
+ csum_cntr = eth_calc_ip6_pseudo_hdr_csum(
42
+ pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_base,
43
+ csl, pkt->l4proto, &cso);
44
+ }
45
46
/* data checksum */
47
csum_cntr +=
48
--
49
2.5.0
50
51
diff view generated by jsdifflib
Deleted patch
1
From: Zhang Chen <chen.zhang@intel.com>
2
1
3
This patch allow users to set the "max_queue_size" according
4
to their environment.
5
6
Signed-off-by: Zhang Chen <chen.zhang@intel.com>
7
Signed-off-by: Jason Wang <jasowang@redhat.com>
8
---
9
net/colo-compare.c | 43 ++++++++++++++++++++++++++++++++++++++++++-
10
qemu-options.hx | 5 +++--
11
2 files changed, 45 insertions(+), 3 deletions(-)
12
13
diff --git a/net/colo-compare.c b/net/colo-compare.c
14
index XXXXXXX..XXXXXXX 100644
15
--- a/net/colo-compare.c
16
+++ b/net/colo-compare.c
17
@@ -XXX,XX +XXX,XX @@ static bool colo_compare_active;
18
static QemuMutex event_mtx;
19
static QemuCond event_complete_cond;
20
static int event_unhandled_count;
21
+static uint32_t max_queue_size;
22
23
/*
24
* + CompareState ++
25
@@ -XXX,XX +XXX,XX @@ static void fill_pkt_tcp_info(void *data, uint32_t *max_ack)
26
*/
27
static int colo_insert_packet(GQueue *queue, Packet *pkt, uint32_t *max_ack)
28
{
29
- if (g_queue_get_length(queue) <= MAX_QUEUE_SIZE) {
30
+ if (g_queue_get_length(queue) <= max_queue_size) {
31
if (pkt->ip->ip_p == IPPROTO_TCP) {
32
fill_pkt_tcp_info(pkt, max_ack);
33
g_queue_insert_sorted(queue,
34
@@ -XXX,XX +XXX,XX @@ static void compare_set_expired_scan_cycle(Object *obj, Visitor *v,
35
s->expired_scan_cycle = value;
36
}
37
38
+static void get_max_queue_size(Object *obj, Visitor *v,
39
+ const char *name, void *opaque,
40
+ Error **errp)
41
+{
42
+ uint32_t value = max_queue_size;
43
+
44
+ visit_type_uint32(v, name, &value, errp);
45
+}
46
+
47
+static void set_max_queue_size(Object *obj, Visitor *v,
48
+ const char *name, void *opaque,
49
+ Error **errp)
50
+{
51
+ Error *local_err = NULL;
52
+ uint32_t value;
53
+
54
+ visit_type_uint32(v, name, &value, &local_err);
55
+ if (local_err) {
56
+ goto out;
57
+ }
58
+ if (!value) {
59
+ error_setg(&local_err, "Property '%s.%s' requires a positive value",
60
+ object_get_typename(obj), name);
61
+ goto out;
62
+ }
63
+ max_queue_size = value;
64
+
65
+out:
66
+ error_propagate(errp, local_err);
67
+}
68
+
69
static void compare_pri_rs_finalize(SocketReadState *pri_rs)
70
{
71
CompareState *s = container_of(pri_rs, CompareState, pri_rs);
72
@@ -XXX,XX +XXX,XX @@ static void colo_compare_complete(UserCreatable *uc, Error **errp)
73
s->expired_scan_cycle = REGULAR_PACKET_CHECK_MS;
74
}
75
76
+ if (!max_queue_size) {
77
+ /* Set default queue size to 1024 */
78
+ max_queue_size = MAX_QUEUE_SIZE;
79
+ }
80
+
81
if (find_and_check_chardev(&chr, s->pri_indev, errp) ||
82
!qemu_chr_fe_init(&s->chr_pri_in, chr, errp)) {
83
return;
84
@@ -XXX,XX +XXX,XX @@ static void colo_compare_init(Object *obj)
85
compare_get_expired_scan_cycle,
86
compare_set_expired_scan_cycle, NULL, NULL);
87
88
+ object_property_add(obj, "max_queue_size", "uint32",
89
+ get_max_queue_size,
90
+ set_max_queue_size, NULL, NULL);
91
+
92
s->vnet_hdr = false;
93
object_property_add_bool(obj, "vnet_hdr_support", compare_get_vnet_hdr,
94
compare_set_vnet_hdr);
95
diff --git a/qemu-options.hx b/qemu-options.hx
96
index XXXXXXX..XXXXXXX 100644
97
--- a/qemu-options.hx
98
+++ b/qemu-options.hx
99
@@ -XXX,XX +XXX,XX @@ SRST
100
stored. The file format is libpcap, so it can be analyzed with
101
tools such as tcpdump or Wireshark.
102
103
- ``-object colo-compare,id=id,primary_in=chardevid,secondary_in=chardevid,outdev=chardevid,iothread=id[,vnet_hdr_support][,notify_dev=id][,compare_timeout=@var{ms}][,expired_scan_cycle=@var{ms}``
104
+ ``-object colo-compare,id=id,primary_in=chardevid,secondary_in=chardevid,outdev=chardevid,iothread=id[,vnet_hdr_support][,notify_dev=id][,compare_timeout=@var{ms}][,expired_scan_cycle=@var{ms}][,max_queue_size=@var{size}]``
105
Colo-compare gets packet from primary\_inchardevid and
106
secondary\_inchardevid, than compare primary packet with
107
secondary packet. If the packets are same, we will output
108
@@ -XXX,XX +XXX,XX @@ SRST
109
vnet\_hdr\_len. Then compare\_timeout=@var{ms} determines the
110
maximum delay colo-compare wait for the packet.
111
The expired\_scan\_cycle=@var{ms} to set the period of scanning
112
- expired primary node network packets.
113
+ expired primary node network packets. The max\_queue\_size=@var{size}
114
+ is to set the max compare queue size depend on user environment.
115
If you want to use Xen COLO, will need the notify\_dev to
116
notify Xen colo-frame to do checkpoint.
117
118
--
119
2.5.0
120
121
diff view generated by jsdifflib
Deleted patch
1
From: Zhang Chen <chen.zhang@intel.com>
2
1
3
Fix some typo and optimized some descriptions.
4
5
Signed-off-by: Zhang Chen <chen.zhang@intel.com>
6
Signed-off-by: Jason Wang <jasowang@redhat.com>
7
---
8
qemu-options.hx | 32 ++++++++++++++++----------------
9
1 file changed, 16 insertions(+), 16 deletions(-)
10
11
diff --git a/qemu-options.hx b/qemu-options.hx
12
index XXXXXXX..XXXXXXX 100644
13
--- a/qemu-options.hx
14
+++ b/qemu-options.hx
15
@@ -XXX,XX +XXX,XX @@ SRST
16
tools such as tcpdump or Wireshark.
17
18
``-object colo-compare,id=id,primary_in=chardevid,secondary_in=chardevid,outdev=chardevid,iothread=id[,vnet_hdr_support][,notify_dev=id][,compare_timeout=@var{ms}][,expired_scan_cycle=@var{ms}][,max_queue_size=@var{size}]``
19
- Colo-compare gets packet from primary\_inchardevid and
20
- secondary\_inchardevid, than compare primary packet with
21
- secondary packet. If the packets are same, we will output
22
- primary packet to outdevchardevid, else we will notify
23
- colo-frame do checkpoint and send primary packet to
24
- outdevchardevid. In order to improve efficiency, we need to put
25
- the task of comparison in another thread. If it has the
26
- vnet\_hdr\_support flag, colo compare will send/recv packet with
27
- vnet\_hdr\_len. Then compare\_timeout=@var{ms} determines the
28
- maximum delay colo-compare wait for the packet.
29
- The expired\_scan\_cycle=@var{ms} to set the period of scanning
30
- expired primary node network packets. The max\_queue\_size=@var{size}
31
- is to set the max compare queue size depend on user environment.
32
- If you want to use Xen COLO, will need the notify\_dev to
33
+ Colo-compare gets packet from primary\_in chardevid and
34
+ secondary\_in, then compare whether the payload of primary packet
35
+ and secondary packet are the same. If same, it will output
36
+ primary packet to out\_dev, else it will notify COLO-framework to do
37
+ checkpoint and send primary packet to out\_dev. In order to
38
+ improve efficiency, we need to put the task of comparison in
39
+ another iothread. If it has the vnet\_hdr\_support flag,
40
+ colo compare will send/recv packet with vnet\_hdr\_len.
41
+ The compare\_timeout=@var{ms} determines the maximum time of the
42
+ colo-compare hold the packet. The expired\_scan\_cycle=@var{ms}
43
+ is to set the period of scanning expired primary node network packets.
44
+ The max\_queue\_size=@var{size} is to set the max compare queue
45
+ size depend on user environment.
46
+ If user want to use Xen COLO, need to add the notify\_dev to
47
notify Xen colo-frame to do checkpoint.
48
49
- we must use it with the help of filter-mirror and
50
- filter-redirector.
51
+ COLO-compare must be used with the help of filter-mirror,
52
+ filter-redirector and filter-rewriter.
53
54
::
55
56
--
57
2.5.0
58
59
diff view generated by jsdifflib
1
From: Laurent Vivier <lvivier@redhat.com>
1
From: Konstantin Shkolnyy <kshk@linux.ibm.com>
2
2
3
qemu_set_nonblock() checks that the file descriptor can be used and, if
3
Add .set_vnet_le() function that always returns success, assuming that
4
not, crashes QEMU. An assert() is used for that. The use of assert() is
4
vDPA h/w always implements LE data format. Otherwise, QEMU disables vDPA and
5
used to detect programming error and the coredump will allow to debug
5
outputs the message:
6
the problem.
6
"backend does not support LE vnet headers; falling back on userspace virtio"
7
7
8
But in the case of the tap device, this assert() can be triggered by
8
Reviewed-by: Michael S. Tsirkin <mst@redhat.com>
9
a misconfiguration by the user. At startup, it's not a real problem, but it
9
Acked-by: Eugenio Pérez <eperezma@redhat.com>
10
can also happen during the hot-plug of a new device, and here it's a
10
Signed-off-by: Konstantin Shkolnyy <kshk@linux.ibm.com>
11
problem because we can crash a perfectly healthy system.
12
13
For instance:
14
# ip link add link virbr0 name macvtap0 type macvtap mode bridge
15
# ip link set macvtap0 up
16
# TAP=/dev/tap$(ip -o link show macvtap0 | cut -d: -f1)
17
# qemu-system-x86_64 -machine q35 -device pcie-root-port,id=pcie-root-port-0 -monitor stdio 9<> $TAP
18
(qemu) netdev_add type=tap,id=hostnet0,vhost=on,fd=9
19
(qemu) device_add driver=virtio-net-pci,netdev=hostnet0,id=net0,bus=pcie-root-port-0
20
(qemu) device_del net0
21
(qemu) netdev_del hostnet0
22
(qemu) netdev_add type=tap,id=hostnet1,vhost=on,fd=9
23
qemu-system-x86_64: .../util/oslib-posix.c:247: qemu_set_nonblock: Assertion `f != -1' failed.
24
Aborted (core dumped)
25
26
To avoid that, add a function, qemu_try_set_nonblock(), that allows to report the
27
problem without crashing.
28
29
In the same way, we also update the function for vhostfd in net_init_tap_one() and
30
for fd in net_init_socket() (both descriptors are provided by the user and can
31
be wrong).
32
33
Signed-off-by: Laurent Vivier <lvivier@redhat.com>
34
Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com>
35
Signed-off-by: Jason Wang <jasowang@redhat.com>
11
Signed-off-by: Jason Wang <jasowang@redhat.com>
36
---
12
---
37
include/qemu/sockets.h | 1 +
13
net/vhost-vdpa.c | 13 +++++++++++++
38
net/socket.c | 9 ++++++--
14
1 file changed, 13 insertions(+)
39
net/tap.c | 25 ++++++++++++++++++----
40
util/oslib-posix.c | 26 ++++++++++++++++-------
41
util/oslib-win32.c | 57 ++++++++++++++++++++++++++++----------------------
42
5 files changed, 79 insertions(+), 39 deletions(-)
43
15
44
diff --git a/include/qemu/sockets.h b/include/qemu/sockets.h
16
diff --git a/net/vhost-vdpa.c b/net/vhost-vdpa.c
45
index XXXXXXX..XXXXXXX 100644
17
index XXXXXXX..XXXXXXX 100644
46
--- a/include/qemu/sockets.h
18
--- a/net/vhost-vdpa.c
47
+++ b/include/qemu/sockets.h
19
+++ b/net/vhost-vdpa.c
48
@@ -XXX,XX +XXX,XX @@ int qemu_accept(int s, struct sockaddr *addr, socklen_t *addrlen);
20
@@ -XXX,XX +XXX,XX @@ static bool vhost_vdpa_has_ufo(NetClientState *nc)
49
int socket_set_cork(int fd, int v);
21
50
int socket_set_nodelay(int fd);
51
void qemu_set_block(int fd);
52
+int qemu_try_set_nonblock(int fd);
53
void qemu_set_nonblock(int fd);
54
int socket_set_fast_reuse(int fd);
55
56
diff --git a/net/socket.c b/net/socket.c
57
index XXXXXXX..XXXXXXX 100644
58
--- a/net/socket.c
59
+++ b/net/socket.c
60
@@ -XXX,XX +XXX,XX @@ int net_init_socket(const Netdev *netdev, const char *name,
61
}
62
63
if (sock->has_fd) {
64
- int fd;
65
+ int fd, ret;
66
67
fd = monitor_fd_param(cur_mon, sock->fd, errp);
68
if (fd == -1) {
69
return -1;
70
}
71
- qemu_set_nonblock(fd);
72
+ ret = qemu_try_set_nonblock(fd);
73
+ if (ret < 0) {
74
+ error_setg_errno(errp, -ret, "%s: Can't use file descriptor %d",
75
+ name, fd);
76
+ return -1;
77
+ }
78
if (!net_socket_fd_init(peer, "socket", name, fd, 1, sock->mcast,
79
errp)) {
80
return -1;
81
diff --git a/net/tap.c b/net/tap.c
82
index XXXXXXX..XXXXXXX 100644
83
--- a/net/tap.c
84
+++ b/net/tap.c
85
@@ -XXX,XX +XXX,XX @@ static void net_init_tap_one(const NetdevTapOptions *tap, NetClientState *peer,
86
}
87
88
if (vhostfdname) {
89
+ int ret;
90
+
91
vhostfd = monitor_fd_param(cur_mon, vhostfdname, &err);
92
if (vhostfd == -1) {
93
if (tap->has_vhostforce && tap->vhostforce) {
94
@@ -XXX,XX +XXX,XX @@ static void net_init_tap_one(const NetdevTapOptions *tap, NetClientState *peer,
95
}
96
return;
97
}
98
- qemu_set_nonblock(vhostfd);
99
+ ret = qemu_try_set_nonblock(vhostfd);
100
+ if (ret < 0) {
101
+ error_setg_errno(errp, -ret, "%s: Can't use file descriptor %d",
102
+ name, fd);
103
+ return;
104
+ }
105
} else {
106
vhostfd = open("/dev/vhost-net", O_RDWR);
107
if (vhostfd < 0) {
108
@@ -XXX,XX +XXX,XX @@ int net_init_tap(const Netdev *netdev, const char *name,
109
Error *err = NULL;
110
const char *vhostfdname;
111
char ifname[128];
112
+ int ret = 0;
113
114
assert(netdev->type == NET_CLIENT_DRIVER_TAP);
115
tap = &netdev->u.tap;
116
@@ -XXX,XX +XXX,XX @@ int net_init_tap(const Netdev *netdev, const char *name,
117
return -1;
118
}
119
120
- qemu_set_nonblock(fd);
121
+ ret = qemu_try_set_nonblock(fd);
122
+ if (ret < 0) {
123
+ error_setg_errno(errp, -ret, "%s: Can't use file descriptor %d",
124
+ name, fd);
125
+ return -1;
126
+ }
127
128
vnet_hdr = tap_probe_vnet_hdr(fd);
129
130
@@ -XXX,XX +XXX,XX @@ int net_init_tap(const Netdev *netdev, const char *name,
131
char **fds;
132
char **vhost_fds;
133
int nfds = 0, nvhosts = 0;
134
- int ret = 0;
135
136
if (tap->has_ifname || tap->has_script || tap->has_downscript ||
137
tap->has_vnet_hdr || tap->has_helper || tap->has_queues ||
138
@@ -XXX,XX +XXX,XX @@ int net_init_tap(const Netdev *netdev, const char *name,
139
goto free_fail;
140
}
141
142
- qemu_set_nonblock(fd);
143
+ ret = qemu_try_set_nonblock(fd);
144
+ if (ret < 0) {
145
+ error_setg_errno(errp, -ret, "%s: Can't use file descriptor %d",
146
+ name, fd);
147
+ goto free_fail;
148
+ }
149
150
if (i == 0) {
151
vnet_hdr = tap_probe_vnet_hdr(fd);
152
diff --git a/util/oslib-posix.c b/util/oslib-posix.c
153
index XXXXXXX..XXXXXXX 100644
154
--- a/util/oslib-posix.c
155
+++ b/util/oslib-posix.c
156
@@ -XXX,XX +XXX,XX @@ void qemu_set_block(int fd)
157
assert(f != -1);
158
}
22
}
159
23
160
-void qemu_set_nonblock(int fd)
24
+/*
161
+int qemu_try_set_nonblock(int fd)
25
+ * FIXME: vhost_vdpa doesn't have an API to "set h/w endianness". But it's
162
{
26
+ * reasonable to assume that h/w is LE by default, because LE is what
163
int f;
27
+ * virtio 1.0 and later ask for. So, this function just says "yes, the h/w is
164
f = fcntl(fd, F_GETFL);
28
+ * LE". Otherwise, on a BE machine, higher-level code would mistakely think
165
- assert(f != -1);
29
+ * the h/w is BE and can't support VDPA for a virtio 1.0 client.
166
- f = fcntl(fd, F_SETFL, f | O_NONBLOCK);
30
+ */
167
-#ifdef __OpenBSD__
31
+static int vhost_vdpa_set_vnet_le(NetClientState *nc, bool enable)
168
if (f == -1) {
32
+{
169
+ return -errno;
170
+ }
171
+ if (fcntl(fd, F_SETFL, f | O_NONBLOCK) == -1) {
172
+#ifdef __OpenBSD__
173
/*
174
* Previous to OpenBSD 6.3, fcntl(F_SETFL) is not permitted on
175
* memory devices and sets errno to ENODEV.
176
* It's OK if we fail to set O_NONBLOCK on devices like /dev/null,
177
* because they will never block anyway.
178
*/
179
- assert(errno == ENODEV);
180
- }
181
-#else
182
- assert(f != -1);
183
+ if (errno == ENODEV) {
184
+ return 0;
185
+ }
186
#endif
187
+ return -errno;
188
+ }
189
+ return 0;
33
+ return 0;
190
+}
34
+}
191
+
35
+
192
+void qemu_set_nonblock(int fd)
36
static bool vhost_vdpa_check_peer_type(NetClientState *nc, ObjectClass *oc,
193
+{
37
Error **errp)
194
+ int f;
195
+ f = qemu_try_set_nonblock(fd);
196
+ assert(f == 0);
197
}
198
199
int socket_set_fast_reuse(int fd)
200
diff --git a/util/oslib-win32.c b/util/oslib-win32.c
201
index XXXXXXX..XXXXXXX 100644
202
--- a/util/oslib-win32.c
203
+++ b/util/oslib-win32.c
204
@@ -XXX,XX +XXX,XX @@ struct tm *localtime_r(const time_t *timep, struct tm *result)
205
}
206
#endif /* CONFIG_LOCALTIME_R */
207
208
-void qemu_set_block(int fd)
209
-{
210
- unsigned long opt = 0;
211
- WSAEventSelect(fd, NULL, 0);
212
- ioctlsocket(fd, FIONBIO, &opt);
213
-}
214
-
215
-void qemu_set_nonblock(int fd)
216
-{
217
- unsigned long opt = 1;
218
- ioctlsocket(fd, FIONBIO, &opt);
219
- qemu_fd_register(fd);
220
-}
221
-
222
-int socket_set_fast_reuse(int fd)
223
-{
224
- /* Enabling the reuse of an endpoint that was used by a socket still in
225
- * TIME_WAIT state is usually performed by setting SO_REUSEADDR. On Windows
226
- * fast reuse is the default and SO_REUSEADDR does strange things. So we
227
- * don't have to do anything here. More info can be found at:
228
- * http://msdn.microsoft.com/en-us/library/windows/desktop/ms740621.aspx */
229
- return 0;
230
-}
231
-
232
-
233
static int socket_error(void)
234
{
38
{
235
switch (WSAGetLastError()) {
39
@@ -XXX,XX +XXX,XX @@ static NetClientInfo net_vhost_vdpa_info = {
236
@@ -XXX,XX +XXX,XX @@ static int socket_error(void)
40
.cleanup = vhost_vdpa_cleanup,
237
}
41
.has_vnet_hdr = vhost_vdpa_has_vnet_hdr,
238
}
42
.has_ufo = vhost_vdpa_has_ufo,
239
43
+ .set_vnet_le = vhost_vdpa_set_vnet_le,
240
+void qemu_set_block(int fd)
44
.check_peer_type = vhost_vdpa_check_peer_type,
241
+{
45
.set_steering_ebpf = vhost_vdpa_set_steering_ebpf,
242
+ unsigned long opt = 0;
46
};
243
+ WSAEventSelect(fd, NULL, 0);
244
+ ioctlsocket(fd, FIONBIO, &opt);
245
+}
246
+
247
+int qemu_try_set_nonblock(int fd)
248
+{
249
+ unsigned long opt = 1;
250
+ if (ioctlsocket(fd, FIONBIO, &opt) != NO_ERROR) {
251
+ return -socket_error();
252
+ }
253
+ qemu_fd_register(fd);
254
+ return 0;
255
+}
256
+
257
+void qemu_set_nonblock(int fd)
258
+{
259
+ (void)qemu_try_set_nonblock(fd);
260
+}
261
+
262
+int socket_set_fast_reuse(int fd)
263
+{
264
+ /* Enabling the reuse of an endpoint that was used by a socket still in
265
+ * TIME_WAIT state is usually performed by setting SO_REUSEADDR. On Windows
266
+ * fast reuse is the default and SO_REUSEADDR does strange things. So we
267
+ * don't have to do anything here. More info can be found at:
268
+ * http://msdn.microsoft.com/en-us/library/windows/desktop/ms740621.aspx */
269
+ return 0;
270
+}
271
+
272
int inet_aton(const char *cp, struct in_addr *ia)
273
{
274
uint32_t addr = inet_addr(cp);
275
--
47
--
276
2.5.0
48
2.42.0
277
49
278
50
diff view generated by jsdifflib
Deleted patch
1
From: "Daniel P. Berrange" <berrange@redhat.com>
2
1
3
When QEMU sets up a tap based network device backend, it mostly ignores errors
4
reported from various ioctl() calls it makes, assuming the TAP file descriptor
5
is valid. This assumption can easily be violated when the user is passing in a
6
pre-opened file descriptor. At best, the ioctls may fail with a -EBADF, but if
7
the user passes in a bogus FD number that happens to clash with a FD number that
8
QEMU has opened internally for another reason, a wide variety of errnos may
9
result, as the TUNGETIFF ioctl number may map to a completely different command
10
on a different type of file.
11
12
By ignoring all these errors, QEMU sets up a zombie network backend that will
13
never pass any data. Even worse, when QEMU shuts down, or that network backend
14
is hot-removed, it will close this bogus file descriptor, which could belong to
15
another QEMU device backend.
16
17
There's no obvious guaranteed reliable way to detect that a FD genuinely is a
18
TAP device, as opposed to a UNIX socket, or pipe, or something else. Checking
19
the errno from probing vnet hdr flag though, does catch the big common cases.
20
ie calling TUNGETIFF will return EBADF for an invalid FD, and ENOTTY when FD is
21
a UNIX socket, or pipe which catches accidental collisions with FDs used for
22
stdio, or monitor socket.
23
24
Previously the example below where bogus fd 9 collides with the FD used for the
25
chardev saw:
26
27
$ ./x86_64-softmmu/qemu-system-x86_64 -netdev tap,id=hostnet0,fd=9 \
28
-chardev socket,id=charchannel0,path=/tmp/qga,server,nowait \
29
-monitor stdio -vnc :0
30
qemu-system-x86_64: -netdev tap,id=hostnet0,fd=9: TUNGETIFF ioctl() failed: Inappropriate ioctl for device
31
TUNSETOFFLOAD ioctl() failed: Bad address
32
QEMU 2.9.1 monitor - type 'help' for more information
33
(qemu) Warning: netdev hostnet0 has no peer
34
35
which gives a running QEMU with a zombie network backend.
36
37
With this change applied we get an error message and QEMU immediately exits
38
before carrying on and making a bigger disaster:
39
40
$ ./x86_64-softmmu/qemu-system-x86_64 -netdev tap,id=hostnet0,fd=9 \
41
-chardev socket,id=charchannel0,path=/tmp/qga,server,nowait \
42
-monitor stdio -vnc :0
43
qemu-system-x86_64: -netdev tap,id=hostnet0,vhost=on,fd=9: Unable to query TUNGETIFF on FD 9: Inappropriate ioctl for device
44
45
Reported-by: Dr. David Alan Gilbert <dgilbert@redhat.com>
46
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
47
Tested-by: Dr. David Alan Gilbert <dgilbert@redhat.com>
48
Message-id: 20171027085548.3472-1-berrange@redhat.com
49
[lv: to simplify, don't check on EINVAL with TUNGETIFF as it exists since v2.6.27]
50
Signed-off-by: Laurent Vivier <lvivier@redhat.com>
51
Signed-off-by: Jason Wang <jasowang@redhat.com>
52
---
53
net/tap-bsd.c | 2 +-
54
net/tap-linux.c | 8 +++++---
55
net/tap-solaris.c | 2 +-
56
net/tap-stub.c | 2 +-
57
net/tap.c | 25 ++++++++++++++++++++-----
58
net/tap_int.h | 2 +-
59
6 files changed, 29 insertions(+), 12 deletions(-)
60
61
diff --git a/net/tap-bsd.c b/net/tap-bsd.c
62
index XXXXXXX..XXXXXXX 100644
63
--- a/net/tap-bsd.c
64
+++ b/net/tap-bsd.c
65
@@ -XXX,XX +XXX,XX @@ void tap_set_sndbuf(int fd, const NetdevTapOptions *tap, Error **errp)
66
{
67
}
68
69
-int tap_probe_vnet_hdr(int fd)
70
+int tap_probe_vnet_hdr(int fd, Error **errp)
71
{
72
return 0;
73
}
74
diff --git a/net/tap-linux.c b/net/tap-linux.c
75
index XXXXXXX..XXXXXXX 100644
76
--- a/net/tap-linux.c
77
+++ b/net/tap-linux.c
78
@@ -XXX,XX +XXX,XX @@ void tap_set_sndbuf(int fd, const NetdevTapOptions *tap, Error **errp)
79
}
80
}
81
82
-int tap_probe_vnet_hdr(int fd)
83
+int tap_probe_vnet_hdr(int fd, Error **errp)
84
{
85
struct ifreq ifr;
86
87
if (ioctl(fd, TUNGETIFF, &ifr) != 0) {
88
- error_report("TUNGETIFF ioctl() failed: %s", strerror(errno));
89
- return 0;
90
+ /* TUNGETIFF is available since kernel v2.6.27 */
91
+ error_setg_errno(errp, errno,
92
+ "Unable to query TUNGETIFF on FD %d", fd);
93
+ return -1;
94
}
95
96
return ifr.ifr_flags & IFF_VNET_HDR;
97
diff --git a/net/tap-solaris.c b/net/tap-solaris.c
98
index XXXXXXX..XXXXXXX 100644
99
--- a/net/tap-solaris.c
100
+++ b/net/tap-solaris.c
101
@@ -XXX,XX +XXX,XX @@ void tap_set_sndbuf(int fd, const NetdevTapOptions *tap, Error **errp)
102
{
103
}
104
105
-int tap_probe_vnet_hdr(int fd)
106
+int tap_probe_vnet_hdr(int fd, Error **errp)
107
{
108
return 0;
109
}
110
diff --git a/net/tap-stub.c b/net/tap-stub.c
111
index XXXXXXX..XXXXXXX 100644
112
--- a/net/tap-stub.c
113
+++ b/net/tap-stub.c
114
@@ -XXX,XX +XXX,XX @@ void tap_set_sndbuf(int fd, const NetdevTapOptions *tap, Error **errp)
115
{
116
}
117
118
-int tap_probe_vnet_hdr(int fd)
119
+int tap_probe_vnet_hdr(int fd, Error **errp)
120
{
121
return 0;
122
}
123
diff --git a/net/tap.c b/net/tap.c
124
index XXXXXXX..XXXXXXX 100644
125
--- a/net/tap.c
126
+++ b/net/tap.c
127
@@ -XXX,XX +XXX,XX @@ int net_init_bridge(const Netdev *netdev, const char *name,
128
}
129
130
qemu_set_nonblock(fd);
131
- vnet_hdr = tap_probe_vnet_hdr(fd);
132
+ vnet_hdr = tap_probe_vnet_hdr(fd, errp);
133
+ if (vnet_hdr < 0) {
134
+ close(fd);
135
+ return -1;
136
+ }
137
s = net_tap_fd_init(peer, "bridge", name, fd, vnet_hdr);
138
139
snprintf(s->nc.info_str, sizeof(s->nc.info_str), "helper=%s,br=%s", helper,
140
@@ -XXX,XX +XXX,XX @@ int net_init_tap(const Netdev *netdev, const char *name,
141
return -1;
142
}
143
144
- vnet_hdr = tap_probe_vnet_hdr(fd);
145
+ vnet_hdr = tap_probe_vnet_hdr(fd, errp);
146
+ if (vnet_hdr < 0) {
147
+ close(fd);
148
+ return -1;
149
+ }
150
151
net_init_tap_one(tap, peer, "tap", name, NULL,
152
script, downscript,
153
@@ -XXX,XX +XXX,XX @@ int net_init_tap(const Netdev *netdev, const char *name,
154
}
155
156
if (i == 0) {
157
- vnet_hdr = tap_probe_vnet_hdr(fd);
158
- } else if (vnet_hdr != tap_probe_vnet_hdr(fd)) {
159
+ vnet_hdr = tap_probe_vnet_hdr(fd, errp);
160
+ if (vnet_hdr < 0) {
161
+ goto free_fail;
162
+ }
163
+ } else if (vnet_hdr != tap_probe_vnet_hdr(fd, NULL)) {
164
error_setg(errp,
165
"vnet_hdr not consistent across given tap fds");
166
ret = -1;
167
@@ -XXX,XX +XXX,XX @@ free_fail:
168
}
169
170
qemu_set_nonblock(fd);
171
- vnet_hdr = tap_probe_vnet_hdr(fd);
172
+ vnet_hdr = tap_probe_vnet_hdr(fd, errp);
173
+ if (vnet_hdr < 0) {
174
+ close(fd);
175
+ return -1;
176
+ }
177
178
net_init_tap_one(tap, peer, "bridge", name, ifname,
179
script, downscript, vhostfdname,
180
diff --git a/net/tap_int.h b/net/tap_int.h
181
index XXXXXXX..XXXXXXX 100644
182
--- a/net/tap_int.h
183
+++ b/net/tap_int.h
184
@@ -XXX,XX +XXX,XX @@ int tap_open(char *ifname, int ifname_size, int *vnet_hdr,
185
ssize_t tap_read_packet(int tapfd, uint8_t *buf, int maxlen);
186
187
void tap_set_sndbuf(int fd, const NetdevTapOptions *tap, Error **errp);
188
-int tap_probe_vnet_hdr(int fd);
189
+int tap_probe_vnet_hdr(int fd, Error **errp);
190
int tap_probe_vnet_hdr_len(int fd, int len);
191
int tap_probe_has_ufo(int fd);
192
void tap_fd_set_offload(int fd, int csum, int tso4, int tso6, int ecn, int ufo);
193
--
194
2.5.0
195
196
diff view generated by jsdifflib
Deleted patch
1
From: erik-smit <erik.lucas.smit@gmail.com>
2
1
3
The test of the write of the dblac register was testing the old value
4
instead of the new value. This would accept the write of an invalid value
5
but subsequently refuse any following valid writes.
6
7
Signed-off-by: erik-smit <erik.lucas.smit@gmail.com>
8
Reviewed-by: Cédric Le Goater <clg@kaod.org>
9
Signed-off-by: Jason Wang <jasowang@redhat.com>
10
---
11
hw/net/ftgmac100.c | 14 ++++++++------
12
1 file changed, 8 insertions(+), 6 deletions(-)
13
14
diff --git a/hw/net/ftgmac100.c b/hw/net/ftgmac100.c
15
index XXXXXXX..XXXXXXX 100644
16
--- a/hw/net/ftgmac100.c
17
+++ b/hw/net/ftgmac100.c
18
@@ -XXX,XX +XXX,XX @@ static void ftgmac100_write(void *opaque, hwaddr addr,
19
s->phydata = value & 0xffff;
20
break;
21
case FTGMAC100_DBLAC: /* DMA Burst Length and Arbitration Control */
22
- if (FTGMAC100_DBLAC_TXDES_SIZE(s->dblac) < sizeof(FTGMAC100Desc)) {
23
+ if (FTGMAC100_DBLAC_TXDES_SIZE(value) < sizeof(FTGMAC100Desc)) {
24
qemu_log_mask(LOG_GUEST_ERROR,
25
- "%s: transmit descriptor too small : %d bytes\n",
26
- __func__, FTGMAC100_DBLAC_TXDES_SIZE(s->dblac));
27
+ "%s: transmit descriptor too small: %" PRIx64
28
+ " bytes\n", __func__,
29
+ FTGMAC100_DBLAC_TXDES_SIZE(value));
30
break;
31
}
32
- if (FTGMAC100_DBLAC_RXDES_SIZE(s->dblac) < sizeof(FTGMAC100Desc)) {
33
+ if (FTGMAC100_DBLAC_RXDES_SIZE(value) < sizeof(FTGMAC100Desc)) {
34
qemu_log_mask(LOG_GUEST_ERROR,
35
- "%s: receive descriptor too small : %d bytes\n",
36
- __func__, FTGMAC100_DBLAC_RXDES_SIZE(s->dblac));
37
+ "%s: receive descriptor too small : %" PRIx64
38
+ " bytes\n", __func__,
39
+ FTGMAC100_DBLAC_RXDES_SIZE(value));
40
break;
41
}
42
s->dblac = value;
43
--
44
2.5.0
45
46
diff view generated by jsdifflib