1
The following changes since commit e3acc2c1961cbe22ca474cd5da4163b7bbf7cea3:
1
TCG patch queue, plus one target/sh4 patch that
2
Yoshinori Sato asked me to process.
2
3
3
tests/docker/dockerfiles: Bump fedora-i386-cross to fedora 34 (2021-10-05 16:40:39 -0700)
4
5
r~
6
7
8
The following changes since commit efbf38d73e5dcc4d5f8b98c6e7a12be1f3b91745:
9
10
Merge tag 'for-upstream' of git://repo.or.cz/qemu/kevin into staging (2022-10-03 15:06:07 -0400)
4
11
5
are available in the Git repository at:
12
are available in the Git repository at:
6
13
7
https://gitlab.com/rth7680/qemu.git tags/pull-tcg-20211006
14
https://gitlab.com/rth7680/qemu.git tags/pull-tcg-20221004
8
15
9
for you to fetch changes up to ea3f2af8f1b87d7bced9b75ef2e788b66ec49961:
16
for you to fetch changes up to ab419fd8a035a65942de4e63effcd55ccbf1a9fe:
10
17
11
tcg/s390x: Implement TCG_TARGET_HAS_cmpsel_vec (2021-10-05 16:53:17 -0700)
18
target/sh4: Fix TB_FLAG_UNALIGN (2022-10-04 12:33:05 -0700)
12
19
13
----------------------------------------------------------------
20
----------------------------------------------------------------
14
More fixes for fedora-i386-cross
21
Cache CPUClass for use in hot code paths.
15
Add dup_const_tl
22
Add CPUTLBEntryFull, probe_access_full, tlb_set_page_full.
16
Expand MemOp MO_SIZE
23
Add generic support for TARGET_TB_PCREL.
17
Move MemOpIdx out of tcg.h
24
tcg/ppc: Optimize 26-bit jumps using STQ for POWER 2.07
18
Vector support for tcg/s390x
25
target/sh4: Fix TB_FLAG_UNALIGN
19
26
20
----------------------------------------------------------------
27
----------------------------------------------------------------
21
Philipp Tomsich (1):
28
Alex Bennée (3):
22
tcg: add dup_const_tl wrapper
29
cpu: cache CPUClass in CPUState for hot code paths
30
hw/core/cpu-sysemu: used cached class in cpu_asidx_from_attrs
31
cputlb: used cached CPUClass in our hot-paths
23
32
24
Richard Henderson (27):
33
Leandro Lupori (1):
25
tests/docker: Remove fedora-i386-cross from DOCKER_PARTIAL_IMAGES
34
tcg/ppc: Optimize 26-bit jumps
26
tests/docker: Fix fedora-i386-cross cross-compilation
27
accel/tcg: Drop signness in tracing in cputlb.c
28
tcg: Expand MO_SIZE to 3 bits
29
tcg: Rename TCGMemOpIdx to MemOpIdx
30
tcg: Split out MemOpIdx to exec/memopidx.h
31
trace/mem: Pass MemOpIdx to trace_mem_get_info
32
accel/tcg: Pass MemOpIdx to atomic_trace_*_post
33
plugins: Reorg arguments to qemu_plugin_vcpu_mem_cb
34
trace: Split guest_mem_before
35
hw/core/cpu: Re-sort the non-pointers to the end of CPUClass
36
tcg: Expand usadd/ussub with umin/umax
37
tcg/s390x: Rename from tcg/s390
38
tcg/s390x: Change FACILITY representation
39
tcg/s390x: Merge TCG_AREG0 and TCG_REG_CALL_STACK into TCGReg
40
tcg/s390x: Add host vector framework
41
tcg/s390x: Implement tcg_out_ld/st for vector types
42
tcg/s390x: Implement tcg_out_mov for vector types
43
tcg/s390x: Implement tcg_out_dup*_vec
44
tcg/s390x: Implement minimal vector operations
45
tcg/s390x: Implement andc, orc, abs, neg, not vector operations
46
tcg/s390x: Implement TCG_TARGET_HAS_mul_vec
47
tcg/s390x: Implement vector shift operations
48
tcg/s390x: Implement TCG_TARGET_HAS_minmax_vec
49
tcg/s390x: Implement TCG_TARGET_HAS_sat_vec
50
tcg/s390x: Implement TCG_TARGET_HAS_bitsel_vec
51
tcg/s390x: Implement TCG_TARGET_HAS_cmpsel_vec
52
35
53
meson.build | 2 -
36
Richard Henderson (16):
54
accel/tcg/atomic_template.h | 73 +-
37
accel/tcg: Rename CPUIOTLBEntry to CPUTLBEntryFull
55
include/exec/memop.h | 14 +-
38
accel/tcg: Drop addr member from SavedIOTLB
56
include/exec/memopidx.h | 55 ++
39
accel/tcg: Suppress auto-invalidate in probe_access_internal
57
include/hw/core/cpu.h | 11 +-
40
accel/tcg: Introduce probe_access_full
58
include/qemu/plugin.h | 26 +-
41
accel/tcg: Introduce tlb_set_page_full
59
include/tcg/tcg.h | 117 ++-
42
include/exec: Introduce TARGET_PAGE_ENTRY_EXTRA
60
tcg/{s390 => s390x}/tcg-target-con-set.h | 7 +
43
accel/tcg: Remove PageDesc code_bitmap
61
tcg/{s390 => s390x}/tcg-target-con-str.h | 1 +
44
accel/tcg: Use bool for page_find_alloc
62
tcg/{s390 => s390x}/tcg-target.h | 91 ++-
45
accel/tcg: Use DisasContextBase in plugin_gen_tb_start
63
tcg/s390x/tcg-target.opc.h | 15 +
46
accel/tcg: Do not align tb->page_addr[0]
64
trace/mem.h | 63 --
47
accel/tcg: Inline tb_flush_jmp_cache
65
accel/tcg/cputlb.c | 103 ++-
48
include/hw/core: Create struct CPUJumpCache
66
accel/tcg/plugin-gen.c | 5 +-
49
hw/core: Add CPUClass.get_pc
67
accel/tcg/user-exec.c | 133 ++-
50
accel/tcg: Introduce tb_pc and log_pc
68
plugins/api.c | 19 +-
51
accel/tcg: Introduce TARGET_TB_PCREL
69
plugins/core.c | 10 +-
52
target/sh4: Fix TB_FLAG_UNALIGN
70
target/arm/helper-a64.c | 16 +-
71
target/arm/m_helper.c | 2 +-
72
target/arm/translate-a64.c | 2 +-
73
target/i386/tcg/mem_helper.c | 4 +-
74
target/m68k/op_helper.c | 2 +-
75
target/mips/tcg/msa_helper.c | 6 +-
76
target/s390x/tcg/mem_helper.c | 20 +-
77
target/sparc/ldst_helper.c | 2 +-
78
tcg/optimize.c | 2 +-
79
tcg/tcg-op-vec.c | 37 +-
80
tcg/tcg-op.c | 60 +-
81
tcg/tcg.c | 2 +-
82
tcg/tci.c | 14 +-
83
accel/tcg/atomic_common.c.inc | 43 +-
84
target/s390x/tcg/translate_vx.c.inc | 2 +-
85
tcg/aarch64/tcg-target.c.inc | 18 +-
86
tcg/arm/tcg-target.c.inc | 14 +-
87
tcg/i386/tcg-target.c.inc | 14 +-
88
tcg/mips/tcg-target.c.inc | 16 +-
89
tcg/ppc/tcg-target.c.inc | 18 +-
90
tcg/riscv/tcg-target.c.inc | 20 +-
91
tcg/{s390 => s390x}/tcg-target.c.inc | 949 ++++++++++++++++++++--
92
tcg/sparc/tcg-target.c.inc | 20 +-
93
tcg/tcg-ldst.c.inc | 2 +-
94
tests/docker/Makefile.include | 2 +-
95
tests/docker/dockerfiles/fedora-i386-cross.docker | 5 +-
96
trace-events | 18 +-
97
44 files changed, 1445 insertions(+), 610 deletions(-)
98
create mode 100644 include/exec/memopidx.h
99
rename tcg/{s390 => s390x}/tcg-target-con-set.h (86%)
100
rename tcg/{s390 => s390x}/tcg-target-con-str.h (96%)
101
rename tcg/{s390 => s390x}/tcg-target.h (66%)
102
create mode 100644 tcg/s390x/tcg-target.opc.h
103
delete mode 100644 trace/mem.h
104
rename tcg/{s390 => s390x}/tcg-target.c.inc (73%)
105
53
54
accel/tcg/internal.h | 10 ++
55
accel/tcg/tb-hash.h | 1 +
56
accel/tcg/tb-jmp-cache.h | 65 ++++++++
57
include/exec/cpu-common.h | 1 +
58
include/exec/cpu-defs.h | 48 ++++--
59
include/exec/exec-all.h | 75 ++++++++-
60
include/exec/plugin-gen.h | 7 +-
61
include/hw/core/cpu.h | 28 ++--
62
include/qemu/typedefs.h | 2 +
63
include/tcg/tcg.h | 2 +-
64
target/sh4/cpu.h | 56 ++++---
65
accel/stubs/tcg-stub.c | 4 +
66
accel/tcg/cpu-exec.c | 80 +++++-----
67
accel/tcg/cputlb.c | 259 ++++++++++++++++++--------------
68
accel/tcg/plugin-gen.c | 22 +--
69
accel/tcg/translate-all.c | 214 ++++++++++++--------------
70
accel/tcg/translator.c | 2 +-
71
cpu.c | 9 +-
72
hw/core/cpu-common.c | 3 +-
73
hw/core/cpu-sysemu.c | 5 +-
74
linux-user/sh4/signal.c | 6 +-
75
plugins/core.c | 2 +-
76
target/alpha/cpu.c | 9 ++
77
target/arm/cpu.c | 17 ++-
78
target/arm/mte_helper.c | 14 +-
79
target/arm/sve_helper.c | 4 +-
80
target/arm/translate-a64.c | 2 +-
81
target/avr/cpu.c | 10 +-
82
target/cris/cpu.c | 8 +
83
target/hexagon/cpu.c | 10 +-
84
target/hppa/cpu.c | 12 +-
85
target/i386/cpu.c | 9 ++
86
target/i386/tcg/tcg-cpu.c | 2 +-
87
target/loongarch/cpu.c | 11 +-
88
target/m68k/cpu.c | 8 +
89
target/microblaze/cpu.c | 10 +-
90
target/mips/cpu.c | 8 +
91
target/mips/tcg/exception.c | 2 +-
92
target/mips/tcg/sysemu/special_helper.c | 2 +-
93
target/nios2/cpu.c | 9 ++
94
target/openrisc/cpu.c | 10 +-
95
target/ppc/cpu_init.c | 8 +
96
target/riscv/cpu.c | 17 ++-
97
target/rx/cpu.c | 10 +-
98
target/s390x/cpu.c | 8 +
99
target/s390x/tcg/mem_helper.c | 4 -
100
target/sh4/cpu.c | 18 ++-
101
target/sh4/helper.c | 6 +-
102
target/sh4/translate.c | 90 +++++------
103
target/sparc/cpu.c | 10 +-
104
target/tricore/cpu.c | 11 +-
105
target/xtensa/cpu.c | 8 +
106
tcg/tcg.c | 8 +-
107
trace/control-target.c | 2 +-
108
tcg/ppc/tcg-target.c.inc | 119 +++++++++++----
109
55 files changed, 915 insertions(+), 462 deletions(-)
110
create mode 100644 accel/tcg/tb-jmp-cache.h
111
diff view generated by jsdifflib
Deleted patch
1
The image was upgraded to a full image in ee381b7fe146.
2
This makes it possible to use docker-test@image syntax
3
with this container.
4
1
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
6
Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
7
Message-Id: <20210930163636.721311-2-richard.henderson@linaro.org>
8
---
9
tests/docker/Makefile.include | 2 +-
10
1 file changed, 1 insertion(+), 1 deletion(-)
11
12
diff --git a/tests/docker/Makefile.include b/tests/docker/Makefile.include
13
index XXXXXXX..XXXXXXX 100644
14
--- a/tests/docker/Makefile.include
15
+++ b/tests/docker/Makefile.include
16
@@ -XXX,XX +XXX,XX @@ DOCKER_PARTIAL_IMAGES += debian-riscv64-cross
17
DOCKER_PARTIAL_IMAGES += debian-sh4-cross debian-sparc64-cross
18
DOCKER_PARTIAL_IMAGES += debian-tricore-cross
19
DOCKER_PARTIAL_IMAGES += debian-xtensa-cross
20
-DOCKER_PARTIAL_IMAGES += fedora-i386-cross fedora-cris-cross
21
+DOCKER_PARTIAL_IMAGES += fedora-cris-cross
22
23
# Rules for building linux-user powered images
24
#
25
--
26
2.25.1
27
28
diff view generated by jsdifflib
Deleted patch
1
By using PKG_CONFIG_PATH instead of PKG_CONFIG_LIBDIR,
2
we were still including the 64-bit packages. Install
3
pcre-devel.i686 to fill a missing glib2 dependency.
4
1
5
By using --extra-cflags instead of --cpu, we incorrectly
6
use the wrong probing during meson.
7
8
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
9
Reviewed-by: Richard W.M. Jones <rjones@redhat.com>
10
Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
11
Message-Id: <20210930163636.721311-3-richard.henderson@linaro.org>
12
---
13
tests/docker/dockerfiles/fedora-i386-cross.docker | 5 +++--
14
1 file changed, 3 insertions(+), 2 deletions(-)
15
16
diff --git a/tests/docker/dockerfiles/fedora-i386-cross.docker b/tests/docker/dockerfiles/fedora-i386-cross.docker
17
index XXXXXXX..XXXXXXX 100644
18
--- a/tests/docker/dockerfiles/fedora-i386-cross.docker
19
+++ b/tests/docker/dockerfiles/fedora-i386-cross.docker
20
@@ -XXX,XX +XXX,XX @@ ENV PACKAGES \
21
glibc-static.i686 \
22
gnutls-devel.i686 \
23
nettle-devel.i686 \
24
+ pcre-devel.i686 \
25
perl-Test-Harness \
26
pixman-devel.i686 \
27
sysprof-capture-devel.i686 \
28
zlib-devel.i686
29
30
-ENV QEMU_CONFIGURE_OPTS --extra-cflags=-m32 --disable-vhost-user
31
-ENV PKG_CONFIG_PATH /usr/lib/pkgconfig
32
+ENV QEMU_CONFIGURE_OPTS --cpu=i386 --disable-vhost-user
33
+ENV PKG_CONFIG_LIBDIR /usr/lib/pkgconfig
34
35
RUN dnf update -y && dnf install -y $PACKAGES
36
RUN rpm -q $PACKAGES | sort > /packages.txt
37
--
38
2.25.1
39
40
diff view generated by jsdifflib
1
Reviewed-by: David Hildenbrand <david@redhat.com>
1
From: Alex Bennée <alex.bennee@linaro.org>
2
3
The class cast checkers are quite expensive and always on (unlike the
4
dynamic case who's checks are gated by CONFIG_QOM_CAST_DEBUG). To
5
avoid the overhead of repeatedly checking something which should never
6
change we cache the CPUClass reference for use in the hot code paths.
7
8
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
9
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
10
Message-Id: <20220811151413.3350684-3-alex.bennee@linaro.org>
11
Signed-off-by: Cédric Le Goater <clg@kaod.org>
12
Message-Id: <20220923084803.498337-3-clg@kaod.org>
2
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
13
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
3
---
14
---
4
tcg/s390x/tcg-target.c.inc | 72 +++++++++++++++++++++++++++++++++++---
15
include/hw/core/cpu.h | 9 +++++++++
5
1 file changed, 68 insertions(+), 4 deletions(-)
16
cpu.c | 9 ++++-----
17
2 files changed, 13 insertions(+), 5 deletions(-)
6
18
7
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
19
diff --git a/include/hw/core/cpu.h b/include/hw/core/cpu.h
8
index XXXXXXX..XXXXXXX 100644
20
index XXXXXXX..XXXXXXX 100644
9
--- a/tcg/s390x/tcg-target.c.inc
21
--- a/include/hw/core/cpu.h
10
+++ b/tcg/s390x/tcg-target.c.inc
22
+++ b/include/hw/core/cpu.h
11
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
23
@@ -XXX,XX +XXX,XX @@ typedef int (*WriteCoreDumpFunction)(const void *buf, size_t size,
12
RX_STC = 0x42,
24
*/
13
RX_STH = 0x40,
25
#define CPU(obj) ((CPUState *)(obj))
14
26
15
+ VRRa_VLR = 0xe756,
27
+/*
16
+
28
+ * The class checkers bring in CPU_GET_CLASS() which is potentially
17
+ VRSb_VLVG = 0xe722,
29
+ * expensive given the eventual call to
18
+ VRSc_VLGV = 0xe721,
30
+ * object_class_dynamic_cast_assert(). Because of this the CPUState
19
+
31
+ * has a cached value for the class in cs->cc which is set up in
20
VRX_VL = 0xe706,
32
+ * cpu_exec_realizefn() for use in hot code paths.
21
VRX_VLLEZ = 0xe704,
33
+ */
22
VRX_VST = 0xe70e,
34
typedef struct CPUClass CPUClass;
23
@@ -XXX,XX +XXX,XX @@ static int RXB(TCGReg v1, TCGReg v2, TCGReg v3, TCGReg v4)
35
DECLARE_CLASS_CHECKERS(CPUClass, CPU,
24
| ((v4 & 0x10) << (4 + 0));
36
TYPE_CPU)
25
}
37
@@ -XXX,XX +XXX,XX @@ struct qemu_work_item;
26
38
struct CPUState {
27
+static void tcg_out_insn_VRRa(TCGContext *s, S390Opcode op,
39
/*< private >*/
28
+ TCGReg v1, TCGReg v2, int m3)
40
DeviceState parent_obj;
29
+{
41
+ /* cache to avoid expensive CPU_GET_CLASS */
30
+ tcg_debug_assert(is_vector_reg(v1));
42
+ CPUClass *cc;
31
+ tcg_debug_assert(is_vector_reg(v2));
43
/*< public >*/
32
+ tcg_out16(s, (op & 0xff00) | ((v1 & 0xf) << 4) | (v2 & 0xf));
44
33
+ tcg_out32(s, (op & 0x00ff) | RXB(v1, v2, 0, 0) | (m3 << 12));
45
int nr_cores;
34
+}
46
diff --git a/cpu.c b/cpu.c
35
+
47
index XXXXXXX..XXXXXXX 100644
36
+static void tcg_out_insn_VRSb(TCGContext *s, S390Opcode op, TCGReg v1,
48
--- a/cpu.c
37
+ intptr_t d2, TCGReg b2, TCGReg r3, int m4)
49
+++ b/cpu.c
38
+{
50
@@ -XXX,XX +XXX,XX @@ const VMStateDescription vmstate_cpu_common = {
39
+ tcg_debug_assert(is_vector_reg(v1));
51
40
+ tcg_debug_assert(d2 >= 0 && d2 <= 0xfff);
52
void cpu_exec_realizefn(CPUState *cpu, Error **errp)
41
+ tcg_debug_assert(is_general_reg(b2));
42
+ tcg_debug_assert(is_general_reg(r3));
43
+ tcg_out16(s, (op & 0xff00) | ((v1 & 0xf) << 4) | r3);
44
+ tcg_out16(s, b2 << 12 | d2);
45
+ tcg_out16(s, (op & 0x00ff) | RXB(v1, 0, 0, 0) | (m4 << 12));
46
+}
47
+
48
+static void tcg_out_insn_VRSc(TCGContext *s, S390Opcode op, TCGReg r1,
49
+ intptr_t d2, TCGReg b2, TCGReg v3, int m4)
50
+{
51
+ tcg_debug_assert(is_general_reg(r1));
52
+ tcg_debug_assert(d2 >= 0 && d2 <= 0xfff);
53
+ tcg_debug_assert(is_general_reg(b2));
54
+ tcg_debug_assert(is_vector_reg(v3));
55
+ tcg_out16(s, (op & 0xff00) | (r1 << 4) | (v3 & 0xf));
56
+ tcg_out16(s, b2 << 12 | d2);
57
+ tcg_out16(s, (op & 0x00ff) | RXB(0, 0, v3, 0) | (m4 << 12));
58
+}
59
+
60
static void tcg_out_insn_VRX(TCGContext *s, S390Opcode op, TCGReg v1,
61
TCGReg b2, TCGReg x2, intptr_t d2, int m3)
62
{
53
{
63
@@ -XXX,XX +XXX,XX @@ static void tcg_out_sh32(TCGContext* s, S390Opcode op, TCGReg dest,
54
-#ifndef CONFIG_USER_ONLY
64
55
- CPUClass *cc = CPU_GET_CLASS(cpu);
65
static bool tcg_out_mov(TCGContext *s, TCGType type, TCGReg dst, TCGReg src)
56
-#endif
66
{
57
+ /* cache the cpu class for the hotpath */
67
- if (src != dst) {
58
+ cpu->cc = CPU_GET_CLASS(cpu);
68
- if (type == TCG_TYPE_I32) {
59
69
+ if (src == dst) {
60
cpu_list_add(cpu);
70
+ return true;
61
if (!accel_cpu_realizefn(cpu, errp)) {
71
+ }
62
@@ -XXX,XX +XXX,XX @@ void cpu_exec_realizefn(CPUState *cpu, Error **errp)
72
+ switch (type) {
63
if (qdev_get_vmsd(DEVICE(cpu)) == NULL) {
73
+ case TCG_TYPE_I32:
64
vmstate_register(NULL, cpu->cpu_index, &vmstate_cpu_common, cpu);
74
+ if (likely(is_general_reg(dst) && is_general_reg(src))) {
75
tcg_out_insn(s, RR, LR, dst, src);
76
- } else {
77
- tcg_out_insn(s, RRE, LGR, dst, src);
78
+ break;
79
}
80
+ /* fallthru */
81
+
82
+ case TCG_TYPE_I64:
83
+ if (likely(is_general_reg(dst))) {
84
+ if (likely(is_general_reg(src))) {
85
+ tcg_out_insn(s, RRE, LGR, dst, src);
86
+ } else {
87
+ tcg_out_insn(s, VRSc, VLGV, dst, 0, 0, src, 3);
88
+ }
89
+ break;
90
+ } else if (is_general_reg(src)) {
91
+ tcg_out_insn(s, VRSb, VLVG, dst, 0, 0, src, 3);
92
+ break;
93
+ }
94
+ /* fallthru */
95
+
96
+ case TCG_TYPE_V64:
97
+ case TCG_TYPE_V128:
98
+ tcg_out_insn(s, VRRa, VLR, dst, src, 0);
99
+ break;
100
+
101
+ default:
102
+ g_assert_not_reached();
103
}
65
}
104
return true;
66
- if (cc->sysemu_ops->legacy_vmsd != NULL) {
67
- vmstate_register(NULL, cpu->cpu_index, cc->sysemu_ops->legacy_vmsd, cpu);
68
+ if (cpu->cc->sysemu_ops->legacy_vmsd != NULL) {
69
+ vmstate_register(NULL, cpu->cpu_index, cpu->cc->sysemu_ops->legacy_vmsd, cpu);
70
}
71
#endif /* CONFIG_USER_ONLY */
105
}
72
}
106
--
73
--
107
2.25.1
74
2.34.1
108
75
109
76
diff view generated by jsdifflib
1
This is via expansion; don't actually set TCG_TARGET_HAS_cmpsel_vec.
1
From: Alex Bennée <alex.bennee@linaro.org>
2
2
3
This is a heavily used function so lets avoid the cost of
4
CPU_GET_CLASS. On the romulus-bmc run it has a modest effect:
5
6
Before: 36.812 s ± 0.506 s
7
After: 35.912 s ± 0.168 s
8
9
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
10
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
11
Message-Id: <20220811151413.3350684-4-alex.bennee@linaro.org>
12
Signed-off-by: Cédric Le Goater <clg@kaod.org>
13
Message-Id: <20220923084803.498337-4-clg@kaod.org>
3
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
14
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
4
---
15
---
5
tcg/s390x/tcg-target.c.inc | 24 +++++++++++++++++++++++-
16
hw/core/cpu-sysemu.c | 5 ++---
6
1 file changed, 23 insertions(+), 1 deletion(-)
17
1 file changed, 2 insertions(+), 3 deletions(-)
7
18
8
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
19
diff --git a/hw/core/cpu-sysemu.c b/hw/core/cpu-sysemu.c
9
index XXXXXXX..XXXXXXX 100644
20
index XXXXXXX..XXXXXXX 100644
10
--- a/tcg/s390x/tcg-target.c.inc
21
--- a/hw/core/cpu-sysemu.c
11
+++ b/tcg/s390x/tcg-target.c.inc
22
+++ b/hw/core/cpu-sysemu.c
12
@@ -XXX,XX +XXX,XX @@ int tcg_can_emit_vec_op(TCGOpcode opc, TCGType type, unsigned vece)
23
@@ -XXX,XX +XXX,XX @@ hwaddr cpu_get_phys_page_debug(CPUState *cpu, vaddr addr)
13
case INDEX_op_xor_vec:
24
14
return 1;
25
int cpu_asidx_from_attrs(CPUState *cpu, MemTxAttrs attrs)
15
case INDEX_op_cmp_vec:
26
{
16
+ case INDEX_op_cmpsel_vec:
27
- CPUClass *cc = CPU_GET_CLASS(cpu);
17
case INDEX_op_rotrv_vec:
28
int ret = 0;
18
return -1;
29
19
case INDEX_op_mul_vec:
30
- if (cc->sysemu_ops->asidx_from_attrs) {
20
@@ -XXX,XX +XXX,XX @@ static void expand_vec_cmp(TCGType type, unsigned vece, TCGv_vec v0,
31
- ret = cc->sysemu_ops->asidx_from_attrs(cpu, attrs);
32
+ if (cpu->cc->sysemu_ops->asidx_from_attrs) {
33
+ ret = cpu->cc->sysemu_ops->asidx_from_attrs(cpu, attrs);
34
assert(ret < cpu->num_ases && ret >= 0);
21
}
35
}
22
}
36
return ret;
23
24
+static void expand_vec_cmpsel(TCGType type, unsigned vece, TCGv_vec v0,
25
+ TCGv_vec c1, TCGv_vec c2,
26
+ TCGv_vec v3, TCGv_vec v4, TCGCond cond)
27
+{
28
+ TCGv_vec t = tcg_temp_new_vec(type);
29
+
30
+ if (expand_vec_cmp_noinv(type, vece, t, c1, c2, cond)) {
31
+ /* Invert the sense of the compare by swapping arguments. */
32
+ tcg_gen_bitsel_vec(vece, v0, t, v4, v3);
33
+ } else {
34
+ tcg_gen_bitsel_vec(vece, v0, t, v3, v4);
35
+ }
36
+ tcg_temp_free_vec(t);
37
+}
38
+
39
static void expand_vec_sat(TCGType type, unsigned vece, TCGv_vec v0,
40
TCGv_vec v1, TCGv_vec v2, TCGOpcode add_sub_opc)
41
{
42
@@ -XXX,XX +XXX,XX @@ void tcg_expand_vec_op(TCGOpcode opc, TCGType type, unsigned vece,
43
TCGArg a0, ...)
44
{
45
va_list va;
46
- TCGv_vec v0, v1, v2, t0;
47
+ TCGv_vec v0, v1, v2, v3, v4, t0;
48
49
va_start(va, a0);
50
v0 = temp_tcgv_vec(arg_temp(a0));
51
@@ -XXX,XX +XXX,XX @@ void tcg_expand_vec_op(TCGOpcode opc, TCGType type, unsigned vece,
52
expand_vec_cmp(type, vece, v0, v1, v2, va_arg(va, TCGArg));
53
break;
54
55
+ case INDEX_op_cmpsel_vec:
56
+ v3 = temp_tcgv_vec(arg_temp(va_arg(va, TCGArg)));
57
+ v4 = temp_tcgv_vec(arg_temp(va_arg(va, TCGArg)));
58
+ expand_vec_cmpsel(type, vece, v0, v1, v2, v3, v4, va_arg(va, TCGArg));
59
+ break;
60
+
61
case INDEX_op_rotrv_vec:
62
t0 = tcg_temp_new_vec(type);
63
tcg_gen_neg_vec(vece, t0, v2);
64
--
37
--
65
2.25.1
38
2.34.1
66
39
67
40
diff view generated by jsdifflib
1
We are already inconsistent about whether or not
1
From: Alex Bennée <alex.bennee@linaro.org>
2
MO_SIGN is set in trace_mem_get_info. Dropping it
3
entirely allows some simplification.
4
2
5
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
3
Before: 35.912 s ± 0.168 s
4
After: 35.565 s ± 0.087 s
5
6
Signed-off-by: Alex Bennée <alex.bennee@linaro.org>
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Message-Id: <20220811151413.3350684-5-alex.bennee@linaro.org>
9
Signed-off-by: Cédric Le Goater <clg@kaod.org>
10
Message-Id: <20220923084803.498337-5-clg@kaod.org>
6
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
11
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
7
---
12
---
8
accel/tcg/cputlb.c | 10 +++-------
13
accel/tcg/cputlb.c | 15 ++++++---------
9
accel/tcg/user-exec.c | 45 ++++++-------------------------------------
14
1 file changed, 6 insertions(+), 9 deletions(-)
10
2 files changed, 9 insertions(+), 46 deletions(-)
11
15
12
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
16
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
13
index XXXXXXX..XXXXXXX 100644
17
index XXXXXXX..XXXXXXX 100644
14
--- a/accel/tcg/cputlb.c
18
--- a/accel/tcg/cputlb.c
15
+++ b/accel/tcg/cputlb.c
19
+++ b/accel/tcg/cputlb.c
16
@@ -XXX,XX +XXX,XX @@ static inline uint64_t cpu_load_helper(CPUArchState *env, abi_ptr addr,
20
@@ -XXX,XX +XXX,XX @@ void tlb_set_page(CPUState *cpu, target_ulong vaddr,
17
meminfo = trace_mem_get_info(op, mmu_idx, false);
21
static void tlb_fill(CPUState *cpu, target_ulong addr, int size,
18
trace_guest_mem_before_exec(env_cpu(env), addr, meminfo);
22
MMUAccessType access_type, int mmu_idx, uintptr_t retaddr)
19
20
- op &= ~MO_SIGN;
21
oi = make_memop_idx(op, mmu_idx);
22
ret = full_load(env, addr, oi, retaddr);
23
24
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_ldub_mmuidx_ra(CPUArchState *env, abi_ptr addr,
25
int cpu_ldsb_mmuidx_ra(CPUArchState *env, abi_ptr addr,
26
int mmu_idx, uintptr_t ra)
27
{
23
{
28
- return (int8_t)cpu_load_helper(env, addr, mmu_idx, ra, MO_SB,
24
- CPUClass *cc = CPU_GET_CLASS(cpu);
29
- full_ldub_mmu);
25
bool ok;
30
+ return (int8_t)cpu_ldub_mmuidx_ra(env, addr, mmu_idx, ra);
26
27
/*
28
* This is not a probe, so only valid return is success; failure
29
* should result in exception + longjmp to the cpu loop.
30
*/
31
- ok = cc->tcg_ops->tlb_fill(cpu, addr, size,
32
- access_type, mmu_idx, false, retaddr);
33
+ ok = cpu->cc->tcg_ops->tlb_fill(cpu, addr, size,
34
+ access_type, mmu_idx, false, retaddr);
35
assert(ok);
31
}
36
}
32
37
33
uint32_t cpu_lduw_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
38
@@ -XXX,XX +XXX,XX @@ static inline void cpu_unaligned_access(CPUState *cpu, vaddr addr,
34
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_lduw_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
39
MMUAccessType access_type,
35
int cpu_ldsw_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
40
int mmu_idx, uintptr_t retaddr)
36
int mmu_idx, uintptr_t ra)
37
{
41
{
38
- return (int16_t)cpu_load_helper(env, addr, mmu_idx, ra, MO_BESW,
42
- CPUClass *cc = CPU_GET_CLASS(cpu);
39
- full_be_lduw_mmu);
43
-
40
+ return (int16_t)cpu_lduw_be_mmuidx_ra(env, addr, mmu_idx, ra);
44
- cc->tcg_ops->do_unaligned_access(cpu, addr, access_type, mmu_idx, retaddr);
45
+ cpu->cc->tcg_ops->do_unaligned_access(cpu, addr, access_type,
46
+ mmu_idx, retaddr);
41
}
47
}
42
48
43
uint32_t cpu_ldl_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
49
static inline void cpu_transaction_failed(CPUState *cpu, hwaddr physaddr,
44
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_lduw_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
50
@@ -XXX,XX +XXX,XX @@ static int probe_access_internal(CPUArchState *env, target_ulong addr,
45
int cpu_ldsw_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
51
if (!tlb_hit_page(tlb_addr, page_addr)) {
46
int mmu_idx, uintptr_t ra)
52
if (!victim_tlb_hit(env, mmu_idx, index, elt_ofs, page_addr)) {
47
{
53
CPUState *cs = env_cpu(env);
48
- return (int16_t)cpu_load_helper(env, addr, mmu_idx, ra, MO_LESW,
54
- CPUClass *cc = CPU_GET_CLASS(cs);
49
- full_le_lduw_mmu);
55
50
+ return (int16_t)cpu_lduw_le_mmuidx_ra(env, addr, mmu_idx, ra);
56
- if (!cc->tcg_ops->tlb_fill(cs, addr, fault_size, access_type,
51
}
57
- mmu_idx, nonfault, retaddr)) {
52
58
+ if (!cs->cc->tcg_ops->tlb_fill(cs, addr, fault_size, access_type,
53
uint32_t cpu_ldl_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
59
+ mmu_idx, nonfault, retaddr)) {
54
diff --git a/accel/tcg/user-exec.c b/accel/tcg/user-exec.c
60
/* Non-faulting page table read failed. */
55
index XXXXXXX..XXXXXXX 100644
61
*phost = NULL;
56
--- a/accel/tcg/user-exec.c
62
return TLB_INVALID_MASK;
57
+++ b/accel/tcg/user-exec.c
58
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_ldub_data(CPUArchState *env, abi_ptr ptr)
59
60
int cpu_ldsb_data(CPUArchState *env, abi_ptr ptr)
61
{
62
- int ret;
63
- uint16_t meminfo = trace_mem_get_info(MO_SB, MMU_USER_IDX, false);
64
-
65
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
66
- ret = ldsb_p(g2h(env_cpu(env), ptr));
67
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
68
- return ret;
69
+ return (int8_t)cpu_ldub_data(env, ptr);
70
}
71
72
uint32_t cpu_lduw_be_data(CPUArchState *env, abi_ptr ptr)
73
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_lduw_be_data(CPUArchState *env, abi_ptr ptr)
74
75
int cpu_ldsw_be_data(CPUArchState *env, abi_ptr ptr)
76
{
77
- int ret;
78
- uint16_t meminfo = trace_mem_get_info(MO_BESW, MMU_USER_IDX, false);
79
-
80
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
81
- ret = ldsw_be_p(g2h(env_cpu(env), ptr));
82
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
83
- return ret;
84
+ return (int16_t)cpu_lduw_be_data(env, ptr);
85
}
86
87
uint32_t cpu_ldl_be_data(CPUArchState *env, abi_ptr ptr)
88
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_lduw_le_data(CPUArchState *env, abi_ptr ptr)
89
90
int cpu_ldsw_le_data(CPUArchState *env, abi_ptr ptr)
91
{
92
- int ret;
93
- uint16_t meminfo = trace_mem_get_info(MO_LESW, MMU_USER_IDX, false);
94
-
95
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
96
- ret = ldsw_le_p(g2h(env_cpu(env), ptr));
97
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
98
- return ret;
99
+ return (int16_t)cpu_lduw_le_data(env, ptr);
100
}
101
102
uint32_t cpu_ldl_le_data(CPUArchState *env, abi_ptr ptr)
103
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_ldub_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
104
105
int cpu_ldsb_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
106
{
107
- int ret;
108
-
109
- set_helper_retaddr(retaddr);
110
- ret = cpu_ldsb_data(env, ptr);
111
- clear_helper_retaddr();
112
- return ret;
113
+ return (int8_t)cpu_ldub_data_ra(env, ptr, retaddr);
114
}
115
116
uint32_t cpu_lduw_be_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
117
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_lduw_be_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
118
119
int cpu_ldsw_be_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
120
{
121
- int ret;
122
-
123
- set_helper_retaddr(retaddr);
124
- ret = cpu_ldsw_be_data(env, ptr);
125
- clear_helper_retaddr();
126
- return ret;
127
+ return (int16_t)cpu_lduw_be_data_ra(env, ptr, retaddr);
128
}
129
130
uint32_t cpu_ldl_be_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
131
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_lduw_le_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
132
133
int cpu_ldsw_le_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
134
{
135
- int ret;
136
-
137
- set_helper_retaddr(retaddr);
138
- ret = cpu_ldsw_le_data(env, ptr);
139
- clear_helper_retaddr();
140
- return ret;
141
+ return (int16_t)cpu_lduw_le_data_ra(env, ptr, retaddr);
142
}
143
144
uint32_t cpu_ldl_le_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
145
--
63
--
146
2.25.1
64
2.34.1
147
65
148
66
diff view generated by jsdifflib
1
We have lacked expressive support for memory sizes larger
1
This structure will shortly contain more than just
2
than 64-bits for a while. Fixing that requires adjustment
2
data for accessing MMIO. Rename the 'addr' member
3
to several points where we used this for array indexing,
3
to 'xlat_section' to more clearly indicate its purpose.
4
and two places that develop -Wswitch warnings after the change.
5
4
6
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
5
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
6
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
7
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
7
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
8
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
9
---
9
---
10
include/exec/memop.h | 14 +++++++++-----
10
include/exec/cpu-defs.h | 22 ++++----
11
target/arm/translate-a64.c | 2 +-
11
accel/tcg/cputlb.c | 102 +++++++++++++++++++------------------
12
tcg/tcg-op.c | 13 ++++++++-----
12
target/arm/mte_helper.c | 14 ++---
13
target/s390x/tcg/translate_vx.c.inc | 2 +-
13
target/arm/sve_helper.c | 4 +-
14
tcg/aarch64/tcg-target.c.inc | 4 ++--
14
target/arm/translate-a64.c | 2 +-
15
tcg/arm/tcg-target.c.inc | 4 ++--
15
5 files changed, 73 insertions(+), 71 deletions(-)
16
tcg/i386/tcg-target.c.inc | 4 ++--
17
tcg/mips/tcg-target.c.inc | 4 ++--
18
tcg/ppc/tcg-target.c.inc | 8 ++++----
19
tcg/riscv/tcg-target.c.inc | 4 ++--
20
tcg/s390/tcg-target.c.inc | 4 ++--
21
tcg/sparc/tcg-target.c.inc | 16 ++++++++--------
22
12 files changed, 43 insertions(+), 36 deletions(-)
23
16
24
diff --git a/include/exec/memop.h b/include/exec/memop.h
17
diff --git a/include/exec/cpu-defs.h b/include/exec/cpu-defs.h
25
index XXXXXXX..XXXXXXX 100644
18
index XXXXXXX..XXXXXXX 100644
26
--- a/include/exec/memop.h
19
--- a/include/exec/cpu-defs.h
27
+++ b/include/exec/memop.h
20
+++ b/include/exec/cpu-defs.h
28
@@ -XXX,XX +XXX,XX @@ typedef enum MemOp {
21
@@ -XXX,XX +XXX,XX @@ typedef uint64_t target_ulong;
29
MO_16 = 1,
22
# endif
30
MO_32 = 2,
23
# endif
31
MO_64 = 3,
24
32
- MO_SIZE = 3, /* Mask for the above. */
25
+/* Minimalized TLB entry for use by TCG fast path. */
33
+ MO_128 = 4,
26
typedef struct CPUTLBEntry {
34
+ MO_256 = 5,
27
/* bit TARGET_LONG_BITS to TARGET_PAGE_BITS : virtual address
35
+ MO_512 = 6,
28
bit TARGET_PAGE_BITS-1..4 : Nonzero for accesses that should not
36
+ MO_1024 = 7,
29
@@ -XXX,XX +XXX,XX @@ typedef struct CPUTLBEntry {
37
+ MO_SIZE = 0x07, /* Mask for the above. */
30
38
31
QEMU_BUILD_BUG_ON(sizeof(CPUTLBEntry) != (1 << CPU_TLB_ENTRY_BITS));
39
- MO_SIGN = 4, /* Sign-extended, otherwise zero-extended. */
32
40
+ MO_SIGN = 0x08, /* Sign-extended, otherwise zero-extended. */
33
-/* The IOTLB is not accessed directly inline by generated TCG code,
41
34
- * so the CPUIOTLBEntry layout is not as critical as that of the
42
- MO_BSWAP = 8, /* Host reverse endian. */
35
- * CPUTLBEntry. (This is also why we don't want to combine the two
43
+ MO_BSWAP = 0x10, /* Host reverse endian. */
36
- * structs into one.)
44
#ifdef HOST_WORDS_BIGENDIAN
37
+/*
45
MO_LE = MO_BSWAP,
38
+ * The full TLB entry, which is not accessed by generated TCG code,
46
MO_BE = 0,
39
+ * so the layout is not as critical as that of CPUTLBEntry. This is
47
@@ -XXX,XX +XXX,XX @@ typedef enum MemOp {
40
+ * also why we don't want to combine the two structs.
48
* - an alignment to a specified size, which may be more or less than
41
*/
49
* the access size (MO_ALIGN_x where 'x' is a size in bytes);
42
-typedef struct CPUIOTLBEntry {
43
+typedef struct CPUTLBEntryFull {
44
/*
45
- * @addr contains:
46
+ * @xlat_section contains:
47
* - in the lower TARGET_PAGE_BITS, a physical section number
48
* - with the lower TARGET_PAGE_BITS masked off, an offset which
49
* must be added to the virtual address to obtain:
50
@@ -XXX,XX +XXX,XX @@ typedef struct CPUIOTLBEntry {
51
* number is PHYS_SECTION_NOTDIRTY or PHYS_SECTION_ROM)
52
* + the offset within the target MemoryRegion (otherwise)
50
*/
53
*/
51
- MO_ASHIFT = 4,
54
- hwaddr addr;
52
- MO_AMASK = 7 << MO_ASHIFT,
55
+ hwaddr xlat_section;
53
+ MO_ASHIFT = 5,
56
MemTxAttrs attrs;
54
+ MO_AMASK = 0x7 << MO_ASHIFT,
57
-} CPUIOTLBEntry;
55
#ifdef NEED_CPU_H
58
+} CPUTLBEntryFull;
56
#ifdef TARGET_ALIGNED_ONLY
59
57
MO_ALIGN = 0,
60
/*
61
* Data elements that are per MMU mode, minus the bits accessed by
62
@@ -XXX,XX +XXX,XX @@ typedef struct CPUTLBDesc {
63
size_t vindex;
64
/* The tlb victim table, in two parts. */
65
CPUTLBEntry vtable[CPU_VTLB_SIZE];
66
- CPUIOTLBEntry viotlb[CPU_VTLB_SIZE];
67
- /* The iotlb. */
68
- CPUIOTLBEntry *iotlb;
69
+ CPUTLBEntryFull vfulltlb[CPU_VTLB_SIZE];
70
+ CPUTLBEntryFull *fulltlb;
71
} CPUTLBDesc;
72
73
/*
74
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
75
index XXXXXXX..XXXXXXX 100644
76
--- a/accel/tcg/cputlb.c
77
+++ b/accel/tcg/cputlb.c
78
@@ -XXX,XX +XXX,XX @@ static void tlb_mmu_resize_locked(CPUTLBDesc *desc, CPUTLBDescFast *fast,
79
}
80
81
g_free(fast->table);
82
- g_free(desc->iotlb);
83
+ g_free(desc->fulltlb);
84
85
tlb_window_reset(desc, now, 0);
86
/* desc->n_used_entries is cleared by the caller */
87
fast->mask = (new_size - 1) << CPU_TLB_ENTRY_BITS;
88
fast->table = g_try_new(CPUTLBEntry, new_size);
89
- desc->iotlb = g_try_new(CPUIOTLBEntry, new_size);
90
+ desc->fulltlb = g_try_new(CPUTLBEntryFull, new_size);
91
92
/*
93
* If the allocations fail, try smaller sizes. We just freed some
94
@@ -XXX,XX +XXX,XX @@ static void tlb_mmu_resize_locked(CPUTLBDesc *desc, CPUTLBDescFast *fast,
95
* allocations to fail though, so we progressively reduce the allocation
96
* size, aborting if we cannot even allocate the smallest TLB we support.
97
*/
98
- while (fast->table == NULL || desc->iotlb == NULL) {
99
+ while (fast->table == NULL || desc->fulltlb == NULL) {
100
if (new_size == (1 << CPU_TLB_DYN_MIN_BITS)) {
101
error_report("%s: %s", __func__, strerror(errno));
102
abort();
103
@@ -XXX,XX +XXX,XX @@ static void tlb_mmu_resize_locked(CPUTLBDesc *desc, CPUTLBDescFast *fast,
104
fast->mask = (new_size - 1) << CPU_TLB_ENTRY_BITS;
105
106
g_free(fast->table);
107
- g_free(desc->iotlb);
108
+ g_free(desc->fulltlb);
109
fast->table = g_try_new(CPUTLBEntry, new_size);
110
- desc->iotlb = g_try_new(CPUIOTLBEntry, new_size);
111
+ desc->fulltlb = g_try_new(CPUTLBEntryFull, new_size);
112
}
113
}
114
115
@@ -XXX,XX +XXX,XX @@ static void tlb_mmu_init(CPUTLBDesc *desc, CPUTLBDescFast *fast, int64_t now)
116
desc->n_used_entries = 0;
117
fast->mask = (n_entries - 1) << CPU_TLB_ENTRY_BITS;
118
fast->table = g_new(CPUTLBEntry, n_entries);
119
- desc->iotlb = g_new(CPUIOTLBEntry, n_entries);
120
+ desc->fulltlb = g_new(CPUTLBEntryFull, n_entries);
121
tlb_mmu_flush_locked(desc, fast);
122
}
123
124
@@ -XXX,XX +XXX,XX @@ void tlb_destroy(CPUState *cpu)
125
CPUTLBDescFast *fast = &env_tlb(env)->f[i];
126
127
g_free(fast->table);
128
- g_free(desc->iotlb);
129
+ g_free(desc->fulltlb);
130
}
131
}
132
133
@@ -XXX,XX +XXX,XX @@ void tlb_set_page_with_attrs(CPUState *cpu, target_ulong vaddr,
134
135
/* Evict the old entry into the victim tlb. */
136
copy_tlb_helper_locked(tv, te);
137
- desc->viotlb[vidx] = desc->iotlb[index];
138
+ desc->vfulltlb[vidx] = desc->fulltlb[index];
139
tlb_n_used_entries_dec(env, mmu_idx);
140
}
141
142
@@ -XXX,XX +XXX,XX @@ void tlb_set_page_with_attrs(CPUState *cpu, target_ulong vaddr,
143
* subtract here is that of the page base, and not the same as the
144
* vaddr we add back in io_readx()/io_writex()/get_page_addr_code().
145
*/
146
- desc->iotlb[index].addr = iotlb - vaddr_page;
147
- desc->iotlb[index].attrs = attrs;
148
+ desc->fulltlb[index].xlat_section = iotlb - vaddr_page;
149
+ desc->fulltlb[index].attrs = attrs;
150
151
/* Now calculate the new entry */
152
tn.addend = addend - vaddr_page;
153
@@ -XXX,XX +XXX,XX @@ static inline void cpu_transaction_failed(CPUState *cpu, hwaddr physaddr,
154
}
155
}
156
157
-static uint64_t io_readx(CPUArchState *env, CPUIOTLBEntry *iotlbentry,
158
+static uint64_t io_readx(CPUArchState *env, CPUTLBEntryFull *full,
159
int mmu_idx, target_ulong addr, uintptr_t retaddr,
160
MMUAccessType access_type, MemOp op)
161
{
162
@@ -XXX,XX +XXX,XX @@ static uint64_t io_readx(CPUArchState *env, CPUIOTLBEntry *iotlbentry,
163
bool locked = false;
164
MemTxResult r;
165
166
- section = iotlb_to_section(cpu, iotlbentry->addr, iotlbentry->attrs);
167
+ section = iotlb_to_section(cpu, full->xlat_section, full->attrs);
168
mr = section->mr;
169
- mr_offset = (iotlbentry->addr & TARGET_PAGE_MASK) + addr;
170
+ mr_offset = (full->xlat_section & TARGET_PAGE_MASK) + addr;
171
cpu->mem_io_pc = retaddr;
172
if (!cpu->can_do_io) {
173
cpu_io_recompile(cpu, retaddr);
174
@@ -XXX,XX +XXX,XX @@ static uint64_t io_readx(CPUArchState *env, CPUIOTLBEntry *iotlbentry,
175
qemu_mutex_lock_iothread();
176
locked = true;
177
}
178
- r = memory_region_dispatch_read(mr, mr_offset, &val, op, iotlbentry->attrs);
179
+ r = memory_region_dispatch_read(mr, mr_offset, &val, op, full->attrs);
180
if (r != MEMTX_OK) {
181
hwaddr physaddr = mr_offset +
182
section->offset_within_address_space -
183
section->offset_within_region;
184
185
cpu_transaction_failed(cpu, physaddr, addr, memop_size(op), access_type,
186
- mmu_idx, iotlbentry->attrs, r, retaddr);
187
+ mmu_idx, full->attrs, r, retaddr);
188
}
189
if (locked) {
190
qemu_mutex_unlock_iothread();
191
@@ -XXX,XX +XXX,XX @@ static uint64_t io_readx(CPUArchState *env, CPUIOTLBEntry *iotlbentry,
192
}
193
194
/*
195
- * Save a potentially trashed IOTLB entry for later lookup by plugin.
196
- * This is read by tlb_plugin_lookup if the iotlb entry doesn't match
197
+ * Save a potentially trashed CPUTLBEntryFull for later lookup by plugin.
198
+ * This is read by tlb_plugin_lookup if the fulltlb entry doesn't match
199
* because of the side effect of io_writex changing memory layout.
200
*/
201
static void save_iotlb_data(CPUState *cs, hwaddr addr,
202
@@ -XXX,XX +XXX,XX @@ static void save_iotlb_data(CPUState *cs, hwaddr addr,
203
#endif
204
}
205
206
-static void io_writex(CPUArchState *env, CPUIOTLBEntry *iotlbentry,
207
+static void io_writex(CPUArchState *env, CPUTLBEntryFull *full,
208
int mmu_idx, uint64_t val, target_ulong addr,
209
uintptr_t retaddr, MemOp op)
210
{
211
@@ -XXX,XX +XXX,XX @@ static void io_writex(CPUArchState *env, CPUIOTLBEntry *iotlbentry,
212
bool locked = false;
213
MemTxResult r;
214
215
- section = iotlb_to_section(cpu, iotlbentry->addr, iotlbentry->attrs);
216
+ section = iotlb_to_section(cpu, full->xlat_section, full->attrs);
217
mr = section->mr;
218
- mr_offset = (iotlbentry->addr & TARGET_PAGE_MASK) + addr;
219
+ mr_offset = (full->xlat_section & TARGET_PAGE_MASK) + addr;
220
if (!cpu->can_do_io) {
221
cpu_io_recompile(cpu, retaddr);
222
}
223
@@ -XXX,XX +XXX,XX @@ static void io_writex(CPUArchState *env, CPUIOTLBEntry *iotlbentry,
224
* The memory_region_dispatch may trigger a flush/resize
225
* so for plugins we save the iotlb_data just in case.
226
*/
227
- save_iotlb_data(cpu, iotlbentry->addr, section, mr_offset);
228
+ save_iotlb_data(cpu, full->xlat_section, section, mr_offset);
229
230
if (!qemu_mutex_iothread_locked()) {
231
qemu_mutex_lock_iothread();
232
locked = true;
233
}
234
- r = memory_region_dispatch_write(mr, mr_offset, val, op, iotlbentry->attrs);
235
+ r = memory_region_dispatch_write(mr, mr_offset, val, op, full->attrs);
236
if (r != MEMTX_OK) {
237
hwaddr physaddr = mr_offset +
238
section->offset_within_address_space -
239
section->offset_within_region;
240
241
cpu_transaction_failed(cpu, physaddr, addr, memop_size(op),
242
- MMU_DATA_STORE, mmu_idx, iotlbentry->attrs, r,
243
+ MMU_DATA_STORE, mmu_idx, full->attrs, r,
244
retaddr);
245
}
246
if (locked) {
247
@@ -XXX,XX +XXX,XX @@ static bool victim_tlb_hit(CPUArchState *env, size_t mmu_idx, size_t index,
248
copy_tlb_helper_locked(vtlb, &tmptlb);
249
qemu_spin_unlock(&env_tlb(env)->c.lock);
250
251
- CPUIOTLBEntry tmpio, *io = &env_tlb(env)->d[mmu_idx].iotlb[index];
252
- CPUIOTLBEntry *vio = &env_tlb(env)->d[mmu_idx].viotlb[vidx];
253
- tmpio = *io; *io = *vio; *vio = tmpio;
254
+ CPUTLBEntryFull *f1 = &env_tlb(env)->d[mmu_idx].fulltlb[index];
255
+ CPUTLBEntryFull *f2 = &env_tlb(env)->d[mmu_idx].vfulltlb[vidx];
256
+ CPUTLBEntryFull tmpf;
257
+ tmpf = *f1; *f1 = *f2; *f2 = tmpf;
258
return true;
259
}
260
}
261
@@ -XXX,XX +XXX,XX @@ static bool victim_tlb_hit(CPUArchState *env, size_t mmu_idx, size_t index,
262
(ADDR) & TARGET_PAGE_MASK)
263
264
static void notdirty_write(CPUState *cpu, vaddr mem_vaddr, unsigned size,
265
- CPUIOTLBEntry *iotlbentry, uintptr_t retaddr)
266
+ CPUTLBEntryFull *full, uintptr_t retaddr)
267
{
268
- ram_addr_t ram_addr = mem_vaddr + iotlbentry->addr;
269
+ ram_addr_t ram_addr = mem_vaddr + full->xlat_section;
270
271
trace_memory_notdirty_write_access(mem_vaddr, ram_addr, size);
272
273
@@ -XXX,XX +XXX,XX @@ int probe_access_flags(CPUArchState *env, target_ulong addr,
274
/* Handle clean RAM pages. */
275
if (unlikely(flags & TLB_NOTDIRTY)) {
276
uintptr_t index = tlb_index(env, mmu_idx, addr);
277
- CPUIOTLBEntry *iotlbentry = &env_tlb(env)->d[mmu_idx].iotlb[index];
278
+ CPUTLBEntryFull *full = &env_tlb(env)->d[mmu_idx].fulltlb[index];
279
280
- notdirty_write(env_cpu(env), addr, 1, iotlbentry, retaddr);
281
+ notdirty_write(env_cpu(env), addr, 1, full, retaddr);
282
flags &= ~TLB_NOTDIRTY;
283
}
284
285
@@ -XXX,XX +XXX,XX @@ void *probe_access(CPUArchState *env, target_ulong addr, int size,
286
287
if (unlikely(flags & (TLB_NOTDIRTY | TLB_WATCHPOINT))) {
288
uintptr_t index = tlb_index(env, mmu_idx, addr);
289
- CPUIOTLBEntry *iotlbentry = &env_tlb(env)->d[mmu_idx].iotlb[index];
290
+ CPUTLBEntryFull *full = &env_tlb(env)->d[mmu_idx].fulltlb[index];
291
292
/* Handle watchpoints. */
293
if (flags & TLB_WATCHPOINT) {
294
int wp_access = (access_type == MMU_DATA_STORE
295
? BP_MEM_WRITE : BP_MEM_READ);
296
cpu_check_watchpoint(env_cpu(env), addr, size,
297
- iotlbentry->attrs, wp_access, retaddr);
298
+ full->attrs, wp_access, retaddr);
299
}
300
301
/* Handle clean RAM pages. */
302
if (flags & TLB_NOTDIRTY) {
303
- notdirty_write(env_cpu(env), addr, 1, iotlbentry, retaddr);
304
+ notdirty_write(env_cpu(env), addr, 1, full, retaddr);
305
}
306
}
307
308
@@ -XXX,XX +XXX,XX @@ tb_page_addr_t get_page_addr_code_hostp(CPUArchState *env, target_ulong addr,
309
* should have just filled the TLB. The one corner case is io_writex
310
* which can cause TLB flushes and potential resizing of the TLBs
311
* losing the information we need. In those cases we need to recover
312
- * data from a copy of the iotlbentry. As long as this always occurs
313
+ * data from a copy of the CPUTLBEntryFull. As long as this always occurs
314
* from the same thread (which a mem callback will be) this is safe.
315
*/
316
317
@@ -XXX,XX +XXX,XX @@ bool tlb_plugin_lookup(CPUState *cpu, target_ulong addr, int mmu_idx,
318
if (likely(tlb_hit(tlb_addr, addr))) {
319
/* We must have an iotlb entry for MMIO */
320
if (tlb_addr & TLB_MMIO) {
321
- CPUIOTLBEntry *iotlbentry;
322
- iotlbentry = &env_tlb(env)->d[mmu_idx].iotlb[index];
323
+ CPUTLBEntryFull *full;
324
+ full = &env_tlb(env)->d[mmu_idx].fulltlb[index];
325
data->is_io = true;
326
- data->v.io.section = iotlb_to_section(cpu, iotlbentry->addr, iotlbentry->attrs);
327
- data->v.io.offset = (iotlbentry->addr & TARGET_PAGE_MASK) + addr;
328
+ data->v.io.section =
329
+ iotlb_to_section(cpu, full->xlat_section, full->attrs);
330
+ data->v.io.offset = (full->xlat_section & TARGET_PAGE_MASK) + addr;
331
} else {
332
data->is_io = false;
333
data->v.ram.hostaddr = (void *)((uintptr_t)addr + tlbe->addend);
334
@@ -XXX,XX +XXX,XX @@ static void *atomic_mmu_lookup(CPUArchState *env, target_ulong addr,
335
336
if (unlikely(tlb_addr & TLB_NOTDIRTY)) {
337
notdirty_write(env_cpu(env), addr, size,
338
- &env_tlb(env)->d[mmu_idx].iotlb[index], retaddr);
339
+ &env_tlb(env)->d[mmu_idx].fulltlb[index], retaddr);
340
}
341
342
return hostaddr;
343
@@ -XXX,XX +XXX,XX @@ load_helper(CPUArchState *env, target_ulong addr, MemOpIdx oi,
344
345
/* Handle anything that isn't just a straight memory access. */
346
if (unlikely(tlb_addr & ~TARGET_PAGE_MASK)) {
347
- CPUIOTLBEntry *iotlbentry;
348
+ CPUTLBEntryFull *full;
349
bool need_swap;
350
351
/* For anything that is unaligned, recurse through full_load. */
352
@@ -XXX,XX +XXX,XX @@ load_helper(CPUArchState *env, target_ulong addr, MemOpIdx oi,
353
goto do_unaligned_access;
354
}
355
356
- iotlbentry = &env_tlb(env)->d[mmu_idx].iotlb[index];
357
+ full = &env_tlb(env)->d[mmu_idx].fulltlb[index];
358
359
/* Handle watchpoints. */
360
if (unlikely(tlb_addr & TLB_WATCHPOINT)) {
361
/* On watchpoint hit, this will longjmp out. */
362
cpu_check_watchpoint(env_cpu(env), addr, size,
363
- iotlbentry->attrs, BP_MEM_READ, retaddr);
364
+ full->attrs, BP_MEM_READ, retaddr);
365
}
366
367
need_swap = size > 1 && (tlb_addr & TLB_BSWAP);
368
369
/* Handle I/O access. */
370
if (likely(tlb_addr & TLB_MMIO)) {
371
- return io_readx(env, iotlbentry, mmu_idx, addr, retaddr,
372
+ return io_readx(env, full, mmu_idx, addr, retaddr,
373
access_type, op ^ (need_swap * MO_BSWAP));
374
}
375
376
@@ -XXX,XX +XXX,XX @@ store_helper_unaligned(CPUArchState *env, target_ulong addr, uint64_t val,
377
*/
378
if (unlikely(tlb_addr & TLB_WATCHPOINT)) {
379
cpu_check_watchpoint(env_cpu(env), addr, size - size2,
380
- env_tlb(env)->d[mmu_idx].iotlb[index].attrs,
381
+ env_tlb(env)->d[mmu_idx].fulltlb[index].attrs,
382
BP_MEM_WRITE, retaddr);
383
}
384
if (unlikely(tlb_addr2 & TLB_WATCHPOINT)) {
385
cpu_check_watchpoint(env_cpu(env), page2, size2,
386
- env_tlb(env)->d[mmu_idx].iotlb[index2].attrs,
387
+ env_tlb(env)->d[mmu_idx].fulltlb[index2].attrs,
388
BP_MEM_WRITE, retaddr);
389
}
390
391
@@ -XXX,XX +XXX,XX @@ store_helper(CPUArchState *env, target_ulong addr, uint64_t val,
392
393
/* Handle anything that isn't just a straight memory access. */
394
if (unlikely(tlb_addr & ~TARGET_PAGE_MASK)) {
395
- CPUIOTLBEntry *iotlbentry;
396
+ CPUTLBEntryFull *full;
397
bool need_swap;
398
399
/* For anything that is unaligned, recurse through byte stores. */
400
@@ -XXX,XX +XXX,XX @@ store_helper(CPUArchState *env, target_ulong addr, uint64_t val,
401
goto do_unaligned_access;
402
}
403
404
- iotlbentry = &env_tlb(env)->d[mmu_idx].iotlb[index];
405
+ full = &env_tlb(env)->d[mmu_idx].fulltlb[index];
406
407
/* Handle watchpoints. */
408
if (unlikely(tlb_addr & TLB_WATCHPOINT)) {
409
/* On watchpoint hit, this will longjmp out. */
410
cpu_check_watchpoint(env_cpu(env), addr, size,
411
- iotlbentry->attrs, BP_MEM_WRITE, retaddr);
412
+ full->attrs, BP_MEM_WRITE, retaddr);
413
}
414
415
need_swap = size > 1 && (tlb_addr & TLB_BSWAP);
416
417
/* Handle I/O access. */
418
if (tlb_addr & TLB_MMIO) {
419
- io_writex(env, iotlbentry, mmu_idx, val, addr, retaddr,
420
+ io_writex(env, full, mmu_idx, val, addr, retaddr,
421
op ^ (need_swap * MO_BSWAP));
422
return;
423
}
424
@@ -XXX,XX +XXX,XX @@ store_helper(CPUArchState *env, target_ulong addr, uint64_t val,
425
426
/* Handle clean RAM pages. */
427
if (tlb_addr & TLB_NOTDIRTY) {
428
- notdirty_write(env_cpu(env), addr, size, iotlbentry, retaddr);
429
+ notdirty_write(env_cpu(env), addr, size, full, retaddr);
430
}
431
432
haddr = (void *)((uintptr_t)addr + entry->addend);
433
diff --git a/target/arm/mte_helper.c b/target/arm/mte_helper.c
434
index XXXXXXX..XXXXXXX 100644
435
--- a/target/arm/mte_helper.c
436
+++ b/target/arm/mte_helper.c
437
@@ -XXX,XX +XXX,XX @@ static uint8_t *allocation_tag_mem(CPUARMState *env, int ptr_mmu_idx,
438
return tags + index;
439
#else
440
uintptr_t index;
441
- CPUIOTLBEntry *iotlbentry;
442
+ CPUTLBEntryFull *full;
443
int in_page, flags;
444
ram_addr_t ptr_ra;
445
hwaddr ptr_paddr, tag_paddr, xlat;
446
@@ -XXX,XX +XXX,XX @@ static uint8_t *allocation_tag_mem(CPUARMState *env, int ptr_mmu_idx,
447
assert(!(flags & TLB_INVALID_MASK));
448
449
/*
450
- * Find the iotlbentry for ptr. This *must* be present in the TLB
451
+ * Find the CPUTLBEntryFull for ptr. This *must* be present in the TLB
452
* because we just found the mapping.
453
* TODO: Perhaps there should be a cputlb helper that returns a
454
* matching tlb entry + iotlb entry.
455
@@ -XXX,XX +XXX,XX @@ static uint8_t *allocation_tag_mem(CPUARMState *env, int ptr_mmu_idx,
456
g_assert(tlb_hit(comparator, ptr));
457
}
458
# endif
459
- iotlbentry = &env_tlb(env)->d[ptr_mmu_idx].iotlb[index];
460
+ full = &env_tlb(env)->d[ptr_mmu_idx].fulltlb[index];
461
462
/* If the virtual page MemAttr != Tagged, access unchecked. */
463
- if (!arm_tlb_mte_tagged(&iotlbentry->attrs)) {
464
+ if (!arm_tlb_mte_tagged(&full->attrs)) {
465
return NULL;
466
}
467
468
@@ -XXX,XX +XXX,XX @@ static uint8_t *allocation_tag_mem(CPUARMState *env, int ptr_mmu_idx,
469
int wp = ptr_access == MMU_DATA_LOAD ? BP_MEM_READ : BP_MEM_WRITE;
470
assert(ra != 0);
471
cpu_check_watchpoint(env_cpu(env), ptr, ptr_size,
472
- iotlbentry->attrs, wp, ra);
473
+ full->attrs, wp, ra);
474
}
475
476
/*
477
@@ -XXX,XX +XXX,XX @@ static uint8_t *allocation_tag_mem(CPUARMState *env, int ptr_mmu_idx,
478
tag_paddr = ptr_paddr >> (LOG2_TAG_GRANULE + 1);
479
480
/* Look up the address in tag space. */
481
- tag_asi = iotlbentry->attrs.secure ? ARMASIdx_TagS : ARMASIdx_TagNS;
482
+ tag_asi = full->attrs.secure ? ARMASIdx_TagS : ARMASIdx_TagNS;
483
tag_as = cpu_get_address_space(env_cpu(env), tag_asi);
484
mr = address_space_translate(tag_as, tag_paddr, &xlat, NULL,
485
tag_access == MMU_DATA_STORE,
486
- iotlbentry->attrs);
487
+ full->attrs);
488
489
/*
490
* Note that @mr will never be NULL. If there is nothing in the address
491
diff --git a/target/arm/sve_helper.c b/target/arm/sve_helper.c
492
index XXXXXXX..XXXXXXX 100644
493
--- a/target/arm/sve_helper.c
494
+++ b/target/arm/sve_helper.c
495
@@ -XXX,XX +XXX,XX @@ bool sve_probe_page(SVEHostPage *info, bool nofault, CPUARMState *env,
496
g_assert(tlb_hit(comparator, addr));
497
# endif
498
499
- CPUIOTLBEntry *iotlbentry = &env_tlb(env)->d[mmu_idx].iotlb[index];
500
- info->attrs = iotlbentry->attrs;
501
+ CPUTLBEntryFull *full = &env_tlb(env)->d[mmu_idx].fulltlb[index];
502
+ info->attrs = full->attrs;
503
}
504
#endif
505
58
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
506
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
59
index XXXXXXX..XXXXXXX 100644
507
index XXXXXXX..XXXXXXX 100644
60
--- a/target/arm/translate-a64.c
508
--- a/target/arm/translate-a64.c
61
+++ b/target/arm/translate-a64.c
509
+++ b/target/arm/translate-a64.c
62
@@ -XXX,XX +XXX,XX @@ static void read_vec_element(DisasContext *s, TCGv_i64 tcg_dest, int srcidx,
510
@@ -XXX,XX +XXX,XX @@ static bool is_guarded_page(CPUARMState *env, DisasContext *s)
63
int element, MemOp memop)
511
* table entry even for that case.
64
{
512
*/
65
int vect_off = vec_reg_offset(s, srcidx, element, memop & MO_SIZE);
513
return (tlb_hit(entry->addr_code, addr) &&
66
- switch (memop) {
514
- arm_tlb_bti_gp(&env_tlb(env)->d[mmu_idx].iotlb[index].attrs));
67
+ switch ((unsigned)memop) {
515
+ arm_tlb_bti_gp(&env_tlb(env)->d[mmu_idx].fulltlb[index].attrs));
68
case MO_8:
69
tcg_gen_ld8u_i64(tcg_dest, cpu_env, vect_off);
70
break;
71
diff --git a/tcg/tcg-op.c b/tcg/tcg-op.c
72
index XXXXXXX..XXXXXXX 100644
73
--- a/tcg/tcg-op.c
74
+++ b/tcg/tcg-op.c
75
@@ -XXX,XX +XXX,XX @@ static inline MemOp tcg_canonicalize_memop(MemOp op, bool is64, bool st)
76
}
77
break;
78
case MO_64:
79
- if (!is64) {
80
- tcg_abort();
81
+ if (is64) {
82
+ op &= ~MO_SIGN;
83
+ break;
84
}
85
- break;
86
+ /* fall through */
87
+ default:
88
+ g_assert_not_reached();
89
}
90
if (st) {
91
op &= ~MO_SIGN;
92
@@ -XXX,XX +XXX,XX @@ typedef void (*gen_atomic_op_i64)(TCGv_i64, TCGv_env, TCGv,
93
# define WITH_ATOMIC64(X)
94
#endif
516
#endif
95
517
}
96
-static void * const table_cmpxchg[16] = {
518
97
+static void * const table_cmpxchg[(MO_SIZE | MO_BSWAP) + 1] = {
98
[MO_8] = gen_helper_atomic_cmpxchgb,
99
[MO_16 | MO_LE] = gen_helper_atomic_cmpxchgw_le,
100
[MO_16 | MO_BE] = gen_helper_atomic_cmpxchgw_be,
101
@@ -XXX,XX +XXX,XX @@ static void do_atomic_op_i64(TCGv_i64 ret, TCGv addr, TCGv_i64 val,
102
}
103
104
#define GEN_ATOMIC_HELPER(NAME, OP, NEW) \
105
-static void * const table_##NAME[16] = { \
106
+static void * const table_##NAME[(MO_SIZE | MO_BSWAP) + 1] = { \
107
[MO_8] = gen_helper_atomic_##NAME##b, \
108
[MO_16 | MO_LE] = gen_helper_atomic_##NAME##w_le, \
109
[MO_16 | MO_BE] = gen_helper_atomic_##NAME##w_be, \
110
diff --git a/target/s390x/tcg/translate_vx.c.inc b/target/s390x/tcg/translate_vx.c.inc
111
index XXXXXXX..XXXXXXX 100644
112
--- a/target/s390x/tcg/translate_vx.c.inc
113
+++ b/target/s390x/tcg/translate_vx.c.inc
114
@@ -XXX,XX +XXX,XX @@ static void read_vec_element_i64(TCGv_i64 dst, uint8_t reg, uint8_t enr,
115
{
116
const int offs = vec_reg_offset(reg, enr, memop & MO_SIZE);
117
118
- switch (memop) {
119
+ switch ((unsigned)memop) {
120
case ES_8:
121
tcg_gen_ld8u_i64(dst, cpu_env, offs);
122
break;
123
diff --git a/tcg/aarch64/tcg-target.c.inc b/tcg/aarch64/tcg-target.c.inc
124
index XXXXXXX..XXXXXXX 100644
125
--- a/tcg/aarch64/tcg-target.c.inc
126
+++ b/tcg/aarch64/tcg-target.c.inc
127
@@ -XXX,XX +XXX,XX @@ static void tcg_out_cltz(TCGContext *s, TCGType ext, TCGReg d,
128
/* helper signature: helper_ret_ld_mmu(CPUState *env, target_ulong addr,
129
* TCGMemOpIdx oi, uintptr_t ra)
130
*/
131
-static void * const qemu_ld_helpers[4] = {
132
+static void * const qemu_ld_helpers[MO_SIZE + 1] = {
133
[MO_8] = helper_ret_ldub_mmu,
134
#ifdef HOST_WORDS_BIGENDIAN
135
[MO_16] = helper_be_lduw_mmu,
136
@@ -XXX,XX +XXX,XX @@ static void * const qemu_ld_helpers[4] = {
137
* uintxx_t val, TCGMemOpIdx oi,
138
* uintptr_t ra)
139
*/
140
-static void * const qemu_st_helpers[4] = {
141
+static void * const qemu_st_helpers[MO_SIZE + 1] = {
142
[MO_8] = helper_ret_stb_mmu,
143
#ifdef HOST_WORDS_BIGENDIAN
144
[MO_16] = helper_be_stw_mmu,
145
diff --git a/tcg/arm/tcg-target.c.inc b/tcg/arm/tcg-target.c.inc
146
index XXXXXXX..XXXXXXX 100644
147
--- a/tcg/arm/tcg-target.c.inc
148
+++ b/tcg/arm/tcg-target.c.inc
149
@@ -XXX,XX +XXX,XX @@ static void tcg_out_vldst(TCGContext *s, ARMInsn insn,
150
/* helper signature: helper_ret_ld_mmu(CPUState *env, target_ulong addr,
151
* int mmu_idx, uintptr_t ra)
152
*/
153
-static void * const qemu_ld_helpers[8] = {
154
+static void * const qemu_ld_helpers[MO_SSIZE + 1] = {
155
[MO_UB] = helper_ret_ldub_mmu,
156
[MO_SB] = helper_ret_ldsb_mmu,
157
#ifdef HOST_WORDS_BIGENDIAN
158
@@ -XXX,XX +XXX,XX @@ static void * const qemu_ld_helpers[8] = {
159
/* helper signature: helper_ret_st_mmu(CPUState *env, target_ulong addr,
160
* uintxx_t val, int mmu_idx, uintptr_t ra)
161
*/
162
-static void * const qemu_st_helpers[4] = {
163
+static void * const qemu_st_helpers[MO_SIZE + 1] = {
164
[MO_8] = helper_ret_stb_mmu,
165
#ifdef HOST_WORDS_BIGENDIAN
166
[MO_16] = helper_be_stw_mmu,
167
diff --git a/tcg/i386/tcg-target.c.inc b/tcg/i386/tcg-target.c.inc
168
index XXXXXXX..XXXXXXX 100644
169
--- a/tcg/i386/tcg-target.c.inc
170
+++ b/tcg/i386/tcg-target.c.inc
171
@@ -XXX,XX +XXX,XX @@ static void tcg_out_nopn(TCGContext *s, int n)
172
/* helper signature: helper_ret_ld_mmu(CPUState *env, target_ulong addr,
173
* int mmu_idx, uintptr_t ra)
174
*/
175
-static void * const qemu_ld_helpers[16] = {
176
+static void * const qemu_ld_helpers[(MO_SIZE | MO_BSWAP) + 1] = {
177
[MO_UB] = helper_ret_ldub_mmu,
178
[MO_LEUW] = helper_le_lduw_mmu,
179
[MO_LEUL] = helper_le_ldul_mmu,
180
@@ -XXX,XX +XXX,XX @@ static void * const qemu_ld_helpers[16] = {
181
/* helper signature: helper_ret_st_mmu(CPUState *env, target_ulong addr,
182
* uintxx_t val, int mmu_idx, uintptr_t ra)
183
*/
184
-static void * const qemu_st_helpers[16] = {
185
+static void * const qemu_st_helpers[(MO_SIZE | MO_BSWAP) + 1] = {
186
[MO_UB] = helper_ret_stb_mmu,
187
[MO_LEUW] = helper_le_stw_mmu,
188
[MO_LEUL] = helper_le_stl_mmu,
189
diff --git a/tcg/mips/tcg-target.c.inc b/tcg/mips/tcg-target.c.inc
190
index XXXXXXX..XXXXXXX 100644
191
--- a/tcg/mips/tcg-target.c.inc
192
+++ b/tcg/mips/tcg-target.c.inc
193
@@ -XXX,XX +XXX,XX @@ static void tcg_out_call(TCGContext *s, const tcg_insn_unit *arg)
194
#if defined(CONFIG_SOFTMMU)
195
#include "../tcg-ldst.c.inc"
196
197
-static void * const qemu_ld_helpers[16] = {
198
+static void * const qemu_ld_helpers[(MO_SSIZE | MO_BSWAP) + 1] = {
199
[MO_UB] = helper_ret_ldub_mmu,
200
[MO_SB] = helper_ret_ldsb_mmu,
201
[MO_LEUW] = helper_le_lduw_mmu,
202
@@ -XXX,XX +XXX,XX @@ static void * const qemu_ld_helpers[16] = {
203
#endif
204
};
205
206
-static void * const qemu_st_helpers[16] = {
207
+static void * const qemu_st_helpers[(MO_SIZE | MO_BSWAP) + 1] = {
208
[MO_UB] = helper_ret_stb_mmu,
209
[MO_LEUW] = helper_le_stw_mmu,
210
[MO_LEUL] = helper_le_stl_mmu,
211
diff --git a/tcg/ppc/tcg-target.c.inc b/tcg/ppc/tcg-target.c.inc
212
index XXXXXXX..XXXXXXX 100644
213
--- a/tcg/ppc/tcg-target.c.inc
214
+++ b/tcg/ppc/tcg-target.c.inc
215
@@ -XXX,XX +XXX,XX @@ static void tcg_out_call(TCGContext *s, const tcg_insn_unit *target)
216
#endif
217
}
218
219
-static const uint32_t qemu_ldx_opc[16] = {
220
+static const uint32_t qemu_ldx_opc[(MO_SSIZE + MO_BSWAP) + 1] = {
221
[MO_UB] = LBZX,
222
[MO_UW] = LHZX,
223
[MO_UL] = LWZX,
224
@@ -XXX,XX +XXX,XX @@ static const uint32_t qemu_ldx_opc[16] = {
225
[MO_BSWAP | MO_Q] = LDBRX,
226
};
227
228
-static const uint32_t qemu_stx_opc[16] = {
229
+static const uint32_t qemu_stx_opc[(MO_SIZE + MO_BSWAP) + 1] = {
230
[MO_UB] = STBX,
231
[MO_UW] = STHX,
232
[MO_UL] = STWX,
233
@@ -XXX,XX +XXX,XX @@ static const uint32_t qemu_exts_opc[4] = {
234
/* helper signature: helper_ld_mmu(CPUState *env, target_ulong addr,
235
* int mmu_idx, uintptr_t ra)
236
*/
237
-static void * const qemu_ld_helpers[16] = {
238
+static void * const qemu_ld_helpers[(MO_SIZE | MO_BSWAP) + 1] = {
239
[MO_UB] = helper_ret_ldub_mmu,
240
[MO_LEUW] = helper_le_lduw_mmu,
241
[MO_LEUL] = helper_le_ldul_mmu,
242
@@ -XXX,XX +XXX,XX @@ static void * const qemu_ld_helpers[16] = {
243
/* helper signature: helper_st_mmu(CPUState *env, target_ulong addr,
244
* uintxx_t val, int mmu_idx, uintptr_t ra)
245
*/
246
-static void * const qemu_st_helpers[16] = {
247
+static void * const qemu_st_helpers[(MO_SIZE | MO_BSWAP) + 1] = {
248
[MO_UB] = helper_ret_stb_mmu,
249
[MO_LEUW] = helper_le_stw_mmu,
250
[MO_LEUL] = helper_le_stl_mmu,
251
diff --git a/tcg/riscv/tcg-target.c.inc b/tcg/riscv/tcg-target.c.inc
252
index XXXXXXX..XXXXXXX 100644
253
--- a/tcg/riscv/tcg-target.c.inc
254
+++ b/tcg/riscv/tcg-target.c.inc
255
@@ -XXX,XX +XXX,XX @@ static void tcg_out_mb(TCGContext *s, TCGArg a0)
256
/* helper signature: helper_ret_ld_mmu(CPUState *env, target_ulong addr,
257
* TCGMemOpIdx oi, uintptr_t ra)
258
*/
259
-static void * const qemu_ld_helpers[8] = {
260
+static void * const qemu_ld_helpers[MO_SSIZE + 1] = {
261
[MO_UB] = helper_ret_ldub_mmu,
262
[MO_SB] = helper_ret_ldsb_mmu,
263
#ifdef HOST_WORDS_BIGENDIAN
264
@@ -XXX,XX +XXX,XX @@ static void * const qemu_ld_helpers[8] = {
265
* uintxx_t val, TCGMemOpIdx oi,
266
* uintptr_t ra)
267
*/
268
-static void * const qemu_st_helpers[4] = {
269
+static void * const qemu_st_helpers[MO_SIZE + 1] = {
270
[MO_8] = helper_ret_stb_mmu,
271
#ifdef HOST_WORDS_BIGENDIAN
272
[MO_16] = helper_be_stw_mmu,
273
diff --git a/tcg/s390/tcg-target.c.inc b/tcg/s390/tcg-target.c.inc
274
index XXXXXXX..XXXXXXX 100644
275
--- a/tcg/s390/tcg-target.c.inc
276
+++ b/tcg/s390/tcg-target.c.inc
277
@@ -XXX,XX +XXX,XX @@ static const uint8_t tcg_cond_to_ltr_cond[] = {
278
};
279
280
#ifdef CONFIG_SOFTMMU
281
-static void * const qemu_ld_helpers[16] = {
282
+static void * const qemu_ld_helpers[(MO_SSIZE | MO_BSWAP) + 1] = {
283
[MO_UB] = helper_ret_ldub_mmu,
284
[MO_SB] = helper_ret_ldsb_mmu,
285
[MO_LEUW] = helper_le_lduw_mmu,
286
@@ -XXX,XX +XXX,XX @@ static void * const qemu_ld_helpers[16] = {
287
[MO_BEQ] = helper_be_ldq_mmu,
288
};
289
290
-static void * const qemu_st_helpers[16] = {
291
+static void * const qemu_st_helpers[(MO_SIZE | MO_BSWAP) + 1] = {
292
[MO_UB] = helper_ret_stb_mmu,
293
[MO_LEUW] = helper_le_stw_mmu,
294
[MO_LEUL] = helper_le_stl_mmu,
295
diff --git a/tcg/sparc/tcg-target.c.inc b/tcg/sparc/tcg-target.c.inc
296
index XXXXXXX..XXXXXXX 100644
297
--- a/tcg/sparc/tcg-target.c.inc
298
+++ b/tcg/sparc/tcg-target.c.inc
299
@@ -XXX,XX +XXX,XX @@ static void tcg_out_mb(TCGContext *s, TCGArg a0)
300
}
301
302
#ifdef CONFIG_SOFTMMU
303
-static const tcg_insn_unit *qemu_ld_trampoline[16];
304
-static const tcg_insn_unit *qemu_st_trampoline[16];
305
+static const tcg_insn_unit *qemu_ld_trampoline[(MO_SSIZE | MO_BSWAP) + 1];
306
+static const tcg_insn_unit *qemu_st_trampoline[(MO_SIZE | MO_BSWAP) + 1];
307
308
static void emit_extend(TCGContext *s, TCGReg r, int op)
309
{
310
@@ -XXX,XX +XXX,XX @@ static void emit_extend(TCGContext *s, TCGReg r, int op)
311
312
static void build_trampolines(TCGContext *s)
313
{
314
- static void * const qemu_ld_helpers[16] = {
315
+ static void * const qemu_ld_helpers[] = {
316
[MO_UB] = helper_ret_ldub_mmu,
317
[MO_SB] = helper_ret_ldsb_mmu,
318
[MO_LEUW] = helper_le_lduw_mmu,
319
@@ -XXX,XX +XXX,XX @@ static void build_trampolines(TCGContext *s)
320
[MO_BEUL] = helper_be_ldul_mmu,
321
[MO_BEQ] = helper_be_ldq_mmu,
322
};
323
- static void * const qemu_st_helpers[16] = {
324
+ static void * const qemu_st_helpers[] = {
325
[MO_UB] = helper_ret_stb_mmu,
326
[MO_LEUW] = helper_le_stw_mmu,
327
[MO_LEUL] = helper_le_stl_mmu,
328
@@ -XXX,XX +XXX,XX @@ static void build_trampolines(TCGContext *s)
329
int i;
330
TCGReg ra;
331
332
- for (i = 0; i < 16; ++i) {
333
+ for (i = 0; i < ARRAY_SIZE(qemu_ld_helpers); ++i) {
334
if (qemu_ld_helpers[i] == NULL) {
335
continue;
336
}
337
@@ -XXX,XX +XXX,XX @@ static void build_trampolines(TCGContext *s)
338
tcg_out_mov(s, TCG_TYPE_PTR, TCG_REG_O7, ra);
339
}
340
341
- for (i = 0; i < 16; ++i) {
342
+ for (i = 0; i < ARRAY_SIZE(qemu_st_helpers); ++i) {
343
if (qemu_st_helpers[i] == NULL) {
344
continue;
345
}
346
@@ -XXX,XX +XXX,XX @@ static TCGReg tcg_out_tlb_load(TCGContext *s, TCGReg addr, int mem_index,
347
}
348
#endif /* CONFIG_SOFTMMU */
349
350
-static const int qemu_ld_opc[16] = {
351
+static const int qemu_ld_opc[(MO_SSIZE | MO_BSWAP) + 1] = {
352
[MO_UB] = LDUB,
353
[MO_SB] = LDSB,
354
355
@@ -XXX,XX +XXX,XX @@ static const int qemu_ld_opc[16] = {
356
[MO_LEQ] = LDX_LE,
357
};
358
359
-static const int qemu_st_opc[16] = {
360
+static const int qemu_st_opc[(MO_SIZE | MO_BSWAP) + 1] = {
361
[MO_UB] = STB,
362
363
[MO_BEUW] = STH,
364
--
519
--
365
2.25.1
520
2.34.1
366
521
367
522
diff view generated by jsdifflib
1
There is no point in encoding load/store within a bit of
1
This field is only written, not read; remove it.
2
the memory trace info operand. Represent atomic operations
3
as a single read-modify-write tracepoint. Use MemOpIdx
4
instead of inventing a form specifically for traces.
5
2
3
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
4
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
6
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
5
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
7
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
6
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
---
7
---
9
accel/tcg/atomic_template.h | 1 -
8
include/hw/core/cpu.h | 1 -
10
trace/mem.h | 51 -----------------------------------
9
accel/tcg/cputlb.c | 7 +++----
11
accel/tcg/cputlb.c | 7 ++---
10
2 files changed, 3 insertions(+), 5 deletions(-)
12
accel/tcg/user-exec.c | 44 +++++++++++-------------------
13
tcg/tcg-op.c | 17 +++---------
14
accel/tcg/atomic_common.c.inc | 12 +++------
15
trace-events | 18 +++----------
16
7 files changed, 28 insertions(+), 122 deletions(-)
17
delete mode 100644 trace/mem.h
18
11
19
diff --git a/accel/tcg/atomic_template.h b/accel/tcg/atomic_template.h
12
diff --git a/include/hw/core/cpu.h b/include/hw/core/cpu.h
20
index XXXXXXX..XXXXXXX 100644
13
index XXXXXXX..XXXXXXX 100644
21
--- a/accel/tcg/atomic_template.h
14
--- a/include/hw/core/cpu.h
22
+++ b/accel/tcg/atomic_template.h
15
+++ b/include/hw/core/cpu.h
23
@@ -XXX,XX +XXX,XX @@
16
@@ -XXX,XX +XXX,XX @@ struct CPUWatchpoint {
17
* the memory regions get moved around by io_writex.
24
*/
18
*/
25
19
typedef struct SavedIOTLB {
26
#include "qemu/plugin.h"
20
- hwaddr addr;
27
-#include "trace/mem.h"
21
MemoryRegionSection *section;
28
22
hwaddr mr_offset;
29
#if DATA_SIZE == 16
23
} SavedIOTLB;
30
# define SUFFIX o
31
diff --git a/trace/mem.h b/trace/mem.h
32
deleted file mode 100644
33
index XXXXXXX..XXXXXXX
34
--- a/trace/mem.h
35
+++ /dev/null
36
@@ -XXX,XX +XXX,XX @@
37
-/*
38
- * Helper functions for guest memory tracing
39
- *
40
- * Copyright (C) 2016 Lluís Vilanova <vilanova@ac.upc.edu>
41
- *
42
- * This work is licensed under the terms of the GNU GPL, version 2 or later.
43
- * See the COPYING file in the top-level directory.
44
- */
45
-
46
-#ifndef TRACE__MEM_H
47
-#define TRACE__MEM_H
48
-
49
-#include "exec/memopidx.h"
50
-
51
-#define TRACE_MEM_SZ_SHIFT_MASK 0xf /* size shift mask */
52
-#define TRACE_MEM_SE (1ULL << 4) /* sign extended (y/n) */
53
-#define TRACE_MEM_BE (1ULL << 5) /* big endian (y/n) */
54
-#define TRACE_MEM_ST (1ULL << 6) /* store (y/n) */
55
-#define TRACE_MEM_MMU_SHIFT 8 /* mmu idx */
56
-
57
-/**
58
- * trace_mem_get_info:
59
- *
60
- * Return a value for the 'info' argument in guest memory access traces.
61
- */
62
-static inline uint16_t trace_mem_get_info(MemOpIdx oi, bool store)
63
-{
64
- MemOp op = get_memop(oi);
65
- uint32_t size_shift = op & MO_SIZE;
66
- bool sign_extend = op & MO_SIGN;
67
- bool big_endian = (op & MO_BSWAP) == MO_BE;
68
- uint16_t res;
69
-
70
- res = size_shift & TRACE_MEM_SZ_SHIFT_MASK;
71
- if (sign_extend) {
72
- res |= TRACE_MEM_SE;
73
- }
74
- if (big_endian) {
75
- res |= TRACE_MEM_BE;
76
- }
77
- if (store) {
78
- res |= TRACE_MEM_ST;
79
- }
80
-#ifdef CONFIG_SOFTMMU
81
- res |= get_mmuidx(oi) << TRACE_MEM_MMU_SHIFT;
82
-#endif
83
-
84
- return res;
85
-}
86
-
87
-#endif /* TRACE__MEM_H */
88
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
24
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
89
index XXXXXXX..XXXXXXX 100644
25
index XXXXXXX..XXXXXXX 100644
90
--- a/accel/tcg/cputlb.c
26
--- a/accel/tcg/cputlb.c
91
+++ b/accel/tcg/cputlb.c
27
+++ b/accel/tcg/cputlb.c
92
@@ -XXX,XX +XXX,XX @@
28
@@ -XXX,XX +XXX,XX @@ static uint64_t io_readx(CPUArchState *env, CPUTLBEntryFull *full,
93
#include "qemu/atomic128.h"
29
* This is read by tlb_plugin_lookup if the fulltlb entry doesn't match
94
#include "exec/translate-all.h"
30
* because of the side effect of io_writex changing memory layout.
95
#include "trace/trace-root.h"
31
*/
96
-#include "trace/mem.h"
32
-static void save_iotlb_data(CPUState *cs, hwaddr addr,
97
#include "tb-hash.h"
33
- MemoryRegionSection *section, hwaddr mr_offset)
98
#include "internal.h"
34
+static void save_iotlb_data(CPUState *cs, MemoryRegionSection *section,
35
+ hwaddr mr_offset)
36
{
99
#ifdef CONFIG_PLUGIN
37
#ifdef CONFIG_PLUGIN
100
@@ -XXX,XX +XXX,XX @@ static inline uint64_t cpu_load_helper(CPUArchState *env, abi_ptr addr,
38
SavedIOTLB *saved = &cs->saved_iotlb;
101
MemOp op, FullLoadHelper *full_load)
39
- saved->addr = addr;
102
{
40
saved->section = section;
103
MemOpIdx oi = make_memop_idx(op, mmu_idx);
41
saved->mr_offset = mr_offset;
104
- uint16_t meminfo = trace_mem_get_info(oi, false);
42
#endif
105
uint64_t ret;
43
@@ -XXX,XX +XXX,XX @@ static void io_writex(CPUArchState *env, CPUTLBEntryFull *full,
106
44
* The memory_region_dispatch may trigger a flush/resize
107
- trace_guest_mem_before_exec(env_cpu(env), addr, meminfo);
45
* so for plugins we save the iotlb_data just in case.
108
+ trace_guest_ld_before_exec(env_cpu(env), addr, oi);
46
*/
109
47
- save_iotlb_data(cpu, full->xlat_section, section, mr_offset);
110
ret = full_load(env, addr, oi, retaddr);
48
+ save_iotlb_data(cpu, section, mr_offset);
111
49
112
@@ -XXX,XX +XXX,XX @@ cpu_store_helper(CPUArchState *env, target_ulong addr, uint64_t val,
50
if (!qemu_mutex_iothread_locked()) {
113
int mmu_idx, uintptr_t retaddr, MemOp op)
51
qemu_mutex_lock_iothread();
114
{
115
MemOpIdx oi = make_memop_idx(op, mmu_idx);
116
- uint16_t meminfo = trace_mem_get_info(oi, true);
117
118
- trace_guest_mem_before_exec(env_cpu(env), addr, meminfo);
119
+ trace_guest_st_before_exec(env_cpu(env), addr, oi);
120
121
store_helper(env, addr, val, oi, retaddr, op);
122
123
diff --git a/accel/tcg/user-exec.c b/accel/tcg/user-exec.c
124
index XXXXXXX..XXXXXXX 100644
125
--- a/accel/tcg/user-exec.c
126
+++ b/accel/tcg/user-exec.c
127
@@ -XXX,XX +XXX,XX @@
128
#include "exec/helper-proto.h"
129
#include "qemu/atomic128.h"
130
#include "trace/trace-root.h"
131
-#include "trace/mem.h"
132
+#include "internal.h"
133
134
#undef EAX
135
#undef ECX
136
@@ -XXX,XX +XXX,XX @@ int cpu_signal_handler(int host_signum, void *pinfo,
137
uint32_t cpu_ldub_data(CPUArchState *env, abi_ptr ptr)
138
{
139
MemOpIdx oi = make_memop_idx(MO_UB, MMU_USER_IDX);
140
- uint16_t meminfo = trace_mem_get_info(oi, false);
141
uint32_t ret;
142
143
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
144
+ trace_guest_ld_before_exec(env_cpu(env), ptr, oi);
145
ret = ldub_p(g2h(env_cpu(env), ptr));
146
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
147
return ret;
148
@@ -XXX,XX +XXX,XX @@ int cpu_ldsb_data(CPUArchState *env, abi_ptr ptr)
149
uint32_t cpu_lduw_be_data(CPUArchState *env, abi_ptr ptr)
150
{
151
MemOpIdx oi = make_memop_idx(MO_BEUW, MMU_USER_IDX);
152
- uint16_t meminfo = trace_mem_get_info(oi, false);
153
uint32_t ret;
154
155
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
156
+ trace_guest_ld_before_exec(env_cpu(env), ptr, oi);
157
ret = lduw_be_p(g2h(env_cpu(env), ptr));
158
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
159
return ret;
160
@@ -XXX,XX +XXX,XX @@ int cpu_ldsw_be_data(CPUArchState *env, abi_ptr ptr)
161
uint32_t cpu_ldl_be_data(CPUArchState *env, abi_ptr ptr)
162
{
163
MemOpIdx oi = make_memop_idx(MO_BEUL, MMU_USER_IDX);
164
- uint16_t meminfo = trace_mem_get_info(oi, false);
165
uint32_t ret;
166
167
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
168
+ trace_guest_ld_before_exec(env_cpu(env), ptr, oi);
169
ret = ldl_be_p(g2h(env_cpu(env), ptr));
170
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
171
return ret;
172
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_ldl_be_data(CPUArchState *env, abi_ptr ptr)
173
uint64_t cpu_ldq_be_data(CPUArchState *env, abi_ptr ptr)
174
{
175
MemOpIdx oi = make_memop_idx(MO_BEQ, MMU_USER_IDX);
176
- uint16_t meminfo = trace_mem_get_info(oi, false);
177
uint64_t ret;
178
179
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
180
+ trace_guest_ld_before_exec(env_cpu(env), ptr, oi);
181
ret = ldq_be_p(g2h(env_cpu(env), ptr));
182
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
183
return ret;
184
@@ -XXX,XX +XXX,XX @@ uint64_t cpu_ldq_be_data(CPUArchState *env, abi_ptr ptr)
185
uint32_t cpu_lduw_le_data(CPUArchState *env, abi_ptr ptr)
186
{
187
MemOpIdx oi = make_memop_idx(MO_LEUW, MMU_USER_IDX);
188
- uint16_t meminfo = trace_mem_get_info(oi, false);
189
uint32_t ret;
190
191
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
192
+ trace_guest_ld_before_exec(env_cpu(env), ptr, oi);
193
ret = lduw_le_p(g2h(env_cpu(env), ptr));
194
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
195
return ret;
196
@@ -XXX,XX +XXX,XX @@ int cpu_ldsw_le_data(CPUArchState *env, abi_ptr ptr)
197
uint32_t cpu_ldl_le_data(CPUArchState *env, abi_ptr ptr)
198
{
199
MemOpIdx oi = make_memop_idx(MO_LEUL, MMU_USER_IDX);
200
- uint16_t meminfo = trace_mem_get_info(oi, false);
201
uint32_t ret;
202
203
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
204
+ trace_guest_ld_before_exec(env_cpu(env), ptr, oi);
205
ret = ldl_le_p(g2h(env_cpu(env), ptr));
206
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
207
return ret;
208
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_ldl_le_data(CPUArchState *env, abi_ptr ptr)
209
uint64_t cpu_ldq_le_data(CPUArchState *env, abi_ptr ptr)
210
{
211
MemOpIdx oi = make_memop_idx(MO_LEQ, MMU_USER_IDX);
212
- uint16_t meminfo = trace_mem_get_info(oi, false);
213
uint64_t ret;
214
215
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
216
+ trace_guest_ld_before_exec(env_cpu(env), ptr, oi);
217
ret = ldq_le_p(g2h(env_cpu(env), ptr));
218
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
219
return ret;
220
@@ -XXX,XX +XXX,XX @@ uint64_t cpu_ldq_le_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
221
void cpu_stb_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
222
{
223
MemOpIdx oi = make_memop_idx(MO_UB, MMU_USER_IDX);
224
- uint16_t meminfo = trace_mem_get_info(oi, true);
225
226
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
227
+ trace_guest_st_before_exec(env_cpu(env), ptr, oi);
228
stb_p(g2h(env_cpu(env), ptr), val);
229
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
230
}
231
@@ -XXX,XX +XXX,XX @@ void cpu_stb_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
232
void cpu_stw_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
233
{
234
MemOpIdx oi = make_memop_idx(MO_BEUW, MMU_USER_IDX);
235
- uint16_t meminfo = trace_mem_get_info(oi, true);
236
237
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
238
+ trace_guest_st_before_exec(env_cpu(env), ptr, oi);
239
stw_be_p(g2h(env_cpu(env), ptr), val);
240
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
241
}
242
@@ -XXX,XX +XXX,XX @@ void cpu_stw_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
243
void cpu_stl_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
244
{
245
MemOpIdx oi = make_memop_idx(MO_BEUL, MMU_USER_IDX);
246
- uint16_t meminfo = trace_mem_get_info(oi, true);
247
248
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
249
+ trace_guest_st_before_exec(env_cpu(env), ptr, oi);
250
stl_be_p(g2h(env_cpu(env), ptr), val);
251
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
252
}
253
@@ -XXX,XX +XXX,XX @@ void cpu_stl_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
254
void cpu_stq_be_data(CPUArchState *env, abi_ptr ptr, uint64_t val)
255
{
256
MemOpIdx oi = make_memop_idx(MO_BEQ, MMU_USER_IDX);
257
- uint16_t meminfo = trace_mem_get_info(oi, true);
258
259
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
260
+ trace_guest_st_before_exec(env_cpu(env), ptr, oi);
261
stq_be_p(g2h(env_cpu(env), ptr), val);
262
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
263
}
264
@@ -XXX,XX +XXX,XX @@ void cpu_stq_be_data(CPUArchState *env, abi_ptr ptr, uint64_t val)
265
void cpu_stw_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
266
{
267
MemOpIdx oi = make_memop_idx(MO_LEUW, MMU_USER_IDX);
268
- uint16_t meminfo = trace_mem_get_info(oi, true);
269
270
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
271
+ trace_guest_st_before_exec(env_cpu(env), ptr, oi);
272
stw_le_p(g2h(env_cpu(env), ptr), val);
273
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
274
}
275
@@ -XXX,XX +XXX,XX @@ void cpu_stw_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
276
void cpu_stl_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
277
{
278
MemOpIdx oi = make_memop_idx(MO_LEUL, MMU_USER_IDX);
279
- uint16_t meminfo = trace_mem_get_info(oi, true);
280
281
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
282
+ trace_guest_st_before_exec(env_cpu(env), ptr, oi);
283
stl_le_p(g2h(env_cpu(env), ptr), val);
284
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
285
}
286
@@ -XXX,XX +XXX,XX @@ void cpu_stl_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
287
void cpu_stq_le_data(CPUArchState *env, abi_ptr ptr, uint64_t val)
288
{
289
MemOpIdx oi = make_memop_idx(MO_LEQ, MMU_USER_IDX);
290
- uint16_t meminfo = trace_mem_get_info(oi, true);
291
292
- trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
293
+ trace_guest_st_before_exec(env_cpu(env), ptr, oi);
294
stq_le_p(g2h(env_cpu(env), ptr), val);
295
qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
296
}
297
diff --git a/tcg/tcg-op.c b/tcg/tcg-op.c
298
index XXXXXXX..XXXXXXX 100644
299
--- a/tcg/tcg-op.c
300
+++ b/tcg/tcg-op.c
301
@@ -XXX,XX +XXX,XX @@
302
#include "tcg/tcg-op.h"
303
#include "tcg/tcg-mo.h"
304
#include "trace-tcg.h"
305
-#include "trace/mem.h"
306
#include "exec/plugin-gen.h"
307
308
/* Reduce the number of ifdefs below. This assumes that all uses of
309
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_ld_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
310
{
311
MemOp orig_memop;
312
MemOpIdx oi;
313
- uint16_t info;
314
315
tcg_gen_req_mo(TCG_MO_LD_LD | TCG_MO_ST_LD);
316
memop = tcg_canonicalize_memop(memop, 0, 0);
317
oi = make_memop_idx(memop, idx);
318
- info = trace_mem_get_info(oi, 0);
319
- trace_guest_mem_before_tcg(tcg_ctx->cpu, cpu_env, addr, info);
320
+ trace_guest_ld_before_tcg(tcg_ctx->cpu, cpu_env, addr, oi);
321
322
orig_memop = memop;
323
if (!TCG_TARGET_HAS_MEMORY_BSWAP && (memop & MO_BSWAP)) {
324
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_st_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
325
{
326
TCGv_i32 swap = NULL;
327
MemOpIdx oi;
328
- uint16_t info;
329
330
tcg_gen_req_mo(TCG_MO_LD_ST | TCG_MO_ST_ST);
331
memop = tcg_canonicalize_memop(memop, 0, 1);
332
oi = make_memop_idx(memop, idx);
333
- info = trace_mem_get_info(oi, 1);
334
- trace_guest_mem_before_tcg(tcg_ctx->cpu, cpu_env, addr, info);
335
+ trace_guest_st_before_tcg(tcg_ctx->cpu, cpu_env, addr, oi);
336
337
if (!TCG_TARGET_HAS_MEMORY_BSWAP && (memop & MO_BSWAP)) {
338
swap = tcg_temp_new_i32();
339
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_ld_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
340
{
341
MemOp orig_memop;
342
MemOpIdx oi;
343
- uint16_t info;
344
345
if (TCG_TARGET_REG_BITS == 32 && (memop & MO_SIZE) < MO_64) {
346
tcg_gen_qemu_ld_i32(TCGV_LOW(val), addr, idx, memop);
347
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_ld_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
348
tcg_gen_req_mo(TCG_MO_LD_LD | TCG_MO_ST_LD);
349
memop = tcg_canonicalize_memop(memop, 1, 0);
350
oi = make_memop_idx(memop, idx);
351
- info = trace_mem_get_info(oi, 0);
352
- trace_guest_mem_before_tcg(tcg_ctx->cpu, cpu_env, addr, info);
353
+ trace_guest_ld_before_tcg(tcg_ctx->cpu, cpu_env, addr, oi);
354
355
orig_memop = memop;
356
if (!TCG_TARGET_HAS_MEMORY_BSWAP && (memop & MO_BSWAP)) {
357
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_st_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
358
{
359
TCGv_i64 swap = NULL;
360
MemOpIdx oi;
361
- uint16_t info;
362
363
if (TCG_TARGET_REG_BITS == 32 && (memop & MO_SIZE) < MO_64) {
364
tcg_gen_qemu_st_i32(TCGV_LOW(val), addr, idx, memop);
365
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_st_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
366
tcg_gen_req_mo(TCG_MO_LD_ST | TCG_MO_ST_ST);
367
memop = tcg_canonicalize_memop(memop, 1, 1);
368
oi = make_memop_idx(memop, idx);
369
- info = trace_mem_get_info(oi, 1);
370
- trace_guest_mem_before_tcg(tcg_ctx->cpu, cpu_env, addr, info);
371
+ trace_guest_st_before_tcg(tcg_ctx->cpu, cpu_env, addr, oi);
372
373
if (!TCG_TARGET_HAS_MEMORY_BSWAP && (memop & MO_BSWAP)) {
374
swap = tcg_temp_new_i64();
375
diff --git a/accel/tcg/atomic_common.c.inc b/accel/tcg/atomic_common.c.inc
376
index XXXXXXX..XXXXXXX 100644
377
--- a/accel/tcg/atomic_common.c.inc
378
+++ b/accel/tcg/atomic_common.c.inc
379
@@ -XXX,XX +XXX,XX @@ static void atomic_trace_rmw_pre(CPUArchState *env, target_ulong addr,
380
MemOpIdx oi)
381
{
382
CPUState *cpu = env_cpu(env);
383
- uint16_t info = trace_mem_get_info(oi, false);
384
385
- trace_guest_mem_before_exec(cpu, addr, info);
386
- trace_guest_mem_before_exec(cpu, addr, info | TRACE_MEM_ST);
387
+ trace_guest_rmw_before_exec(cpu, addr, oi);
388
}
389
390
static void atomic_trace_rmw_post(CPUArchState *env, target_ulong addr,
391
@@ -XXX,XX +XXX,XX @@ static void atomic_trace_rmw_post(CPUArchState *env, target_ulong addr,
392
static void atomic_trace_ld_pre(CPUArchState *env, target_ulong addr,
393
MemOpIdx oi)
394
{
395
- uint16_t info = trace_mem_get_info(oi, false);
396
-
397
- trace_guest_mem_before_exec(env_cpu(env), addr, info);
398
+ trace_guest_ld_before_exec(env_cpu(env), addr, oi);
399
}
400
401
static void atomic_trace_ld_post(CPUArchState *env, target_ulong addr,
402
@@ -XXX,XX +XXX,XX @@ static void atomic_trace_ld_post(CPUArchState *env, target_ulong addr,
403
static void atomic_trace_st_pre(CPUArchState *env, target_ulong addr,
404
MemOpIdx oi)
405
{
406
- uint16_t info = trace_mem_get_info(oi, true);
407
-
408
- trace_guest_mem_before_exec(env_cpu(env), addr, info);
409
+ trace_guest_st_before_exec(env_cpu(env), addr, oi);
410
}
411
412
static void atomic_trace_st_post(CPUArchState *env, target_ulong addr,
413
diff --git a/trace-events b/trace-events
414
index XXXXXXX..XXXXXXX 100644
415
--- a/trace-events
416
+++ b/trace-events
417
@@ -XXX,XX +XXX,XX @@ vcpu guest_cpu_reset(void)
418
# tcg/tcg-op.c
419
420
# @vaddr: Access' virtual address.
421
-# @info : Access' information (see below).
422
+# @memopidx: Access' information (see below).
423
#
424
# Start virtual memory access (before any potential access violation).
425
-#
426
# Does not include memory accesses performed by devices.
427
#
428
-# Access information can be parsed as:
429
-#
430
-# struct mem_info {
431
-# uint8_t size_shift : 4; /* interpreted as "1 << size_shift" bytes */
432
-# bool sign_extend: 1; /* sign-extended */
433
-# uint8_t endianness : 1; /* 0: little, 1: big */
434
-# bool store : 1; /* whether it is a store operation */
435
-# pad : 1;
436
-# uint8_t mmuidx : 4; /* mmuidx (softmmu only) */
437
-# };
438
-#
439
# Mode: user, softmmu
440
# Targets: TCG(all)
441
-vcpu tcg guest_mem_before(TCGv vaddr, uint16_t info) "info=%d", "vaddr=0x%016"PRIx64" info=%d"
442
+vcpu tcg guest_ld_before(TCGv vaddr, uint32_t memopidx) "info=%d", "vaddr=0x%016"PRIx64" memopidx=0x%x"
443
+vcpu tcg guest_st_before(TCGv vaddr, uint32_t memopidx) "info=%d", "vaddr=0x%016"PRIx64" memopidx=0x%x"
444
+vcpu tcg guest_rmw_before(TCGv vaddr, uint32_t memopidx) "info=%d", "vaddr=0x%016"PRIx64" memopidx=0x%x"
445
446
# include/user/syscall-trace.h
447
448
--
52
--
449
2.25.1
53
2.34.1
450
54
451
55
diff view generated by jsdifflib
1
We're about to move this out of tcg.h, so rename it
1
When PAGE_WRITE_INV is set when calling tlb_set_page,
2
as we did when moving MemOp.
2
we immediately set TLB_INVALID_MASK in order to force
3
tlb_fill to be called on the next lookup. Here in
4
probe_access_internal, we have just called tlb_fill
5
and eliminated true misses, thus the lookup must be valid.
3
6
4
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
7
This allows us to remove a warning comment from s390x.
5
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
8
There doesn't seem to be a reason to change the code though.
9
10
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
11
Reviewed-by: David Hildenbrand <david@redhat.com>
12
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
6
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
13
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
7
---
14
---
8
accel/tcg/atomic_template.h | 24 +++++------
15
accel/tcg/cputlb.c | 10 +++++++++-
9
include/tcg/tcg.h | 74 ++++++++++++++++-----------------
16
target/s390x/tcg/mem_helper.c | 4 ----
10
accel/tcg/cputlb.c | 78 +++++++++++++++++------------------
17
2 files changed, 9 insertions(+), 5 deletions(-)
11
accel/tcg/user-exec.c | 2 +-
12
target/arm/helper-a64.c | 16 +++----
13
target/arm/m_helper.c | 2 +-
14
target/i386/tcg/mem_helper.c | 4 +-
15
target/m68k/op_helper.c | 2 +-
16
target/mips/tcg/msa_helper.c | 6 +--
17
target/s390x/tcg/mem_helper.c | 20 ++++-----
18
target/sparc/ldst_helper.c | 2 +-
19
tcg/optimize.c | 2 +-
20
tcg/tcg-op.c | 12 +++---
21
tcg/tcg.c | 2 +-
22
tcg/tci.c | 14 +++----
23
accel/tcg/atomic_common.c.inc | 6 +--
24
tcg/aarch64/tcg-target.c.inc | 14 +++----
25
tcg/arm/tcg-target.c.inc | 10 ++---
26
tcg/i386/tcg-target.c.inc | 10 ++---
27
tcg/mips/tcg-target.c.inc | 12 +++---
28
tcg/ppc/tcg-target.c.inc | 10 ++---
29
tcg/riscv/tcg-target.c.inc | 16 +++----
30
tcg/s390/tcg-target.c.inc | 10 ++---
31
tcg/sparc/tcg-target.c.inc | 4 +-
32
tcg/tcg-ldst.c.inc | 2 +-
33
25 files changed, 177 insertions(+), 177 deletions(-)
34
18
35
diff --git a/accel/tcg/atomic_template.h b/accel/tcg/atomic_template.h
36
index XXXXXXX..XXXXXXX 100644
37
--- a/accel/tcg/atomic_template.h
38
+++ b/accel/tcg/atomic_template.h
39
@@ -XXX,XX +XXX,XX @@
40
41
ABI_TYPE ATOMIC_NAME(cmpxchg)(CPUArchState *env, target_ulong addr,
42
ABI_TYPE cmpv, ABI_TYPE newv,
43
- TCGMemOpIdx oi, uintptr_t retaddr)
44
+ MemOpIdx oi, uintptr_t retaddr)
45
{
46
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
47
PAGE_READ | PAGE_WRITE, retaddr);
48
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(cmpxchg)(CPUArchState *env, target_ulong addr,
49
#if DATA_SIZE >= 16
50
#if HAVE_ATOMIC128
51
ABI_TYPE ATOMIC_NAME(ld)(CPUArchState *env, target_ulong addr,
52
- TCGMemOpIdx oi, uintptr_t retaddr)
53
+ MemOpIdx oi, uintptr_t retaddr)
54
{
55
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
56
PAGE_READ, retaddr);
57
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(ld)(CPUArchState *env, target_ulong addr,
58
}
59
60
void ATOMIC_NAME(st)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
61
- TCGMemOpIdx oi, uintptr_t retaddr)
62
+ MemOpIdx oi, uintptr_t retaddr)
63
{
64
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
65
PAGE_WRITE, retaddr);
66
@@ -XXX,XX +XXX,XX @@ void ATOMIC_NAME(st)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
67
#endif
68
#else
69
ABI_TYPE ATOMIC_NAME(xchg)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
70
- TCGMemOpIdx oi, uintptr_t retaddr)
71
+ MemOpIdx oi, uintptr_t retaddr)
72
{
73
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
74
PAGE_READ | PAGE_WRITE, retaddr);
75
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(xchg)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
76
77
#define GEN_ATOMIC_HELPER(X) \
78
ABI_TYPE ATOMIC_NAME(X)(CPUArchState *env, target_ulong addr, \
79
- ABI_TYPE val, TCGMemOpIdx oi, uintptr_t retaddr) \
80
+ ABI_TYPE val, MemOpIdx oi, uintptr_t retaddr) \
81
{ \
82
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE, \
83
PAGE_READ | PAGE_WRITE, retaddr); \
84
@@ -XXX,XX +XXX,XX @@ GEN_ATOMIC_HELPER(xor_fetch)
85
*/
86
#define GEN_ATOMIC_HELPER_FN(X, FN, XDATA_TYPE, RET) \
87
ABI_TYPE ATOMIC_NAME(X)(CPUArchState *env, target_ulong addr, \
88
- ABI_TYPE xval, TCGMemOpIdx oi, uintptr_t retaddr) \
89
+ ABI_TYPE xval, MemOpIdx oi, uintptr_t retaddr) \
90
{ \
91
XDATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE, \
92
PAGE_READ | PAGE_WRITE, retaddr); \
93
@@ -XXX,XX +XXX,XX @@ GEN_ATOMIC_HELPER_FN(umax_fetch, MAX, DATA_TYPE, new)
94
95
ABI_TYPE ATOMIC_NAME(cmpxchg)(CPUArchState *env, target_ulong addr,
96
ABI_TYPE cmpv, ABI_TYPE newv,
97
- TCGMemOpIdx oi, uintptr_t retaddr)
98
+ MemOpIdx oi, uintptr_t retaddr)
99
{
100
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
101
PAGE_READ | PAGE_WRITE, retaddr);
102
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(cmpxchg)(CPUArchState *env, target_ulong addr,
103
#if DATA_SIZE >= 16
104
#if HAVE_ATOMIC128
105
ABI_TYPE ATOMIC_NAME(ld)(CPUArchState *env, target_ulong addr,
106
- TCGMemOpIdx oi, uintptr_t retaddr)
107
+ MemOpIdx oi, uintptr_t retaddr)
108
{
109
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
110
PAGE_READ, retaddr);
111
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(ld)(CPUArchState *env, target_ulong addr,
112
}
113
114
void ATOMIC_NAME(st)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
115
- TCGMemOpIdx oi, uintptr_t retaddr)
116
+ MemOpIdx oi, uintptr_t retaddr)
117
{
118
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
119
PAGE_WRITE, retaddr);
120
@@ -XXX,XX +XXX,XX @@ void ATOMIC_NAME(st)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
121
#endif
122
#else
123
ABI_TYPE ATOMIC_NAME(xchg)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
124
- TCGMemOpIdx oi, uintptr_t retaddr)
125
+ MemOpIdx oi, uintptr_t retaddr)
126
{
127
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
128
PAGE_READ | PAGE_WRITE, retaddr);
129
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(xchg)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
130
131
#define GEN_ATOMIC_HELPER(X) \
132
ABI_TYPE ATOMIC_NAME(X)(CPUArchState *env, target_ulong addr, \
133
- ABI_TYPE val, TCGMemOpIdx oi, uintptr_t retaddr) \
134
+ ABI_TYPE val, MemOpIdx oi, uintptr_t retaddr) \
135
{ \
136
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE, \
137
PAGE_READ | PAGE_WRITE, retaddr); \
138
@@ -XXX,XX +XXX,XX @@ GEN_ATOMIC_HELPER(xor_fetch)
139
*/
140
#define GEN_ATOMIC_HELPER_FN(X, FN, XDATA_TYPE, RET) \
141
ABI_TYPE ATOMIC_NAME(X)(CPUArchState *env, target_ulong addr, \
142
- ABI_TYPE xval, TCGMemOpIdx oi, uintptr_t retaddr) \
143
+ ABI_TYPE xval, MemOpIdx oi, uintptr_t retaddr) \
144
{ \
145
XDATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE, \
146
PAGE_READ | PAGE_WRITE, retaddr); \
147
diff --git a/include/tcg/tcg.h b/include/tcg/tcg.h
148
index XXXXXXX..XXXXXXX 100644
149
--- a/include/tcg/tcg.h
150
+++ b/include/tcg/tcg.h
151
@@ -XXX,XX +XXX,XX @@ static inline size_t tcg_current_code_size(TCGContext *s)
152
}
153
154
/* Combine the MemOp and mmu_idx parameters into a single value. */
155
-typedef uint32_t TCGMemOpIdx;
156
+typedef uint32_t MemOpIdx;
157
158
/**
159
* make_memop_idx
160
@@ -XXX,XX +XXX,XX @@ typedef uint32_t TCGMemOpIdx;
161
*
162
* Encode these values into a single parameter.
163
*/
164
-static inline TCGMemOpIdx make_memop_idx(MemOp op, unsigned idx)
165
+static inline MemOpIdx make_memop_idx(MemOp op, unsigned idx)
166
{
167
tcg_debug_assert(idx <= 15);
168
return (op << 4) | idx;
169
@@ -XXX,XX +XXX,XX @@ static inline TCGMemOpIdx make_memop_idx(MemOp op, unsigned idx)
170
*
171
* Extract the memory operation from the combined value.
172
*/
173
-static inline MemOp get_memop(TCGMemOpIdx oi)
174
+static inline MemOp get_memop(MemOpIdx oi)
175
{
176
return oi >> 4;
177
}
178
@@ -XXX,XX +XXX,XX @@ static inline MemOp get_memop(TCGMemOpIdx oi)
179
*
180
* Extract the mmu index from the combined value.
181
*/
182
-static inline unsigned get_mmuidx(TCGMemOpIdx oi)
183
+static inline unsigned get_mmuidx(MemOpIdx oi)
184
{
185
return oi & 15;
186
}
187
@@ -XXX,XX +XXX,XX @@ uint64_t dup_const(unsigned vece, uint64_t c);
188
#ifdef CONFIG_SOFTMMU
189
/* Value zero-extended to tcg register size. */
190
tcg_target_ulong helper_ret_ldub_mmu(CPUArchState *env, target_ulong addr,
191
- TCGMemOpIdx oi, uintptr_t retaddr);
192
+ MemOpIdx oi, uintptr_t retaddr);
193
tcg_target_ulong helper_le_lduw_mmu(CPUArchState *env, target_ulong addr,
194
- TCGMemOpIdx oi, uintptr_t retaddr);
195
+ MemOpIdx oi, uintptr_t retaddr);
196
tcg_target_ulong helper_le_ldul_mmu(CPUArchState *env, target_ulong addr,
197
- TCGMemOpIdx oi, uintptr_t retaddr);
198
+ MemOpIdx oi, uintptr_t retaddr);
199
uint64_t helper_le_ldq_mmu(CPUArchState *env, target_ulong addr,
200
- TCGMemOpIdx oi, uintptr_t retaddr);
201
+ MemOpIdx oi, uintptr_t retaddr);
202
tcg_target_ulong helper_be_lduw_mmu(CPUArchState *env, target_ulong addr,
203
- TCGMemOpIdx oi, uintptr_t retaddr);
204
+ MemOpIdx oi, uintptr_t retaddr);
205
tcg_target_ulong helper_be_ldul_mmu(CPUArchState *env, target_ulong addr,
206
- TCGMemOpIdx oi, uintptr_t retaddr);
207
+ MemOpIdx oi, uintptr_t retaddr);
208
uint64_t helper_be_ldq_mmu(CPUArchState *env, target_ulong addr,
209
- TCGMemOpIdx oi, uintptr_t retaddr);
210
+ MemOpIdx oi, uintptr_t retaddr);
211
212
/* Value sign-extended to tcg register size. */
213
tcg_target_ulong helper_ret_ldsb_mmu(CPUArchState *env, target_ulong addr,
214
- TCGMemOpIdx oi, uintptr_t retaddr);
215
+ MemOpIdx oi, uintptr_t retaddr);
216
tcg_target_ulong helper_le_ldsw_mmu(CPUArchState *env, target_ulong addr,
217
- TCGMemOpIdx oi, uintptr_t retaddr);
218
+ MemOpIdx oi, uintptr_t retaddr);
219
tcg_target_ulong helper_le_ldsl_mmu(CPUArchState *env, target_ulong addr,
220
- TCGMemOpIdx oi, uintptr_t retaddr);
221
+ MemOpIdx oi, uintptr_t retaddr);
222
tcg_target_ulong helper_be_ldsw_mmu(CPUArchState *env, target_ulong addr,
223
- TCGMemOpIdx oi, uintptr_t retaddr);
224
+ MemOpIdx oi, uintptr_t retaddr);
225
tcg_target_ulong helper_be_ldsl_mmu(CPUArchState *env, target_ulong addr,
226
- TCGMemOpIdx oi, uintptr_t retaddr);
227
+ MemOpIdx oi, uintptr_t retaddr);
228
229
void helper_ret_stb_mmu(CPUArchState *env, target_ulong addr, uint8_t val,
230
- TCGMemOpIdx oi, uintptr_t retaddr);
231
+ MemOpIdx oi, uintptr_t retaddr);
232
void helper_le_stw_mmu(CPUArchState *env, target_ulong addr, uint16_t val,
233
- TCGMemOpIdx oi, uintptr_t retaddr);
234
+ MemOpIdx oi, uintptr_t retaddr);
235
void helper_le_stl_mmu(CPUArchState *env, target_ulong addr, uint32_t val,
236
- TCGMemOpIdx oi, uintptr_t retaddr);
237
+ MemOpIdx oi, uintptr_t retaddr);
238
void helper_le_stq_mmu(CPUArchState *env, target_ulong addr, uint64_t val,
239
- TCGMemOpIdx oi, uintptr_t retaddr);
240
+ MemOpIdx oi, uintptr_t retaddr);
241
void helper_be_stw_mmu(CPUArchState *env, target_ulong addr, uint16_t val,
242
- TCGMemOpIdx oi, uintptr_t retaddr);
243
+ MemOpIdx oi, uintptr_t retaddr);
244
void helper_be_stl_mmu(CPUArchState *env, target_ulong addr, uint32_t val,
245
- TCGMemOpIdx oi, uintptr_t retaddr);
246
+ MemOpIdx oi, uintptr_t retaddr);
247
void helper_be_stq_mmu(CPUArchState *env, target_ulong addr, uint64_t val,
248
- TCGMemOpIdx oi, uintptr_t retaddr);
249
+ MemOpIdx oi, uintptr_t retaddr);
250
251
/* Temporary aliases until backends are converted. */
252
#ifdef TARGET_WORDS_BIGENDIAN
253
@@ -XXX,XX +XXX,XX @@ void helper_be_stq_mmu(CPUArchState *env, target_ulong addr, uint64_t val,
254
255
uint32_t cpu_atomic_cmpxchgb_mmu(CPUArchState *env, target_ulong addr,
256
uint32_t cmpv, uint32_t newv,
257
- TCGMemOpIdx oi, uintptr_t retaddr);
258
+ MemOpIdx oi, uintptr_t retaddr);
259
uint32_t cpu_atomic_cmpxchgw_le_mmu(CPUArchState *env, target_ulong addr,
260
uint32_t cmpv, uint32_t newv,
261
- TCGMemOpIdx oi, uintptr_t retaddr);
262
+ MemOpIdx oi, uintptr_t retaddr);
263
uint32_t cpu_atomic_cmpxchgl_le_mmu(CPUArchState *env, target_ulong addr,
264
uint32_t cmpv, uint32_t newv,
265
- TCGMemOpIdx oi, uintptr_t retaddr);
266
+ MemOpIdx oi, uintptr_t retaddr);
267
uint64_t cpu_atomic_cmpxchgq_le_mmu(CPUArchState *env, target_ulong addr,
268
uint64_t cmpv, uint64_t newv,
269
- TCGMemOpIdx oi, uintptr_t retaddr);
270
+ MemOpIdx oi, uintptr_t retaddr);
271
uint32_t cpu_atomic_cmpxchgw_be_mmu(CPUArchState *env, target_ulong addr,
272
uint32_t cmpv, uint32_t newv,
273
- TCGMemOpIdx oi, uintptr_t retaddr);
274
+ MemOpIdx oi, uintptr_t retaddr);
275
uint32_t cpu_atomic_cmpxchgl_be_mmu(CPUArchState *env, target_ulong addr,
276
uint32_t cmpv, uint32_t newv,
277
- TCGMemOpIdx oi, uintptr_t retaddr);
278
+ MemOpIdx oi, uintptr_t retaddr);
279
uint64_t cpu_atomic_cmpxchgq_be_mmu(CPUArchState *env, target_ulong addr,
280
uint64_t cmpv, uint64_t newv,
281
- TCGMemOpIdx oi, uintptr_t retaddr);
282
+ MemOpIdx oi, uintptr_t retaddr);
283
284
#define GEN_ATOMIC_HELPER(NAME, TYPE, SUFFIX) \
285
TYPE cpu_atomic_ ## NAME ## SUFFIX ## _mmu \
286
(CPUArchState *env, target_ulong addr, TYPE val, \
287
- TCGMemOpIdx oi, uintptr_t retaddr);
288
+ MemOpIdx oi, uintptr_t retaddr);
289
290
#ifdef CONFIG_ATOMIC64
291
#define GEN_ATOMIC_HELPER_ALL(NAME) \
292
@@ -XXX,XX +XXX,XX @@ GEN_ATOMIC_HELPER_ALL(xchg)
293
294
Int128 cpu_atomic_cmpxchgo_le_mmu(CPUArchState *env, target_ulong addr,
295
Int128 cmpv, Int128 newv,
296
- TCGMemOpIdx oi, uintptr_t retaddr);
297
+ MemOpIdx oi, uintptr_t retaddr);
298
Int128 cpu_atomic_cmpxchgo_be_mmu(CPUArchState *env, target_ulong addr,
299
Int128 cmpv, Int128 newv,
300
- TCGMemOpIdx oi, uintptr_t retaddr);
301
+ MemOpIdx oi, uintptr_t retaddr);
302
303
Int128 cpu_atomic_ldo_le_mmu(CPUArchState *env, target_ulong addr,
304
- TCGMemOpIdx oi, uintptr_t retaddr);
305
+ MemOpIdx oi, uintptr_t retaddr);
306
Int128 cpu_atomic_ldo_be_mmu(CPUArchState *env, target_ulong addr,
307
- TCGMemOpIdx oi, uintptr_t retaddr);
308
+ MemOpIdx oi, uintptr_t retaddr);
309
void cpu_atomic_sto_le_mmu(CPUArchState *env, target_ulong addr, Int128 val,
310
- TCGMemOpIdx oi, uintptr_t retaddr);
311
+ MemOpIdx oi, uintptr_t retaddr);
312
void cpu_atomic_sto_be_mmu(CPUArchState *env, target_ulong addr, Int128 val,
313
- TCGMemOpIdx oi, uintptr_t retaddr);
314
+ MemOpIdx oi, uintptr_t retaddr);
315
316
#ifdef CONFIG_DEBUG_TCG
317
void tcg_assert_listed_vecop(TCGOpcode);
318
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
19
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
319
index XXXXXXX..XXXXXXX 100644
20
index XXXXXXX..XXXXXXX 100644
320
--- a/accel/tcg/cputlb.c
21
--- a/accel/tcg/cputlb.c
321
+++ b/accel/tcg/cputlb.c
22
+++ b/accel/tcg/cputlb.c
322
@@ -XXX,XX +XXX,XX @@ bool tlb_plugin_lookup(CPUState *cpu, target_ulong addr, int mmu_idx,
23
@@ -XXX,XX +XXX,XX @@ static int probe_access_internal(CPUArchState *env, target_ulong addr,
323
* @prot may be PAGE_READ, PAGE_WRITE, or PAGE_READ|PAGE_WRITE.
324
*/
325
static void *atomic_mmu_lookup(CPUArchState *env, target_ulong addr,
326
- TCGMemOpIdx oi, int size, int prot,
327
+ MemOpIdx oi, int size, int prot,
328
uintptr_t retaddr)
329
{
330
size_t mmu_idx = get_mmuidx(oi);
331
@@ -XXX,XX +XXX,XX @@ static void *atomic_mmu_lookup(CPUArchState *env, target_ulong addr,
332
*/
333
334
typedef uint64_t FullLoadHelper(CPUArchState *env, target_ulong addr,
335
- TCGMemOpIdx oi, uintptr_t retaddr);
336
+ MemOpIdx oi, uintptr_t retaddr);
337
338
static inline uint64_t QEMU_ALWAYS_INLINE
339
load_memop(const void *haddr, MemOp op)
340
@@ -XXX,XX +XXX,XX @@ load_memop(const void *haddr, MemOp op)
341
}
342
343
static inline uint64_t QEMU_ALWAYS_INLINE
344
-load_helper(CPUArchState *env, target_ulong addr, TCGMemOpIdx oi,
345
+load_helper(CPUArchState *env, target_ulong addr, MemOpIdx oi,
346
uintptr_t retaddr, MemOp op, bool code_read,
347
FullLoadHelper *full_load)
348
{
349
@@ -XXX,XX +XXX,XX @@ load_helper(CPUArchState *env, target_ulong addr, TCGMemOpIdx oi,
350
*/
351
352
static uint64_t full_ldub_mmu(CPUArchState *env, target_ulong addr,
353
- TCGMemOpIdx oi, uintptr_t retaddr)
354
+ MemOpIdx oi, uintptr_t retaddr)
355
{
356
return load_helper(env, addr, oi, retaddr, MO_UB, false, full_ldub_mmu);
357
}
358
359
tcg_target_ulong helper_ret_ldub_mmu(CPUArchState *env, target_ulong addr,
360
- TCGMemOpIdx oi, uintptr_t retaddr)
361
+ MemOpIdx oi, uintptr_t retaddr)
362
{
363
return full_ldub_mmu(env, addr, oi, retaddr);
364
}
365
366
static uint64_t full_le_lduw_mmu(CPUArchState *env, target_ulong addr,
367
- TCGMemOpIdx oi, uintptr_t retaddr)
368
+ MemOpIdx oi, uintptr_t retaddr)
369
{
370
return load_helper(env, addr, oi, retaddr, MO_LEUW, false,
371
full_le_lduw_mmu);
372
}
373
374
tcg_target_ulong helper_le_lduw_mmu(CPUArchState *env, target_ulong addr,
375
- TCGMemOpIdx oi, uintptr_t retaddr)
376
+ MemOpIdx oi, uintptr_t retaddr)
377
{
378
return full_le_lduw_mmu(env, addr, oi, retaddr);
379
}
380
381
static uint64_t full_be_lduw_mmu(CPUArchState *env, target_ulong addr,
382
- TCGMemOpIdx oi, uintptr_t retaddr)
383
+ MemOpIdx oi, uintptr_t retaddr)
384
{
385
return load_helper(env, addr, oi, retaddr, MO_BEUW, false,
386
full_be_lduw_mmu);
387
}
388
389
tcg_target_ulong helper_be_lduw_mmu(CPUArchState *env, target_ulong addr,
390
- TCGMemOpIdx oi, uintptr_t retaddr)
391
+ MemOpIdx oi, uintptr_t retaddr)
392
{
393
return full_be_lduw_mmu(env, addr, oi, retaddr);
394
}
395
396
static uint64_t full_le_ldul_mmu(CPUArchState *env, target_ulong addr,
397
- TCGMemOpIdx oi, uintptr_t retaddr)
398
+ MemOpIdx oi, uintptr_t retaddr)
399
{
400
return load_helper(env, addr, oi, retaddr, MO_LEUL, false,
401
full_le_ldul_mmu);
402
}
403
404
tcg_target_ulong helper_le_ldul_mmu(CPUArchState *env, target_ulong addr,
405
- TCGMemOpIdx oi, uintptr_t retaddr)
406
+ MemOpIdx oi, uintptr_t retaddr)
407
{
408
return full_le_ldul_mmu(env, addr, oi, retaddr);
409
}
410
411
static uint64_t full_be_ldul_mmu(CPUArchState *env, target_ulong addr,
412
- TCGMemOpIdx oi, uintptr_t retaddr)
413
+ MemOpIdx oi, uintptr_t retaddr)
414
{
415
return load_helper(env, addr, oi, retaddr, MO_BEUL, false,
416
full_be_ldul_mmu);
417
}
418
419
tcg_target_ulong helper_be_ldul_mmu(CPUArchState *env, target_ulong addr,
420
- TCGMemOpIdx oi, uintptr_t retaddr)
421
+ MemOpIdx oi, uintptr_t retaddr)
422
{
423
return full_be_ldul_mmu(env, addr, oi, retaddr);
424
}
425
426
uint64_t helper_le_ldq_mmu(CPUArchState *env, target_ulong addr,
427
- TCGMemOpIdx oi, uintptr_t retaddr)
428
+ MemOpIdx oi, uintptr_t retaddr)
429
{
430
return load_helper(env, addr, oi, retaddr, MO_LEQ, false,
431
helper_le_ldq_mmu);
432
}
433
434
uint64_t helper_be_ldq_mmu(CPUArchState *env, target_ulong addr,
435
- TCGMemOpIdx oi, uintptr_t retaddr)
436
+ MemOpIdx oi, uintptr_t retaddr)
437
{
438
return load_helper(env, addr, oi, retaddr, MO_BEQ, false,
439
helper_be_ldq_mmu);
440
@@ -XXX,XX +XXX,XX @@ uint64_t helper_be_ldq_mmu(CPUArchState *env, target_ulong addr,
441
442
443
tcg_target_ulong helper_ret_ldsb_mmu(CPUArchState *env, target_ulong addr,
444
- TCGMemOpIdx oi, uintptr_t retaddr)
445
+ MemOpIdx oi, uintptr_t retaddr)
446
{
447
return (int8_t)helper_ret_ldub_mmu(env, addr, oi, retaddr);
448
}
449
450
tcg_target_ulong helper_le_ldsw_mmu(CPUArchState *env, target_ulong addr,
451
- TCGMemOpIdx oi, uintptr_t retaddr)
452
+ MemOpIdx oi, uintptr_t retaddr)
453
{
454
return (int16_t)helper_le_lduw_mmu(env, addr, oi, retaddr);
455
}
456
457
tcg_target_ulong helper_be_ldsw_mmu(CPUArchState *env, target_ulong addr,
458
- TCGMemOpIdx oi, uintptr_t retaddr)
459
+ MemOpIdx oi, uintptr_t retaddr)
460
{
461
return (int16_t)helper_be_lduw_mmu(env, addr, oi, retaddr);
462
}
463
464
tcg_target_ulong helper_le_ldsl_mmu(CPUArchState *env, target_ulong addr,
465
- TCGMemOpIdx oi, uintptr_t retaddr)
466
+ MemOpIdx oi, uintptr_t retaddr)
467
{
468
return (int32_t)helper_le_ldul_mmu(env, addr, oi, retaddr);
469
}
470
471
tcg_target_ulong helper_be_ldsl_mmu(CPUArchState *env, target_ulong addr,
472
- TCGMemOpIdx oi, uintptr_t retaddr)
473
+ MemOpIdx oi, uintptr_t retaddr)
474
{
475
return (int32_t)helper_be_ldul_mmu(env, addr, oi, retaddr);
476
}
477
@@ -XXX,XX +XXX,XX @@ static inline uint64_t cpu_load_helper(CPUArchState *env, abi_ptr addr,
478
MemOp op, FullLoadHelper *full_load)
479
{
480
uint16_t meminfo;
481
- TCGMemOpIdx oi;
482
+ MemOpIdx oi;
483
uint64_t ret;
484
485
meminfo = trace_mem_get_info(op, mmu_idx, false);
486
@@ -XXX,XX +XXX,XX @@ store_helper_unaligned(CPUArchState *env, target_ulong addr, uint64_t val,
487
uintptr_t index, index2;
488
CPUTLBEntry *entry, *entry2;
489
target_ulong page2, tlb_addr, tlb_addr2;
490
- TCGMemOpIdx oi;
491
+ MemOpIdx oi;
492
size_t size2;
493
int i;
494
495
@@ -XXX,XX +XXX,XX @@ store_helper_unaligned(CPUArchState *env, target_ulong addr, uint64_t val,
496
497
static inline void QEMU_ALWAYS_INLINE
498
store_helper(CPUArchState *env, target_ulong addr, uint64_t val,
499
- TCGMemOpIdx oi, uintptr_t retaddr, MemOp op)
500
+ MemOpIdx oi, uintptr_t retaddr, MemOp op)
501
{
502
uintptr_t mmu_idx = get_mmuidx(oi);
503
uintptr_t index = tlb_index(env, mmu_idx, addr);
504
@@ -XXX,XX +XXX,XX @@ store_helper(CPUArchState *env, target_ulong addr, uint64_t val,
505
506
void __attribute__((noinline))
507
helper_ret_stb_mmu(CPUArchState *env, target_ulong addr, uint8_t val,
508
- TCGMemOpIdx oi, uintptr_t retaddr)
509
+ MemOpIdx oi, uintptr_t retaddr)
510
{
511
store_helper(env, addr, val, oi, retaddr, MO_UB);
512
}
513
514
void helper_le_stw_mmu(CPUArchState *env, target_ulong addr, uint16_t val,
515
- TCGMemOpIdx oi, uintptr_t retaddr)
516
+ MemOpIdx oi, uintptr_t retaddr)
517
{
518
store_helper(env, addr, val, oi, retaddr, MO_LEUW);
519
}
520
521
void helper_be_stw_mmu(CPUArchState *env, target_ulong addr, uint16_t val,
522
- TCGMemOpIdx oi, uintptr_t retaddr)
523
+ MemOpIdx oi, uintptr_t retaddr)
524
{
525
store_helper(env, addr, val, oi, retaddr, MO_BEUW);
526
}
527
528
void helper_le_stl_mmu(CPUArchState *env, target_ulong addr, uint32_t val,
529
- TCGMemOpIdx oi, uintptr_t retaddr)
530
+ MemOpIdx oi, uintptr_t retaddr)
531
{
532
store_helper(env, addr, val, oi, retaddr, MO_LEUL);
533
}
534
535
void helper_be_stl_mmu(CPUArchState *env, target_ulong addr, uint32_t val,
536
- TCGMemOpIdx oi, uintptr_t retaddr)
537
+ MemOpIdx oi, uintptr_t retaddr)
538
{
539
store_helper(env, addr, val, oi, retaddr, MO_BEUL);
540
}
541
542
void helper_le_stq_mmu(CPUArchState *env, target_ulong addr, uint64_t val,
543
- TCGMemOpIdx oi, uintptr_t retaddr)
544
+ MemOpIdx oi, uintptr_t retaddr)
545
{
546
store_helper(env, addr, val, oi, retaddr, MO_LEQ);
547
}
548
549
void helper_be_stq_mmu(CPUArchState *env, target_ulong addr, uint64_t val,
550
- TCGMemOpIdx oi, uintptr_t retaddr)
551
+ MemOpIdx oi, uintptr_t retaddr)
552
{
553
store_helper(env, addr, val, oi, retaddr, MO_BEQ);
554
}
555
@@ -XXX,XX +XXX,XX @@ static inline void QEMU_ALWAYS_INLINE
556
cpu_store_helper(CPUArchState *env, target_ulong addr, uint64_t val,
557
int mmu_idx, uintptr_t retaddr, MemOp op)
558
{
559
- TCGMemOpIdx oi;
560
+ MemOpIdx oi;
561
uint16_t meminfo;
562
563
meminfo = trace_mem_get_info(op, mmu_idx, true);
564
@@ -XXX,XX +XXX,XX @@ void cpu_stq_le_data(CPUArchState *env, target_ulong ptr, uint64_t val)
565
/* Code access functions. */
566
567
static uint64_t full_ldub_code(CPUArchState *env, target_ulong addr,
568
- TCGMemOpIdx oi, uintptr_t retaddr)
569
+ MemOpIdx oi, uintptr_t retaddr)
570
{
571
return load_helper(env, addr, oi, retaddr, MO_8, true, full_ldub_code);
572
}
573
574
uint32_t cpu_ldub_code(CPUArchState *env, abi_ptr addr)
575
{
576
- TCGMemOpIdx oi = make_memop_idx(MO_UB, cpu_mmu_index(env, true));
577
+ MemOpIdx oi = make_memop_idx(MO_UB, cpu_mmu_index(env, true));
578
return full_ldub_code(env, addr, oi, 0);
579
}
580
581
static uint64_t full_lduw_code(CPUArchState *env, target_ulong addr,
582
- TCGMemOpIdx oi, uintptr_t retaddr)
583
+ MemOpIdx oi, uintptr_t retaddr)
584
{
585
return load_helper(env, addr, oi, retaddr, MO_TEUW, true, full_lduw_code);
586
}
587
588
uint32_t cpu_lduw_code(CPUArchState *env, abi_ptr addr)
589
{
590
- TCGMemOpIdx oi = make_memop_idx(MO_TEUW, cpu_mmu_index(env, true));
591
+ MemOpIdx oi = make_memop_idx(MO_TEUW, cpu_mmu_index(env, true));
592
return full_lduw_code(env, addr, oi, 0);
593
}
594
595
static uint64_t full_ldl_code(CPUArchState *env, target_ulong addr,
596
- TCGMemOpIdx oi, uintptr_t retaddr)
597
+ MemOpIdx oi, uintptr_t retaddr)
598
{
599
return load_helper(env, addr, oi, retaddr, MO_TEUL, true, full_ldl_code);
600
}
601
602
uint32_t cpu_ldl_code(CPUArchState *env, abi_ptr addr)
603
{
604
- TCGMemOpIdx oi = make_memop_idx(MO_TEUL, cpu_mmu_index(env, true));
605
+ MemOpIdx oi = make_memop_idx(MO_TEUL, cpu_mmu_index(env, true));
606
return full_ldl_code(env, addr, oi, 0);
607
}
608
609
static uint64_t full_ldq_code(CPUArchState *env, target_ulong addr,
610
- TCGMemOpIdx oi, uintptr_t retaddr)
611
+ MemOpIdx oi, uintptr_t retaddr)
612
{
613
return load_helper(env, addr, oi, retaddr, MO_TEQ, true, full_ldq_code);
614
}
615
616
uint64_t cpu_ldq_code(CPUArchState *env, abi_ptr addr)
617
{
618
- TCGMemOpIdx oi = make_memop_idx(MO_TEQ, cpu_mmu_index(env, true));
619
+ MemOpIdx oi = make_memop_idx(MO_TEQ, cpu_mmu_index(env, true));
620
return full_ldq_code(env, addr, oi, 0);
621
}
622
diff --git a/accel/tcg/user-exec.c b/accel/tcg/user-exec.c
623
index XXXXXXX..XXXXXXX 100644
624
--- a/accel/tcg/user-exec.c
625
+++ b/accel/tcg/user-exec.c
626
@@ -XXX,XX +XXX,XX @@ uint64_t cpu_ldq_code(CPUArchState *env, abi_ptr ptr)
627
* @prot may be PAGE_READ, PAGE_WRITE, or PAGE_READ|PAGE_WRITE.
628
*/
629
static void *atomic_mmu_lookup(CPUArchState *env, target_ulong addr,
630
- TCGMemOpIdx oi, int size, int prot,
631
+ MemOpIdx oi, int size, int prot,
632
uintptr_t retaddr)
633
{
634
/* Enforce qemu required alignment. */
635
diff --git a/target/arm/helper-a64.c b/target/arm/helper-a64.c
636
index XXXXXXX..XXXXXXX 100644
637
--- a/target/arm/helper-a64.c
638
+++ b/target/arm/helper-a64.c
639
@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(paired_cmpxchg64_le)(CPUARMState *env, uint64_t addr,
640
clear_helper_retaddr();
641
#else
642
int mem_idx = cpu_mmu_index(env, false);
643
- TCGMemOpIdx oi0 = make_memop_idx(MO_LEQ | MO_ALIGN_16, mem_idx);
644
- TCGMemOpIdx oi1 = make_memop_idx(MO_LEQ, mem_idx);
645
+ MemOpIdx oi0 = make_memop_idx(MO_LEQ | MO_ALIGN_16, mem_idx);
646
+ MemOpIdx oi1 = make_memop_idx(MO_LEQ, mem_idx);
647
648
o0 = helper_le_ldq_mmu(env, addr + 0, oi0, ra);
649
o1 = helper_le_ldq_mmu(env, addr + 8, oi1, ra);
650
@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(paired_cmpxchg64_le_parallel)(CPUARMState *env, uint64_t addr,
651
uintptr_t ra = GETPC();
652
bool success;
653
int mem_idx;
654
- TCGMemOpIdx oi;
655
+ MemOpIdx oi;
656
657
assert(HAVE_CMPXCHG128);
658
659
@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(paired_cmpxchg64_be)(CPUARMState *env, uint64_t addr,
660
clear_helper_retaddr();
661
#else
662
int mem_idx = cpu_mmu_index(env, false);
663
- TCGMemOpIdx oi0 = make_memop_idx(MO_BEQ | MO_ALIGN_16, mem_idx);
664
- TCGMemOpIdx oi1 = make_memop_idx(MO_BEQ, mem_idx);
665
+ MemOpIdx oi0 = make_memop_idx(MO_BEQ | MO_ALIGN_16, mem_idx);
666
+ MemOpIdx oi1 = make_memop_idx(MO_BEQ, mem_idx);
667
668
o1 = helper_be_ldq_mmu(env, addr + 0, oi0, ra);
669
o0 = helper_be_ldq_mmu(env, addr + 8, oi1, ra);
670
@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(paired_cmpxchg64_be_parallel)(CPUARMState *env, uint64_t addr,
671
uintptr_t ra = GETPC();
672
bool success;
673
int mem_idx;
674
- TCGMemOpIdx oi;
675
+ MemOpIdx oi;
676
677
assert(HAVE_CMPXCHG128);
678
679
@@ -XXX,XX +XXX,XX @@ void HELPER(casp_le_parallel)(CPUARMState *env, uint32_t rs, uint64_t addr,
680
Int128 oldv, cmpv, newv;
681
uintptr_t ra = GETPC();
682
int mem_idx;
683
- TCGMemOpIdx oi;
684
+ MemOpIdx oi;
685
686
assert(HAVE_CMPXCHG128);
687
688
@@ -XXX,XX +XXX,XX @@ void HELPER(casp_be_parallel)(CPUARMState *env, uint32_t rs, uint64_t addr,
689
Int128 oldv, cmpv, newv;
690
uintptr_t ra = GETPC();
691
int mem_idx;
692
- TCGMemOpIdx oi;
693
+ MemOpIdx oi;
694
695
assert(HAVE_CMPXCHG128);
696
697
diff --git a/target/arm/m_helper.c b/target/arm/m_helper.c
698
index XXXXXXX..XXXXXXX 100644
699
--- a/target/arm/m_helper.c
700
+++ b/target/arm/m_helper.c
701
@@ -XXX,XX +XXX,XX @@ static bool do_v7m_function_return(ARMCPU *cpu)
702
703
{
704
bool threadmode, spsel;
705
- TCGMemOpIdx oi;
706
+ MemOpIdx oi;
707
ARMMMUIdx mmu_idx;
708
uint32_t *frame_sp_p;
709
uint32_t frameptr;
710
diff --git a/target/i386/tcg/mem_helper.c b/target/i386/tcg/mem_helper.c
711
index XXXXXXX..XXXXXXX 100644
712
--- a/target/i386/tcg/mem_helper.c
713
+++ b/target/i386/tcg/mem_helper.c
714
@@ -XXX,XX +XXX,XX @@ void helper_cmpxchg8b(CPUX86State *env, target_ulong a0)
715
{
716
uintptr_t ra = GETPC();
717
int mem_idx = cpu_mmu_index(env, false);
718
- TCGMemOpIdx oi = make_memop_idx(MO_TEQ, mem_idx);
719
+ MemOpIdx oi = make_memop_idx(MO_TEQ, mem_idx);
720
oldv = cpu_atomic_cmpxchgq_le_mmu(env, a0, cmpv, newv, oi, ra);
721
}
24
}
722
25
tlb_addr = tlb_read_ofs(entry, elt_ofs);
723
@@ -XXX,XX +XXX,XX @@ void helper_cmpxchg16b(CPUX86State *env, target_ulong a0)
26
724
Int128 newv = int128_make128(env->regs[R_EBX], env->regs[R_ECX]);
27
+ flags = TLB_FLAGS_MASK;
725
28
page_addr = addr & TARGET_PAGE_MASK;
726
int mem_idx = cpu_mmu_index(env, false);
29
if (!tlb_hit_page(tlb_addr, page_addr)) {
727
- TCGMemOpIdx oi = make_memop_idx(MO_TEQ | MO_ALIGN_16, mem_idx);
30
if (!victim_tlb_hit(env, mmu_idx, index, elt_ofs, page_addr)) {
728
+ MemOpIdx oi = make_memop_idx(MO_TEQ | MO_ALIGN_16, mem_idx);
31
@@ -XXX,XX +XXX,XX @@ static int probe_access_internal(CPUArchState *env, target_ulong addr,
729
Int128 oldv = cpu_atomic_cmpxchgo_le_mmu(env, a0, cmpv, newv, oi, ra);
32
730
33
/* TLB resize via tlb_fill may have moved the entry. */
731
if (int128_eq(oldv, cmpv)) {
34
entry = tlb_entry(env, mmu_idx, addr);
732
diff --git a/target/m68k/op_helper.c b/target/m68k/op_helper.c
35
+
733
index XXXXXXX..XXXXXXX 100644
36
+ /*
734
--- a/target/m68k/op_helper.c
37
+ * With PAGE_WRITE_INV, we set TLB_INVALID_MASK immediately,
735
+++ b/target/m68k/op_helper.c
38
+ * to force the next access through tlb_fill. We've just
736
@@ -XXX,XX +XXX,XX @@ static void do_cas2l(CPUM68KState *env, uint32_t regs, uint32_t a1, uint32_t a2,
39
+ * called tlb_fill, so we know that this entry *is* valid.
737
uintptr_t ra = GETPC();
40
+ */
738
#if defined(CONFIG_ATOMIC64)
41
+ flags &= ~TLB_INVALID_MASK;
739
int mmu_idx = cpu_mmu_index(env, 0);
42
}
740
- TCGMemOpIdx oi = make_memop_idx(MO_BEQ, mmu_idx);
43
tlb_addr = tlb_read_ofs(entry, elt_ofs);
741
+ MemOpIdx oi = make_memop_idx(MO_BEQ, mmu_idx);
44
}
742
#endif
45
- flags = tlb_addr & TLB_FLAGS_MASK;
743
46
+ flags &= tlb_addr;
744
if (parallel) {
47
745
diff --git a/target/mips/tcg/msa_helper.c b/target/mips/tcg/msa_helper.c
48
/* Fold all "mmio-like" bits into TLB_MMIO. This is not RAM. */
746
index XXXXXXX..XXXXXXX 100644
49
if (unlikely(flags & ~(TLB_WATCHPOINT | TLB_NOTDIRTY))) {
747
--- a/target/mips/tcg/msa_helper.c
748
+++ b/target/mips/tcg/msa_helper.c
749
@@ -XXX,XX +XXX,XX @@ void helper_msa_ffint_u_df(CPUMIPSState *env, uint32_t df, uint32_t wd,
750
#define DF_ELEMENTS(df) (MSA_WRLEN / DF_BITS(df))
751
752
#if !defined(CONFIG_USER_ONLY)
753
-#define MEMOP_IDX(DF) \
754
- TCGMemOpIdx oi = make_memop_idx(MO_TE | DF | MO_UNALN, \
755
- cpu_mmu_index(env, false));
756
+#define MEMOP_IDX(DF) \
757
+ MemOpIdx oi = make_memop_idx(MO_TE | DF | MO_UNALN, \
758
+ cpu_mmu_index(env, false));
759
#else
760
#define MEMOP_IDX(DF)
761
#endif
762
diff --git a/target/s390x/tcg/mem_helper.c b/target/s390x/tcg/mem_helper.c
50
diff --git a/target/s390x/tcg/mem_helper.c b/target/s390x/tcg/mem_helper.c
763
index XXXXXXX..XXXXXXX 100644
51
index XXXXXXX..XXXXXXX 100644
764
--- a/target/s390x/tcg/mem_helper.c
52
--- a/target/s390x/tcg/mem_helper.c
765
+++ b/target/s390x/tcg/mem_helper.c
53
+++ b/target/s390x/tcg/mem_helper.c
766
@@ -XXX,XX +XXX,XX @@ static void do_access_memset(CPUS390XState *env, vaddr vaddr, char *haddr,
54
@@ -XXX,XX +XXX,XX @@ static int s390_probe_access(CPUArchState *env, target_ulong addr, int size,
767
g_assert(haddr);
768
memset(haddr, byte, size);
769
#else
55
#else
770
- TCGMemOpIdx oi = make_memop_idx(MO_UB, mmu_idx);
56
int flags;
771
+ MemOpIdx oi = make_memop_idx(MO_UB, mmu_idx);
57
772
int i;
58
- /*
773
59
- * For !CONFIG_USER_ONLY, we cannot rely on TLB_INVALID_MASK or haddr==NULL
774
if (likely(haddr)) {
60
- * to detect if there was an exception during tlb_fill().
775
@@ -XXX,XX +XXX,XX @@ static uint8_t do_access_get_byte(CPUS390XState *env, vaddr vaddr, char **haddr,
61
- */
776
#ifdef CONFIG_USER_ONLY
62
env->tlb_fill_exc = 0;
777
return ldub_p(*haddr + offset);
63
flags = probe_access_flags(env, addr, access_type, mmu_idx, nonfault, phost,
778
#else
64
ra);
779
- TCGMemOpIdx oi = make_memop_idx(MO_UB, mmu_idx);
780
+ MemOpIdx oi = make_memop_idx(MO_UB, mmu_idx);
781
uint8_t byte;
782
783
if (likely(*haddr)) {
784
@@ -XXX,XX +XXX,XX @@ static void do_access_set_byte(CPUS390XState *env, vaddr vaddr, char **haddr,
785
#ifdef CONFIG_USER_ONLY
786
stb_p(*haddr + offset, byte);
787
#else
788
- TCGMemOpIdx oi = make_memop_idx(MO_UB, mmu_idx);
789
+ MemOpIdx oi = make_memop_idx(MO_UB, mmu_idx);
790
791
if (likely(*haddr)) {
792
stb_p(*haddr + offset, byte);
793
@@ -XXX,XX +XXX,XX @@ void HELPER(cdsg_parallel)(CPUS390XState *env, uint64_t addr,
794
Int128 cmpv = int128_make128(env->regs[r1 + 1], env->regs[r1]);
795
Int128 newv = int128_make128(env->regs[r3 + 1], env->regs[r3]);
796
int mem_idx;
797
- TCGMemOpIdx oi;
798
+ MemOpIdx oi;
799
Int128 oldv;
800
bool fail;
801
802
@@ -XXX,XX +XXX,XX @@ static uint32_t do_csst(CPUS390XState *env, uint32_t r3, uint64_t a1,
803
uint32_t *haddr = g2h(env_cpu(env), a1);
804
ov = qatomic_cmpxchg__nocheck(haddr, cv, nv);
805
#else
806
- TCGMemOpIdx oi = make_memop_idx(MO_TEUL | MO_ALIGN, mem_idx);
807
+ MemOpIdx oi = make_memop_idx(MO_TEUL | MO_ALIGN, mem_idx);
808
ov = cpu_atomic_cmpxchgl_be_mmu(env, a1, cv, nv, oi, ra);
809
#endif
810
} else {
811
@@ -XXX,XX +XXX,XX @@ static uint32_t do_csst(CPUS390XState *env, uint32_t r3, uint64_t a1,
812
813
if (parallel) {
814
#ifdef CONFIG_ATOMIC64
815
- TCGMemOpIdx oi = make_memop_idx(MO_TEQ | MO_ALIGN, mem_idx);
816
+ MemOpIdx oi = make_memop_idx(MO_TEQ | MO_ALIGN, mem_idx);
817
ov = cpu_atomic_cmpxchgq_be_mmu(env, a1, cv, nv, oi, ra);
818
#else
819
/* Note that we asserted !parallel above. */
820
@@ -XXX,XX +XXX,XX @@ static uint32_t do_csst(CPUS390XState *env, uint32_t r3, uint64_t a1,
821
cpu_stq_data_ra(env, a1 + 0, int128_gethi(nv), ra);
822
cpu_stq_data_ra(env, a1 + 8, int128_getlo(nv), ra);
823
} else if (HAVE_CMPXCHG128) {
824
- TCGMemOpIdx oi = make_memop_idx(MO_TEQ | MO_ALIGN_16, mem_idx);
825
+ MemOpIdx oi = make_memop_idx(MO_TEQ | MO_ALIGN_16, mem_idx);
826
ov = cpu_atomic_cmpxchgo_be_mmu(env, a1, cv, nv, oi, ra);
827
cc = !int128_eq(ov, cv);
828
} else {
829
@@ -XXX,XX +XXX,XX @@ static uint32_t do_csst(CPUS390XState *env, uint32_t r3, uint64_t a1,
830
cpu_stq_data_ra(env, a2 + 0, svh, ra);
831
cpu_stq_data_ra(env, a2 + 8, svl, ra);
832
} else if (HAVE_ATOMIC128) {
833
- TCGMemOpIdx oi = make_memop_idx(MO_TEQ | MO_ALIGN_16, mem_idx);
834
+ MemOpIdx oi = make_memop_idx(MO_TEQ | MO_ALIGN_16, mem_idx);
835
Int128 sv = int128_make128(svl, svh);
836
cpu_atomic_sto_be_mmu(env, a2, sv, oi, ra);
837
} else {
838
@@ -XXX,XX +XXX,XX @@ uint64_t HELPER(lpq_parallel)(CPUS390XState *env, uint64_t addr)
839
uintptr_t ra = GETPC();
840
uint64_t hi, lo;
841
int mem_idx;
842
- TCGMemOpIdx oi;
843
+ MemOpIdx oi;
844
Int128 v;
845
846
assert(HAVE_ATOMIC128);
847
@@ -XXX,XX +XXX,XX @@ void HELPER(stpq_parallel)(CPUS390XState *env, uint64_t addr,
848
{
849
uintptr_t ra = GETPC();
850
int mem_idx;
851
- TCGMemOpIdx oi;
852
+ MemOpIdx oi;
853
Int128 v;
854
855
assert(HAVE_ATOMIC128);
856
diff --git a/target/sparc/ldst_helper.c b/target/sparc/ldst_helper.c
857
index XXXXXXX..XXXXXXX 100644
858
--- a/target/sparc/ldst_helper.c
859
+++ b/target/sparc/ldst_helper.c
860
@@ -XXX,XX +XXX,XX @@ uint64_t helper_ld_asi(CPUSPARCState *env, target_ulong addr,
861
case ASI_SNF:
862
case ASI_SNFL:
863
{
864
- TCGMemOpIdx oi;
865
+ MemOpIdx oi;
866
int idx = (env->pstate & PS_PRIV
867
? (asi & 1 ? MMU_KERNEL_SECONDARY_IDX : MMU_KERNEL_IDX)
868
: (asi & 1 ? MMU_USER_SECONDARY_IDX : MMU_USER_IDX));
869
diff --git a/tcg/optimize.c b/tcg/optimize.c
870
index XXXXXXX..XXXXXXX 100644
871
--- a/tcg/optimize.c
872
+++ b/tcg/optimize.c
873
@@ -XXX,XX +XXX,XX @@ void tcg_optimize(TCGContext *s)
874
875
CASE_OP_32_64(qemu_ld):
876
{
877
- TCGMemOpIdx oi = op->args[nb_oargs + nb_iargs];
878
+ MemOpIdx oi = op->args[nb_oargs + nb_iargs];
879
MemOp mop = get_memop(oi);
880
if (!(mop & MO_SIGN)) {
881
mask = (2ULL << ((8 << (mop & MO_SIZE)) - 1)) - 1;
882
diff --git a/tcg/tcg-op.c b/tcg/tcg-op.c
883
index XXXXXXX..XXXXXXX 100644
884
--- a/tcg/tcg-op.c
885
+++ b/tcg/tcg-op.c
886
@@ -XXX,XX +XXX,XX @@ static inline MemOp tcg_canonicalize_memop(MemOp op, bool is64, bool st)
887
static void gen_ldst_i32(TCGOpcode opc, TCGv_i32 val, TCGv addr,
888
MemOp memop, TCGArg idx)
889
{
890
- TCGMemOpIdx oi = make_memop_idx(memop, idx);
891
+ MemOpIdx oi = make_memop_idx(memop, idx);
892
#if TARGET_LONG_BITS == 32
893
tcg_gen_op3i_i32(opc, val, addr, oi);
894
#else
895
@@ -XXX,XX +XXX,XX @@ static void gen_ldst_i32(TCGOpcode opc, TCGv_i32 val, TCGv addr,
896
static void gen_ldst_i64(TCGOpcode opc, TCGv_i64 val, TCGv addr,
897
MemOp memop, TCGArg idx)
898
{
899
- TCGMemOpIdx oi = make_memop_idx(memop, idx);
900
+ MemOpIdx oi = make_memop_idx(memop, idx);
901
#if TARGET_LONG_BITS == 32
902
if (TCG_TARGET_REG_BITS == 32) {
903
tcg_gen_op4i_i32(opc, TCGV_LOW(val), TCGV_HIGH(val), addr, oi);
904
@@ -XXX,XX +XXX,XX @@ void tcg_gen_atomic_cmpxchg_i32(TCGv_i32 retv, TCGv addr, TCGv_i32 cmpv,
905
tcg_temp_free_i32(t1);
906
} else {
907
gen_atomic_cx_i32 gen;
908
- TCGMemOpIdx oi;
909
+ MemOpIdx oi;
910
911
gen = table_cmpxchg[memop & (MO_SIZE | MO_BSWAP)];
912
tcg_debug_assert(gen != NULL);
913
@@ -XXX,XX +XXX,XX @@ void tcg_gen_atomic_cmpxchg_i64(TCGv_i64 retv, TCGv addr, TCGv_i64 cmpv,
914
} else if ((memop & MO_SIZE) == MO_64) {
915
#ifdef CONFIG_ATOMIC64
916
gen_atomic_cx_i64 gen;
917
- TCGMemOpIdx oi;
918
+ MemOpIdx oi;
919
920
gen = table_cmpxchg[memop & (MO_SIZE | MO_BSWAP)];
921
tcg_debug_assert(gen != NULL);
922
@@ -XXX,XX +XXX,XX @@ static void do_atomic_op_i32(TCGv_i32 ret, TCGv addr, TCGv_i32 val,
923
TCGArg idx, MemOp memop, void * const table[])
924
{
925
gen_atomic_op_i32 gen;
926
- TCGMemOpIdx oi;
927
+ MemOpIdx oi;
928
929
memop = tcg_canonicalize_memop(memop, 0, 0);
930
931
@@ -XXX,XX +XXX,XX @@ static void do_atomic_op_i64(TCGv_i64 ret, TCGv addr, TCGv_i64 val,
932
if ((memop & MO_SIZE) == MO_64) {
933
#ifdef CONFIG_ATOMIC64
934
gen_atomic_op_i64 gen;
935
- TCGMemOpIdx oi;
936
+ MemOpIdx oi;
937
938
gen = table[memop & (MO_SIZE | MO_BSWAP)];
939
tcg_debug_assert(gen != NULL);
940
diff --git a/tcg/tcg.c b/tcg/tcg.c
941
index XXXXXXX..XXXXXXX 100644
942
--- a/tcg/tcg.c
943
+++ b/tcg/tcg.c
944
@@ -XXX,XX +XXX,XX @@ static void tcg_dump_ops(TCGContext *s, bool have_prefs)
945
case INDEX_op_qemu_ld_i64:
946
case INDEX_op_qemu_st_i64:
947
{
948
- TCGMemOpIdx oi = op->args[k++];
949
+ MemOpIdx oi = op->args[k++];
950
MemOp op = get_memop(oi);
951
unsigned ix = get_mmuidx(oi);
952
953
diff --git a/tcg/tci.c b/tcg/tci.c
954
index XXXXXXX..XXXXXXX 100644
955
--- a/tcg/tci.c
956
+++ b/tcg/tci.c
957
@@ -XXX,XX +XXX,XX @@ static uint64_t tci_uint64(uint32_t high, uint32_t low)
958
* i = immediate (uint32_t)
959
* I = immediate (tcg_target_ulong)
960
* l = label or pointer
961
- * m = immediate (TCGMemOpIdx)
962
+ * m = immediate (MemOpIdx)
963
* n = immediate (call return length)
964
* r = register
965
* s = signed ldst offset
966
@@ -XXX,XX +XXX,XX @@ static void tci_args_ri(uint32_t insn, TCGReg *r0, tcg_target_ulong *i1)
967
}
968
969
static void tci_args_rrm(uint32_t insn, TCGReg *r0,
970
- TCGReg *r1, TCGMemOpIdx *m2)
971
+ TCGReg *r1, MemOpIdx *m2)
972
{
973
*r0 = extract32(insn, 8, 4);
974
*r1 = extract32(insn, 12, 4);
975
@@ -XXX,XX +XXX,XX @@ static void tci_args_rrrc(uint32_t insn,
976
}
977
978
static void tci_args_rrrm(uint32_t insn,
979
- TCGReg *r0, TCGReg *r1, TCGReg *r2, TCGMemOpIdx *m3)
980
+ TCGReg *r0, TCGReg *r1, TCGReg *r2, MemOpIdx *m3)
981
{
982
*r0 = extract32(insn, 8, 4);
983
*r1 = extract32(insn, 12, 4);
984
@@ -XXX,XX +XXX,XX @@ static bool tci_compare64(uint64_t u0, uint64_t u1, TCGCond condition)
985
}
986
987
static uint64_t tci_qemu_ld(CPUArchState *env, target_ulong taddr,
988
- TCGMemOpIdx oi, const void *tb_ptr)
989
+ MemOpIdx oi, const void *tb_ptr)
990
{
991
MemOp mop = get_memop(oi) & (MO_BSWAP | MO_SSIZE);
992
uintptr_t ra = (uintptr_t)tb_ptr;
993
@@ -XXX,XX +XXX,XX @@ static uint64_t tci_qemu_ld(CPUArchState *env, target_ulong taddr,
994
}
995
996
static void tci_qemu_st(CPUArchState *env, target_ulong taddr, uint64_t val,
997
- TCGMemOpIdx oi, const void *tb_ptr)
998
+ MemOpIdx oi, const void *tb_ptr)
999
{
1000
MemOp mop = get_memop(oi) & (MO_BSWAP | MO_SSIZE);
1001
uintptr_t ra = (uintptr_t)tb_ptr;
1002
@@ -XXX,XX +XXX,XX @@ uintptr_t QEMU_DISABLE_CFI tcg_qemu_tb_exec(CPUArchState *env,
1003
uint32_t tmp32;
1004
uint64_t tmp64;
1005
uint64_t T1, T2;
1006
- TCGMemOpIdx oi;
1007
+ MemOpIdx oi;
1008
int32_t ofs;
1009
void *ptr;
1010
1011
@@ -XXX,XX +XXX,XX @@ int print_insn_tci(bfd_vma addr, disassemble_info *info)
1012
tcg_target_ulong i1;
1013
int32_t s2;
1014
TCGCond c;
1015
- TCGMemOpIdx oi;
1016
+ MemOpIdx oi;
1017
uint8_t pos, len;
1018
void *ptr;
1019
1020
diff --git a/accel/tcg/atomic_common.c.inc b/accel/tcg/atomic_common.c.inc
1021
index XXXXXXX..XXXXXXX 100644
1022
--- a/accel/tcg/atomic_common.c.inc
1023
+++ b/accel/tcg/atomic_common.c.inc
1024
@@ -XXX,XX +XXX,XX @@
1025
*/
1026
1027
static uint16_t atomic_trace_rmw_pre(CPUArchState *env, target_ulong addr,
1028
- TCGMemOpIdx oi)
1029
+ MemOpIdx oi)
1030
{
1031
CPUState *cpu = env_cpu(env);
1032
uint16_t info = trace_mem_get_info(get_memop(oi), get_mmuidx(oi), false);
1033
@@ -XXX,XX +XXX,XX @@ static void atomic_trace_rmw_post(CPUArchState *env, target_ulong addr,
1034
1035
#if HAVE_ATOMIC128
1036
static uint16_t atomic_trace_ld_pre(CPUArchState *env, target_ulong addr,
1037
- TCGMemOpIdx oi)
1038
+ MemOpIdx oi)
1039
{
1040
uint16_t info = trace_mem_get_info(get_memop(oi), get_mmuidx(oi), false);
1041
1042
@@ -XXX,XX +XXX,XX @@ static void atomic_trace_ld_post(CPUArchState *env, target_ulong addr,
1043
}
1044
1045
static uint16_t atomic_trace_st_pre(CPUArchState *env, target_ulong addr,
1046
- TCGMemOpIdx oi)
1047
+ MemOpIdx oi)
1048
{
1049
uint16_t info = trace_mem_get_info(get_memop(oi), get_mmuidx(oi), true);
1050
1051
diff --git a/tcg/aarch64/tcg-target.c.inc b/tcg/aarch64/tcg-target.c.inc
1052
index XXXXXXX..XXXXXXX 100644
1053
--- a/tcg/aarch64/tcg-target.c.inc
1054
+++ b/tcg/aarch64/tcg-target.c.inc
1055
@@ -XXX,XX +XXX,XX @@ static void tcg_out_cltz(TCGContext *s, TCGType ext, TCGReg d,
1056
#include "../tcg-ldst.c.inc"
1057
1058
/* helper signature: helper_ret_ld_mmu(CPUState *env, target_ulong addr,
1059
- * TCGMemOpIdx oi, uintptr_t ra)
1060
+ * MemOpIdx oi, uintptr_t ra)
1061
*/
1062
static void * const qemu_ld_helpers[MO_SIZE + 1] = {
1063
[MO_8] = helper_ret_ldub_mmu,
1064
@@ -XXX,XX +XXX,XX @@ static void * const qemu_ld_helpers[MO_SIZE + 1] = {
1065
};
1066
1067
/* helper signature: helper_ret_st_mmu(CPUState *env, target_ulong addr,
1068
- * uintxx_t val, TCGMemOpIdx oi,
1069
+ * uintxx_t val, MemOpIdx oi,
1070
* uintptr_t ra)
1071
*/
1072
static void * const qemu_st_helpers[MO_SIZE + 1] = {
1073
@@ -XXX,XX +XXX,XX @@ static inline void tcg_out_adr(TCGContext *s, TCGReg rd, const void *target)
1074
1075
static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1076
{
1077
- TCGMemOpIdx oi = lb->oi;
1078
+ MemOpIdx oi = lb->oi;
1079
MemOp opc = get_memop(oi);
1080
MemOp size = opc & MO_SIZE;
1081
1082
@@ -XXX,XX +XXX,XX @@ static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1083
1084
static bool tcg_out_qemu_st_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1085
{
1086
- TCGMemOpIdx oi = lb->oi;
1087
+ MemOpIdx oi = lb->oi;
1088
MemOp opc = get_memop(oi);
1089
MemOp size = opc & MO_SIZE;
1090
1091
@@ -XXX,XX +XXX,XX @@ static bool tcg_out_qemu_st_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1092
return true;
1093
}
1094
1095
-static void add_qemu_ldst_label(TCGContext *s, bool is_ld, TCGMemOpIdx oi,
1096
+static void add_qemu_ldst_label(TCGContext *s, bool is_ld, MemOpIdx oi,
1097
TCGType ext, TCGReg data_reg, TCGReg addr_reg,
1098
tcg_insn_unit *raddr, tcg_insn_unit *label_ptr)
1099
{
1100
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_st_direct(TCGContext *s, MemOp memop,
1101
}
1102
1103
static void tcg_out_qemu_ld(TCGContext *s, TCGReg data_reg, TCGReg addr_reg,
1104
- TCGMemOpIdx oi, TCGType ext)
1105
+ MemOpIdx oi, TCGType ext)
1106
{
1107
MemOp memop = get_memop(oi);
1108
const TCGType otype = TARGET_LONG_BITS == 64 ? TCG_TYPE_I64 : TCG_TYPE_I32;
1109
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_ld(TCGContext *s, TCGReg data_reg, TCGReg addr_reg,
1110
}
1111
1112
static void tcg_out_qemu_st(TCGContext *s, TCGReg data_reg, TCGReg addr_reg,
1113
- TCGMemOpIdx oi)
1114
+ MemOpIdx oi)
1115
{
1116
MemOp memop = get_memop(oi);
1117
const TCGType otype = TARGET_LONG_BITS == 64 ? TCG_TYPE_I64 : TCG_TYPE_I32;
1118
diff --git a/tcg/arm/tcg-target.c.inc b/tcg/arm/tcg-target.c.inc
1119
index XXXXXXX..XXXXXXX 100644
1120
--- a/tcg/arm/tcg-target.c.inc
1121
+++ b/tcg/arm/tcg-target.c.inc
1122
@@ -XXX,XX +XXX,XX @@ static TCGReg tcg_out_tlb_read(TCGContext *s, TCGReg addrlo, TCGReg addrhi,
1123
/* Record the context of a call to the out of line helper code for the slow
1124
path for a load or store, so that we can later generate the correct
1125
helper code. */
1126
-static void add_qemu_ldst_label(TCGContext *s, bool is_ld, TCGMemOpIdx oi,
1127
+static void add_qemu_ldst_label(TCGContext *s, bool is_ld, MemOpIdx oi,
1128
TCGReg datalo, TCGReg datahi, TCGReg addrlo,
1129
TCGReg addrhi, tcg_insn_unit *raddr,
1130
tcg_insn_unit *label_ptr)
1131
@@ -XXX,XX +XXX,XX @@ static void add_qemu_ldst_label(TCGContext *s, bool is_ld, TCGMemOpIdx oi,
1132
static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1133
{
1134
TCGReg argreg, datalo, datahi;
1135
- TCGMemOpIdx oi = lb->oi;
1136
+ MemOpIdx oi = lb->oi;
1137
MemOp opc = get_memop(oi);
1138
void *func;
1139
1140
@@ -XXX,XX +XXX,XX @@ static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1141
static bool tcg_out_qemu_st_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1142
{
1143
TCGReg argreg, datalo, datahi;
1144
- TCGMemOpIdx oi = lb->oi;
1145
+ MemOpIdx oi = lb->oi;
1146
MemOp opc = get_memop(oi);
1147
1148
if (!reloc_pc24(lb->label_ptr[0], tcg_splitwx_to_rx(s->code_ptr))) {
1149
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_ld_direct(TCGContext *s, MemOp opc, TCGReg datalo,
1150
static void tcg_out_qemu_ld(TCGContext *s, const TCGArg *args, bool is64)
1151
{
1152
TCGReg addrlo, datalo, datahi, addrhi __attribute__((unused));
1153
- TCGMemOpIdx oi;
1154
+ MemOpIdx oi;
1155
MemOp opc;
1156
#ifdef CONFIG_SOFTMMU
1157
int mem_index;
1158
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_st_direct(TCGContext *s, MemOp opc, TCGReg datalo,
1159
static void tcg_out_qemu_st(TCGContext *s, const TCGArg *args, bool is64)
1160
{
1161
TCGReg addrlo, datalo, datahi, addrhi __attribute__((unused));
1162
- TCGMemOpIdx oi;
1163
+ MemOpIdx oi;
1164
MemOp opc;
1165
#ifdef CONFIG_SOFTMMU
1166
int mem_index;
1167
diff --git a/tcg/i386/tcg-target.c.inc b/tcg/i386/tcg-target.c.inc
1168
index XXXXXXX..XXXXXXX 100644
1169
--- a/tcg/i386/tcg-target.c.inc
1170
+++ b/tcg/i386/tcg-target.c.inc
1171
@@ -XXX,XX +XXX,XX @@ static inline void tcg_out_tlb_load(TCGContext *s, TCGReg addrlo, TCGReg addrhi,
1172
* for a load or store, so that we can later generate the correct helper code
1173
*/
1174
static void add_qemu_ldst_label(TCGContext *s, bool is_ld, bool is_64,
1175
- TCGMemOpIdx oi,
1176
+ MemOpIdx oi,
1177
TCGReg datalo, TCGReg datahi,
1178
TCGReg addrlo, TCGReg addrhi,
1179
tcg_insn_unit *raddr,
1180
@@ -XXX,XX +XXX,XX @@ static void add_qemu_ldst_label(TCGContext *s, bool is_ld, bool is_64,
1181
*/
1182
static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
1183
{
1184
- TCGMemOpIdx oi = l->oi;
1185
+ MemOpIdx oi = l->oi;
1186
MemOp opc = get_memop(oi);
1187
TCGReg data_reg;
1188
tcg_insn_unit **label_ptr = &l->label_ptr[0];
1189
@@ -XXX,XX +XXX,XX @@ static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
1190
*/
1191
static bool tcg_out_qemu_st_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
1192
{
1193
- TCGMemOpIdx oi = l->oi;
1194
+ MemOpIdx oi = l->oi;
1195
MemOp opc = get_memop(oi);
1196
MemOp s_bits = opc & MO_SIZE;
1197
tcg_insn_unit **label_ptr = &l->label_ptr[0];
1198
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_ld(TCGContext *s, const TCGArg *args, bool is64)
1199
{
1200
TCGReg datalo, datahi, addrlo;
1201
TCGReg addrhi __attribute__((unused));
1202
- TCGMemOpIdx oi;
1203
+ MemOpIdx oi;
1204
MemOp opc;
1205
#if defined(CONFIG_SOFTMMU)
1206
int mem_index;
1207
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_st(TCGContext *s, const TCGArg *args, bool is64)
1208
{
1209
TCGReg datalo, datahi, addrlo;
1210
TCGReg addrhi __attribute__((unused));
1211
- TCGMemOpIdx oi;
1212
+ MemOpIdx oi;
1213
MemOp opc;
1214
#if defined(CONFIG_SOFTMMU)
1215
int mem_index;
1216
diff --git a/tcg/mips/tcg-target.c.inc b/tcg/mips/tcg-target.c.inc
1217
index XXXXXXX..XXXXXXX 100644
1218
--- a/tcg/mips/tcg-target.c.inc
1219
+++ b/tcg/mips/tcg-target.c.inc
1220
@@ -XXX,XX +XXX,XX @@ QEMU_BUILD_BUG_ON(TLB_MASK_TABLE_OFS(0) < -32768);
1221
* Clobbers TMP0, TMP1, TMP2, TMP3.
1222
*/
1223
static void tcg_out_tlb_load(TCGContext *s, TCGReg base, TCGReg addrl,
1224
- TCGReg addrh, TCGMemOpIdx oi,
1225
+ TCGReg addrh, MemOpIdx oi,
1226
tcg_insn_unit *label_ptr[2], bool is_load)
1227
{
1228
MemOp opc = get_memop(oi);
1229
@@ -XXX,XX +XXX,XX @@ static void tcg_out_tlb_load(TCGContext *s, TCGReg base, TCGReg addrl,
1230
tcg_out_opc_reg(s, ALIAS_PADD, base, TCG_TMP2, addrl);
1231
}
1232
1233
-static void add_qemu_ldst_label(TCGContext *s, int is_ld, TCGMemOpIdx oi,
1234
+static void add_qemu_ldst_label(TCGContext *s, int is_ld, MemOpIdx oi,
1235
TCGType ext,
1236
TCGReg datalo, TCGReg datahi,
1237
TCGReg addrlo, TCGReg addrhi,
1238
@@ -XXX,XX +XXX,XX @@ static void add_qemu_ldst_label(TCGContext *s, int is_ld, TCGMemOpIdx oi,
1239
static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
1240
{
1241
const tcg_insn_unit *tgt_rx = tcg_splitwx_to_rx(s->code_ptr);
1242
- TCGMemOpIdx oi = l->oi;
1243
+ MemOpIdx oi = l->oi;
1244
MemOp opc = get_memop(oi);
1245
TCGReg v0;
1246
int i;
1247
@@ -XXX,XX +XXX,XX @@ static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
1248
static bool tcg_out_qemu_st_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
1249
{
1250
const tcg_insn_unit *tgt_rx = tcg_splitwx_to_rx(s->code_ptr);
1251
- TCGMemOpIdx oi = l->oi;
1252
+ MemOpIdx oi = l->oi;
1253
MemOp opc = get_memop(oi);
1254
MemOp s_bits = opc & MO_SIZE;
1255
int i;
1256
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_ld(TCGContext *s, const TCGArg *args, bool is_64)
1257
{
1258
TCGReg addr_regl, addr_regh __attribute__((unused));
1259
TCGReg data_regl, data_regh;
1260
- TCGMemOpIdx oi;
1261
+ MemOpIdx oi;
1262
MemOp opc;
1263
#if defined(CONFIG_SOFTMMU)
1264
tcg_insn_unit *label_ptr[2];
1265
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_st(TCGContext *s, const TCGArg *args, bool is_64)
1266
{
1267
TCGReg addr_regl, addr_regh __attribute__((unused));
1268
TCGReg data_regl, data_regh;
1269
- TCGMemOpIdx oi;
1270
+ MemOpIdx oi;
1271
MemOp opc;
1272
#if defined(CONFIG_SOFTMMU)
1273
tcg_insn_unit *label_ptr[2];
1274
diff --git a/tcg/ppc/tcg-target.c.inc b/tcg/ppc/tcg-target.c.inc
1275
index XXXXXXX..XXXXXXX 100644
1276
--- a/tcg/ppc/tcg-target.c.inc
1277
+++ b/tcg/ppc/tcg-target.c.inc
1278
@@ -XXX,XX +XXX,XX @@ static TCGReg tcg_out_tlb_read(TCGContext *s, MemOp opc,
1279
/* Record the context of a call to the out of line helper code for the slow
1280
path for a load or store, so that we can later generate the correct
1281
helper code. */
1282
-static void add_qemu_ldst_label(TCGContext *s, bool is_ld, TCGMemOpIdx oi,
1283
+static void add_qemu_ldst_label(TCGContext *s, bool is_ld, MemOpIdx oi,
1284
TCGReg datalo_reg, TCGReg datahi_reg,
1285
TCGReg addrlo_reg, TCGReg addrhi_reg,
1286
tcg_insn_unit *raddr, tcg_insn_unit *lptr)
1287
@@ -XXX,XX +XXX,XX @@ static void add_qemu_ldst_label(TCGContext *s, bool is_ld, TCGMemOpIdx oi,
1288
1289
static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1290
{
1291
- TCGMemOpIdx oi = lb->oi;
1292
+ MemOpIdx oi = lb->oi;
1293
MemOp opc = get_memop(oi);
1294
TCGReg hi, lo, arg = TCG_REG_R3;
1295
1296
@@ -XXX,XX +XXX,XX @@ static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1297
1298
static bool tcg_out_qemu_st_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1299
{
1300
- TCGMemOpIdx oi = lb->oi;
1301
+ MemOpIdx oi = lb->oi;
1302
MemOp opc = get_memop(oi);
1303
MemOp s_bits = opc & MO_SIZE;
1304
TCGReg hi, lo, arg = TCG_REG_R3;
1305
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_ld(TCGContext *s, const TCGArg *args, bool is_64)
1306
{
1307
TCGReg datalo, datahi, addrlo, rbase;
1308
TCGReg addrhi __attribute__((unused));
1309
- TCGMemOpIdx oi;
1310
+ MemOpIdx oi;
1311
MemOp opc, s_bits;
1312
#ifdef CONFIG_SOFTMMU
1313
int mem_index;
1314
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_st(TCGContext *s, const TCGArg *args, bool is_64)
1315
{
1316
TCGReg datalo, datahi, addrlo, rbase;
1317
TCGReg addrhi __attribute__((unused));
1318
- TCGMemOpIdx oi;
1319
+ MemOpIdx oi;
1320
MemOp opc, s_bits;
1321
#ifdef CONFIG_SOFTMMU
1322
int mem_index;
1323
diff --git a/tcg/riscv/tcg-target.c.inc b/tcg/riscv/tcg-target.c.inc
1324
index XXXXXXX..XXXXXXX 100644
1325
--- a/tcg/riscv/tcg-target.c.inc
1326
+++ b/tcg/riscv/tcg-target.c.inc
1327
@@ -XXX,XX +XXX,XX @@ static void tcg_out_mb(TCGContext *s, TCGArg a0)
1328
#include "../tcg-ldst.c.inc"
1329
1330
/* helper signature: helper_ret_ld_mmu(CPUState *env, target_ulong addr,
1331
- * TCGMemOpIdx oi, uintptr_t ra)
1332
+ * MemOpIdx oi, uintptr_t ra)
1333
*/
1334
static void * const qemu_ld_helpers[MO_SSIZE + 1] = {
1335
[MO_UB] = helper_ret_ldub_mmu,
1336
@@ -XXX,XX +XXX,XX @@ static void * const qemu_ld_helpers[MO_SSIZE + 1] = {
1337
};
1338
1339
/* helper signature: helper_ret_st_mmu(CPUState *env, target_ulong addr,
1340
- * uintxx_t val, TCGMemOpIdx oi,
1341
+ * uintxx_t val, MemOpIdx oi,
1342
* uintptr_t ra)
1343
*/
1344
static void * const qemu_st_helpers[MO_SIZE + 1] = {
1345
@@ -XXX,XX +XXX,XX @@ static void tcg_out_goto(TCGContext *s, const tcg_insn_unit *target)
1346
}
1347
1348
static void tcg_out_tlb_load(TCGContext *s, TCGReg addrl,
1349
- TCGReg addrh, TCGMemOpIdx oi,
1350
+ TCGReg addrh, MemOpIdx oi,
1351
tcg_insn_unit **label_ptr, bool is_load)
1352
{
1353
MemOp opc = get_memop(oi);
1354
@@ -XXX,XX +XXX,XX @@ static void tcg_out_tlb_load(TCGContext *s, TCGReg addrl,
1355
tcg_out_opc_reg(s, OPC_ADD, TCG_REG_TMP0, TCG_REG_TMP2, addrl);
1356
}
1357
1358
-static void add_qemu_ldst_label(TCGContext *s, int is_ld, TCGMemOpIdx oi,
1359
+static void add_qemu_ldst_label(TCGContext *s, int is_ld, MemOpIdx oi,
1360
TCGType ext,
1361
TCGReg datalo, TCGReg datahi,
1362
TCGReg addrlo, TCGReg addrhi,
1363
@@ -XXX,XX +XXX,XX @@ static void add_qemu_ldst_label(TCGContext *s, int is_ld, TCGMemOpIdx oi,
1364
1365
static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
1366
{
1367
- TCGMemOpIdx oi = l->oi;
1368
+ MemOpIdx oi = l->oi;
1369
MemOp opc = get_memop(oi);
1370
TCGReg a0 = tcg_target_call_iarg_regs[0];
1371
TCGReg a1 = tcg_target_call_iarg_regs[1];
1372
@@ -XXX,XX +XXX,XX @@ static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
1373
1374
static bool tcg_out_qemu_st_slow_path(TCGContext *s, TCGLabelQemuLdst *l)
1375
{
1376
- TCGMemOpIdx oi = l->oi;
1377
+ MemOpIdx oi = l->oi;
1378
MemOp opc = get_memop(oi);
1379
MemOp s_bits = opc & MO_SIZE;
1380
TCGReg a0 = tcg_target_call_iarg_regs[0];
1381
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_ld(TCGContext *s, const TCGArg *args, bool is_64)
1382
{
1383
TCGReg addr_regl, addr_regh __attribute__((unused));
1384
TCGReg data_regl, data_regh;
1385
- TCGMemOpIdx oi;
1386
+ MemOpIdx oi;
1387
MemOp opc;
1388
#if defined(CONFIG_SOFTMMU)
1389
tcg_insn_unit *label_ptr[1];
1390
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_st(TCGContext *s, const TCGArg *args, bool is_64)
1391
{
1392
TCGReg addr_regl, addr_regh __attribute__((unused));
1393
TCGReg data_regl, data_regh;
1394
- TCGMemOpIdx oi;
1395
+ MemOpIdx oi;
1396
MemOp opc;
1397
#if defined(CONFIG_SOFTMMU)
1398
tcg_insn_unit *label_ptr[1];
1399
diff --git a/tcg/s390/tcg-target.c.inc b/tcg/s390/tcg-target.c.inc
1400
index XXXXXXX..XXXXXXX 100644
1401
--- a/tcg/s390/tcg-target.c.inc
1402
+++ b/tcg/s390/tcg-target.c.inc
1403
@@ -XXX,XX +XXX,XX @@ static TCGReg tcg_out_tlb_read(TCGContext *s, TCGReg addr_reg, MemOp opc,
1404
return addr_reg;
1405
}
1406
1407
-static void add_qemu_ldst_label(TCGContext *s, bool is_ld, TCGMemOpIdx oi,
1408
+static void add_qemu_ldst_label(TCGContext *s, bool is_ld, MemOpIdx oi,
1409
TCGReg data, TCGReg addr,
1410
tcg_insn_unit *raddr, tcg_insn_unit *label_ptr)
1411
{
1412
@@ -XXX,XX +XXX,XX @@ static bool tcg_out_qemu_ld_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1413
{
1414
TCGReg addr_reg = lb->addrlo_reg;
1415
TCGReg data_reg = lb->datalo_reg;
1416
- TCGMemOpIdx oi = lb->oi;
1417
+ MemOpIdx oi = lb->oi;
1418
MemOp opc = get_memop(oi);
1419
1420
if (!patch_reloc(lb->label_ptr[0], R_390_PC16DBL,
1421
@@ -XXX,XX +XXX,XX @@ static bool tcg_out_qemu_st_slow_path(TCGContext *s, TCGLabelQemuLdst *lb)
1422
{
1423
TCGReg addr_reg = lb->addrlo_reg;
1424
TCGReg data_reg = lb->datalo_reg;
1425
- TCGMemOpIdx oi = lb->oi;
1426
+ MemOpIdx oi = lb->oi;
1427
MemOp opc = get_memop(oi);
1428
1429
if (!patch_reloc(lb->label_ptr[0], R_390_PC16DBL,
1430
@@ -XXX,XX +XXX,XX @@ static void tcg_prepare_user_ldst(TCGContext *s, TCGReg *addr_reg,
1431
#endif /* CONFIG_SOFTMMU */
1432
1433
static void tcg_out_qemu_ld(TCGContext* s, TCGReg data_reg, TCGReg addr_reg,
1434
- TCGMemOpIdx oi)
1435
+ MemOpIdx oi)
1436
{
1437
MemOp opc = get_memop(oi);
1438
#ifdef CONFIG_SOFTMMU
1439
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_ld(TCGContext* s, TCGReg data_reg, TCGReg addr_reg,
1440
}
1441
1442
static void tcg_out_qemu_st(TCGContext* s, TCGReg data_reg, TCGReg addr_reg,
1443
- TCGMemOpIdx oi)
1444
+ MemOpIdx oi)
1445
{
1446
MemOp opc = get_memop(oi);
1447
#ifdef CONFIG_SOFTMMU
1448
diff --git a/tcg/sparc/tcg-target.c.inc b/tcg/sparc/tcg-target.c.inc
1449
index XXXXXXX..XXXXXXX 100644
1450
--- a/tcg/sparc/tcg-target.c.inc
1451
+++ b/tcg/sparc/tcg-target.c.inc
1452
@@ -XXX,XX +XXX,XX @@ static const int qemu_st_opc[(MO_SIZE | MO_BSWAP) + 1] = {
1453
};
1454
1455
static void tcg_out_qemu_ld(TCGContext *s, TCGReg data, TCGReg addr,
1456
- TCGMemOpIdx oi, bool is_64)
1457
+ MemOpIdx oi, bool is_64)
1458
{
1459
MemOp memop = get_memop(oi);
1460
#ifdef CONFIG_SOFTMMU
1461
@@ -XXX,XX +XXX,XX @@ static void tcg_out_qemu_ld(TCGContext *s, TCGReg data, TCGReg addr,
1462
}
1463
1464
static void tcg_out_qemu_st(TCGContext *s, TCGReg data, TCGReg addr,
1465
- TCGMemOpIdx oi)
1466
+ MemOpIdx oi)
1467
{
1468
MemOp memop = get_memop(oi);
1469
#ifdef CONFIG_SOFTMMU
1470
diff --git a/tcg/tcg-ldst.c.inc b/tcg/tcg-ldst.c.inc
1471
index XXXXXXX..XXXXXXX 100644
1472
--- a/tcg/tcg-ldst.c.inc
1473
+++ b/tcg/tcg-ldst.c.inc
1474
@@ -XXX,XX +XXX,XX @@
1475
1476
typedef struct TCGLabelQemuLdst {
1477
bool is_ld; /* qemu_ld: true, qemu_st: false */
1478
- TCGMemOpIdx oi;
1479
+ MemOpIdx oi;
1480
TCGType type; /* result type of a load */
1481
TCGReg addrlo_reg; /* reg index for low word of guest virtual addr */
1482
TCGReg addrhi_reg; /* reg index for high word of guest virtual addr */
1483
--
65
--
1484
2.25.1
66
2.34.1
1485
67
1486
68
diff view generated by jsdifflib
1
Add an interface to return the CPUTLBEntryFull struct
2
that goes with the lookup. The result is not intended
3
to be valid across multiple lookups, so the user must
4
use the results immediately.
5
6
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
7
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
8
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
1
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
9
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
2
---
10
---
3
tcg/s390x/tcg-target-con-set.h | 1 +
11
include/exec/exec-all.h | 15 +++++++++++++
4
tcg/s390x/tcg-target.h | 2 +-
12
include/qemu/typedefs.h | 1 +
5
tcg/s390x/tcg-target.c.inc | 20 ++++++++++++++++++++
13
accel/tcg/cputlb.c | 47 +++++++++++++++++++++++++----------------
6
3 files changed, 22 insertions(+), 1 deletion(-)
14
3 files changed, 45 insertions(+), 18 deletions(-)
7
15
8
diff --git a/tcg/s390x/tcg-target-con-set.h b/tcg/s390x/tcg-target-con-set.h
16
diff --git a/include/exec/exec-all.h b/include/exec/exec-all.h
9
index XXXXXXX..XXXXXXX 100644
17
index XXXXXXX..XXXXXXX 100644
10
--- a/tcg/s390x/tcg-target-con-set.h
18
--- a/include/exec/exec-all.h
11
+++ b/tcg/s390x/tcg-target-con-set.h
19
+++ b/include/exec/exec-all.h
12
@@ -XXX,XX +XXX,XX @@ C_O1_I2(r, r, ri)
20
@@ -XXX,XX +XXX,XX @@ int probe_access_flags(CPUArchState *env, target_ulong addr,
13
C_O1_I2(r, rZ, r)
21
MMUAccessType access_type, int mmu_idx,
14
C_O1_I2(v, v, r)
22
bool nonfault, void **phost, uintptr_t retaddr);
15
C_O1_I2(v, v, v)
23
16
+C_O1_I3(v, v, v, v)
24
+#ifndef CONFIG_USER_ONLY
17
C_O1_I4(r, r, ri, r, 0)
25
+/**
18
C_O1_I4(r, r, ri, rI, 0)
26
+ * probe_access_full:
19
C_O2_I2(b, a, 0, r)
27
+ * Like probe_access_flags, except also return into @pfull.
20
diff --git a/tcg/s390x/tcg-target.h b/tcg/s390x/tcg-target.h
28
+ *
29
+ * The CPUTLBEntryFull structure returned via @pfull is transient
30
+ * and must be consumed or copied immediately, before any further
31
+ * access or changes to TLB @mmu_idx.
32
+ */
33
+int probe_access_full(CPUArchState *env, target_ulong addr,
34
+ MMUAccessType access_type, int mmu_idx,
35
+ bool nonfault, void **phost,
36
+ CPUTLBEntryFull **pfull, uintptr_t retaddr);
37
+#endif
38
+
39
#define CODE_GEN_ALIGN 16 /* must be >= of the size of a icache line */
40
41
/* Estimated block size for TB allocation. */
42
diff --git a/include/qemu/typedefs.h b/include/qemu/typedefs.h
21
index XXXXXXX..XXXXXXX 100644
43
index XXXXXXX..XXXXXXX 100644
22
--- a/tcg/s390x/tcg-target.h
44
--- a/include/qemu/typedefs.h
23
+++ b/tcg/s390x/tcg-target.h
45
+++ b/include/qemu/typedefs.h
24
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities[3];
46
@@ -XXX,XX +XXX,XX @@ typedef struct ConfidentialGuestSupport ConfidentialGuestSupport;
25
#define TCG_TARGET_HAS_mul_vec 1
47
typedef struct CPUAddressSpace CPUAddressSpace;
26
#define TCG_TARGET_HAS_sat_vec 0
48
typedef struct CPUArchState CPUArchState;
27
#define TCG_TARGET_HAS_minmax_vec 1
49
typedef struct CPUState CPUState;
28
-#define TCG_TARGET_HAS_bitsel_vec 0
50
+typedef struct CPUTLBEntryFull CPUTLBEntryFull;
29
+#define TCG_TARGET_HAS_bitsel_vec 1
51
typedef struct DeviceListener DeviceListener;
30
#define TCG_TARGET_HAS_cmpsel_vec 0
52
typedef struct DeviceState DeviceState;
31
53
typedef struct DirtyBitmapSnapshot DirtyBitmapSnapshot;
32
/* used for function call generation */
54
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
33
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
34
index XXXXXXX..XXXXXXX 100644
55
index XXXXXXX..XXXXXXX 100644
35
--- a/tcg/s390x/tcg-target.c.inc
56
--- a/accel/tcg/cputlb.c
36
+++ b/tcg/s390x/tcg-target.c.inc
57
+++ b/accel/tcg/cputlb.c
37
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
58
@@ -XXX,XX +XXX,XX @@ static void notdirty_write(CPUState *cpu, vaddr mem_vaddr, unsigned size,
38
VRRa_VUPH = 0xe7d7,
59
static int probe_access_internal(CPUArchState *env, target_ulong addr,
39
VRRa_VUPL = 0xe7d6,
60
int fault_size, MMUAccessType access_type,
40
VRRc_VX = 0xe76d,
61
int mmu_idx, bool nonfault,
41
+ VRRe_VSEL = 0xe78d,
62
- void **phost, uintptr_t retaddr)
42
VRRf_VLVGP = 0xe762,
63
+ void **phost, CPUTLBEntryFull **pfull,
43
64
+ uintptr_t retaddr)
44
VRSa_VERLL = 0xe733,
65
{
45
@@ -XXX,XX +XXX,XX @@ static void tcg_out_insn_VRRc(TCGContext *s, S390Opcode op,
66
uintptr_t index = tlb_index(env, mmu_idx, addr);
46
tcg_out16(s, (op & 0x00ff) | RXB(v1, v2, v3, 0) | (m4 << 12));
67
CPUTLBEntry *entry = tlb_entry(env, mmu_idx, addr);
68
@@ -XXX,XX +XXX,XX @@ static int probe_access_internal(CPUArchState *env, target_ulong addr,
69
mmu_idx, nonfault, retaddr)) {
70
/* Non-faulting page table read failed. */
71
*phost = NULL;
72
+ *pfull = NULL;
73
return TLB_INVALID_MASK;
74
}
75
76
/* TLB resize via tlb_fill may have moved the entry. */
77
+ index = tlb_index(env, mmu_idx, addr);
78
entry = tlb_entry(env, mmu_idx, addr);
79
80
/*
81
@@ -XXX,XX +XXX,XX @@ static int probe_access_internal(CPUArchState *env, target_ulong addr,
82
}
83
flags &= tlb_addr;
84
85
+ *pfull = &env_tlb(env)->d[mmu_idx].fulltlb[index];
86
+
87
/* Fold all "mmio-like" bits into TLB_MMIO. This is not RAM. */
88
if (unlikely(flags & ~(TLB_WATCHPOINT | TLB_NOTDIRTY))) {
89
*phost = NULL;
90
@@ -XXX,XX +XXX,XX @@ static int probe_access_internal(CPUArchState *env, target_ulong addr,
91
return flags;
47
}
92
}
48
93
49
+static void tcg_out_insn_VRRe(TCGContext *s, S390Opcode op,
94
-int probe_access_flags(CPUArchState *env, target_ulong addr,
50
+ TCGReg v1, TCGReg v2, TCGReg v3, TCGReg v4)
95
- MMUAccessType access_type, int mmu_idx,
96
- bool nonfault, void **phost, uintptr_t retaddr)
97
+int probe_access_full(CPUArchState *env, target_ulong addr,
98
+ MMUAccessType access_type, int mmu_idx,
99
+ bool nonfault, void **phost, CPUTLBEntryFull **pfull,
100
+ uintptr_t retaddr)
101
{
102
- int flags;
103
-
104
- flags = probe_access_internal(env, addr, 0, access_type, mmu_idx,
105
- nonfault, phost, retaddr);
106
+ int flags = probe_access_internal(env, addr, 0, access_type, mmu_idx,
107
+ nonfault, phost, pfull, retaddr);
108
109
/* Handle clean RAM pages. */
110
if (unlikely(flags & TLB_NOTDIRTY)) {
111
- uintptr_t index = tlb_index(env, mmu_idx, addr);
112
- CPUTLBEntryFull *full = &env_tlb(env)->d[mmu_idx].fulltlb[index];
113
-
114
- notdirty_write(env_cpu(env), addr, 1, full, retaddr);
115
+ notdirty_write(env_cpu(env), addr, 1, *pfull, retaddr);
116
flags &= ~TLB_NOTDIRTY;
117
}
118
119
return flags;
120
}
121
122
+int probe_access_flags(CPUArchState *env, target_ulong addr,
123
+ MMUAccessType access_type, int mmu_idx,
124
+ bool nonfault, void **phost, uintptr_t retaddr)
51
+{
125
+{
52
+ tcg_debug_assert(is_vector_reg(v1));
126
+ CPUTLBEntryFull *full;
53
+ tcg_debug_assert(is_vector_reg(v2));
127
+
54
+ tcg_debug_assert(is_vector_reg(v3));
128
+ return probe_access_full(env, addr, access_type, mmu_idx,
55
+ tcg_debug_assert(is_vector_reg(v4));
129
+ nonfault, phost, &full, retaddr);
56
+ tcg_out16(s, (op & 0xff00) | ((v1 & 0xf) << 4) | (v2 & 0xf));
57
+ tcg_out16(s, v3 << 12);
58
+ tcg_out16(s, (op & 0x00ff) | RXB(v1, v2, v3, v4) | (v4 << 12));
59
+}
130
+}
60
+
131
+
61
static void tcg_out_insn_VRRf(TCGContext *s, S390Opcode op,
132
void *probe_access(CPUArchState *env, target_ulong addr, int size,
62
TCGReg v1, TCGReg r2, TCGReg r3)
133
MMUAccessType access_type, int mmu_idx, uintptr_t retaddr)
63
{
134
{
64
@@ -XXX,XX +XXX,XX @@ static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
135
+ CPUTLBEntryFull *full;
65
tcg_out_insn(s, VRRc, VMXL, a0, a1, a2, vece);
136
void *host;
66
break;
137
int flags;
67
138
68
+ case INDEX_op_bitsel_vec:
139
g_assert(-(addr | TARGET_PAGE_MASK) >= size);
69
+ tcg_out_insn(s, VRRe, VSEL, a0, a1, a2, args[3]);
140
70
+ break;
141
flags = probe_access_internal(env, addr, size, access_type, mmu_idx,
71
+
142
- false, &host, retaddr);
72
case INDEX_op_cmp_vec:
143
+ false, &host, &full, retaddr);
73
switch ((TCGCond)args[3]) {
144
74
case TCG_COND_EQ:
145
/* Per the interface, size == 0 merely faults the access. */
75
@@ -XXX,XX +XXX,XX @@ int tcg_can_emit_vec_op(TCGOpcode opc, TCGType type, unsigned vece)
146
if (size == 0) {
76
case INDEX_op_add_vec:
147
@@ -XXX,XX +XXX,XX @@ void *probe_access(CPUArchState *env, target_ulong addr, int size,
77
case INDEX_op_and_vec:
148
}
78
case INDEX_op_andc_vec:
149
79
+ case INDEX_op_bitsel_vec:
150
if (unlikely(flags & (TLB_NOTDIRTY | TLB_WATCHPOINT))) {
80
case INDEX_op_neg_vec:
151
- uintptr_t index = tlb_index(env, mmu_idx, addr);
81
case INDEX_op_not_vec:
152
- CPUTLBEntryFull *full = &env_tlb(env)->d[mmu_idx].fulltlb[index];
82
case INDEX_op_or_vec:
153
-
83
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
154
/* Handle watchpoints. */
84
case INDEX_op_shrs_vec:
155
if (flags & TLB_WATCHPOINT) {
85
case INDEX_op_sars_vec:
156
int wp_access = (access_type == MMU_DATA_STORE
86
return C_O1_I2(v, v, r);
157
@@ -XXX,XX +XXX,XX @@ void *probe_access(CPUArchState *env, target_ulong addr, int size,
87
+ case INDEX_op_bitsel_vec:
158
void *tlb_vaddr_to_host(CPUArchState *env, abi_ptr addr,
88
+ return C_O1_I3(v, v, v, v);
159
MMUAccessType access_type, int mmu_idx)
89
160
{
90
default:
161
+ CPUTLBEntryFull *full;
91
g_assert_not_reached();
162
void *host;
163
int flags;
164
165
flags = probe_access_internal(env, addr, 0, access_type,
166
- mmu_idx, true, &host, 0);
167
+ mmu_idx, true, &host, &full, 0);
168
169
/* No combination of flags are expected by the caller. */
170
return flags ? NULL : host;
171
@@ -XXX,XX +XXX,XX @@ void *tlb_vaddr_to_host(CPUArchState *env, abi_ptr addr,
172
tb_page_addr_t get_page_addr_code_hostp(CPUArchState *env, target_ulong addr,
173
void **hostp)
174
{
175
+ CPUTLBEntryFull *full;
176
void *p;
177
178
(void)probe_access_internal(env, addr, 1, MMU_INST_FETCH,
179
- cpu_mmu_index(env, true), false, &p, 0);
180
+ cpu_mmu_index(env, true), false, &p, &full, 0);
181
if (p == NULL) {
182
return -1;
183
}
92
--
184
--
93
2.25.1
185
2.34.1
94
186
95
187
diff view generated by jsdifflib
1
We will shortly use the MemOpIdx directly, but in the meantime
1
Now that we have collected all of the page data into
2
re-compute the trace meminfo.
2
CPUTLBEntryFull, provide an interface to record that
3
all in one go, instead of using 4 arguments. This interface
4
allows CPUTLBEntryFull to be extended without having to
5
change the number of arguments.
3
6
7
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
8
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
4
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
9
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
10
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
6
---
11
---
7
accel/tcg/atomic_template.h | 48 +++++++++++++++++------------------
12
include/exec/cpu-defs.h | 14 +++++++++++
8
accel/tcg/atomic_common.c.inc | 30 +++++++++++-----------
13
include/exec/exec-all.h | 22 ++++++++++++++++++
9
2 files changed, 39 insertions(+), 39 deletions(-)
14
accel/tcg/cputlb.c | 51 ++++++++++++++++++++++++++---------------
15
3 files changed, 69 insertions(+), 18 deletions(-)
10
16
11
diff --git a/accel/tcg/atomic_template.h b/accel/tcg/atomic_template.h
17
diff --git a/include/exec/cpu-defs.h b/include/exec/cpu-defs.h
12
index XXXXXXX..XXXXXXX 100644
18
index XXXXXXX..XXXXXXX 100644
13
--- a/accel/tcg/atomic_template.h
19
--- a/include/exec/cpu-defs.h
14
+++ b/accel/tcg/atomic_template.h
20
+++ b/include/exec/cpu-defs.h
15
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(cmpxchg)(CPUArchState *env, target_ulong addr,
21
@@ -XXX,XX +XXX,XX @@ typedef struct CPUTLBEntryFull {
16
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
22
* + the offset within the target MemoryRegion (otherwise)
17
PAGE_READ | PAGE_WRITE, retaddr);
23
*/
18
DATA_TYPE ret;
24
hwaddr xlat_section;
19
- uint16_t info = atomic_trace_rmw_pre(env, addr, oi);
25
+
20
26
+ /*
21
+ atomic_trace_rmw_pre(env, addr, oi);
27
+ * @phys_addr contains the physical address in the address space
22
#if DATA_SIZE == 16
28
+ * given by cpu_asidx_from_attrs(cpu, @attrs).
23
ret = atomic16_cmpxchg(haddr, cmpv, newv);
29
+ */
24
#else
30
+ hwaddr phys_addr;
25
ret = qatomic_cmpxchg__nocheck(haddr, cmpv, newv);
31
+
26
#endif
32
+ /* @attrs contains the memory transaction attributes for the page. */
27
ATOMIC_MMU_CLEANUP;
33
MemTxAttrs attrs;
28
- atomic_trace_rmw_post(env, addr, info);
34
+
29
+ atomic_trace_rmw_post(env, addr, oi);
35
+ /* @prot contains the complete protections for the page. */
30
return ret;
36
+ uint8_t prot;
37
+
38
+ /* @lg_page_size contains the log2 of the page size. */
39
+ uint8_t lg_page_size;
40
} CPUTLBEntryFull;
41
42
/*
43
diff --git a/include/exec/exec-all.h b/include/exec/exec-all.h
44
index XXXXXXX..XXXXXXX 100644
45
--- a/include/exec/exec-all.h
46
+++ b/include/exec/exec-all.h
47
@@ -XXX,XX +XXX,XX @@ void tlb_flush_range_by_mmuidx_all_cpus_synced(CPUState *cpu,
48
uint16_t idxmap,
49
unsigned bits);
50
51
+/**
52
+ * tlb_set_page_full:
53
+ * @cpu: CPU context
54
+ * @mmu_idx: mmu index of the tlb to modify
55
+ * @vaddr: virtual address of the entry to add
56
+ * @full: the details of the tlb entry
57
+ *
58
+ * Add an entry to @cpu tlb index @mmu_idx. All of the fields of
59
+ * @full must be filled, except for xlat_section, and constitute
60
+ * the complete description of the translated page.
61
+ *
62
+ * This is generally called by the target tlb_fill function after
63
+ * having performed a successful page table walk to find the physical
64
+ * address and attributes for the translation.
65
+ *
66
+ * At most one entry for a given virtual address is permitted. Only a
67
+ * single TARGET_PAGE_SIZE region is mapped; @full->lg_page_size is only
68
+ * used by tlb_flush_page.
69
+ */
70
+void tlb_set_page_full(CPUState *cpu, int mmu_idx, target_ulong vaddr,
71
+ CPUTLBEntryFull *full);
72
+
73
/**
74
* tlb_set_page_with_attrs:
75
* @cpu: CPU to add this TLB entry for
76
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
77
index XXXXXXX..XXXXXXX 100644
78
--- a/accel/tcg/cputlb.c
79
+++ b/accel/tcg/cputlb.c
80
@@ -XXX,XX +XXX,XX @@ static void tlb_add_large_page(CPUArchState *env, int mmu_idx,
81
env_tlb(env)->d[mmu_idx].large_page_mask = lp_mask;
31
}
82
}
32
83
33
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(ld)(CPUArchState *env, target_ulong addr,
84
-/* Add a new TLB entry. At most one entry for a given virtual address
34
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
85
+/*
35
PAGE_READ, retaddr);
86
+ * Add a new TLB entry. At most one entry for a given virtual address
36
DATA_TYPE val;
87
* is permitted. Only a single TARGET_PAGE_SIZE region is mapped, the
37
- uint16_t info = atomic_trace_ld_pre(env, addr, oi);
88
* supplied size is only used by tlb_flush_page.
38
89
*
39
+ atomic_trace_ld_pre(env, addr, oi);
90
* Called from TCG-generated code, which is under an RCU read-side
40
val = atomic16_read(haddr);
91
* critical section.
41
ATOMIC_MMU_CLEANUP;
92
*/
42
- atomic_trace_ld_post(env, addr, info);
93
-void tlb_set_page_with_attrs(CPUState *cpu, target_ulong vaddr,
43
+ atomic_trace_ld_post(env, addr, oi);
94
- hwaddr paddr, MemTxAttrs attrs, int prot,
44
return val;
95
- int mmu_idx, target_ulong size)
96
+void tlb_set_page_full(CPUState *cpu, int mmu_idx,
97
+ target_ulong vaddr, CPUTLBEntryFull *full)
98
{
99
CPUArchState *env = cpu->env_ptr;
100
CPUTLB *tlb = env_tlb(env);
101
@@ -XXX,XX +XXX,XX @@ void tlb_set_page_with_attrs(CPUState *cpu, target_ulong vaddr,
102
CPUTLBEntry *te, tn;
103
hwaddr iotlb, xlat, sz, paddr_page;
104
target_ulong vaddr_page;
105
- int asidx = cpu_asidx_from_attrs(cpu, attrs);
106
- int wp_flags;
107
+ int asidx, wp_flags, prot;
108
bool is_ram, is_romd;
109
110
assert_cpu_is_self(cpu);
111
112
- if (size <= TARGET_PAGE_SIZE) {
113
+ if (full->lg_page_size <= TARGET_PAGE_BITS) {
114
sz = TARGET_PAGE_SIZE;
115
} else {
116
- tlb_add_large_page(env, mmu_idx, vaddr, size);
117
- sz = size;
118
+ sz = (hwaddr)1 << full->lg_page_size;
119
+ tlb_add_large_page(env, mmu_idx, vaddr, sz);
120
}
121
vaddr_page = vaddr & TARGET_PAGE_MASK;
122
- paddr_page = paddr & TARGET_PAGE_MASK;
123
+ paddr_page = full->phys_addr & TARGET_PAGE_MASK;
124
125
+ prot = full->prot;
126
+ asidx = cpu_asidx_from_attrs(cpu, full->attrs);
127
section = address_space_translate_for_iotlb(cpu, asidx, paddr_page,
128
- &xlat, &sz, attrs, &prot);
129
+ &xlat, &sz, full->attrs, &prot);
130
assert(sz >= TARGET_PAGE_SIZE);
131
132
tlb_debug("vaddr=" TARGET_FMT_lx " paddr=0x" TARGET_FMT_plx
133
" prot=%x idx=%d\n",
134
- vaddr, paddr, prot, mmu_idx);
135
+ vaddr, full->phys_addr, prot, mmu_idx);
136
137
address = vaddr_page;
138
- if (size < TARGET_PAGE_SIZE) {
139
+ if (full->lg_page_size < TARGET_PAGE_BITS) {
140
/* Repeat the MMU check and TLB fill on every access. */
141
address |= TLB_INVALID_MASK;
142
}
143
- if (attrs.byte_swap) {
144
+ if (full->attrs.byte_swap) {
145
address |= TLB_BSWAP;
146
}
147
148
@@ -XXX,XX +XXX,XX @@ void tlb_set_page_with_attrs(CPUState *cpu, target_ulong vaddr,
149
* subtract here is that of the page base, and not the same as the
150
* vaddr we add back in io_readx()/io_writex()/get_page_addr_code().
151
*/
152
+ desc->fulltlb[index] = *full;
153
desc->fulltlb[index].xlat_section = iotlb - vaddr_page;
154
- desc->fulltlb[index].attrs = attrs;
155
+ desc->fulltlb[index].phys_addr = paddr_page;
156
+ desc->fulltlb[index].prot = prot;
157
158
/* Now calculate the new entry */
159
tn.addend = addend - vaddr_page;
160
@@ -XXX,XX +XXX,XX @@ void tlb_set_page_with_attrs(CPUState *cpu, target_ulong vaddr,
161
qemu_spin_unlock(&tlb->c.lock);
45
}
162
}
46
163
47
@@ -XXX,XX +XXX,XX @@ void ATOMIC_NAME(st)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
164
-/* Add a new TLB entry, but without specifying the memory
48
{
165
- * transaction attributes to be used.
49
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
166
- */
50
PAGE_WRITE, retaddr);
167
+void tlb_set_page_with_attrs(CPUState *cpu, target_ulong vaddr,
51
- uint16_t info = atomic_trace_st_pre(env, addr, oi);
168
+ hwaddr paddr, MemTxAttrs attrs, int prot,
52
169
+ int mmu_idx, target_ulong size)
53
+ atomic_trace_st_pre(env, addr, oi);
170
+{
54
atomic16_set(haddr, val);
171
+ CPUTLBEntryFull full = {
55
ATOMIC_MMU_CLEANUP;
172
+ .phys_addr = paddr,
56
- atomic_trace_st_post(env, addr, info);
173
+ .attrs = attrs,
57
+ atomic_trace_st_post(env, addr, oi);
174
+ .prot = prot,
58
}
175
+ .lg_page_size = ctz64(size)
59
#endif
176
+ };
60
#else
61
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(xchg)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
62
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
63
PAGE_READ | PAGE_WRITE, retaddr);
64
DATA_TYPE ret;
65
- uint16_t info = atomic_trace_rmw_pre(env, addr, oi);
66
67
+ atomic_trace_rmw_pre(env, addr, oi);
68
ret = qatomic_xchg__nocheck(haddr, val);
69
ATOMIC_MMU_CLEANUP;
70
- atomic_trace_rmw_post(env, addr, info);
71
+ atomic_trace_rmw_post(env, addr, oi);
72
return ret;
73
}
74
75
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(X)(CPUArchState *env, target_ulong addr, \
76
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE, \
77
PAGE_READ | PAGE_WRITE, retaddr); \
78
DATA_TYPE ret; \
79
- uint16_t info = atomic_trace_rmw_pre(env, addr, oi); \
80
+ atomic_trace_rmw_pre(env, addr, oi); \
81
ret = qatomic_##X(haddr, val); \
82
ATOMIC_MMU_CLEANUP; \
83
- atomic_trace_rmw_post(env, addr, info); \
84
+ atomic_trace_rmw_post(env, addr, oi); \
85
return ret; \
86
}
87
88
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(X)(CPUArchState *env, target_ulong addr, \
89
XDATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE, \
90
PAGE_READ | PAGE_WRITE, retaddr); \
91
XDATA_TYPE cmp, old, new, val = xval; \
92
- uint16_t info = atomic_trace_rmw_pre(env, addr, oi); \
93
+ atomic_trace_rmw_pre(env, addr, oi); \
94
smp_mb(); \
95
cmp = qatomic_read__nocheck(haddr); \
96
do { \
97
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(X)(CPUArchState *env, target_ulong addr, \
98
cmp = qatomic_cmpxchg__nocheck(haddr, old, new); \
99
} while (cmp != old); \
100
ATOMIC_MMU_CLEANUP; \
101
- atomic_trace_rmw_post(env, addr, info); \
102
+ atomic_trace_rmw_post(env, addr, oi); \
103
return RET; \
104
}
105
106
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(cmpxchg)(CPUArchState *env, target_ulong addr,
107
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
108
PAGE_READ | PAGE_WRITE, retaddr);
109
DATA_TYPE ret;
110
- uint16_t info = atomic_trace_rmw_pre(env, addr, oi);
111
112
+ atomic_trace_rmw_pre(env, addr, oi);
113
#if DATA_SIZE == 16
114
ret = atomic16_cmpxchg(haddr, BSWAP(cmpv), BSWAP(newv));
115
#else
116
ret = qatomic_cmpxchg__nocheck(haddr, BSWAP(cmpv), BSWAP(newv));
117
#endif
118
ATOMIC_MMU_CLEANUP;
119
- atomic_trace_rmw_post(env, addr, info);
120
+ atomic_trace_rmw_post(env, addr, oi);
121
return BSWAP(ret);
122
}
123
124
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(ld)(CPUArchState *env, target_ulong addr,
125
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
126
PAGE_READ, retaddr);
127
DATA_TYPE val;
128
- uint16_t info = atomic_trace_ld_pre(env, addr, oi);
129
130
+ atomic_trace_ld_pre(env, addr, oi);
131
val = atomic16_read(haddr);
132
ATOMIC_MMU_CLEANUP;
133
- atomic_trace_ld_post(env, addr, info);
134
+ atomic_trace_ld_post(env, addr, oi);
135
return BSWAP(val);
136
}
137
138
@@ -XXX,XX +XXX,XX @@ void ATOMIC_NAME(st)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
139
{
140
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
141
PAGE_WRITE, retaddr);
142
- uint16_t info = atomic_trace_st_pre(env, addr, oi);
143
144
+ atomic_trace_st_pre(env, addr, oi);
145
val = BSWAP(val);
146
atomic16_set(haddr, val);
147
ATOMIC_MMU_CLEANUP;
148
- atomic_trace_st_post(env, addr, info);
149
+ atomic_trace_st_post(env, addr, oi);
150
}
151
#endif
152
#else
153
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(xchg)(CPUArchState *env, target_ulong addr, ABI_TYPE val,
154
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE,
155
PAGE_READ | PAGE_WRITE, retaddr);
156
ABI_TYPE ret;
157
- uint16_t info = atomic_trace_rmw_pre(env, addr, oi);
158
159
+ atomic_trace_rmw_pre(env, addr, oi);
160
ret = qatomic_xchg__nocheck(haddr, BSWAP(val));
161
ATOMIC_MMU_CLEANUP;
162
- atomic_trace_rmw_post(env, addr, info);
163
+ atomic_trace_rmw_post(env, addr, oi);
164
return BSWAP(ret);
165
}
166
167
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(X)(CPUArchState *env, target_ulong addr, \
168
DATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE, \
169
PAGE_READ | PAGE_WRITE, retaddr); \
170
DATA_TYPE ret; \
171
- uint16_t info = atomic_trace_rmw_pre(env, addr, oi); \
172
+ atomic_trace_rmw_pre(env, addr, oi); \
173
ret = qatomic_##X(haddr, BSWAP(val)); \
174
ATOMIC_MMU_CLEANUP; \
175
- atomic_trace_rmw_post(env, addr, info); \
176
+ atomic_trace_rmw_post(env, addr, oi); \
177
return BSWAP(ret); \
178
}
179
180
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(X)(CPUArchState *env, target_ulong addr, \
181
XDATA_TYPE *haddr = atomic_mmu_lookup(env, addr, oi, DATA_SIZE, \
182
PAGE_READ | PAGE_WRITE, retaddr); \
183
XDATA_TYPE ldo, ldn, old, new, val = xval; \
184
- uint16_t info = atomic_trace_rmw_pre(env, addr, oi); \
185
+ atomic_trace_rmw_pre(env, addr, oi); \
186
smp_mb(); \
187
ldn = qatomic_read__nocheck(haddr); \
188
do { \
189
@@ -XXX,XX +XXX,XX @@ ABI_TYPE ATOMIC_NAME(X)(CPUArchState *env, target_ulong addr, \
190
ldn = qatomic_cmpxchg__nocheck(haddr, ldo, BSWAP(new)); \
191
} while (ldo != ldn); \
192
ATOMIC_MMU_CLEANUP; \
193
- atomic_trace_rmw_post(env, addr, info); \
194
+ atomic_trace_rmw_post(env, addr, oi); \
195
return RET; \
196
}
197
198
diff --git a/accel/tcg/atomic_common.c.inc b/accel/tcg/atomic_common.c.inc
199
index XXXXXXX..XXXXXXX 100644
200
--- a/accel/tcg/atomic_common.c.inc
201
+++ b/accel/tcg/atomic_common.c.inc
202
@@ -XXX,XX +XXX,XX @@
203
* See the COPYING file in the top-level directory.
204
*/
205
206
-static uint16_t atomic_trace_rmw_pre(CPUArchState *env, target_ulong addr,
207
- MemOpIdx oi)
208
+static void atomic_trace_rmw_pre(CPUArchState *env, target_ulong addr,
209
+ MemOpIdx oi)
210
{
211
CPUState *cpu = env_cpu(env);
212
uint16_t info = trace_mem_get_info(oi, false);
213
214
trace_guest_mem_before_exec(cpu, addr, info);
215
trace_guest_mem_before_exec(cpu, addr, info | TRACE_MEM_ST);
216
-
217
- return info;
218
}
219
220
static void atomic_trace_rmw_post(CPUArchState *env, target_ulong addr,
221
- uint16_t info)
222
+ MemOpIdx oi)
223
{
224
+ uint16_t info = trace_mem_get_info(oi, false);
225
+
177
+
226
qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, info);
178
+ assert(is_power_of_2(size));
227
qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, info | TRACE_MEM_ST);
179
+ tlb_set_page_full(cpu, mmu_idx, vaddr, &full);
228
}
180
+}
229
230
#if HAVE_ATOMIC128
231
-static uint16_t atomic_trace_ld_pre(CPUArchState *env, target_ulong addr,
232
- MemOpIdx oi)
233
+static void atomic_trace_ld_pre(CPUArchState *env, target_ulong addr,
234
+ MemOpIdx oi)
235
{
236
uint16_t info = trace_mem_get_info(oi, false);
237
238
trace_guest_mem_before_exec(env_cpu(env), addr, info);
239
-
240
- return info;
241
}
242
243
static void atomic_trace_ld_post(CPUArchState *env, target_ulong addr,
244
- uint16_t info)
245
+ MemOpIdx oi)
246
{
247
+ uint16_t info = trace_mem_get_info(oi, false);
248
+
181
+
249
qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, info);
182
void tlb_set_page(CPUState *cpu, target_ulong vaddr,
250
}
183
hwaddr paddr, int prot,
251
184
int mmu_idx, target_ulong size)
252
-static uint16_t atomic_trace_st_pre(CPUArchState *env, target_ulong addr,
253
- MemOpIdx oi)
254
+static void atomic_trace_st_pre(CPUArchState *env, target_ulong addr,
255
+ MemOpIdx oi)
256
{
257
uint16_t info = trace_mem_get_info(oi, true);
258
259
trace_guest_mem_before_exec(env_cpu(env), addr, info);
260
-
261
- return info;
262
}
263
264
static void atomic_trace_st_post(CPUArchState *env, target_ulong addr,
265
- uint16_t info)
266
+ MemOpIdx oi)
267
{
268
+ uint16_t info = trace_mem_get_info(oi, false);
269
+
270
qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, info);
271
}
272
#endif
273
--
185
--
274
2.25.1
186
2.34.1
275
187
276
188
diff view generated by jsdifflib
1
Despite the comment, the members were not kept at the end.
1
Allow the target to cache items from the guest page tables.
2
2
3
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
4
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
3
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
5
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
4
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
6
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
---
7
---
6
include/hw/core/cpu.h | 11 +++++++----
8
include/exec/cpu-defs.h | 9 +++++++++
7
1 file changed, 7 insertions(+), 4 deletions(-)
9
1 file changed, 9 insertions(+)
8
10
9
diff --git a/include/hw/core/cpu.h b/include/hw/core/cpu.h
11
diff --git a/include/exec/cpu-defs.h b/include/exec/cpu-defs.h
10
index XXXXXXX..XXXXXXX 100644
12
index XXXXXXX..XXXXXXX 100644
11
--- a/include/hw/core/cpu.h
13
--- a/include/exec/cpu-defs.h
12
+++ b/include/hw/core/cpu.h
14
+++ b/include/exec/cpu-defs.h
13
@@ -XXX,XX +XXX,XX @@ struct CPUClass {
15
@@ -XXX,XX +XXX,XX @@ typedef struct CPUTLBEntryFull {
14
ObjectClass *(*class_by_name)(const char *cpu_model);
16
15
void (*parse_features)(const char *typename, char *str, Error **errp);
17
/* @lg_page_size contains the log2 of the page size. */
16
18
uint8_t lg_page_size;
17
- int reset_dump_flags;
18
bool (*has_work)(CPUState *cpu);
19
int (*memory_rw_debug)(CPUState *cpu, vaddr addr,
20
uint8_t *buf, int len, bool is_write);
21
@@ -XXX,XX +XXX,XX @@ struct CPUClass {
22
void (*disas_set_info)(CPUState *cpu, disassemble_info *info);
23
24
const char *deprecation_note;
25
- /* Keep non-pointer data at the end to minimize holes. */
26
- int gdb_num_core_regs;
27
- bool gdb_stop_before_watchpoint;
28
struct AccelCPUClass *accel_cpu;
29
30
/* when system emulation is not available, this pointer is NULL */
31
@@ -XXX,XX +XXX,XX @@ struct CPUClass {
32
* class data that depends on the accelerator, see accel/accel-common.c.
33
*/
34
void (*init_accel_cpu)(struct AccelCPUClass *accel_cpu, CPUClass *cc);
35
+
19
+
36
+ /*
20
+ /*
37
+ * Keep non-pointer data at the end to minimize holes.
21
+ * Allow target-specific additions to this structure.
22
+ * This may be used to cache items from the guest cpu
23
+ * page tables for later use by the implementation.
38
+ */
24
+ */
39
+ int reset_dump_flags;
25
+#ifdef TARGET_PAGE_ENTRY_EXTRA
40
+ int gdb_num_core_regs;
26
+ TARGET_PAGE_ENTRY_EXTRA
41
+ bool gdb_stop_before_watchpoint;
27
+#endif
42
};
28
} CPUTLBEntryFull;
43
29
44
/*
30
/*
45
--
31
--
46
2.25.1
32
2.34.1
47
33
48
34
diff view generated by jsdifflib
1
We will shortly need to be able to check facilities beyond the
1
This bitmap is created and discarded immediately.
2
first 64. Instead of explicitly masking against s390_facilities,
2
We gain nothing by its existence.
3
create a HAVE_FACILITY macro that indexes an array.
4
3
5
Reviewed-by: David Hildenbrand <david@redhat.com>
4
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
6
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
6
Message-Id: <20220822232338.1727934-2-richard.henderson@linaro.org>
7
---
7
---
8
v2: Change name to HAVE_FACILITY (david)
8
accel/tcg/translate-all.c | 78 ++-------------------------------------
9
---
9
1 file changed, 4 insertions(+), 74 deletions(-)
10
tcg/s390x/tcg-target.h | 29 ++++++++-------
11
tcg/s390x/tcg-target.c.inc | 74 +++++++++++++++++++-------------------
12
2 files changed, 52 insertions(+), 51 deletions(-)
13
10
14
diff --git a/tcg/s390x/tcg-target.h b/tcg/s390x/tcg-target.h
11
diff --git a/accel/tcg/translate-all.c b/accel/tcg/translate-all.c
15
index XXXXXXX..XXXXXXX 100644
12
index XXXXXXX..XXXXXXX 100644
16
--- a/tcg/s390x/tcg-target.h
13
--- a/accel/tcg/translate-all.c
17
+++ b/tcg/s390x/tcg-target.h
14
+++ b/accel/tcg/translate-all.c
18
@@ -XXX,XX +XXX,XX @@ typedef enum TCGReg {
19
/* A list of relevant facilities used by this translator. Some of these
20
are required for proper operation, and these are checked at startup. */
21
22
-#define FACILITY_ZARCH_ACTIVE (1ULL << (63 - 2))
23
-#define FACILITY_LONG_DISP (1ULL << (63 - 18))
24
-#define FACILITY_EXT_IMM (1ULL << (63 - 21))
25
-#define FACILITY_GEN_INST_EXT (1ULL << (63 - 34))
26
-#define FACILITY_LOAD_ON_COND (1ULL << (63 - 45))
27
+#define FACILITY_ZARCH_ACTIVE 2
28
+#define FACILITY_LONG_DISP 18
29
+#define FACILITY_EXT_IMM 21
30
+#define FACILITY_GEN_INST_EXT 34
31
+#define FACILITY_LOAD_ON_COND 45
32
#define FACILITY_FAST_BCR_SER FACILITY_LOAD_ON_COND
33
#define FACILITY_DISTINCT_OPS FACILITY_LOAD_ON_COND
34
-#define FACILITY_LOAD_ON_COND2 (1ULL << (63 - 53))
35
+#define FACILITY_LOAD_ON_COND2 53
36
37
-extern uint64_t s390_facilities;
38
+extern uint64_t s390_facilities[1];
39
+
40
+#define HAVE_FACILITY(X) \
41
+ ((s390_facilities[FACILITY_##X / 64] >> (63 - FACILITY_##X % 64)) & 1)
42
43
/* optional instructions */
44
#define TCG_TARGET_HAS_div2_i32 1
45
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities;
46
#define TCG_TARGET_HAS_clz_i32 0
47
#define TCG_TARGET_HAS_ctz_i32 0
48
#define TCG_TARGET_HAS_ctpop_i32 0
49
-#define TCG_TARGET_HAS_deposit_i32 (s390_facilities & FACILITY_GEN_INST_EXT)
50
-#define TCG_TARGET_HAS_extract_i32 (s390_facilities & FACILITY_GEN_INST_EXT)
51
+#define TCG_TARGET_HAS_deposit_i32 HAVE_FACILITY(GEN_INST_EXT)
52
+#define TCG_TARGET_HAS_extract_i32 HAVE_FACILITY(GEN_INST_EXT)
53
#define TCG_TARGET_HAS_sextract_i32 0
54
#define TCG_TARGET_HAS_extract2_i32 0
55
#define TCG_TARGET_HAS_movcond_i32 1
56
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities;
57
#define TCG_TARGET_HAS_mulsh_i32 0
58
#define TCG_TARGET_HAS_extrl_i64_i32 0
59
#define TCG_TARGET_HAS_extrh_i64_i32 0
60
-#define TCG_TARGET_HAS_direct_jump (s390_facilities & FACILITY_GEN_INST_EXT)
61
+#define TCG_TARGET_HAS_direct_jump HAVE_FACILITY(GEN_INST_EXT)
62
#define TCG_TARGET_HAS_qemu_st8_i32 0
63
64
#define TCG_TARGET_HAS_div2_i64 1
65
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities;
66
#define TCG_TARGET_HAS_eqv_i64 0
67
#define TCG_TARGET_HAS_nand_i64 0
68
#define TCG_TARGET_HAS_nor_i64 0
69
-#define TCG_TARGET_HAS_clz_i64 (s390_facilities & FACILITY_EXT_IMM)
70
+#define TCG_TARGET_HAS_clz_i64 HAVE_FACILITY(EXT_IMM)
71
#define TCG_TARGET_HAS_ctz_i64 0
72
#define TCG_TARGET_HAS_ctpop_i64 0
73
-#define TCG_TARGET_HAS_deposit_i64 (s390_facilities & FACILITY_GEN_INST_EXT)
74
-#define TCG_TARGET_HAS_extract_i64 (s390_facilities & FACILITY_GEN_INST_EXT)
75
+#define TCG_TARGET_HAS_deposit_i64 HAVE_FACILITY(GEN_INST_EXT)
76
+#define TCG_TARGET_HAS_extract_i64 HAVE_FACILITY(GEN_INST_EXT)
77
#define TCG_TARGET_HAS_sextract_i64 0
78
#define TCG_TARGET_HAS_extract2_i64 0
79
#define TCG_TARGET_HAS_movcond_i64 1
80
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
81
index XXXXXXX..XXXXXXX 100644
82
--- a/tcg/s390x/tcg-target.c.inc
83
+++ b/tcg/s390x/tcg-target.c.inc
84
@@ -XXX,XX +XXX,XX @@
15
@@ -XXX,XX +XXX,XX @@
85
We don't need this when we have pc-relative loads with the general
16
#define assert_memory_lock() tcg_debug_assert(have_mmap_lock())
86
instructions extension facility. */
87
#define TCG_REG_TB TCG_REG_R12
88
-#define USE_REG_TB (!(s390_facilities & FACILITY_GEN_INST_EXT))
89
+#define USE_REG_TB (!HAVE_FACILITY(GEN_INST_EXT))
90
91
#ifndef CONFIG_SOFTMMU
92
#define TCG_GUEST_BASE_REG TCG_REG_R13
93
@@ -XXX,XX +XXX,XX @@ static void * const qemu_st_helpers[(MO_SIZE | MO_BSWAP) + 1] = {
94
#endif
17
#endif
95
18
96
static const tcg_insn_unit *tb_ret_addr;
19
-#define SMC_BITMAP_USE_THRESHOLD 10
97
-uint64_t s390_facilities;
20
-
98
+uint64_t s390_facilities[1];
21
typedef struct PageDesc {
99
22
/* list of TBs intersecting this ram page */
100
static bool patch_reloc(tcg_insn_unit *src_rw, int type,
23
uintptr_t first_tb;
101
intptr_t value, intptr_t addend)
24
-#ifdef CONFIG_SOFTMMU
102
@@ -XXX,XX +XXX,XX @@ static void tcg_out_movi_int(TCGContext *s, TCGType type, TCGReg ret,
25
- /* in order to optimize self modifying code, we count the number
103
}
26
- of lookups we do to a given page to use a bitmap */
104
27
- unsigned long *code_bitmap;
105
/* Try all 48-bit insns that can load it in one go. */
28
- unsigned int code_write_count;
106
- if (s390_facilities & FACILITY_EXT_IMM) {
29
-#else
107
+ if (HAVE_FACILITY(EXT_IMM)) {
30
+#ifdef CONFIG_USER_ONLY
108
if (sval == (int32_t)sval) {
31
unsigned long flags;
109
tcg_out_insn(s, RIL, LGFI, ret, sval);
32
void *target_data;
110
return;
33
#endif
111
@@ -XXX,XX +XXX,XX @@ static void tcg_out_movi_int(TCGContext *s, TCGType type, TCGReg ret,
34
-#ifndef CONFIG_USER_ONLY
112
}
35
+#ifdef CONFIG_SOFTMMU
113
36
QemuSpin lock;
114
/* Otherwise, stuff it in the constant pool. */
37
#endif
115
- if (s390_facilities & FACILITY_GEN_INST_EXT) {
38
} PageDesc;
116
+ if (HAVE_FACILITY(GEN_INST_EXT)) {
39
@@ -XXX,XX +XXX,XX @@ void tb_htable_init(void)
117
tcg_out_insn(s, RIL, LGRL, ret, 0);
40
qht_init(&tb_ctx.htable, tb_cmp, CODE_GEN_HTABLE_SIZE, mode);
118
new_pool_label(s, sval, R_390_PC32DBL, s->code_ptr - 2, 2);
41
}
119
} else if (USE_REG_TB && !in_prologue) {
42
120
@@ -XXX,XX +XXX,XX @@ static void tcg_out_ld_abs(TCGContext *s, TCGType type,
43
-/* call with @p->lock held */
44
-static inline void invalidate_page_bitmap(PageDesc *p)
45
-{
46
- assert_page_locked(p);
47
-#ifdef CONFIG_SOFTMMU
48
- g_free(p->code_bitmap);
49
- p->code_bitmap = NULL;
50
- p->code_write_count = 0;
51
-#endif
52
-}
53
-
54
/* Set to NULL all the 'first_tb' fields in all PageDescs. */
55
static void page_flush_tb_1(int level, void **lp)
121
{
56
{
122
intptr_t addr = (intptr_t)abs;
57
@@ -XXX,XX +XXX,XX @@ static void page_flush_tb_1(int level, void **lp)
123
58
for (i = 0; i < V_L2_SIZE; ++i) {
124
- if ((s390_facilities & FACILITY_GEN_INST_EXT) && !(addr & 1)) {
59
page_lock(&pd[i]);
125
+ if (HAVE_FACILITY(GEN_INST_EXT) && !(addr & 1)) {
60
pd[i].first_tb = (uintptr_t)NULL;
126
ptrdiff_t disp = tcg_pcrel_diff(s, abs) >> 1;
61
- invalidate_page_bitmap(pd + i);
127
if (disp == (int32_t)disp) {
62
page_unlock(&pd[i]);
128
if (type == TCG_TYPE_I32) {
63
}
129
@@ -XXX,XX +XXX,XX @@ static inline void tcg_out_risbg(TCGContext *s, TCGReg dest, TCGReg src,
64
} else {
130
65
@@ -XXX,XX +XXX,XX @@ static void do_tb_phys_invalidate(TranslationBlock *tb, bool rm_from_page_list)
131
static void tgen_ext8s(TCGContext *s, TCGType type, TCGReg dest, TCGReg src)
66
if (rm_from_page_list) {
132
{
67
p = page_find(tb->page_addr[0] >> TARGET_PAGE_BITS);
133
- if (s390_facilities & FACILITY_EXT_IMM) {
68
tb_page_remove(p, tb);
134
+ if (HAVE_FACILITY(EXT_IMM)) {
69
- invalidate_page_bitmap(p);
135
tcg_out_insn(s, RRE, LGBR, dest, src);
70
if (tb->page_addr[1] != -1) {
136
return;
71
p = page_find(tb->page_addr[1] >> TARGET_PAGE_BITS);
137
}
72
tb_page_remove(p, tb);
138
@@ -XXX,XX +XXX,XX @@ static void tgen_ext8s(TCGContext *s, TCGType type, TCGReg dest, TCGReg src)
73
- invalidate_page_bitmap(p);
139
140
static void tgen_ext8u(TCGContext *s, TCGType type, TCGReg dest, TCGReg src)
141
{
142
- if (s390_facilities & FACILITY_EXT_IMM) {
143
+ if (HAVE_FACILITY(EXT_IMM)) {
144
tcg_out_insn(s, RRE, LLGCR, dest, src);
145
return;
146
}
147
@@ -XXX,XX +XXX,XX @@ static void tgen_ext8u(TCGContext *s, TCGType type, TCGReg dest, TCGReg src)
148
149
static void tgen_ext16s(TCGContext *s, TCGType type, TCGReg dest, TCGReg src)
150
{
151
- if (s390_facilities & FACILITY_EXT_IMM) {
152
+ if (HAVE_FACILITY(EXT_IMM)) {
153
tcg_out_insn(s, RRE, LGHR, dest, src);
154
return;
155
}
156
@@ -XXX,XX +XXX,XX @@ static void tgen_ext16s(TCGContext *s, TCGType type, TCGReg dest, TCGReg src)
157
158
static void tgen_ext16u(TCGContext *s, TCGType type, TCGReg dest, TCGReg src)
159
{
160
- if (s390_facilities & FACILITY_EXT_IMM) {
161
+ if (HAVE_FACILITY(EXT_IMM)) {
162
tcg_out_insn(s, RRE, LLGHR, dest, src);
163
return;
164
}
165
@@ -XXX,XX +XXX,XX @@ static void tgen_andi(TCGContext *s, TCGType type, TCGReg dest, uint64_t val)
166
tgen_ext32u(s, dest, dest);
167
return;
168
}
169
- if (s390_facilities & FACILITY_EXT_IMM) {
170
+ if (HAVE_FACILITY(EXT_IMM)) {
171
if ((val & valid) == 0xff) {
172
tgen_ext8u(s, TCG_TYPE_I64, dest, dest);
173
return;
174
@@ -XXX,XX +XXX,XX @@ static void tgen_andi(TCGContext *s, TCGType type, TCGReg dest, uint64_t val)
175
}
176
177
/* Try all 48-bit insns that can perform it in one go. */
178
- if (s390_facilities & FACILITY_EXT_IMM) {
179
+ if (HAVE_FACILITY(EXT_IMM)) {
180
for (i = 0; i < 2; i++) {
181
tcg_target_ulong mask = ~(0xffffffffull << i*32);
182
if (((val | ~valid) & mask) == mask) {
183
@@ -XXX,XX +XXX,XX @@ static void tgen_andi(TCGContext *s, TCGType type, TCGReg dest, uint64_t val)
184
}
185
}
74
}
186
}
75
}
187
- if ((s390_facilities & FACILITY_GEN_INST_EXT) && risbg_mask(val)) {
76
188
+ if (HAVE_FACILITY(GEN_INST_EXT) && risbg_mask(val)) {
77
@@ -XXX,XX +XXX,XX @@ void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr)
189
tgen_andi_risbg(s, dest, dest, val);
190
return;
191
}
192
@@ -XXX,XX +XXX,XX @@ static void tgen_ori(TCGContext *s, TCGType type, TCGReg dest, uint64_t val)
193
}
194
195
/* Try all 48-bit insns that can perform it in one go. */
196
- if (s390_facilities & FACILITY_EXT_IMM) {
197
+ if (HAVE_FACILITY(EXT_IMM)) {
198
for (i = 0; i < 2; i++) {
199
tcg_target_ulong mask = (0xffffffffull << i*32);
200
if ((val & mask) != 0 && (val & ~mask) == 0) {
201
@@ -XXX,XX +XXX,XX @@ static void tgen_ori(TCGContext *s, TCGType type, TCGReg dest, uint64_t val)
202
/* Perform the OR via sequential modifications to the high and
203
low parts. Do this via recursion to handle 16-bit vs 32-bit
204
masks in each half. */
205
- tcg_debug_assert(s390_facilities & FACILITY_EXT_IMM);
206
+ tcg_debug_assert(HAVE_FACILITY(EXT_IMM));
207
tgen_ori(s, type, dest, val & 0x00000000ffffffffull);
208
tgen_ori(s, type, dest, val & 0xffffffff00000000ull);
209
}
210
@@ -XXX,XX +XXX,XX @@ static void tgen_ori(TCGContext *s, TCGType type, TCGReg dest, uint64_t val)
211
static void tgen_xori(TCGContext *s, TCGType type, TCGReg dest, uint64_t val)
212
{
213
/* Try all 48-bit insns that can perform it in one go. */
214
- if (s390_facilities & FACILITY_EXT_IMM) {
215
+ if (HAVE_FACILITY(EXT_IMM)) {
216
if ((val & 0xffffffff00000000ull) == 0) {
217
tcg_out_insn(s, RIL, XILF, dest, val);
218
return;
219
@@ -XXX,XX +XXX,XX @@ static void tgen_xori(TCGContext *s, TCGType type, TCGReg dest, uint64_t val)
220
tcg_tbrel_diff(s, NULL));
221
} else {
222
/* Perform the xor by parts. */
223
- tcg_debug_assert(s390_facilities & FACILITY_EXT_IMM);
224
+ tcg_debug_assert(HAVE_FACILITY(EXT_IMM));
225
if (val & 0xffffffff) {
226
tcg_out_insn(s, RIL, XILF, dest, val);
227
}
228
@@ -XXX,XX +XXX,XX @@ static int tgen_cmp(TCGContext *s, TCGType type, TCGCond c, TCGReg r1,
229
goto exit;
230
}
231
232
- if (s390_facilities & FACILITY_EXT_IMM) {
233
+ if (HAVE_FACILITY(EXT_IMM)) {
234
if (type == TCG_TYPE_I32) {
235
op = (is_unsigned ? RIL_CLFI : RIL_CFI);
236
tcg_out_insn_RIL(s, op, r1, c2);
237
@@ -XXX,XX +XXX,XX @@ static void tgen_setcond(TCGContext *s, TCGType type, TCGCond cond,
238
bool have_loc;
239
240
/* With LOC2, we can always emit the minimum 3 insns. */
241
- if (s390_facilities & FACILITY_LOAD_ON_COND2) {
242
+ if (HAVE_FACILITY(LOAD_ON_COND2)) {
243
/* Emit: d = 0, d = (cc ? 1 : d). */
244
cc = tgen_cmp(s, type, cond, c1, c2, c2const, false);
245
tcg_out_movi(s, TCG_TYPE_I64, dest, 0);
246
@@ -XXX,XX +XXX,XX @@ static void tgen_setcond(TCGContext *s, TCGType type, TCGCond cond,
247
return;
248
}
249
250
- have_loc = (s390_facilities & FACILITY_LOAD_ON_COND) != 0;
251
+ have_loc = HAVE_FACILITY(LOAD_ON_COND);
252
253
/* For HAVE_LOC, only the paths through GTU/GT/LEU/LE are smaller. */
254
restart:
255
@@ -XXX,XX +XXX,XX @@ static void tgen_movcond(TCGContext *s, TCGType type, TCGCond c, TCGReg dest,
256
TCGArg v3, int v3const)
257
{
258
int cc;
259
- if (s390_facilities & FACILITY_LOAD_ON_COND) {
260
+ if (HAVE_FACILITY(LOAD_ON_COND)) {
261
cc = tgen_cmp(s, type, c, c1, c2, c2const, false);
262
if (v3const) {
263
tcg_out_insn(s, RIE, LOCGHI, dest, v3, cc);
264
@@ -XXX,XX +XXX,XX @@ static void tgen_clz(TCGContext *s, TCGReg dest, TCGReg a1,
265
} else {
266
tcg_out_mov(s, TCG_TYPE_I64, dest, a2);
267
}
268
- if (s390_facilities & FACILITY_LOAD_ON_COND) {
269
+ if (HAVE_FACILITY(LOAD_ON_COND)) {
270
/* Emit: if (one bit found) dest = r0. */
271
tcg_out_insn(s, RRF, LOCGR, dest, TCG_REG_R0, 2);
272
} else {
273
@@ -XXX,XX +XXX,XX @@ static void tgen_brcond(TCGContext *s, TCGType type, TCGCond c,
274
{
275
int cc;
276
277
- if (s390_facilities & FACILITY_GEN_INST_EXT) {
278
+ if (HAVE_FACILITY(GEN_INST_EXT)) {
279
bool is_unsigned = is_unsigned_cond(c);
280
bool in_range;
281
S390Opcode opc;
282
@@ -XXX,XX +XXX,XX @@ static TCGReg tcg_out_tlb_read(TCGContext *s, TCGReg addr_reg, MemOp opc,
283
cross pages using the address of the last byte of the access. */
284
a_off = (a_bits >= s_bits ? 0 : s_mask - a_mask);
285
tlb_mask = (uint64_t)TARGET_PAGE_MASK | a_mask;
286
- if ((s390_facilities & FACILITY_GEN_INST_EXT) && a_off == 0) {
287
+ if (HAVE_FACILITY(GEN_INST_EXT) && a_off == 0) {
288
tgen_andi_risbg(s, TCG_REG_R3, addr_reg, tlb_mask);
289
} else {
290
tcg_out_insn(s, RX, LA, TCG_REG_R3, addr_reg, TCG_REG_NONE, a_off);
291
@@ -XXX,XX +XXX,XX @@ static inline void tcg_out_op(TCGContext *s, TCGOpcode opc,
292
tcg_out_insn(s, RI, AHI, a0, a2);
293
break;
294
}
295
- if (s390_facilities & FACILITY_EXT_IMM) {
296
+ if (HAVE_FACILITY(EXT_IMM)) {
297
tcg_out_insn(s, RIL, AFI, a0, a2);
298
break;
299
}
300
@@ -XXX,XX +XXX,XX @@ static inline void tcg_out_op(TCGContext *s, TCGOpcode opc,
301
tcg_out_insn(s, RI, AGHI, a0, a2);
302
break;
303
}
304
- if (s390_facilities & FACILITY_EXT_IMM) {
305
+ if (HAVE_FACILITY(EXT_IMM)) {
306
if (a2 == (int32_t)a2) {
307
tcg_out_insn(s, RIL, AGFI, a0, a2);
308
break;
309
@@ -XXX,XX +XXX,XX @@ static inline void tcg_out_op(TCGContext *s, TCGOpcode opc,
310
/* The host memory model is quite strong, we simply need to
311
serialize the instruction stream. */
312
if (args[0] & TCG_MO_ST_LD) {
313
- tcg_out_insn(s, RR, BCR,
314
- s390_facilities & FACILITY_FAST_BCR_SER ? 14 : 15, 0);
315
+ tcg_out_insn(s, RR, BCR, HAVE_FACILITY(FAST_BCR_SER) ? 14 : 15, 0);
316
}
317
break;
318
319
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
320
case INDEX_op_or_i64:
321
case INDEX_op_xor_i32:
322
case INDEX_op_xor_i64:
323
- return (s390_facilities & FACILITY_DISTINCT_OPS
324
+ return (HAVE_FACILITY(DISTINCT_OPS)
325
? C_O1_I2(r, r, ri)
326
: C_O1_I2(r, 0, ri));
327
328
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
329
/* If we have the general-instruction-extensions, then we have
330
MULTIPLY SINGLE IMMEDIATE with a signed 32-bit, otherwise we
331
have only MULTIPLY HALFWORD IMMEDIATE, with a signed 16-bit. */
332
- return (s390_facilities & FACILITY_GEN_INST_EXT
333
+ return (HAVE_FACILITY(GEN_INST_EXT)
334
? C_O1_I2(r, 0, ri)
335
: C_O1_I2(r, 0, rI));
336
337
case INDEX_op_mul_i64:
338
- return (s390_facilities & FACILITY_GEN_INST_EXT
339
+ return (HAVE_FACILITY(GEN_INST_EXT)
340
? C_O1_I2(r, 0, rJ)
341
: C_O1_I2(r, 0, rI));
342
343
case INDEX_op_shl_i32:
344
case INDEX_op_shr_i32:
345
case INDEX_op_sar_i32:
346
- return (s390_facilities & FACILITY_DISTINCT_OPS
347
+ return (HAVE_FACILITY(DISTINCT_OPS)
348
? C_O1_I2(r, r, ri)
349
: C_O1_I2(r, 0, ri));
350
351
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
352
353
case INDEX_op_movcond_i32:
354
case INDEX_op_movcond_i64:
355
- return (s390_facilities & FACILITY_LOAD_ON_COND2
356
+ return (HAVE_FACILITY(LOAD_ON_COND2)
357
? C_O1_I4(r, r, ri, rI, 0)
358
: C_O1_I4(r, r, ri, r, 0));
359
360
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
361
362
case INDEX_op_add2_i32:
363
case INDEX_op_sub2_i32:
364
- return (s390_facilities & FACILITY_EXT_IMM
365
+ return (HAVE_FACILITY(EXT_IMM)
366
? C_O2_I4(r, r, 0, 1, ri, r)
367
: C_O2_I4(r, r, 0, 1, r, r));
368
369
case INDEX_op_add2_i64:
370
case INDEX_op_sub2_i64:
371
- return (s390_facilities & FACILITY_EXT_IMM
372
+ return (HAVE_FACILITY(EXT_IMM)
373
? C_O2_I4(r, r, 0, 1, rA, r)
374
: C_O2_I4(r, r, 0, 1, r, r));
375
376
@@ -XXX,XX +XXX,XX @@ static void query_s390_facilities(void)
377
/* Is STORE FACILITY LIST EXTENDED available? Honestly, I believe this
378
is present on all 64-bit systems, but let's check for it anyway. */
379
if (hwcap & HWCAP_S390_STFLE) {
380
- register int r0 __asm__("0");
381
- register void *r1 __asm__("1");
382
+ register int r0 __asm__("0") = ARRAY_SIZE(s390_facilities) - 1;
383
+ register void *r1 __asm__("1") = s390_facilities;
384
385
/* stfle 0(%r1) */
386
- r1 = &s390_facilities;
387
asm volatile(".word 0xb2b0,0x1000"
388
- : "=r"(r0) : "0"(0), "r"(r1) : "memory", "cc");
389
+ : "=r"(r0) : "r"(r0), "r"(r1) : "memory", "cc");
390
}
78
}
391
}
79
}
392
80
81
-#ifdef CONFIG_SOFTMMU
82
-/* call with @p->lock held */
83
-static void build_page_bitmap(PageDesc *p)
84
-{
85
- int n, tb_start, tb_end;
86
- TranslationBlock *tb;
87
-
88
- assert_page_locked(p);
89
- p->code_bitmap = bitmap_new(TARGET_PAGE_SIZE);
90
-
91
- PAGE_FOR_EACH_TB(p, tb, n) {
92
- /* NOTE: this is subtle as a TB may span two physical pages */
93
- if (n == 0) {
94
- /* NOTE: tb_end may be after the end of the page, but
95
- it is not a problem */
96
- tb_start = tb->pc & ~TARGET_PAGE_MASK;
97
- tb_end = tb_start + tb->size;
98
- if (tb_end > TARGET_PAGE_SIZE) {
99
- tb_end = TARGET_PAGE_SIZE;
100
- }
101
- } else {
102
- tb_start = 0;
103
- tb_end = ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
104
- }
105
- bitmap_set(p->code_bitmap, tb_start, tb_end - tb_start);
106
- }
107
-}
108
-#endif
109
-
110
/* add the tb in the target page and protect it if necessary
111
*
112
* Called with mmap_lock held for user-mode emulation.
113
@@ -XXX,XX +XXX,XX @@ static inline void tb_page_add(PageDesc *p, TranslationBlock *tb,
114
page_already_protected = p->first_tb != (uintptr_t)NULL;
115
#endif
116
p->first_tb = (uintptr_t)tb | n;
117
- invalidate_page_bitmap(p);
118
119
#if defined(CONFIG_USER_ONLY)
120
/* translator_loop() must have made all TB pages non-writable */
121
@@ -XXX,XX +XXX,XX @@ tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
122
/* remove TB from the page(s) if we couldn't insert it */
123
if (unlikely(existing_tb)) {
124
tb_page_remove(p, tb);
125
- invalidate_page_bitmap(p);
126
if (p2) {
127
tb_page_remove(p2, tb);
128
- invalidate_page_bitmap(p2);
129
}
130
tb = existing_tb;
131
}
132
@@ -XXX,XX +XXX,XX @@ tb_invalidate_phys_page_range__locked(struct page_collection *pages,
133
#if !defined(CONFIG_USER_ONLY)
134
/* if no code remaining, no need to continue to use slow writes */
135
if (!p->first_tb) {
136
- invalidate_page_bitmap(p);
137
tlb_unprotect_code(start);
138
}
139
#endif
140
@@ -XXX,XX +XXX,XX @@ void tb_invalidate_phys_page_fast(struct page_collection *pages,
141
}
142
143
assert_page_locked(p);
144
- if (!p->code_bitmap &&
145
- ++p->code_write_count >= SMC_BITMAP_USE_THRESHOLD) {
146
- build_page_bitmap(p);
147
- }
148
- if (p->code_bitmap) {
149
- unsigned int nr;
150
- unsigned long b;
151
-
152
- nr = start & ~TARGET_PAGE_MASK;
153
- b = p->code_bitmap[BIT_WORD(nr)] >> (nr & (BITS_PER_LONG - 1));
154
- if (b & ((1 << len) - 1)) {
155
- goto do_invalidate;
156
- }
157
- } else {
158
- do_invalidate:
159
- tb_invalidate_phys_page_range__locked(pages, p, start, start + len,
160
- retaddr);
161
- }
162
+ tb_invalidate_phys_page_range__locked(pages, p, start, start + len,
163
+ retaddr);
164
}
165
#else
166
/* Called with mmap_lock held. If pc is not 0 then it indicates the
393
--
167
--
394
2.25.1
168
2.34.1
395
169
396
170
diff view generated by jsdifflib
1
Implementing add, sub, and, or, xor as the minimal set.
1
Bool is more appropriate type for the alloc parameter.
2
This allows us to actually enable vectors in query_s390_facilities.
3
2
4
Reviewed-by: David Hildenbrand <david@redhat.com>
3
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
4
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
6
---
6
---
7
tcg/s390x/tcg-target.c.inc | 154 ++++++++++++++++++++++++++++++++++++-
7
accel/tcg/translate-all.c | 14 +++++++-------
8
1 file changed, 150 insertions(+), 4 deletions(-)
8
1 file changed, 7 insertions(+), 7 deletions(-)
9
9
10
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
10
diff --git a/accel/tcg/translate-all.c b/accel/tcg/translate-all.c
11
index XXXXXXX..XXXXXXX 100644
11
index XXXXXXX..XXXXXXX 100644
12
--- a/tcg/s390x/tcg-target.c.inc
12
--- a/accel/tcg/translate-all.c
13
+++ b/tcg/s390x/tcg-target.c.inc
13
+++ b/accel/tcg/translate-all.c
14
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
14
@@ -XXX,XX +XXX,XX @@ void page_init(void)
15
VRIc_VREP = 0xe74d,
15
#endif
16
17
VRRa_VLR = 0xe756,
18
+ VRRc_VA = 0xe7f3,
19
+ VRRc_VCEQ = 0xe7f8, /* we leave the m5 cs field 0 */
20
+ VRRc_VCH = 0xe7fb, /* " */
21
+ VRRc_VCHL = 0xe7f9, /* " */
22
+ VRRc_VN = 0xe768,
23
+ VRRc_VO = 0xe76a,
24
+ VRRc_VS = 0xe7f7,
25
+ VRRc_VX = 0xe76d,
26
VRRf_VLVGP = 0xe762,
27
28
VRSb_VLVG = 0xe722,
29
@@ -XXX,XX +XXX,XX @@ static void tcg_out_insn_VRRa(TCGContext *s, S390Opcode op,
30
tcg_out32(s, (op & 0x00ff) | RXB(v1, v2, 0, 0) | (m3 << 12));
31
}
16
}
32
17
33
+static void tcg_out_insn_VRRc(TCGContext *s, S390Opcode op,
18
-static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
34
+ TCGReg v1, TCGReg v2, TCGReg v3, int m4)
19
+static PageDesc *page_find_alloc(tb_page_addr_t index, bool alloc)
35
+{
36
+ tcg_debug_assert(is_vector_reg(v1));
37
+ tcg_debug_assert(is_vector_reg(v2));
38
+ tcg_debug_assert(is_vector_reg(v3));
39
+ tcg_out16(s, (op & 0xff00) | ((v1 & 0xf) << 4) | (v2 & 0xf));
40
+ tcg_out16(s, v3 << 12);
41
+ tcg_out16(s, (op & 0x00ff) | RXB(v1, v2, v3, 0) | (m4 << 12));
42
+}
43
+
44
static void tcg_out_insn_VRRf(TCGContext *s, S390Opcode op,
45
TCGReg v1, TCGReg r2, TCGReg r3)
46
{
20
{
47
@@ -XXX,XX +XXX,XX @@ static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
21
PageDesc *pd;
48
unsigned vecl, unsigned vece,
22
void **lp;
49
const TCGArg *args, const int *const_args)
23
@@ -XXX,XX +XXX,XX @@ static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
24
25
static inline PageDesc *page_find(tb_page_addr_t index)
50
{
26
{
51
- g_assert_not_reached();
27
- return page_find_alloc(index, 0);
52
+ TCGType type = vecl + TCG_TYPE_V64;
28
+ return page_find_alloc(index, false);
53
+ TCGArg a0 = args[0], a1 = args[1], a2 = args[2];
54
+
55
+ switch (opc) {
56
+ case INDEX_op_ld_vec:
57
+ tcg_out_ld(s, type, a0, a1, a2);
58
+ break;
59
+ case INDEX_op_st_vec:
60
+ tcg_out_st(s, type, a0, a1, a2);
61
+ break;
62
+ case INDEX_op_dupm_vec:
63
+ tcg_out_dupm_vec(s, type, vece, a0, a1, a2);
64
+ break;
65
+
66
+ case INDEX_op_add_vec:
67
+ tcg_out_insn(s, VRRc, VA, a0, a1, a2, vece);
68
+ break;
69
+ case INDEX_op_sub_vec:
70
+ tcg_out_insn(s, VRRc, VS, a0, a1, a2, vece);
71
+ break;
72
+ case INDEX_op_and_vec:
73
+ tcg_out_insn(s, VRRc, VN, a0, a1, a2, 0);
74
+ break;
75
+ case INDEX_op_or_vec:
76
+ tcg_out_insn(s, VRRc, VO, a0, a1, a2, 0);
77
+ break;
78
+ case INDEX_op_xor_vec:
79
+ tcg_out_insn(s, VRRc, VX, a0, a1, a2, 0);
80
+ break;
81
+
82
+ case INDEX_op_cmp_vec:
83
+ switch ((TCGCond)args[3]) {
84
+ case TCG_COND_EQ:
85
+ tcg_out_insn(s, VRRc, VCEQ, a0, a1, a2, vece);
86
+ break;
87
+ case TCG_COND_GT:
88
+ tcg_out_insn(s, VRRc, VCH, a0, a1, a2, vece);
89
+ break;
90
+ case TCG_COND_GTU:
91
+ tcg_out_insn(s, VRRc, VCHL, a0, a1, a2, vece);
92
+ break;
93
+ default:
94
+ g_assert_not_reached();
95
+ }
96
+ break;
97
+
98
+ case INDEX_op_mov_vec: /* Always emitted via tcg_out_mov. */
99
+ case INDEX_op_dup_vec: /* Always emitted via tcg_out_dup_vec. */
100
+ default:
101
+ g_assert_not_reached();
102
+ }
103
}
29
}
104
30
105
int tcg_can_emit_vec_op(TCGOpcode opc, TCGType type, unsigned vece)
31
static void page_lock_pair(PageDesc **ret_p1, tb_page_addr_t phys1,
32
- PageDesc **ret_p2, tb_page_addr_t phys2, int alloc);
33
+ PageDesc **ret_p2, tb_page_addr_t phys2, bool alloc);
34
35
/* In user-mode page locks aren't used; mmap_lock is enough */
36
#ifdef CONFIG_USER_ONLY
37
@@ -XXX,XX +XXX,XX @@ static inline void page_unlock(PageDesc *pd)
38
/* lock the page(s) of a TB in the correct acquisition order */
39
static inline void page_lock_tb(const TranslationBlock *tb)
106
{
40
{
107
- return 0;
41
- page_lock_pair(NULL, tb->page_addr[0], NULL, tb->page_addr[1], 0);
108
+ switch (opc) {
42
+ page_lock_pair(NULL, tb->page_addr[0], NULL, tb->page_addr[1], false);
109
+ case INDEX_op_add_vec:
110
+ case INDEX_op_and_vec:
111
+ case INDEX_op_or_vec:
112
+ case INDEX_op_sub_vec:
113
+ case INDEX_op_xor_vec:
114
+ return 1;
115
+ case INDEX_op_cmp_vec:
116
+ return -1;
117
+ default:
118
+ return 0;
119
+ }
120
+}
121
+
122
+static bool expand_vec_cmp_noinv(TCGType type, unsigned vece, TCGv_vec v0,
123
+ TCGv_vec v1, TCGv_vec v2, TCGCond cond)
124
+{
125
+ bool need_swap = false, need_inv = false;
126
+
127
+ switch (cond) {
128
+ case TCG_COND_EQ:
129
+ case TCG_COND_GT:
130
+ case TCG_COND_GTU:
131
+ break;
132
+ case TCG_COND_NE:
133
+ case TCG_COND_LE:
134
+ case TCG_COND_LEU:
135
+ need_inv = true;
136
+ break;
137
+ case TCG_COND_LT:
138
+ case TCG_COND_LTU:
139
+ need_swap = true;
140
+ break;
141
+ case TCG_COND_GE:
142
+ case TCG_COND_GEU:
143
+ need_swap = need_inv = true;
144
+ break;
145
+ default:
146
+ g_assert_not_reached();
147
+ }
148
+
149
+ if (need_inv) {
150
+ cond = tcg_invert_cond(cond);
151
+ }
152
+ if (need_swap) {
153
+ TCGv_vec t1;
154
+ t1 = v1, v1 = v2, v2 = t1;
155
+ cond = tcg_swap_cond(cond);
156
+ }
157
+
158
+ vec_gen_4(INDEX_op_cmp_vec, type, vece, tcgv_vec_arg(v0),
159
+ tcgv_vec_arg(v1), tcgv_vec_arg(v2), cond);
160
+
161
+ return need_inv;
162
+}
163
+
164
+static void expand_vec_cmp(TCGType type, unsigned vece, TCGv_vec v0,
165
+ TCGv_vec v1, TCGv_vec v2, TCGCond cond)
166
+{
167
+ if (expand_vec_cmp_noinv(type, vece, v0, v1, v2, cond)) {
168
+ tcg_gen_not_vec(vece, v0, v0);
169
+ }
170
}
43
}
171
44
172
void tcg_expand_vec_op(TCGOpcode opc, TCGType type, unsigned vece,
45
static inline void page_unlock_tb(const TranslationBlock *tb)
173
TCGArg a0, ...)
46
@@ -XXX,XX +XXX,XX @@ void page_collection_unlock(struct page_collection *set)
47
#endif /* !CONFIG_USER_ONLY */
48
49
static void page_lock_pair(PageDesc **ret_p1, tb_page_addr_t phys1,
50
- PageDesc **ret_p2, tb_page_addr_t phys2, int alloc)
51
+ PageDesc **ret_p2, tb_page_addr_t phys2, bool alloc)
174
{
52
{
175
- g_assert_not_reached();
53
PageDesc *p1, *p2;
176
+ va_list va;
54
tb_page_addr_t page1;
177
+ TCGv_vec v0, v1, v2;
55
@@ -XXX,XX +XXX,XX @@ tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
178
+
56
* Note that inserting into the hash table first isn't an option, since
179
+ va_start(va, a0);
57
* we can only insert TBs that are fully initialized.
180
+ v0 = temp_tcgv_vec(arg_temp(a0));
181
+ v1 = temp_tcgv_vec(arg_temp(va_arg(va, TCGArg)));
182
+ v2 = temp_tcgv_vec(arg_temp(va_arg(va, TCGArg)));
183
+
184
+ switch (opc) {
185
+ case INDEX_op_cmp_vec:
186
+ expand_vec_cmp(type, vece, v0, v1, v2, va_arg(va, TCGArg));
187
+ break;
188
+
189
+ default:
190
+ g_assert_not_reached();
191
+ }
192
+ va_end(va);
193
}
194
195
static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
196
@@ -XXX,XX +XXX,XX @@ static void query_s390_facilities(void)
197
* There is nothing else we currently care about in the 3rd word, so
198
* disable VECTOR with one store.
199
*/
58
*/
200
- if (1 || !(hwcap & HWCAP_S390_VXRS)) {
59
- page_lock_pair(&p, phys_pc, &p2, phys_page2, 1);
201
+ if (!(hwcap & HWCAP_S390_VXRS)) {
60
+ page_lock_pair(&p, phys_pc, &p2, phys_page2, true);
202
s390_facilities[2] = 0;
61
tb_page_add(p, tb, 0, phys_pc & TARGET_PAGE_MASK);
203
}
62
if (p2) {
204
}
63
tb_page_add(p2, tb, 1, phys_page2);
64
@@ -XXX,XX +XXX,XX @@ void page_set_flags(target_ulong start, target_ulong end, int flags)
65
for (addr = start, len = end - start;
66
len != 0;
67
len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
68
- PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
69
+ PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, true);
70
71
/* If the write protection bit is set, then we invalidate
72
the code inside. */
205
--
73
--
206
2.25.1
74
2.34.1
207
75
208
76
diff view generated by jsdifflib
1
The unsigned saturations are handled via generic code
1
Use the pc coming from db->pc_first rather than the TB.
2
using min/max. The signed saturations are expanded using
3
double-sized arithmetic and a saturating pack.
4
2
5
Since all operations are done via expansion, do not
3
Use the cached host_addr rather than re-computing for the
6
actually set TCG_TARGET_HAS_sat_vec.
4
first page. We still need a separate lookup for the second
5
page because it won't be computed for DisasContextBase until
6
the translator actually performs a read from the page.
7
7
8
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
8
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
9
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
9
---
10
---
10
tcg/s390x/tcg-target.opc.h | 3 ++
11
include/exec/plugin-gen.h | 7 ++++---
11
tcg/s390x/tcg-target.c.inc | 63 ++++++++++++++++++++++++++++++++++++++
12
accel/tcg/plugin-gen.c | 22 +++++++++++-----------
12
2 files changed, 66 insertions(+)
13
accel/tcg/translator.c | 2 +-
14
3 files changed, 16 insertions(+), 15 deletions(-)
13
15
14
diff --git a/tcg/s390x/tcg-target.opc.h b/tcg/s390x/tcg-target.opc.h
16
diff --git a/include/exec/plugin-gen.h b/include/exec/plugin-gen.h
15
index XXXXXXX..XXXXXXX 100644
17
index XXXXXXX..XXXXXXX 100644
16
--- a/tcg/s390x/tcg-target.opc.h
18
--- a/include/exec/plugin-gen.h
17
+++ b/tcg/s390x/tcg-target.opc.h
19
+++ b/include/exec/plugin-gen.h
18
@@ -XXX,XX +XXX,XX @@
20
@@ -XXX,XX +XXX,XX @@ struct DisasContextBase;
19
* emitted by tcg_expand_vec_op. For those familiar with GCC internals,
21
20
* consider these to be UNSPEC with names.
22
#ifdef CONFIG_PLUGIN
21
*/
23
22
+DEF(s390_vuph_vec, 1, 1, 0, IMPLVEC)
24
-bool plugin_gen_tb_start(CPUState *cpu, const TranslationBlock *tb, bool supress);
23
+DEF(s390_vupl_vec, 1, 1, 0, IMPLVEC)
25
+bool plugin_gen_tb_start(CPUState *cpu, const struct DisasContextBase *db,
24
+DEF(s390_vpks_vec, 1, 2, 0, IMPLVEC)
26
+ bool supress);
25
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
27
void plugin_gen_tb_end(CPUState *cpu);
28
void plugin_gen_insn_start(CPUState *cpu, const struct DisasContextBase *db);
29
void plugin_gen_insn_end(void);
30
@@ -XXX,XX +XXX,XX @@ static inline void plugin_insn_append(abi_ptr pc, const void *from, size_t size)
31
32
#else /* !CONFIG_PLUGIN */
33
34
-static inline
35
-bool plugin_gen_tb_start(CPUState *cpu, const TranslationBlock *tb, bool supress)
36
+static inline bool
37
+plugin_gen_tb_start(CPUState *cpu, const struct DisasContextBase *db, bool sup)
38
{
39
return false;
40
}
41
diff --git a/accel/tcg/plugin-gen.c b/accel/tcg/plugin-gen.c
26
index XXXXXXX..XXXXXXX 100644
42
index XXXXXXX..XXXXXXX 100644
27
--- a/tcg/s390x/tcg-target.c.inc
43
--- a/accel/tcg/plugin-gen.c
28
+++ b/tcg/s390x/tcg-target.c.inc
44
+++ b/accel/tcg/plugin-gen.c
29
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
45
@@ -XXX,XX +XXX,XX @@ static void plugin_gen_inject(const struct qemu_plugin_tb *plugin_tb)
30
VRRc_VNO = 0xe76b,
46
pr_ops();
31
VRRc_VO = 0xe76a,
47
}
32
VRRc_VOC = 0xe76f,
48
33
+ VRRc_VPKS = 0xe797, /* we leave the m5 cs field 0 */
49
-bool plugin_gen_tb_start(CPUState *cpu, const TranslationBlock *tb, bool mem_only)
34
VRRc_VS = 0xe7f7,
50
+bool plugin_gen_tb_start(CPUState *cpu, const DisasContextBase *db,
35
+ VRRa_VUPH = 0xe7d7,
51
+ bool mem_only)
36
+ VRRa_VUPL = 0xe7d6,
52
{
37
VRRc_VX = 0xe76d,
53
bool ret = false;
38
VRRf_VLVGP = 0xe762,
54
39
55
@@ -XXX,XX +XXX,XX @@ bool plugin_gen_tb_start(CPUState *cpu, const TranslationBlock *tb, bool mem_onl
40
@@ -XXX,XX +XXX,XX @@ static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
56
41
}
57
ret = true;
42
break;
58
43
59
- ptb->vaddr = tb->pc;
44
+ case INDEX_op_s390_vuph_vec:
60
+ ptb->vaddr = db->pc_first;
45
+ tcg_out_insn(s, VRRa, VUPH, a0, a1, vece);
61
ptb->vaddr2 = -1;
46
+ break;
62
- get_page_addr_code_hostp(cpu->env_ptr, tb->pc, &ptb->haddr1);
47
+ case INDEX_op_s390_vupl_vec:
63
+ ptb->haddr1 = db->host_addr[0];
48
+ tcg_out_insn(s, VRRa, VUPL, a0, a1, vece);
64
ptb->haddr2 = NULL;
49
+ break;
65
ptb->mem_only = mem_only;
50
+ case INDEX_op_s390_vpks_vec:
66
51
+ tcg_out_insn(s, VRRc, VPKS, a0, a1, a2, vece);
67
@@ -XXX,XX +XXX,XX @@ void plugin_gen_insn_start(CPUState *cpu, const DisasContextBase *db)
52
+ break;
68
* Note that we skip this when haddr1 == NULL, e.g. when we're
53
+
69
* fetching instructions from a region not backed by RAM.
54
case INDEX_op_mov_vec: /* Always emitted via tcg_out_mov. */
70
*/
55
case INDEX_op_dup_vec: /* Always emitted via tcg_out_dup_vec. */
71
- if (likely(ptb->haddr1 != NULL && ptb->vaddr2 == -1) &&
56
default:
72
- unlikely((db->pc_next & TARGET_PAGE_MASK) !=
57
@@ -XXX,XX +XXX,XX @@ int tcg_can_emit_vec_op(TCGOpcode opc, TCGType type, unsigned vece)
73
- (db->pc_first & TARGET_PAGE_MASK))) {
58
return -1;
74
- get_page_addr_code_hostp(cpu->env_ptr, db->pc_next,
59
case INDEX_op_mul_vec:
75
- &ptb->haddr2);
60
return vece < MO_64;
76
- ptb->vaddr2 = db->pc_next;
61
+ case INDEX_op_ssadd_vec:
77
- }
62
+ case INDEX_op_sssub_vec:
78
- if (likely(ptb->vaddr2 == -1)) {
63
+ return vece < MO_64 ? -1 : 0;
79
+ if (ptb->haddr1 == NULL) {
64
default:
80
+ pinsn->haddr = NULL;
65
return 0;
81
+ } else if (is_same_page(db, db->pc_next)) {
66
}
82
pinsn->haddr = ptb->haddr1 + pinsn->vaddr - ptb->vaddr;
67
@@ -XXX,XX +XXX,XX @@ static void expand_vec_cmp(TCGType type, unsigned vece, TCGv_vec v0,
83
} else {
84
+ if (ptb->vaddr2 == -1) {
85
+ ptb->vaddr2 = TARGET_PAGE_ALIGN(db->pc_first);
86
+ get_page_addr_code_hostp(cpu->env_ptr, ptb->vaddr2, &ptb->haddr2);
87
+ }
88
pinsn->haddr = ptb->haddr2 + pinsn->vaddr - ptb->vaddr2;
68
}
89
}
69
}
90
}
70
91
diff --git a/accel/tcg/translator.c b/accel/tcg/translator.c
71
+static void expand_vec_sat(TCGType type, unsigned vece, TCGv_vec v0,
92
index XXXXXXX..XXXXXXX 100644
72
+ TCGv_vec v1, TCGv_vec v2, TCGOpcode add_sub_opc)
93
--- a/accel/tcg/translator.c
73
+{
94
+++ b/accel/tcg/translator.c
74
+ TCGv_vec h1 = tcg_temp_new_vec(type);
95
@@ -XXX,XX +XXX,XX @@ void translator_loop(CPUState *cpu, TranslationBlock *tb, int max_insns,
75
+ TCGv_vec h2 = tcg_temp_new_vec(type);
96
ops->tb_start(db, cpu);
76
+ TCGv_vec l1 = tcg_temp_new_vec(type);
97
tcg_debug_assert(db->is_jmp == DISAS_NEXT); /* no early exit */
77
+ TCGv_vec l2 = tcg_temp_new_vec(type);
98
78
+
99
- plugin_enabled = plugin_gen_tb_start(cpu, tb, cflags & CF_MEMI_ONLY);
79
+ tcg_debug_assert (vece < MO_64);
100
+ plugin_enabled = plugin_gen_tb_start(cpu, db, cflags & CF_MEMI_ONLY);
80
+
101
81
+ /* Unpack with sign-extension. */
102
while (true) {
82
+ vec_gen_2(INDEX_op_s390_vuph_vec, type, vece,
103
db->num_insns++;
83
+ tcgv_vec_arg(h1), tcgv_vec_arg(v1));
84
+ vec_gen_2(INDEX_op_s390_vuph_vec, type, vece,
85
+ tcgv_vec_arg(h2), tcgv_vec_arg(v2));
86
+
87
+ vec_gen_2(INDEX_op_s390_vupl_vec, type, vece,
88
+ tcgv_vec_arg(l1), tcgv_vec_arg(v1));
89
+ vec_gen_2(INDEX_op_s390_vupl_vec, type, vece,
90
+ tcgv_vec_arg(l2), tcgv_vec_arg(v2));
91
+
92
+ /* Arithmetic on a wider element size. */
93
+ vec_gen_3(add_sub_opc, type, vece + 1, tcgv_vec_arg(h1),
94
+ tcgv_vec_arg(h1), tcgv_vec_arg(h2));
95
+ vec_gen_3(add_sub_opc, type, vece + 1, tcgv_vec_arg(l1),
96
+ tcgv_vec_arg(l1), tcgv_vec_arg(l2));
97
+
98
+ /* Pack with saturation. */
99
+ vec_gen_3(INDEX_op_s390_vpks_vec, type, vece + 1,
100
+ tcgv_vec_arg(v0), tcgv_vec_arg(h1), tcgv_vec_arg(l1));
101
+
102
+ tcg_temp_free_vec(h1);
103
+ tcg_temp_free_vec(h2);
104
+ tcg_temp_free_vec(l1);
105
+ tcg_temp_free_vec(l2);
106
+}
107
+
108
void tcg_expand_vec_op(TCGOpcode opc, TCGType type, unsigned vece,
109
TCGArg a0, ...)
110
{
111
@@ -XXX,XX +XXX,XX @@ void tcg_expand_vec_op(TCGOpcode opc, TCGType type, unsigned vece,
112
tcg_temp_free_vec(t0);
113
break;
114
115
+ case INDEX_op_ssadd_vec:
116
+ expand_vec_sat(type, vece, v0, v1, v2, INDEX_op_add_vec);
117
+ break;
118
+ case INDEX_op_sssub_vec:
119
+ expand_vec_sat(type, vece, v0, v1, v2, INDEX_op_sub_vec);
120
+ break;
121
+
122
default:
123
g_assert_not_reached();
124
}
125
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
126
case INDEX_op_sari_vec:
127
case INDEX_op_shli_vec:
128
case INDEX_op_shri_vec:
129
+ case INDEX_op_s390_vuph_vec:
130
+ case INDEX_op_s390_vupl_vec:
131
return C_O1_I1(v, v);
132
case INDEX_op_add_vec:
133
case INDEX_op_sub_vec:
134
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
135
case INDEX_op_smin_vec:
136
case INDEX_op_umax_vec:
137
case INDEX_op_umin_vec:
138
+ case INDEX_op_s390_vpks_vec:
139
return C_O1_I2(v, v, v);
140
case INDEX_op_rotls_vec:
141
case INDEX_op_shls_vec:
142
--
104
--
143
2.25.1
105
2.34.1
144
106
145
107
diff view generated by jsdifflib
1
We (will) often have the complete MemOpIdx handy, so use that.
1
Let tb->page_addr[0] contain the address of the first byte of the
2
translated block, rather than the address of the page containing the
3
start of the translated block. We need to recover this value anyway
4
at various points, and it is easier to discard a page offset when it
5
is not needed, which happens naturally via the existing find_page shift.
2
6
3
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
7
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
4
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
6
---
9
---
7
trace/mem.h | 32 +++++++++-----------------
10
accel/tcg/cpu-exec.c | 16 ++++++++--------
8
accel/tcg/cputlb.c | 12 ++++------
11
accel/tcg/cputlb.c | 3 ++-
9
accel/tcg/user-exec.c | 42 +++++++++++++++++++++++------------
12
accel/tcg/translate-all.c | 9 +++++----
10
tcg/tcg-op.c | 8 +++----
13
3 files changed, 15 insertions(+), 13 deletions(-)
11
accel/tcg/atomic_common.c.inc | 6 ++---
12
5 files changed, 49 insertions(+), 51 deletions(-)
13
14
14
diff --git a/trace/mem.h b/trace/mem.h
15
diff --git a/accel/tcg/cpu-exec.c b/accel/tcg/cpu-exec.c
15
index XXXXXXX..XXXXXXX 100644
16
index XXXXXXX..XXXXXXX 100644
16
--- a/trace/mem.h
17
--- a/accel/tcg/cpu-exec.c
17
+++ b/trace/mem.h
18
+++ b/accel/tcg/cpu-exec.c
18
@@ -XXX,XX +XXX,XX @@
19
@@ -XXX,XX +XXX,XX @@ struct tb_desc {
19
#ifndef TRACE__MEM_H
20
target_ulong pc;
20
#define TRACE__MEM_H
21
target_ulong cs_base;
21
22
CPUArchState *env;
22
-#include "tcg/tcg.h"
23
- tb_page_addr_t phys_page1;
23
+#include "exec/memopidx.h"
24
+ tb_page_addr_t page_addr0;
24
25
uint32_t flags;
25
#define TRACE_MEM_SZ_SHIFT_MASK 0xf /* size shift mask */
26
uint32_t cflags;
26
#define TRACE_MEM_SE (1ULL << 4) /* sign extended (y/n) */
27
uint32_t trace_vcpu_dstate;
27
@@ -XXX,XX +XXX,XX @@
28
@@ -XXX,XX +XXX,XX @@ static bool tb_lookup_cmp(const void *p, const void *d)
28
#define TRACE_MEM_MMU_SHIFT 8 /* mmu idx */
29
const struct tb_desc *desc = d;
29
30
30
/**
31
if (tb->pc == desc->pc &&
31
- * trace_mem_build_info:
32
- tb->page_addr[0] == desc->phys_page1 &&
32
+ * trace_mem_get_info:
33
+ tb->page_addr[0] == desc->page_addr0 &&
33
*
34
tb->cs_base == desc->cs_base &&
34
* Return a value for the 'info' argument in guest memory access traces.
35
tb->flags == desc->flags &&
35
*/
36
tb->trace_vcpu_dstate == desc->trace_vcpu_dstate &&
36
-static inline uint16_t trace_mem_build_info(int size_shift, bool sign_extend,
37
@@ -XXX,XX +XXX,XX @@ static bool tb_lookup_cmp(const void *p, const void *d)
37
- MemOp endianness, bool store,
38
if (tb->page_addr[1] == -1) {
38
- unsigned int mmu_idx)
39
return true;
39
+static inline uint16_t trace_mem_get_info(MemOpIdx oi, bool store)
40
} else {
40
{
41
- tb_page_addr_t phys_page2;
41
+ MemOp op = get_memop(oi);
42
- target_ulong virt_page2;
42
+ uint32_t size_shift = op & MO_SIZE;
43
+ tb_page_addr_t phys_page1;
43
+ bool sign_extend = op & MO_SIGN;
44
+ target_ulong virt_page1;
44
+ bool big_endian = (op & MO_BSWAP) == MO_BE;
45
45
uint16_t res;
46
/*
46
47
* We know that the first page matched, and an otherwise valid TB
47
res = size_shift & TRACE_MEM_SZ_SHIFT_MASK;
48
@@ -XXX,XX +XXX,XX @@ static bool tb_lookup_cmp(const void *p, const void *d)
48
if (sign_extend) {
49
* is different for the new TB. Therefore any exception raised
49
res |= TRACE_MEM_SE;
50
* here by the faulting lookup is not premature.
51
*/
52
- virt_page2 = TARGET_PAGE_ALIGN(desc->pc);
53
- phys_page2 = get_page_addr_code(desc->env, virt_page2);
54
- if (tb->page_addr[1] == phys_page2) {
55
+ virt_page1 = TARGET_PAGE_ALIGN(desc->pc);
56
+ phys_page1 = get_page_addr_code(desc->env, virt_page1);
57
+ if (tb->page_addr[1] == phys_page1) {
58
return true;
59
}
60
}
61
@@ -XXX,XX +XXX,XX @@ static TranslationBlock *tb_htable_lookup(CPUState *cpu, target_ulong pc,
62
if (phys_pc == -1) {
63
return NULL;
50
}
64
}
51
- if (endianness == MO_BE) {
65
- desc.phys_page1 = phys_pc & TARGET_PAGE_MASK;
52
+ if (big_endian) {
66
+ desc.page_addr0 = phys_pc;
53
res |= TRACE_MEM_BE;
67
h = tb_hash_func(phys_pc, pc, flags, cflags, *cpu->trace_dstate);
54
}
68
return qht_lookup_custom(&tb_ctx.htable, &desc, h, tb_lookup_cmp);
55
if (store) {
56
res |= TRACE_MEM_ST;
57
}
58
#ifdef CONFIG_SOFTMMU
59
- res |= mmu_idx << TRACE_MEM_MMU_SHIFT;
60
+ res |= get_mmuidx(oi) << TRACE_MEM_MMU_SHIFT;
61
#endif
62
+
63
return res;
64
}
69
}
65
66
-
67
-/**
68
- * trace_mem_get_info:
69
- *
70
- * Return a value for the 'info' argument in guest memory access traces.
71
- */
72
-static inline uint16_t trace_mem_get_info(MemOp op,
73
- unsigned int mmu_idx,
74
- bool store)
75
-{
76
- return trace_mem_build_info(op & MO_SIZE, !!(op & MO_SIGN),
77
- op & MO_BSWAP, store,
78
- mmu_idx);
79
-}
80
-
81
#endif /* TRACE__MEM_H */
82
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
70
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
83
index XXXXXXX..XXXXXXX 100644
71
index XXXXXXX..XXXXXXX 100644
84
--- a/accel/tcg/cputlb.c
72
--- a/accel/tcg/cputlb.c
85
+++ b/accel/tcg/cputlb.c
73
+++ b/accel/tcg/cputlb.c
86
@@ -XXX,XX +XXX,XX @@ static inline uint64_t cpu_load_helper(CPUArchState *env, abi_ptr addr,
74
@@ -XXX,XX +XXX,XX @@ void tlb_flush_page_bits_by_mmuidx_all_cpus_synced(CPUState *src_cpu,
87
int mmu_idx, uintptr_t retaddr,
75
can be detected */
88
MemOp op, FullLoadHelper *full_load)
76
void tlb_protect_code(ram_addr_t ram_addr)
89
{
77
{
90
- uint16_t meminfo;
78
- cpu_physical_memory_test_and_clear_dirty(ram_addr, TARGET_PAGE_SIZE,
91
- MemOpIdx oi;
79
+ cpu_physical_memory_test_and_clear_dirty(ram_addr & TARGET_PAGE_MASK,
92
+ MemOpIdx oi = make_memop_idx(op, mmu_idx);
80
+ TARGET_PAGE_SIZE,
93
+ uint16_t meminfo = trace_mem_get_info(oi, false);
81
DIRTY_MEMORY_CODE);
94
uint64_t ret;
82
}
95
83
96
- meminfo = trace_mem_get_info(op, mmu_idx, false);
84
diff --git a/accel/tcg/translate-all.c b/accel/tcg/translate-all.c
97
trace_guest_mem_before_exec(env_cpu(env), addr, meminfo);
98
99
- oi = make_memop_idx(op, mmu_idx);
100
ret = full_load(env, addr, oi, retaddr);
101
102
qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, meminfo);
103
@@ -XXX,XX +XXX,XX @@ static inline void QEMU_ALWAYS_INLINE
104
cpu_store_helper(CPUArchState *env, target_ulong addr, uint64_t val,
105
int mmu_idx, uintptr_t retaddr, MemOp op)
106
{
107
- MemOpIdx oi;
108
- uint16_t meminfo;
109
+ MemOpIdx oi = make_memop_idx(op, mmu_idx);
110
+ uint16_t meminfo = trace_mem_get_info(oi, true);
111
112
- meminfo = trace_mem_get_info(op, mmu_idx, true);
113
trace_guest_mem_before_exec(env_cpu(env), addr, meminfo);
114
115
- oi = make_memop_idx(op, mmu_idx);
116
store_helper(env, addr, val, oi, retaddr, op);
117
118
qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, meminfo);
119
diff --git a/accel/tcg/user-exec.c b/accel/tcg/user-exec.c
120
index XXXXXXX..XXXXXXX 100644
85
index XXXXXXX..XXXXXXX 100644
121
--- a/accel/tcg/user-exec.c
86
--- a/accel/tcg/translate-all.c
122
+++ b/accel/tcg/user-exec.c
87
+++ b/accel/tcg/translate-all.c
123
@@ -XXX,XX +XXX,XX @@ int cpu_signal_handler(int host_signum, void *pinfo,
88
@@ -XXX,XX +XXX,XX @@ static void do_tb_phys_invalidate(TranslationBlock *tb, bool rm_from_page_list)
124
89
qemu_spin_unlock(&tb->jmp_lock);
125
uint32_t cpu_ldub_data(CPUArchState *env, abi_ptr ptr)
90
126
{
91
/* remove the TB from the hash list */
127
+ MemOpIdx oi = make_memop_idx(MO_UB, MMU_USER_IDX);
92
- phys_pc = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
128
+ uint16_t meminfo = trace_mem_get_info(oi, false);
93
+ phys_pc = tb->page_addr[0];
129
uint32_t ret;
94
h = tb_hash_func(phys_pc, tb->pc, tb->flags, orig_cflags,
130
- uint16_t meminfo = trace_mem_get_info(MO_UB, MMU_USER_IDX, false);
95
tb->trace_vcpu_dstate);
131
96
if (!qht_remove(&tb_ctx.htable, tb, h)) {
132
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
97
@@ -XXX,XX +XXX,XX @@ tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
133
ret = ldub_p(g2h(env_cpu(env), ptr));
98
* we can only insert TBs that are fully initialized.
134
@@ -XXX,XX +XXX,XX @@ int cpu_ldsb_data(CPUArchState *env, abi_ptr ptr)
99
*/
135
100
page_lock_pair(&p, phys_pc, &p2, phys_page2, true);
136
uint32_t cpu_lduw_be_data(CPUArchState *env, abi_ptr ptr)
101
- tb_page_add(p, tb, 0, phys_pc & TARGET_PAGE_MASK);
137
{
102
+ tb_page_add(p, tb, 0, phys_pc);
138
+ MemOpIdx oi = make_memop_idx(MO_BEUW, MMU_USER_IDX);
103
if (p2) {
139
+ uint16_t meminfo = trace_mem_get_info(oi, false);
104
tb_page_add(p2, tb, 1, phys_page2);
140
uint32_t ret;
105
} else {
141
- uint16_t meminfo = trace_mem_get_info(MO_BEUW, MMU_USER_IDX, false);
106
@@ -XXX,XX +XXX,XX @@ tb_invalidate_phys_page_range__locked(struct page_collection *pages,
142
107
if (n == 0) {
143
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
108
/* NOTE: tb_end may be after the end of the page, but
144
ret = lduw_be_p(g2h(env_cpu(env), ptr));
109
it is not a problem */
145
@@ -XXX,XX +XXX,XX @@ int cpu_ldsw_be_data(CPUArchState *env, abi_ptr ptr)
110
- tb_start = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
146
111
+ tb_start = tb->page_addr[0];
147
uint32_t cpu_ldl_be_data(CPUArchState *env, abi_ptr ptr)
112
tb_end = tb_start + tb->size;
148
{
113
} else {
149
+ MemOpIdx oi = make_memop_idx(MO_BEUL, MMU_USER_IDX);
114
tb_start = tb->page_addr[1];
150
+ uint16_t meminfo = trace_mem_get_info(oi, false);
115
- tb_end = tb_start + ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
151
uint32_t ret;
116
+ tb_end = tb_start + ((tb->page_addr[0] + tb->size)
152
- uint16_t meminfo = trace_mem_get_info(MO_BEUL, MMU_USER_IDX, false);
117
+ & ~TARGET_PAGE_MASK);
153
118
}
154
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
119
if (!(tb_end <= start || tb_start >= end)) {
155
ret = ldl_be_p(g2h(env_cpu(env), ptr));
120
#ifdef TARGET_HAS_PRECISE_SMC
156
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_ldl_be_data(CPUArchState *env, abi_ptr ptr)
157
158
uint64_t cpu_ldq_be_data(CPUArchState *env, abi_ptr ptr)
159
{
160
+ MemOpIdx oi = make_memop_idx(MO_BEQ, MMU_USER_IDX);
161
+ uint16_t meminfo = trace_mem_get_info(oi, false);
162
uint64_t ret;
163
- uint16_t meminfo = trace_mem_get_info(MO_BEQ, MMU_USER_IDX, false);
164
165
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
166
ret = ldq_be_p(g2h(env_cpu(env), ptr));
167
@@ -XXX,XX +XXX,XX @@ uint64_t cpu_ldq_be_data(CPUArchState *env, abi_ptr ptr)
168
169
uint32_t cpu_lduw_le_data(CPUArchState *env, abi_ptr ptr)
170
{
171
+ MemOpIdx oi = make_memop_idx(MO_LEUW, MMU_USER_IDX);
172
+ uint16_t meminfo = trace_mem_get_info(oi, false);
173
uint32_t ret;
174
- uint16_t meminfo = trace_mem_get_info(MO_LEUW, MMU_USER_IDX, false);
175
176
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
177
ret = lduw_le_p(g2h(env_cpu(env), ptr));
178
@@ -XXX,XX +XXX,XX @@ int cpu_ldsw_le_data(CPUArchState *env, abi_ptr ptr)
179
180
uint32_t cpu_ldl_le_data(CPUArchState *env, abi_ptr ptr)
181
{
182
+ MemOpIdx oi = make_memop_idx(MO_LEUL, MMU_USER_IDX);
183
+ uint16_t meminfo = trace_mem_get_info(oi, false);
184
uint32_t ret;
185
- uint16_t meminfo = trace_mem_get_info(MO_LEUL, MMU_USER_IDX, false);
186
187
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
188
ret = ldl_le_p(g2h(env_cpu(env), ptr));
189
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_ldl_le_data(CPUArchState *env, abi_ptr ptr)
190
191
uint64_t cpu_ldq_le_data(CPUArchState *env, abi_ptr ptr)
192
{
193
+ MemOpIdx oi = make_memop_idx(MO_LEQ, MMU_USER_IDX);
194
+ uint16_t meminfo = trace_mem_get_info(oi, false);
195
uint64_t ret;
196
- uint16_t meminfo = trace_mem_get_info(MO_LEQ, MMU_USER_IDX, false);
197
198
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
199
ret = ldq_le_p(g2h(env_cpu(env), ptr));
200
@@ -XXX,XX +XXX,XX @@ uint64_t cpu_ldq_le_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t retaddr)
201
202
void cpu_stb_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
203
{
204
- uint16_t meminfo = trace_mem_get_info(MO_UB, MMU_USER_IDX, true);
205
+ MemOpIdx oi = make_memop_idx(MO_UB, MMU_USER_IDX);
206
+ uint16_t meminfo = trace_mem_get_info(oi, true);
207
208
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
209
stb_p(g2h(env_cpu(env), ptr), val);
210
@@ -XXX,XX +XXX,XX @@ void cpu_stb_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
211
212
void cpu_stw_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
213
{
214
- uint16_t meminfo = trace_mem_get_info(MO_BEUW, MMU_USER_IDX, true);
215
+ MemOpIdx oi = make_memop_idx(MO_BEUW, MMU_USER_IDX);
216
+ uint16_t meminfo = trace_mem_get_info(oi, true);
217
218
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
219
stw_be_p(g2h(env_cpu(env), ptr), val);
220
@@ -XXX,XX +XXX,XX @@ void cpu_stw_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
221
222
void cpu_stl_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
223
{
224
- uint16_t meminfo = trace_mem_get_info(MO_BEUL, MMU_USER_IDX, true);
225
+ MemOpIdx oi = make_memop_idx(MO_BEUL, MMU_USER_IDX);
226
+ uint16_t meminfo = trace_mem_get_info(oi, true);
227
228
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
229
stl_be_p(g2h(env_cpu(env), ptr), val);
230
@@ -XXX,XX +XXX,XX @@ void cpu_stl_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
231
232
void cpu_stq_be_data(CPUArchState *env, abi_ptr ptr, uint64_t val)
233
{
234
- uint16_t meminfo = trace_mem_get_info(MO_BEQ, MMU_USER_IDX, true);
235
+ MemOpIdx oi = make_memop_idx(MO_BEQ, MMU_USER_IDX);
236
+ uint16_t meminfo = trace_mem_get_info(oi, true);
237
238
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
239
stq_be_p(g2h(env_cpu(env), ptr), val);
240
@@ -XXX,XX +XXX,XX @@ void cpu_stq_be_data(CPUArchState *env, abi_ptr ptr, uint64_t val)
241
242
void cpu_stw_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
243
{
244
- uint16_t meminfo = trace_mem_get_info(MO_LEUW, MMU_USER_IDX, true);
245
+ MemOpIdx oi = make_memop_idx(MO_LEUW, MMU_USER_IDX);
246
+ uint16_t meminfo = trace_mem_get_info(oi, true);
247
248
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
249
stw_le_p(g2h(env_cpu(env), ptr), val);
250
@@ -XXX,XX +XXX,XX @@ void cpu_stw_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
251
252
void cpu_stl_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
253
{
254
- uint16_t meminfo = trace_mem_get_info(MO_LEUL, MMU_USER_IDX, true);
255
+ MemOpIdx oi = make_memop_idx(MO_LEUL, MMU_USER_IDX);
256
+ uint16_t meminfo = trace_mem_get_info(oi, true);
257
258
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
259
stl_le_p(g2h(env_cpu(env), ptr), val);
260
@@ -XXX,XX +XXX,XX @@ void cpu_stl_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
261
262
void cpu_stq_le_data(CPUArchState *env, abi_ptr ptr, uint64_t val)
263
{
264
- uint16_t meminfo = trace_mem_get_info(MO_LEQ, MMU_USER_IDX, true);
265
+ MemOpIdx oi = make_memop_idx(MO_LEQ, MMU_USER_IDX);
266
+ uint16_t meminfo = trace_mem_get_info(oi, true);
267
268
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
269
stq_le_p(g2h(env_cpu(env), ptr), val);
270
diff --git a/tcg/tcg-op.c b/tcg/tcg-op.c
271
index XXXXXXX..XXXXXXX 100644
272
--- a/tcg/tcg-op.c
273
+++ b/tcg/tcg-op.c
274
@@ -XXX,XX +XXX,XX @@ static inline void plugin_gen_mem_callbacks(TCGv vaddr, uint16_t info)
275
void tcg_gen_qemu_ld_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
276
{
277
MemOp orig_memop;
278
- uint16_t info = trace_mem_get_info(memop, idx, 0);
279
+ uint16_t info = trace_mem_get_info(make_memop_idx(memop, idx), 0);
280
281
tcg_gen_req_mo(TCG_MO_LD_LD | TCG_MO_ST_LD);
282
memop = tcg_canonicalize_memop(memop, 0, 0);
283
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_ld_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
284
void tcg_gen_qemu_st_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
285
{
286
TCGv_i32 swap = NULL;
287
- uint16_t info = trace_mem_get_info(memop, idx, 1);
288
+ uint16_t info = trace_mem_get_info(make_memop_idx(memop, idx), 1);
289
290
tcg_gen_req_mo(TCG_MO_LD_ST | TCG_MO_ST_ST);
291
memop = tcg_canonicalize_memop(memop, 0, 1);
292
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_ld_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
293
294
tcg_gen_req_mo(TCG_MO_LD_LD | TCG_MO_ST_LD);
295
memop = tcg_canonicalize_memop(memop, 1, 0);
296
- info = trace_mem_get_info(memop, idx, 0);
297
+ info = trace_mem_get_info(make_memop_idx(memop, idx), 0);
298
trace_guest_mem_before_tcg(tcg_ctx->cpu, cpu_env, addr, info);
299
300
orig_memop = memop;
301
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_st_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
302
303
tcg_gen_req_mo(TCG_MO_LD_ST | TCG_MO_ST_ST);
304
memop = tcg_canonicalize_memop(memop, 1, 1);
305
- info = trace_mem_get_info(memop, idx, 1);
306
+ info = trace_mem_get_info(make_memop_idx(memop, idx), 1);
307
trace_guest_mem_before_tcg(tcg_ctx->cpu, cpu_env, addr, info);
308
309
if (!TCG_TARGET_HAS_MEMORY_BSWAP && (memop & MO_BSWAP)) {
310
diff --git a/accel/tcg/atomic_common.c.inc b/accel/tcg/atomic_common.c.inc
311
index XXXXXXX..XXXXXXX 100644
312
--- a/accel/tcg/atomic_common.c.inc
313
+++ b/accel/tcg/atomic_common.c.inc
314
@@ -XXX,XX +XXX,XX @@ static uint16_t atomic_trace_rmw_pre(CPUArchState *env, target_ulong addr,
315
MemOpIdx oi)
316
{
317
CPUState *cpu = env_cpu(env);
318
- uint16_t info = trace_mem_get_info(get_memop(oi), get_mmuidx(oi), false);
319
+ uint16_t info = trace_mem_get_info(oi, false);
320
321
trace_guest_mem_before_exec(cpu, addr, info);
322
trace_guest_mem_before_exec(cpu, addr, info | TRACE_MEM_ST);
323
@@ -XXX,XX +XXX,XX @@ static void atomic_trace_rmw_post(CPUArchState *env, target_ulong addr,
324
static uint16_t atomic_trace_ld_pre(CPUArchState *env, target_ulong addr,
325
MemOpIdx oi)
326
{
327
- uint16_t info = trace_mem_get_info(get_memop(oi), get_mmuidx(oi), false);
328
+ uint16_t info = trace_mem_get_info(oi, false);
329
330
trace_guest_mem_before_exec(env_cpu(env), addr, info);
331
332
@@ -XXX,XX +XXX,XX @@ static void atomic_trace_ld_post(CPUArchState *env, target_ulong addr,
333
static uint16_t atomic_trace_st_pre(CPUArchState *env, target_ulong addr,
334
MemOpIdx oi)
335
{
336
- uint16_t info = trace_mem_get_info(get_memop(oi), get_mmuidx(oi), true);
337
+ uint16_t info = trace_mem_get_info(oi, true);
338
339
trace_guest_mem_before_exec(env_cpu(env), addr, info);
340
341
--
121
--
342
2.25.1
122
2.34.1
343
123
344
124
diff view generated by jsdifflib
1
Use the MemOpIdx directly, rather than the rearrangement
1
This function has two users, who use it incompatibly.
2
of the same bits currently done by the trace infrastructure.
2
In tlb_flush_page_by_mmuidx_async_0, when flushing a
3
Pass in enum qemu_plugin_mem_rw so that we are able to treat
3
single page, we need to flush exactly two pages.
4
read-modify-write operations as a single operation.
4
In tlb_flush_range_by_mmuidx_async_0, when flushing a
5
range of pages, we need to flush N+1 pages.
5
6
6
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
7
This avoids double-flushing of jmp cache pages in a range.
8
9
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
7
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
10
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
---
11
---
9
include/qemu/plugin.h | 26 ++++++++++++++++++++++++--
12
accel/tcg/cputlb.c | 25 ++++++++++++++-----------
10
accel/tcg/cputlb.c | 4 ++--
13
1 file changed, 14 insertions(+), 11 deletions(-)
11
accel/tcg/plugin-gen.c | 5 ++---
12
accel/tcg/user-exec.c | 28 ++++++++++++++--------------
13
plugins/api.c | 19 +++++++++++--------
14
plugins/core.c | 10 +++++-----
15
tcg/tcg-op.c | 30 +++++++++++++++++++++---------
16
accel/tcg/atomic_common.c.inc | 13 +++----------
17
8 files changed, 82 insertions(+), 53 deletions(-)
18
14
19
diff --git a/include/qemu/plugin.h b/include/qemu/plugin.h
20
index XXXXXXX..XXXXXXX 100644
21
--- a/include/qemu/plugin.h
22
+++ b/include/qemu/plugin.h
23
@@ -XXX,XX +XXX,XX @@
24
#include "qemu/error-report.h"
25
#include "qemu/queue.h"
26
#include "qemu/option.h"
27
+#include "exec/memopidx.h"
28
29
/*
30
* Events that plugins can subscribe to.
31
@@ -XXX,XX +XXX,XX @@ enum qemu_plugin_event {
32
struct qemu_plugin_desc;
33
typedef QTAILQ_HEAD(, qemu_plugin_desc) QemuPluginList;
34
35
+/*
36
+ * Construct a qemu_plugin_meminfo_t.
37
+ */
38
+static inline qemu_plugin_meminfo_t
39
+make_plugin_meminfo(MemOpIdx oi, enum qemu_plugin_mem_rw rw)
40
+{
41
+ return oi | (rw << 16);
42
+}
43
+
44
+/*
45
+ * Extract the memory operation direction from a qemu_plugin_meminfo_t.
46
+ * Other portions may be extracted via get_memop and get_mmuidx.
47
+ */
48
+static inline enum qemu_plugin_mem_rw
49
+get_plugin_meminfo_rw(qemu_plugin_meminfo_t i)
50
+{
51
+ return i >> 16;
52
+}
53
+
54
#ifdef CONFIG_PLUGIN
55
extern QemuOptsList qemu_plugin_opts;
56
57
@@ -XXX,XX +XXX,XX @@ qemu_plugin_vcpu_syscall(CPUState *cpu, int64_t num, uint64_t a1,
58
uint64_t a6, uint64_t a7, uint64_t a8);
59
void qemu_plugin_vcpu_syscall_ret(CPUState *cpu, int64_t num, int64_t ret);
60
61
-void qemu_plugin_vcpu_mem_cb(CPUState *cpu, uint64_t vaddr, uint32_t meminfo);
62
+void qemu_plugin_vcpu_mem_cb(CPUState *cpu, uint64_t vaddr,
63
+ MemOpIdx oi, enum qemu_plugin_mem_rw rw);
64
65
void qemu_plugin_flush_cb(void);
66
67
@@ -XXX,XX +XXX,XX @@ void qemu_plugin_vcpu_syscall_ret(CPUState *cpu, int64_t num, int64_t ret)
68
{ }
69
70
static inline void qemu_plugin_vcpu_mem_cb(CPUState *cpu, uint64_t vaddr,
71
- uint32_t meminfo)
72
+ MemOpIdx oi,
73
+ enum qemu_plugin_mem_rw rw)
74
{ }
75
76
static inline void qemu_plugin_flush_cb(void)
77
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
15
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
78
index XXXXXXX..XXXXXXX 100644
16
index XXXXXXX..XXXXXXX 100644
79
--- a/accel/tcg/cputlb.c
17
--- a/accel/tcg/cputlb.c
80
+++ b/accel/tcg/cputlb.c
18
+++ b/accel/tcg/cputlb.c
81
@@ -XXX,XX +XXX,XX @@ static inline uint64_t cpu_load_helper(CPUArchState *env, abi_ptr addr,
19
@@ -XXX,XX +XXX,XX @@ static void tb_jmp_cache_clear_page(CPUState *cpu, target_ulong page_addr)
82
83
ret = full_load(env, addr, oi, retaddr);
84
85
- qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, meminfo);
86
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, oi, QEMU_PLUGIN_MEM_R);
87
88
return ret;
89
}
90
@@ -XXX,XX +XXX,XX @@ cpu_store_helper(CPUArchState *env, target_ulong addr, uint64_t val,
91
92
store_helper(env, addr, val, oi, retaddr, op);
93
94
- qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, meminfo);
95
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, oi, QEMU_PLUGIN_MEM_W);
96
}
97
98
void cpu_stb_mmuidx_ra(CPUArchState *env, target_ulong addr, uint32_t val,
99
diff --git a/accel/tcg/plugin-gen.c b/accel/tcg/plugin-gen.c
100
index XXXXXXX..XXXXXXX 100644
101
--- a/accel/tcg/plugin-gen.c
102
+++ b/accel/tcg/plugin-gen.c
103
@@ -XXX,XX +XXX,XX @@
104
#include "qemu/osdep.h"
105
#include "tcg/tcg.h"
106
#include "tcg/tcg-op.h"
107
-#include "trace/mem.h"
108
#include "exec/exec-all.h"
109
#include "exec/plugin-gen.h"
110
#include "exec/translator.h"
111
@@ -XXX,XX +XXX,XX @@ static void gen_mem_wrapped(enum plugin_gen_cb type,
112
const union mem_gen_fn *f, TCGv addr,
113
uint32_t info, bool is_mem)
114
{
115
- int wr = !!(info & TRACE_MEM_ST);
116
+ enum qemu_plugin_mem_rw rw = get_plugin_meminfo_rw(info);
117
118
- gen_plugin_cb_start(PLUGIN_GEN_FROM_MEM, type, wr);
119
+ gen_plugin_cb_start(PLUGIN_GEN_FROM_MEM, type, rw);
120
if (is_mem) {
121
f->mem_fn(addr, info);
122
} else {
123
diff --git a/accel/tcg/user-exec.c b/accel/tcg/user-exec.c
124
index XXXXXXX..XXXXXXX 100644
125
--- a/accel/tcg/user-exec.c
126
+++ b/accel/tcg/user-exec.c
127
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_ldub_data(CPUArchState *env, abi_ptr ptr)
128
129
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
130
ret = ldub_p(g2h(env_cpu(env), ptr));
131
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
132
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
133
return ret;
134
}
135
136
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_lduw_be_data(CPUArchState *env, abi_ptr ptr)
137
138
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
139
ret = lduw_be_p(g2h(env_cpu(env), ptr));
140
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
141
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
142
return ret;
143
}
144
145
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_ldl_be_data(CPUArchState *env, abi_ptr ptr)
146
147
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
148
ret = ldl_be_p(g2h(env_cpu(env), ptr));
149
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
150
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
151
return ret;
152
}
153
154
@@ -XXX,XX +XXX,XX @@ uint64_t cpu_ldq_be_data(CPUArchState *env, abi_ptr ptr)
155
156
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
157
ret = ldq_be_p(g2h(env_cpu(env), ptr));
158
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
159
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
160
return ret;
161
}
162
163
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_lduw_le_data(CPUArchState *env, abi_ptr ptr)
164
165
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
166
ret = lduw_le_p(g2h(env_cpu(env), ptr));
167
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
168
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
169
return ret;
170
}
171
172
@@ -XXX,XX +XXX,XX @@ uint32_t cpu_ldl_le_data(CPUArchState *env, abi_ptr ptr)
173
174
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
175
ret = ldl_le_p(g2h(env_cpu(env), ptr));
176
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
177
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
178
return ret;
179
}
180
181
@@ -XXX,XX +XXX,XX @@ uint64_t cpu_ldq_le_data(CPUArchState *env, abi_ptr ptr)
182
183
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
184
ret = ldq_le_p(g2h(env_cpu(env), ptr));
185
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
186
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_R);
187
return ret;
188
}
189
190
@@ -XXX,XX +XXX,XX @@ void cpu_stb_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
191
192
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
193
stb_p(g2h(env_cpu(env), ptr), val);
194
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
195
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
196
}
197
198
void cpu_stw_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
199
@@ -XXX,XX +XXX,XX @@ void cpu_stw_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
200
201
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
202
stw_be_p(g2h(env_cpu(env), ptr), val);
203
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
204
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
205
}
206
207
void cpu_stl_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
208
@@ -XXX,XX +XXX,XX @@ void cpu_stl_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
209
210
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
211
stl_be_p(g2h(env_cpu(env), ptr), val);
212
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
213
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
214
}
215
216
void cpu_stq_be_data(CPUArchState *env, abi_ptr ptr, uint64_t val)
217
@@ -XXX,XX +XXX,XX @@ void cpu_stq_be_data(CPUArchState *env, abi_ptr ptr, uint64_t val)
218
219
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
220
stq_be_p(g2h(env_cpu(env), ptr), val);
221
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
222
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
223
}
224
225
void cpu_stw_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
226
@@ -XXX,XX +XXX,XX @@ void cpu_stw_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
227
228
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
229
stw_le_p(g2h(env_cpu(env), ptr), val);
230
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
231
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
232
}
233
234
void cpu_stl_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
235
@@ -XXX,XX +XXX,XX @@ void cpu_stl_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val)
236
237
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
238
stl_le_p(g2h(env_cpu(env), ptr), val);
239
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
240
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
241
}
242
243
void cpu_stq_le_data(CPUArchState *env, abi_ptr ptr, uint64_t val)
244
@@ -XXX,XX +XXX,XX @@ void cpu_stq_le_data(CPUArchState *env, abi_ptr ptr, uint64_t val)
245
246
trace_guest_mem_before_exec(env_cpu(env), ptr, meminfo);
247
stq_le_p(g2h(env_cpu(env), ptr), val);
248
- qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, meminfo);
249
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), ptr, oi, QEMU_PLUGIN_MEM_W);
250
}
251
252
void cpu_stb_data_ra(CPUArchState *env, abi_ptr ptr,
253
diff --git a/plugins/api.c b/plugins/api.c
254
index XXXXXXX..XXXXXXX 100644
255
--- a/plugins/api.c
256
+++ b/plugins/api.c
257
@@ -XXX,XX +XXX,XX @@
258
#include "qemu/plugin-memory.h"
259
#include "hw/boards.h"
260
#endif
261
-#include "trace/mem.h"
262
263
/* Uninstall and Reset handlers */
264
265
@@ -XXX,XX +XXX,XX @@ const char *qemu_plugin_insn_symbol(const struct qemu_plugin_insn *insn)
266
267
unsigned qemu_plugin_mem_size_shift(qemu_plugin_meminfo_t info)
268
{
269
- return info & TRACE_MEM_SZ_SHIFT_MASK;
270
+ MemOp op = get_memop(info);
271
+ return op & MO_SIZE;
272
}
273
274
bool qemu_plugin_mem_is_sign_extended(qemu_plugin_meminfo_t info)
275
{
276
- return !!(info & TRACE_MEM_SE);
277
+ MemOp op = get_memop(info);
278
+ return op & MO_SIGN;
279
}
280
281
bool qemu_plugin_mem_is_big_endian(qemu_plugin_meminfo_t info)
282
{
283
- return !!(info & TRACE_MEM_BE);
284
+ MemOp op = get_memop(info);
285
+ return (op & MO_BSWAP) == MO_BE;
286
}
287
288
bool qemu_plugin_mem_is_store(qemu_plugin_meminfo_t info)
289
{
290
- return !!(info & TRACE_MEM_ST);
291
+ return get_plugin_meminfo_rw(info) & QEMU_PLUGIN_MEM_W;
292
}
293
294
/*
295
@@ -XXX,XX +XXX,XX @@ struct qemu_plugin_hwaddr *qemu_plugin_get_hwaddr(qemu_plugin_meminfo_t info,
296
{
297
#ifdef CONFIG_SOFTMMU
298
CPUState *cpu = current_cpu;
299
- unsigned int mmu_idx = info >> TRACE_MEM_MMU_SHIFT;
300
- hwaddr_info.is_store = info & TRACE_MEM_ST;
301
+ unsigned int mmu_idx = get_mmuidx(info);
302
+ enum qemu_plugin_mem_rw rw = get_plugin_meminfo_rw(info);
303
+ hwaddr_info.is_store = (rw & QEMU_PLUGIN_MEM_W) != 0;
304
305
if (!tlb_plugin_lookup(cpu, vaddr, mmu_idx,
306
- info & TRACE_MEM_ST, &hwaddr_info)) {
307
+ hwaddr_info.is_store, &hwaddr_info)) {
308
error_report("invalid use of qemu_plugin_get_hwaddr");
309
return NULL;
310
}
311
diff --git a/plugins/core.c b/plugins/core.c
312
index XXXXXXX..XXXXXXX 100644
313
--- a/plugins/core.c
314
+++ b/plugins/core.c
315
@@ -XXX,XX +XXX,XX @@
316
#include "exec/helper-proto.h"
317
#include "tcg/tcg.h"
318
#include "tcg/tcg-op.h"
319
-#include "trace/mem.h" /* mem_info macros */
320
#include "plugin.h"
321
#include "qemu/compiler.h"
322
323
@@ -XXX,XX +XXX,XX @@ void exec_inline_op(struct qemu_plugin_dyn_cb *cb)
324
}
20
}
325
}
21
}
326
22
327
-void qemu_plugin_vcpu_mem_cb(CPUState *cpu, uint64_t vaddr, uint32_t info)
23
-static void tb_flush_jmp_cache(CPUState *cpu, target_ulong addr)
328
+void qemu_plugin_vcpu_mem_cb(CPUState *cpu, uint64_t vaddr,
24
-{
329
+ MemOpIdx oi, enum qemu_plugin_mem_rw rw)
25
- /* Discard jump cache entries for any tb which might potentially
330
{
26
- overlap the flushed page. */
331
GArray *arr = cpu->plugin_mem_cbs;
27
- tb_jmp_cache_clear_page(cpu, addr - TARGET_PAGE_SIZE);
332
size_t i;
28
- tb_jmp_cache_clear_page(cpu, addr);
333
@@ -XXX,XX +XXX,XX @@ void qemu_plugin_vcpu_mem_cb(CPUState *cpu, uint64_t vaddr, uint32_t info)
29
-}
334
for (i = 0; i < arr->len; i++) {
30
-
335
struct qemu_plugin_dyn_cb *cb =
31
/**
336
&g_array_index(arr, struct qemu_plugin_dyn_cb, i);
32
* tlb_mmu_resize_locked() - perform TLB resize bookkeeping; resize if necessary
337
- int w = !!(info & TRACE_MEM_ST) + 1;
33
* @desc: The CPUTLBDesc portion of the TLB
338
34
@@ -XXX,XX +XXX,XX @@ static void tlb_flush_page_by_mmuidx_async_0(CPUState *cpu,
339
- if (!(w & cb->rw)) {
35
}
340
+ if (!(rw & cb->rw)) {
36
qemu_spin_unlock(&env_tlb(env)->c.lock);
341
break;
37
342
}
38
- tb_flush_jmp_cache(cpu, addr);
343
switch (cb->type) {
39
+ /*
344
case PLUGIN_CB_REGULAR:
40
+ * Discard jump cache entries for any tb which might potentially
345
- cb->f.vcpu_mem(cpu->cpu_index, info, vaddr, cb->userp);
41
+ * overlap the flushed page, which includes the previous.
346
+ cb->f.vcpu_mem(cpu->cpu_index, make_plugin_meminfo(oi, rw),
42
+ */
347
+ vaddr, cb->userp);
43
+ tb_jmp_cache_clear_page(cpu, addr - TARGET_PAGE_SIZE);
348
break;
44
+ tb_jmp_cache_clear_page(cpu, addr);
349
case PLUGIN_CB_INLINE:
350
exec_inline_op(cb);
351
diff --git a/tcg/tcg-op.c b/tcg/tcg-op.c
352
index XXXXXXX..XXXXXXX 100644
353
--- a/tcg/tcg-op.c
354
+++ b/tcg/tcg-op.c
355
@@ -XXX,XX +XXX,XX @@ static inline TCGv plugin_prep_mem_callbacks(TCGv vaddr)
356
return vaddr;
357
}
45
}
358
46
359
-static inline void plugin_gen_mem_callbacks(TCGv vaddr, uint16_t info)
47
/**
360
+static void plugin_gen_mem_callbacks(TCGv vaddr, MemOpIdx oi,
48
@@ -XXX,XX +XXX,XX @@ static void tlb_flush_range_by_mmuidx_async_0(CPUState *cpu,
361
+ enum qemu_plugin_mem_rw rw)
49
return;
362
{
363
#ifdef CONFIG_PLUGIN
364
if (tcg_ctx->plugin_insn != NULL) {
365
+ qemu_plugin_meminfo_t info = make_plugin_meminfo(oi, rw);
366
plugin_gen_empty_mem_callback(vaddr, info);
367
tcg_temp_free(vaddr);
368
}
50
}
369
@@ -XXX,XX +XXX,XX @@ static inline void plugin_gen_mem_callbacks(TCGv vaddr, uint16_t info)
51
370
void tcg_gen_qemu_ld_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
52
- for (target_ulong i = 0; i < d.len; i += TARGET_PAGE_SIZE) {
371
{
53
- tb_flush_jmp_cache(cpu, d.addr + i);
372
MemOp orig_memop;
54
+ /*
373
- uint16_t info = trace_mem_get_info(make_memop_idx(memop, idx), 0);
55
+ * Discard jump cache entries for any tb which might potentially
374
+ MemOpIdx oi;
56
+ * overlap the flushed pages, which includes the previous.
375
+ uint16_t info;
57
+ */
376
58
+ d.addr -= TARGET_PAGE_SIZE;
377
tcg_gen_req_mo(TCG_MO_LD_LD | TCG_MO_ST_LD);
59
+ for (target_ulong i = 0, n = d.len / TARGET_PAGE_SIZE + 1; i < n; i++) {
378
memop = tcg_canonicalize_memop(memop, 0, 0);
60
+ tb_jmp_cache_clear_page(cpu, d.addr);
379
+ oi = make_memop_idx(memop, idx);
61
+ d.addr += TARGET_PAGE_SIZE;
380
+ info = trace_mem_get_info(oi, 0);
381
trace_guest_mem_before_tcg(tcg_ctx->cpu, cpu_env, addr, info);
382
383
orig_memop = memop;
384
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_ld_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
385
386
addr = plugin_prep_mem_callbacks(addr);
387
gen_ldst_i32(INDEX_op_qemu_ld_i32, val, addr, memop, idx);
388
- plugin_gen_mem_callbacks(addr, info);
389
+ plugin_gen_mem_callbacks(addr, oi, QEMU_PLUGIN_MEM_R);
390
391
if ((orig_memop ^ memop) & MO_BSWAP) {
392
switch (orig_memop & MO_SIZE) {
393
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_ld_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
394
void tcg_gen_qemu_st_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
395
{
396
TCGv_i32 swap = NULL;
397
- uint16_t info = trace_mem_get_info(make_memop_idx(memop, idx), 1);
398
+ MemOpIdx oi;
399
+ uint16_t info;
400
401
tcg_gen_req_mo(TCG_MO_LD_ST | TCG_MO_ST_ST);
402
memop = tcg_canonicalize_memop(memop, 0, 1);
403
+ oi = make_memop_idx(memop, idx);
404
+ info = trace_mem_get_info(oi, 1);
405
trace_guest_mem_before_tcg(tcg_ctx->cpu, cpu_env, addr, info);
406
407
if (!TCG_TARGET_HAS_MEMORY_BSWAP && (memop & MO_BSWAP)) {
408
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_st_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
409
} else {
410
gen_ldst_i32(INDEX_op_qemu_st_i32, val, addr, memop, idx);
411
}
62
}
412
- plugin_gen_mem_callbacks(addr, info);
413
+ plugin_gen_mem_callbacks(addr, oi, QEMU_PLUGIN_MEM_W);
414
415
if (swap) {
416
tcg_temp_free_i32(swap);
417
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_st_i32(TCGv_i32 val, TCGv addr, TCGArg idx, MemOp memop)
418
void tcg_gen_qemu_ld_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
419
{
420
MemOp orig_memop;
421
+ MemOpIdx oi;
422
uint16_t info;
423
424
if (TCG_TARGET_REG_BITS == 32 && (memop & MO_SIZE) < MO_64) {
425
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_ld_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
426
427
tcg_gen_req_mo(TCG_MO_LD_LD | TCG_MO_ST_LD);
428
memop = tcg_canonicalize_memop(memop, 1, 0);
429
- info = trace_mem_get_info(make_memop_idx(memop, idx), 0);
430
+ oi = make_memop_idx(memop, idx);
431
+ info = trace_mem_get_info(oi, 0);
432
trace_guest_mem_before_tcg(tcg_ctx->cpu, cpu_env, addr, info);
433
434
orig_memop = memop;
435
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_ld_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
436
437
addr = plugin_prep_mem_callbacks(addr);
438
gen_ldst_i64(INDEX_op_qemu_ld_i64, val, addr, memop, idx);
439
- plugin_gen_mem_callbacks(addr, info);
440
+ plugin_gen_mem_callbacks(addr, oi, QEMU_PLUGIN_MEM_R);
441
442
if ((orig_memop ^ memop) & MO_BSWAP) {
443
int flags = (orig_memop & MO_SIGN
444
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_ld_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
445
void tcg_gen_qemu_st_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
446
{
447
TCGv_i64 swap = NULL;
448
+ MemOpIdx oi;
449
uint16_t info;
450
451
if (TCG_TARGET_REG_BITS == 32 && (memop & MO_SIZE) < MO_64) {
452
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_st_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
453
454
tcg_gen_req_mo(TCG_MO_LD_ST | TCG_MO_ST_ST);
455
memop = tcg_canonicalize_memop(memop, 1, 1);
456
- info = trace_mem_get_info(make_memop_idx(memop, idx), 1);
457
+ oi = make_memop_idx(memop, idx);
458
+ info = trace_mem_get_info(oi, 1);
459
trace_guest_mem_before_tcg(tcg_ctx->cpu, cpu_env, addr, info);
460
461
if (!TCG_TARGET_HAS_MEMORY_BSWAP && (memop & MO_BSWAP)) {
462
@@ -XXX,XX +XXX,XX @@ void tcg_gen_qemu_st_i64(TCGv_i64 val, TCGv addr, TCGArg idx, MemOp memop)
463
464
addr = plugin_prep_mem_callbacks(addr);
465
gen_ldst_i64(INDEX_op_qemu_st_i64, val, addr, memop, idx);
466
- plugin_gen_mem_callbacks(addr, info);
467
+ plugin_gen_mem_callbacks(addr, oi, QEMU_PLUGIN_MEM_W);
468
469
if (swap) {
470
tcg_temp_free_i64(swap);
471
diff --git a/accel/tcg/atomic_common.c.inc b/accel/tcg/atomic_common.c.inc
472
index XXXXXXX..XXXXXXX 100644
473
--- a/accel/tcg/atomic_common.c.inc
474
+++ b/accel/tcg/atomic_common.c.inc
475
@@ -XXX,XX +XXX,XX @@ static void atomic_trace_rmw_pre(CPUArchState *env, target_ulong addr,
476
static void atomic_trace_rmw_post(CPUArchState *env, target_ulong addr,
477
MemOpIdx oi)
478
{
479
- uint16_t info = trace_mem_get_info(oi, false);
480
-
481
- qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, info);
482
- qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, info | TRACE_MEM_ST);
483
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, oi, QEMU_PLUGIN_MEM_RW);
484
}
63
}
485
64
486
#if HAVE_ATOMIC128
487
@@ -XXX,XX +XXX,XX @@ static void atomic_trace_ld_pre(CPUArchState *env, target_ulong addr,
488
static void atomic_trace_ld_post(CPUArchState *env, target_ulong addr,
489
MemOpIdx oi)
490
{
491
- uint16_t info = trace_mem_get_info(oi, false);
492
-
493
- qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, info);
494
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, oi, QEMU_PLUGIN_MEM_R);
495
}
496
497
static void atomic_trace_st_pre(CPUArchState *env, target_ulong addr,
498
@@ -XXX,XX +XXX,XX @@ static void atomic_trace_st_pre(CPUArchState *env, target_ulong addr,
499
static void atomic_trace_st_post(CPUArchState *env, target_ulong addr,
500
MemOpIdx oi)
501
{
502
- uint16_t info = trace_mem_get_info(oi, false);
503
-
504
- qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, info);
505
+ qemu_plugin_vcpu_mem_cb(env_cpu(env), addr, oi, QEMU_PLUGIN_MEM_W);
506
}
507
#endif
508
509
--
65
--
510
2.25.1
66
2.34.1
511
67
512
68
diff view generated by jsdifflib
1
Move this code from tcg/tcg.h to its own header.
1
Wrap the bare TranslationBlock pointer into a structure.
2
2
3
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
3
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
4
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
4
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
---
6
---
6
include/exec/memopidx.h | 55 +++++++++++++++++++++++++++++++++++++++++
7
accel/tcg/tb-hash.h | 1 +
7
include/tcg/tcg.h | 39 +----------------------------
8
accel/tcg/tb-jmp-cache.h | 24 ++++++++++++++++++++++++
8
2 files changed, 56 insertions(+), 38 deletions(-)
9
include/exec/cpu-common.h | 1 +
9
create mode 100644 include/exec/memopidx.h
10
include/hw/core/cpu.h | 15 +--------------
11
include/qemu/typedefs.h | 1 +
12
accel/stubs/tcg-stub.c | 4 ++++
13
accel/tcg/cpu-exec.c | 10 +++++++---
14
accel/tcg/cputlb.c | 9 +++++----
15
accel/tcg/translate-all.c | 28 +++++++++++++++++++++++++---
16
hw/core/cpu-common.c | 3 +--
17
plugins/core.c | 2 +-
18
trace/control-target.c | 2 +-
19
12 files changed, 72 insertions(+), 28 deletions(-)
20
create mode 100644 accel/tcg/tb-jmp-cache.h
10
21
11
diff --git a/include/exec/memopidx.h b/include/exec/memopidx.h
22
diff --git a/accel/tcg/tb-hash.h b/accel/tcg/tb-hash.h
23
index XXXXXXX..XXXXXXX 100644
24
--- a/accel/tcg/tb-hash.h
25
+++ b/accel/tcg/tb-hash.h
26
@@ -XXX,XX +XXX,XX @@
27
#include "exec/cpu-defs.h"
28
#include "exec/exec-all.h"
29
#include "qemu/xxhash.h"
30
+#include "tb-jmp-cache.h"
31
32
#ifdef CONFIG_SOFTMMU
33
34
diff --git a/accel/tcg/tb-jmp-cache.h b/accel/tcg/tb-jmp-cache.h
12
new file mode 100644
35
new file mode 100644
13
index XXXXXXX..XXXXXXX
36
index XXXXXXX..XXXXXXX
14
--- /dev/null
37
--- /dev/null
15
+++ b/include/exec/memopidx.h
38
+++ b/accel/tcg/tb-jmp-cache.h
16
@@ -XXX,XX +XXX,XX @@
39
@@ -XXX,XX +XXX,XX @@
17
+/*
40
+/*
18
+ * Combine the MemOp and mmu_idx parameters into a single value.
41
+ * The per-CPU TranslationBlock jump cache.
19
+ *
42
+ *
20
+ * Authors:
43
+ * Copyright (c) 2003 Fabrice Bellard
21
+ * Richard Henderson <rth@twiddle.net>
22
+ *
44
+ *
23
+ * This work is licensed under the terms of the GNU GPL, version 2 or later.
45
+ * SPDX-License-Identifier: GPL-2.0-or-later
24
+ * See the COPYING file in the top-level directory.
25
+ */
46
+ */
26
+
47
+
27
+#ifndef EXEC_MEMOPIDX_H
48
+#ifndef ACCEL_TCG_TB_JMP_CACHE_H
28
+#define EXEC_MEMOPIDX_H 1
49
+#define ACCEL_TCG_TB_JMP_CACHE_H
29
+
50
+
30
+#include "exec/memop.h"
51
+#define TB_JMP_CACHE_BITS 12
31
+
52
+#define TB_JMP_CACHE_SIZE (1 << TB_JMP_CACHE_BITS)
32
+typedef uint32_t MemOpIdx;
53
+
33
+
54
+/*
34
+/**
55
+ * Accessed in parallel; all accesses to 'tb' must be atomic.
35
+ * make_memop_idx
36
+ * @op: memory operation
37
+ * @idx: mmu index
38
+ *
39
+ * Encode these values into a single parameter.
40
+ */
56
+ */
41
+static inline MemOpIdx make_memop_idx(MemOp op, unsigned idx)
57
+struct CPUJumpCache {
42
+{
58
+ struct {
43
+#ifdef CONFIG_DEBUG_TCG
59
+ TranslationBlock *tb;
44
+ assert(idx <= 15);
60
+ } array[TB_JMP_CACHE_SIZE];
45
+#endif
61
+};
46
+ return (op << 4) | idx;
62
+
47
+}
63
+#endif /* ACCEL_TCG_TB_JMP_CACHE_H */
48
+
64
diff --git a/include/exec/cpu-common.h b/include/exec/cpu-common.h
49
+/**
65
index XXXXXXX..XXXXXXX 100644
50
+ * get_memop
66
--- a/include/exec/cpu-common.h
51
+ * @oi: combined op/idx parameter
67
+++ b/include/exec/cpu-common.h
52
+ *
68
@@ -XXX,XX +XXX,XX @@ void cpu_list_unlock(void);
53
+ * Extract the memory operation from the combined value.
69
unsigned int cpu_list_generation_id_get(void);
54
+ */
70
55
+static inline MemOp get_memop(MemOpIdx oi)
71
void tcg_flush_softmmu_tlb(CPUState *cs);
56
+{
72
+void tcg_flush_jmp_cache(CPUState *cs);
57
+ return oi >> 4;
73
58
+}
74
void tcg_iommu_init_notifier_list(CPUState *cpu);
59
+
75
void tcg_iommu_free_notifier_list(CPUState *cpu);
60
+/**
76
diff --git a/include/hw/core/cpu.h b/include/hw/core/cpu.h
61
+ * get_mmuidx
77
index XXXXXXX..XXXXXXX 100644
62
+ * @oi: combined op/idx parameter
78
--- a/include/hw/core/cpu.h
63
+ *
79
+++ b/include/hw/core/cpu.h
64
+ * Extract the mmu index from the combined value.
80
@@ -XXX,XX +XXX,XX @@ struct kvm_run;
65
+ */
81
struct hax_vcpu_state;
66
+static inline unsigned get_mmuidx(MemOpIdx oi)
82
struct hvf_vcpu_state;
67
+{
83
68
+ return oi & 15;
84
-#define TB_JMP_CACHE_BITS 12
69
+}
85
-#define TB_JMP_CACHE_SIZE (1 << TB_JMP_CACHE_BITS)
70
+
71
+#endif
72
diff --git a/include/tcg/tcg.h b/include/tcg/tcg.h
73
index XXXXXXX..XXXXXXX 100644
74
--- a/include/tcg/tcg.h
75
+++ b/include/tcg/tcg.h
76
@@ -XXX,XX +XXX,XX @@
77
78
#include "cpu.h"
79
#include "exec/memop.h"
80
+#include "exec/memopidx.h"
81
#include "qemu/bitops.h"
82
#include "qemu/plugin.h"
83
#include "qemu/queue.h"
84
@@ -XXX,XX +XXX,XX @@ static inline size_t tcg_current_code_size(TCGContext *s)
85
return tcg_ptr_byte_diff(s->code_ptr, s->code_buf);
86
}
87
88
-/* Combine the MemOp and mmu_idx parameters into a single value. */
89
-typedef uint32_t MemOpIdx;
90
-
86
-
91
-/**
87
/* work queue */
92
- * make_memop_idx
88
93
- * @op: memory operation
89
/* The union type allows passing of 64 bit target pointers on 32 bit
94
- * @idx: mmu index
90
@@ -XXX,XX +XXX,XX @@ struct CPUState {
95
- *
91
CPUArchState *env_ptr;
96
- * Encode these values into a single parameter.
92
IcountDecr *icount_decr_ptr;
97
- */
93
98
-static inline MemOpIdx make_memop_idx(MemOp op, unsigned idx)
94
- /* Accessed in parallel; all accesses must be atomic */
95
- TranslationBlock *tb_jmp_cache[TB_JMP_CACHE_SIZE];
96
+ CPUJumpCache *tb_jmp_cache;
97
98
struct GDBRegisterState *gdb_regs;
99
int gdb_num_regs;
100
@@ -XXX,XX +XXX,XX @@ extern CPUTailQ cpus;
101
102
extern __thread CPUState *current_cpu;
103
104
-static inline void cpu_tb_jmp_cache_clear(CPUState *cpu)
99
-{
105
-{
100
- tcg_debug_assert(idx <= 15);
106
- unsigned int i;
101
- return (op << 4) | idx;
102
-}
103
-
107
-
104
-/**
108
- for (i = 0; i < TB_JMP_CACHE_SIZE; i++) {
105
- * get_memop
109
- qatomic_set(&cpu->tb_jmp_cache[i], NULL);
106
- * @oi: combined op/idx parameter
110
- }
107
- *
108
- * Extract the memory operation from the combined value.
109
- */
110
-static inline MemOp get_memop(MemOpIdx oi)
111
-{
112
- return oi >> 4;
113
-}
114
-
115
-/**
116
- * get_mmuidx
117
- * @oi: combined op/idx parameter
118
- *
119
- * Extract the mmu index from the combined value.
120
- */
121
-static inline unsigned get_mmuidx(MemOpIdx oi)
122
-{
123
- return oi & 15;
124
-}
111
-}
125
-
112
-
126
/**
113
/**
127
* tcg_qemu_tb_exec:
114
* qemu_tcg_mttcg_enabled:
128
* @env: pointer to CPUArchState for the CPU
115
* Check whether we are running MultiThread TCG or not.
116
diff --git a/include/qemu/typedefs.h b/include/qemu/typedefs.h
117
index XXXXXXX..XXXXXXX 100644
118
--- a/include/qemu/typedefs.h
119
+++ b/include/qemu/typedefs.h
120
@@ -XXX,XX +XXX,XX @@ typedef struct CoMutex CoMutex;
121
typedef struct ConfidentialGuestSupport ConfidentialGuestSupport;
122
typedef struct CPUAddressSpace CPUAddressSpace;
123
typedef struct CPUArchState CPUArchState;
124
+typedef struct CPUJumpCache CPUJumpCache;
125
typedef struct CPUState CPUState;
126
typedef struct CPUTLBEntryFull CPUTLBEntryFull;
127
typedef struct DeviceListener DeviceListener;
128
diff --git a/accel/stubs/tcg-stub.c b/accel/stubs/tcg-stub.c
129
index XXXXXXX..XXXXXXX 100644
130
--- a/accel/stubs/tcg-stub.c
131
+++ b/accel/stubs/tcg-stub.c
132
@@ -XXX,XX +XXX,XX @@ void tlb_set_dirty(CPUState *cpu, target_ulong vaddr)
133
{
134
}
135
136
+void tcg_flush_jmp_cache(CPUState *cpu)
137
+{
138
+}
139
+
140
int probe_access_flags(CPUArchState *env, target_ulong addr,
141
MMUAccessType access_type, int mmu_idx,
142
bool nonfault, void **phost, uintptr_t retaddr)
143
diff --git a/accel/tcg/cpu-exec.c b/accel/tcg/cpu-exec.c
144
index XXXXXXX..XXXXXXX 100644
145
--- a/accel/tcg/cpu-exec.c
146
+++ b/accel/tcg/cpu-exec.c
147
@@ -XXX,XX +XXX,XX @@
148
#include "sysemu/replay.h"
149
#include "sysemu/tcg.h"
150
#include "exec/helper-proto.h"
151
+#include "tb-jmp-cache.h"
152
#include "tb-hash.h"
153
#include "tb-context.h"
154
#include "internal.h"
155
@@ -XXX,XX +XXX,XX @@ static inline TranslationBlock *tb_lookup(CPUState *cpu, target_ulong pc,
156
tcg_debug_assert(!(cflags & CF_INVALID));
157
158
hash = tb_jmp_cache_hash_func(pc);
159
- tb = qatomic_rcu_read(&cpu->tb_jmp_cache[hash]);
160
+ tb = qatomic_rcu_read(&cpu->tb_jmp_cache->array[hash].tb);
161
162
if (likely(tb &&
163
tb->pc == pc &&
164
@@ -XXX,XX +XXX,XX @@ static inline TranslationBlock *tb_lookup(CPUState *cpu, target_ulong pc,
165
if (tb == NULL) {
166
return NULL;
167
}
168
- qatomic_set(&cpu->tb_jmp_cache[hash], tb);
169
+ qatomic_set(&cpu->tb_jmp_cache->array[hash].tb, tb);
170
return tb;
171
}
172
173
@@ -XXX,XX +XXX,XX @@ int cpu_exec(CPUState *cpu)
174
175
tb = tb_lookup(cpu, pc, cs_base, flags, cflags);
176
if (tb == NULL) {
177
+ uint32_t h;
178
+
179
mmap_lock();
180
tb = tb_gen_code(cpu, pc, cs_base, flags, cflags);
181
mmap_unlock();
182
@@ -XXX,XX +XXX,XX @@ int cpu_exec(CPUState *cpu)
183
* We add the TB in the virtual pc hash table
184
* for the fast lookup
185
*/
186
- qatomic_set(&cpu->tb_jmp_cache[tb_jmp_cache_hash_func(pc)], tb);
187
+ h = tb_jmp_cache_hash_func(pc);
188
+ qatomic_set(&cpu->tb_jmp_cache->array[h].tb, tb);
189
}
190
191
#ifndef CONFIG_USER_ONLY
192
diff --git a/accel/tcg/cputlb.c b/accel/tcg/cputlb.c
193
index XXXXXXX..XXXXXXX 100644
194
--- a/accel/tcg/cputlb.c
195
+++ b/accel/tcg/cputlb.c
196
@@ -XXX,XX +XXX,XX @@ static void tlb_window_reset(CPUTLBDesc *desc, int64_t ns,
197
198
static void tb_jmp_cache_clear_page(CPUState *cpu, target_ulong page_addr)
199
{
200
- unsigned int i, i0 = tb_jmp_cache_hash_page(page_addr);
201
+ int i, i0 = tb_jmp_cache_hash_page(page_addr);
202
+ CPUJumpCache *jc = cpu->tb_jmp_cache;
203
204
for (i = 0; i < TB_JMP_PAGE_SIZE; i++) {
205
- qatomic_set(&cpu->tb_jmp_cache[i0 + i], NULL);
206
+ qatomic_set(&jc->array[i0 + i].tb, NULL);
207
}
208
}
209
210
@@ -XXX,XX +XXX,XX @@ static void tlb_flush_by_mmuidx_async_work(CPUState *cpu, run_on_cpu_data data)
211
212
qemu_spin_unlock(&env_tlb(env)->c.lock);
213
214
- cpu_tb_jmp_cache_clear(cpu);
215
+ tcg_flush_jmp_cache(cpu);
216
217
if (to_clean == ALL_MMUIDX_BITS) {
218
qatomic_set(&env_tlb(env)->c.full_flush_count,
219
@@ -XXX,XX +XXX,XX @@ static void tlb_flush_range_by_mmuidx_async_0(CPUState *cpu,
220
* longer to clear each entry individually than it will to clear it all.
221
*/
222
if (d.len >= (TARGET_PAGE_SIZE * TB_JMP_CACHE_SIZE)) {
223
- cpu_tb_jmp_cache_clear(cpu);
224
+ tcg_flush_jmp_cache(cpu);
225
return;
226
}
227
228
diff --git a/accel/tcg/translate-all.c b/accel/tcg/translate-all.c
229
index XXXXXXX..XXXXXXX 100644
230
--- a/accel/tcg/translate-all.c
231
+++ b/accel/tcg/translate-all.c
232
@@ -XXX,XX +XXX,XX @@
233
#include "sysemu/tcg.h"
234
#include "qapi/error.h"
235
#include "hw/core/tcg-cpu-ops.h"
236
+#include "tb-jmp-cache.h"
237
#include "tb-hash.h"
238
#include "tb-context.h"
239
#include "internal.h"
240
@@ -XXX,XX +XXX,XX @@ static void do_tb_flush(CPUState *cpu, run_on_cpu_data tb_flush_count)
241
}
242
243
CPU_FOREACH(cpu) {
244
- cpu_tb_jmp_cache_clear(cpu);
245
+ tcg_flush_jmp_cache(cpu);
246
}
247
248
qht_reset_size(&tb_ctx.htable, CODE_GEN_HTABLE_SIZE);
249
@@ -XXX,XX +XXX,XX @@ static void do_tb_phys_invalidate(TranslationBlock *tb, bool rm_from_page_list)
250
/* remove the TB from the hash list */
251
h = tb_jmp_cache_hash_func(tb->pc);
252
CPU_FOREACH(cpu) {
253
- if (qatomic_read(&cpu->tb_jmp_cache[h]) == tb) {
254
- qatomic_set(&cpu->tb_jmp_cache[h], NULL);
255
+ CPUJumpCache *jc = cpu->tb_jmp_cache;
256
+ if (qatomic_read(&jc->array[h].tb) == tb) {
257
+ qatomic_set(&jc->array[h].tb, NULL);
258
}
259
}
260
261
@@ -XXX,XX +XXX,XX @@ int page_unprotect(target_ulong address, uintptr_t pc)
262
}
263
#endif /* CONFIG_USER_ONLY */
264
265
+/*
266
+ * Called by generic code at e.g. cpu reset after cpu creation,
267
+ * therefore we must be prepared to allocate the jump cache.
268
+ */
269
+void tcg_flush_jmp_cache(CPUState *cpu)
270
+{
271
+ CPUJumpCache *jc = cpu->tb_jmp_cache;
272
+
273
+ if (likely(jc)) {
274
+ for (int i = 0; i < TB_JMP_CACHE_SIZE; i++) {
275
+ qatomic_set(&jc->array[i].tb, NULL);
276
+ }
277
+ } else {
278
+ /* This should happen once during realize, and thus never race. */
279
+ jc = g_new0(CPUJumpCache, 1);
280
+ jc = qatomic_xchg(&cpu->tb_jmp_cache, jc);
281
+ assert(jc == NULL);
282
+ }
283
+}
284
+
285
/* This is a wrapper for common code that can not use CONFIG_SOFTMMU */
286
void tcg_flush_softmmu_tlb(CPUState *cs)
287
{
288
diff --git a/hw/core/cpu-common.c b/hw/core/cpu-common.c
289
index XXXXXXX..XXXXXXX 100644
290
--- a/hw/core/cpu-common.c
291
+++ b/hw/core/cpu-common.c
292
@@ -XXX,XX +XXX,XX @@ static void cpu_common_reset(DeviceState *dev)
293
cpu->cflags_next_tb = -1;
294
295
if (tcg_enabled()) {
296
- cpu_tb_jmp_cache_clear(cpu);
297
-
298
+ tcg_flush_jmp_cache(cpu);
299
tcg_flush_softmmu_tlb(cpu);
300
}
301
}
302
diff --git a/plugins/core.c b/plugins/core.c
303
index XXXXXXX..XXXXXXX 100644
304
--- a/plugins/core.c
305
+++ b/plugins/core.c
306
@@ -XXX,XX +XXX,XX @@ struct qemu_plugin_ctx *plugin_id_to_ctx_locked(qemu_plugin_id_t id)
307
static void plugin_cpu_update__async(CPUState *cpu, run_on_cpu_data data)
308
{
309
bitmap_copy(cpu->plugin_mask, &data.host_ulong, QEMU_PLUGIN_EV_MAX);
310
- cpu_tb_jmp_cache_clear(cpu);
311
+ tcg_flush_jmp_cache(cpu);
312
}
313
314
static void plugin_cpu_update__locked(gpointer k, gpointer v, gpointer udata)
315
diff --git a/trace/control-target.c b/trace/control-target.c
316
index XXXXXXX..XXXXXXX 100644
317
--- a/trace/control-target.c
318
+++ b/trace/control-target.c
319
@@ -XXX,XX +XXX,XX @@ static void trace_event_synchronize_vcpu_state_dynamic(
320
{
321
bitmap_copy(vcpu->trace_dstate, vcpu->trace_dstate_delayed,
322
CPU_TRACE_DSTATE_MAX_EVENTS);
323
- cpu_tb_jmp_cache_clear(vcpu);
324
+ tcg_flush_jmp_cache(vcpu);
325
}
326
327
void trace_event_set_vcpu_state_dynamic(CPUState *vcpu,
129
--
328
--
130
2.25.1
329
2.34.1
131
330
132
331
diff view generated by jsdifflib
1
Reviewed-by: David Hildenbrand <david@redhat.com>
1
Populate this new method for all targets. Always match
2
the result that would be given by cpu_get_tb_cpu_state,
3
as we will want these values to correspond in the logs.
4
5
Reviewed-by: Taylor Simpson <tsimpson@quicinc.com>
6
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
7
Reviewed-by: Mark Cave-Ayland <mark.cave-ayland@ilande.co.uk> (target/sparc)
2
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
3
---
9
---
4
tcg/s390x/tcg-target.c.inc | 132 +++++++++++++++++++++++++++++++++----
10
Cc: Eduardo Habkost <eduardo@habkost.net> (supporter:Machine core)
5
1 file changed, 120 insertions(+), 12 deletions(-)
11
Cc: Marcel Apfelbaum <marcel.apfelbaum@gmail.com> (supporter:Machine core)
12
Cc: "Philippe Mathieu-Daudé" <f4bug@amsat.org> (reviewer:Machine core)
13
Cc: Yanan Wang <wangyanan55@huawei.com> (reviewer:Machine core)
14
Cc: Michael Rolnik <mrolnik@gmail.com> (maintainer:AVR TCG CPUs)
15
Cc: "Edgar E. Iglesias" <edgar.iglesias@gmail.com> (maintainer:CRIS TCG CPUs)
16
Cc: Taylor Simpson <tsimpson@quicinc.com> (supporter:Hexagon TCG CPUs)
17
Cc: Song Gao <gaosong@loongson.cn> (maintainer:LoongArch TCG CPUs)
18
Cc: Xiaojuan Yang <yangxiaojuan@loongson.cn> (maintainer:LoongArch TCG CPUs)
19
Cc: Laurent Vivier <laurent@vivier.eu> (maintainer:M68K TCG CPUs)
20
Cc: Jiaxun Yang <jiaxun.yang@flygoat.com> (reviewer:MIPS TCG CPUs)
21
Cc: Aleksandar Rikalo <aleksandar.rikalo@syrmia.com> (reviewer:MIPS TCG CPUs)
22
Cc: Chris Wulff <crwulff@gmail.com> (maintainer:NiosII TCG CPUs)
23
Cc: Marek Vasut <marex@denx.de> (maintainer:NiosII TCG CPUs)
24
Cc: Stafford Horne <shorne@gmail.com> (odd fixer:OpenRISC TCG CPUs)
25
Cc: Yoshinori Sato <ysato@users.sourceforge.jp> (reviewer:RENESAS RX CPUs)
26
Cc: Mark Cave-Ayland <mark.cave-ayland@ilande.co.uk> (maintainer:SPARC TCG CPUs)
27
Cc: Bastian Koppelmann <kbastian@mail.uni-paderborn.de> (maintainer:TriCore TCG CPUs)
28
Cc: Max Filippov <jcmvbkbc@gmail.com> (maintainer:Xtensa TCG CPUs)
29
Cc: qemu-arm@nongnu.org (open list:ARM TCG CPUs)
30
Cc: qemu-ppc@nongnu.org (open list:PowerPC TCG CPUs)
31
Cc: qemu-riscv@nongnu.org (open list:RISC-V TCG CPUs)
32
Cc: qemu-s390x@nongnu.org (open list:S390 TCG CPUs)
33
---
34
include/hw/core/cpu.h | 3 +++
35
target/alpha/cpu.c | 9 +++++++++
36
target/arm/cpu.c | 13 +++++++++++++
37
target/avr/cpu.c | 8 ++++++++
38
target/cris/cpu.c | 8 ++++++++
39
target/hexagon/cpu.c | 8 ++++++++
40
target/hppa/cpu.c | 8 ++++++++
41
target/i386/cpu.c | 9 +++++++++
42
target/loongarch/cpu.c | 9 +++++++++
43
target/m68k/cpu.c | 8 ++++++++
44
target/microblaze/cpu.c | 8 ++++++++
45
target/mips/cpu.c | 8 ++++++++
46
target/nios2/cpu.c | 9 +++++++++
47
target/openrisc/cpu.c | 8 ++++++++
48
target/ppc/cpu_init.c | 8 ++++++++
49
target/riscv/cpu.c | 13 +++++++++++++
50
target/rx/cpu.c | 8 ++++++++
51
target/s390x/cpu.c | 8 ++++++++
52
target/sh4/cpu.c | 8 ++++++++
53
target/sparc/cpu.c | 8 ++++++++
54
target/tricore/cpu.c | 9 +++++++++
55
target/xtensa/cpu.c | 8 ++++++++
56
22 files changed, 186 insertions(+)
6
57
7
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
58
diff --git a/include/hw/core/cpu.h b/include/hw/core/cpu.h
8
index XXXXXXX..XXXXXXX 100644
59
index XXXXXXX..XXXXXXX 100644
9
--- a/tcg/s390x/tcg-target.c.inc
60
--- a/include/hw/core/cpu.h
10
+++ b/tcg/s390x/tcg-target.c.inc
61
+++ b/include/hw/core/cpu.h
11
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
62
@@ -XXX,XX +XXX,XX @@ struct SysemuCPUOps;
12
RX_STC = 0x42,
63
* If the target behaviour here is anything other than "set
13
RX_STH = 0x40,
64
* the PC register to the value passed in" then the target must
14
65
* also implement the synchronize_from_tb hook.
15
+ VRX_VL = 0xe706,
66
+ * @get_pc: Callback for getting the Program Counter register.
16
+ VRX_VLLEZ = 0xe704,
67
+ * As above, with the semantics of the target architecture.
17
+ VRX_VST = 0xe70e,
68
* @gdb_read_register: Callback for letting GDB read a register.
18
+ VRX_VSTEF = 0xe70b,
69
* @gdb_write_register: Callback for letting GDB write a register.
19
+ VRX_VSTEG = 0xe70a,
70
* @gdb_adjust_breakpoint: Callback for adjusting the address of a
20
+
71
@@ -XXX,XX +XXX,XX @@ struct CPUClass {
21
NOP = 0x0707,
72
void (*dump_state)(CPUState *cpu, FILE *, int flags);
22
} S390Opcode;
73
int64_t (*get_arch_id)(CPUState *cpu);
23
74
void (*set_pc)(CPUState *cpu, vaddr value);
24
@@ -XXX,XX +XXX,XX @@ static void * const qemu_st_helpers[(MO_SIZE | MO_BSWAP) + 1] = {
75
+ vaddr (*get_pc)(CPUState *cpu);
25
static const tcg_insn_unit *tb_ret_addr;
76
int (*gdb_read_register)(CPUState *cpu, GByteArray *buf, int reg);
26
uint64_t s390_facilities[3];
77
int (*gdb_write_register)(CPUState *cpu, uint8_t *buf, int reg);
27
78
vaddr (*gdb_adjust_breakpoint)(CPUState *cpu, vaddr addr);
28
+static inline bool is_general_reg(TCGReg r)
79
diff --git a/target/alpha/cpu.c b/target/alpha/cpu.c
29
+{
80
index XXXXXXX..XXXXXXX 100644
30
+ return r <= TCG_REG_R15;
81
--- a/target/alpha/cpu.c
31
+}
82
+++ b/target/alpha/cpu.c
32
+
83
@@ -XXX,XX +XXX,XX @@ static void alpha_cpu_set_pc(CPUState *cs, vaddr value)
33
+static inline bool is_vector_reg(TCGReg r)
84
cpu->env.pc = value;
34
+{
85
}
35
+ return r >= TCG_REG_V0 && r <= TCG_REG_V31;
86
36
+}
87
+static vaddr alpha_cpu_get_pc(CPUState *cs)
37
+
88
+{
38
static bool patch_reloc(tcg_insn_unit *src_rw, int type,
89
+ AlphaCPU *cpu = ALPHA_CPU(cs);
39
intptr_t value, intptr_t addend)
90
+
40
{
91
+ return cpu->env.pc;
41
@@ -XXX,XX +XXX,XX @@ static void tcg_out_insn_RSY(TCGContext *s, S390Opcode op, TCGReg r1,
92
+}
42
#define tcg_out_insn_RX tcg_out_insn_RS
93
+
43
#define tcg_out_insn_RXY tcg_out_insn_RSY
94
+
44
95
static bool alpha_cpu_has_work(CPUState *cs)
45
+static int RXB(TCGReg v1, TCGReg v2, TCGReg v3, TCGReg v4)
96
{
46
+{
97
/* Here we are checking to see if the CPU should wake up from HALT.
47
+ /*
98
@@ -XXX,XX +XXX,XX @@ static void alpha_cpu_class_init(ObjectClass *oc, void *data)
48
+ * Shift bit 4 of each regno to its corresponding bit of RXB.
99
cc->has_work = alpha_cpu_has_work;
49
+ * RXB itself begins at bit 8 of the instruction so 8 - 4 = 4
100
cc->dump_state = alpha_cpu_dump_state;
50
+ * is the left-shift of the 4th operand.
101
cc->set_pc = alpha_cpu_set_pc;
51
+ */
102
+ cc->get_pc = alpha_cpu_get_pc;
52
+ return ((v1 & 0x10) << (4 + 3))
103
cc->gdb_read_register = alpha_cpu_gdb_read_register;
53
+ | ((v2 & 0x10) << (4 + 2))
104
cc->gdb_write_register = alpha_cpu_gdb_write_register;
54
+ | ((v3 & 0x10) << (4 + 1))
105
#ifndef CONFIG_USER_ONLY
55
+ | ((v4 & 0x10) << (4 + 0));
106
diff --git a/target/arm/cpu.c b/target/arm/cpu.c
56
+}
107
index XXXXXXX..XXXXXXX 100644
57
+
108
--- a/target/arm/cpu.c
58
+static void tcg_out_insn_VRX(TCGContext *s, S390Opcode op, TCGReg v1,
109
+++ b/target/arm/cpu.c
59
+ TCGReg b2, TCGReg x2, intptr_t d2, int m3)
110
@@ -XXX,XX +XXX,XX @@ static void arm_cpu_set_pc(CPUState *cs, vaddr value)
60
+{
61
+ tcg_debug_assert(is_vector_reg(v1));
62
+ tcg_debug_assert(d2 >= 0 && d2 <= 0xfff);
63
+ tcg_debug_assert(is_general_reg(x2));
64
+ tcg_debug_assert(is_general_reg(b2));
65
+ tcg_out16(s, (op & 0xff00) | ((v1 & 0xf) << 4) | x2);
66
+ tcg_out16(s, (b2 << 12) | d2);
67
+ tcg_out16(s, (op & 0x00ff) | RXB(v1, 0, 0, 0) | (m3 << 12));
68
+}
69
+
70
/* Emit an opcode with "type-checking" of the format. */
71
#define tcg_out_insn(S, FMT, OP, ...) \
72
glue(tcg_out_insn_,FMT)(S, glue(glue(FMT,_),OP), ## __VA_ARGS__)
73
@@ -XXX,XX +XXX,XX @@ static void tcg_out_mem(TCGContext *s, S390Opcode opc_rx, S390Opcode opc_rxy,
74
}
111
}
75
}
112
}
76
113
77
+static void tcg_out_vrx_mem(TCGContext *s, S390Opcode opc_vrx,
114
+static vaddr arm_cpu_get_pc(CPUState *cs)
78
+ TCGReg data, TCGReg base, TCGReg index,
115
+{
79
+ tcg_target_long ofs, int m3)
116
+ ARMCPU *cpu = ARM_CPU(cs);
80
+{
117
+ CPUARMState *env = &cpu->env;
81
+ if (ofs < 0 || ofs >= 0x1000) {
118
+
82
+ if (ofs >= -0x80000 && ofs < 0x80000) {
119
+ if (is_a64(env)) {
83
+ tcg_out_insn(s, RXY, LAY, TCG_TMP0, base, index, ofs);
120
+ return env->pc;
84
+ base = TCG_TMP0;
121
+ } else {
85
+ index = TCG_REG_NONE;
122
+ return env->regs[15];
86
+ ofs = 0;
87
+ } else {
88
+ tcg_out_movi(s, TCG_TYPE_PTR, TCG_TMP0, ofs);
89
+ if (index != TCG_REG_NONE) {
90
+ tcg_out_insn(s, RRE, AGR, TCG_TMP0, index);
91
+ }
92
+ index = TCG_TMP0;
93
+ ofs = 0;
94
+ }
95
+ }
123
+ }
96
+ tcg_out_insn_VRX(s, opc_vrx, data, base, index, ofs, m3);
124
+}
97
+}
125
+
98
126
#ifdef CONFIG_TCG
99
/* load data without address translation or endianness conversion */
127
void arm_cpu_synchronize_from_tb(CPUState *cs,
100
-static inline void tcg_out_ld(TCGContext *s, TCGType type, TCGReg data,
128
const TranslationBlock *tb)
101
- TCGReg base, intptr_t ofs)
129
@@ -XXX,XX +XXX,XX @@ static void arm_cpu_class_init(ObjectClass *oc, void *data)
102
+static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg data,
130
cc->has_work = arm_cpu_has_work;
103
+ TCGReg base, intptr_t ofs)
131
cc->dump_state = arm_cpu_dump_state;
104
{
132
cc->set_pc = arm_cpu_set_pc;
105
- if (type == TCG_TYPE_I32) {
133
+ cc->get_pc = arm_cpu_get_pc;
106
- tcg_out_mem(s, RX_L, RXY_LY, data, base, TCG_REG_NONE, ofs);
134
cc->gdb_read_register = arm_cpu_gdb_read_register;
107
- } else {
135
cc->gdb_write_register = arm_cpu_gdb_write_register;
108
- tcg_out_mem(s, 0, RXY_LG, data, base, TCG_REG_NONE, ofs);
136
#ifndef CONFIG_USER_ONLY
109
+ switch (type) {
137
diff --git a/target/avr/cpu.c b/target/avr/cpu.c
110
+ case TCG_TYPE_I32:
138
index XXXXXXX..XXXXXXX 100644
111
+ if (likely(is_general_reg(data))) {
139
--- a/target/avr/cpu.c
112
+ tcg_out_mem(s, RX_L, RXY_LY, data, base, TCG_REG_NONE, ofs);
140
+++ b/target/avr/cpu.c
113
+ break;
141
@@ -XXX,XX +XXX,XX @@ static void avr_cpu_set_pc(CPUState *cs, vaddr value)
114
+ }
142
cpu->env.pc_w = value / 2; /* internally PC points to words */
115
+ tcg_out_vrx_mem(s, VRX_VLLEZ, data, base, TCG_REG_NONE, ofs, MO_32);
143
}
116
+ break;
144
117
+
145
+static vaddr avr_cpu_get_pc(CPUState *cs)
118
+ case TCG_TYPE_I64:
146
+{
119
+ if (likely(is_general_reg(data))) {
147
+ AVRCPU *cpu = AVR_CPU(cs);
120
+ tcg_out_mem(s, 0, RXY_LG, data, base, TCG_REG_NONE, ofs);
148
+
121
+ break;
149
+ return cpu->env.pc_w * 2;
122
+ }
150
+}
123
+ /* fallthru */
151
+
124
+
152
static bool avr_cpu_has_work(CPUState *cs)
125
+ case TCG_TYPE_V64:
153
{
126
+ tcg_out_vrx_mem(s, VRX_VLLEZ, data, base, TCG_REG_NONE, ofs, MO_64);
154
AVRCPU *cpu = AVR_CPU(cs);
127
+ break;
155
@@ -XXX,XX +XXX,XX @@ static void avr_cpu_class_init(ObjectClass *oc, void *data)
128
+
156
cc->has_work = avr_cpu_has_work;
129
+ case TCG_TYPE_V128:
157
cc->dump_state = avr_cpu_dump_state;
130
+ /* Hint quadword aligned. */
158
cc->set_pc = avr_cpu_set_pc;
131
+ tcg_out_vrx_mem(s, VRX_VL, data, base, TCG_REG_NONE, ofs, 4);
159
+ cc->get_pc = avr_cpu_get_pc;
132
+ break;
160
dc->vmsd = &vms_avr_cpu;
133
+
161
cc->sysemu_ops = &avr_sysemu_ops;
134
+ default:
162
cc->disas_set_info = avr_cpu_disas_set_info;
135
+ g_assert_not_reached();
163
diff --git a/target/cris/cpu.c b/target/cris/cpu.c
164
index XXXXXXX..XXXXXXX 100644
165
--- a/target/cris/cpu.c
166
+++ b/target/cris/cpu.c
167
@@ -XXX,XX +XXX,XX @@ static void cris_cpu_set_pc(CPUState *cs, vaddr value)
168
cpu->env.pc = value;
169
}
170
171
+static vaddr cris_cpu_get_pc(CPUState *cs)
172
+{
173
+ CRISCPU *cpu = CRIS_CPU(cs);
174
+
175
+ return cpu->env.pc;
176
+}
177
+
178
static bool cris_cpu_has_work(CPUState *cs)
179
{
180
return cs->interrupt_request & (CPU_INTERRUPT_HARD | CPU_INTERRUPT_NMI);
181
@@ -XXX,XX +XXX,XX @@ static void cris_cpu_class_init(ObjectClass *oc, void *data)
182
cc->has_work = cris_cpu_has_work;
183
cc->dump_state = cris_cpu_dump_state;
184
cc->set_pc = cris_cpu_set_pc;
185
+ cc->get_pc = cris_cpu_get_pc;
186
cc->gdb_read_register = cris_cpu_gdb_read_register;
187
cc->gdb_write_register = cris_cpu_gdb_write_register;
188
#ifndef CONFIG_USER_ONLY
189
diff --git a/target/hexagon/cpu.c b/target/hexagon/cpu.c
190
index XXXXXXX..XXXXXXX 100644
191
--- a/target/hexagon/cpu.c
192
+++ b/target/hexagon/cpu.c
193
@@ -XXX,XX +XXX,XX @@ static void hexagon_cpu_set_pc(CPUState *cs, vaddr value)
194
env->gpr[HEX_REG_PC] = value;
195
}
196
197
+static vaddr hexagon_cpu_get_pc(CPUState *cs)
198
+{
199
+ HexagonCPU *cpu = HEXAGON_CPU(cs);
200
+ CPUHexagonState *env = &cpu->env;
201
+ return env->gpr[HEX_REG_PC];
202
+}
203
+
204
static void hexagon_cpu_synchronize_from_tb(CPUState *cs,
205
const TranslationBlock *tb)
206
{
207
@@ -XXX,XX +XXX,XX @@ static void hexagon_cpu_class_init(ObjectClass *c, void *data)
208
cc->has_work = hexagon_cpu_has_work;
209
cc->dump_state = hexagon_dump_state;
210
cc->set_pc = hexagon_cpu_set_pc;
211
+ cc->get_pc = hexagon_cpu_get_pc;
212
cc->gdb_read_register = hexagon_gdb_read_register;
213
cc->gdb_write_register = hexagon_gdb_write_register;
214
cc->gdb_num_core_regs = TOTAL_PER_THREAD_REGS + NUM_VREGS + NUM_QREGS;
215
diff --git a/target/hppa/cpu.c b/target/hppa/cpu.c
216
index XXXXXXX..XXXXXXX 100644
217
--- a/target/hppa/cpu.c
218
+++ b/target/hppa/cpu.c
219
@@ -XXX,XX +XXX,XX @@ static void hppa_cpu_set_pc(CPUState *cs, vaddr value)
220
cpu->env.iaoq_b = value + 4;
221
}
222
223
+static vaddr hppa_cpu_get_pc(CPUState *cs)
224
+{
225
+ HPPACPU *cpu = HPPA_CPU(cs);
226
+
227
+ return cpu->env.iaoq_f;
228
+}
229
+
230
static void hppa_cpu_synchronize_from_tb(CPUState *cs,
231
const TranslationBlock *tb)
232
{
233
@@ -XXX,XX +XXX,XX @@ static void hppa_cpu_class_init(ObjectClass *oc, void *data)
234
cc->has_work = hppa_cpu_has_work;
235
cc->dump_state = hppa_cpu_dump_state;
236
cc->set_pc = hppa_cpu_set_pc;
237
+ cc->get_pc = hppa_cpu_get_pc;
238
cc->gdb_read_register = hppa_cpu_gdb_read_register;
239
cc->gdb_write_register = hppa_cpu_gdb_write_register;
240
#ifndef CONFIG_USER_ONLY
241
diff --git a/target/i386/cpu.c b/target/i386/cpu.c
242
index XXXXXXX..XXXXXXX 100644
243
--- a/target/i386/cpu.c
244
+++ b/target/i386/cpu.c
245
@@ -XXX,XX +XXX,XX @@ static void x86_cpu_set_pc(CPUState *cs, vaddr value)
246
cpu->env.eip = value;
247
}
248
249
+static vaddr x86_cpu_get_pc(CPUState *cs)
250
+{
251
+ X86CPU *cpu = X86_CPU(cs);
252
+
253
+ /* Match cpu_get_tb_cpu_state. */
254
+ return cpu->env.eip + cpu->env.segs[R_CS].base;
255
+}
256
+
257
int x86_cpu_pending_interrupt(CPUState *cs, int interrupt_request)
258
{
259
X86CPU *cpu = X86_CPU(cs);
260
@@ -XXX,XX +XXX,XX @@ static void x86_cpu_common_class_init(ObjectClass *oc, void *data)
261
cc->has_work = x86_cpu_has_work;
262
cc->dump_state = x86_cpu_dump_state;
263
cc->set_pc = x86_cpu_set_pc;
264
+ cc->get_pc = x86_cpu_get_pc;
265
cc->gdb_read_register = x86_cpu_gdb_read_register;
266
cc->gdb_write_register = x86_cpu_gdb_write_register;
267
cc->get_arch_id = x86_cpu_get_arch_id;
268
diff --git a/target/loongarch/cpu.c b/target/loongarch/cpu.c
269
index XXXXXXX..XXXXXXX 100644
270
--- a/target/loongarch/cpu.c
271
+++ b/target/loongarch/cpu.c
272
@@ -XXX,XX +XXX,XX @@ static void loongarch_cpu_set_pc(CPUState *cs, vaddr value)
273
env->pc = value;
274
}
275
276
+static vaddr loongarch_cpu_get_pc(CPUState *cs)
277
+{
278
+ LoongArchCPU *cpu = LOONGARCH_CPU(cs);
279
+ CPULoongArchState *env = &cpu->env;
280
+
281
+ return env->pc;
282
+}
283
+
284
#ifndef CONFIG_USER_ONLY
285
#include "hw/loongarch/virt.h"
286
287
@@ -XXX,XX +XXX,XX @@ static void loongarch_cpu_class_init(ObjectClass *c, void *data)
288
cc->has_work = loongarch_cpu_has_work;
289
cc->dump_state = loongarch_cpu_dump_state;
290
cc->set_pc = loongarch_cpu_set_pc;
291
+ cc->get_pc = loongarch_cpu_get_pc;
292
#ifndef CONFIG_USER_ONLY
293
dc->vmsd = &vmstate_loongarch_cpu;
294
cc->sysemu_ops = &loongarch_sysemu_ops;
295
diff --git a/target/m68k/cpu.c b/target/m68k/cpu.c
296
index XXXXXXX..XXXXXXX 100644
297
--- a/target/m68k/cpu.c
298
+++ b/target/m68k/cpu.c
299
@@ -XXX,XX +XXX,XX @@ static void m68k_cpu_set_pc(CPUState *cs, vaddr value)
300
cpu->env.pc = value;
301
}
302
303
+static vaddr m68k_cpu_get_pc(CPUState *cs)
304
+{
305
+ M68kCPU *cpu = M68K_CPU(cs);
306
+
307
+ return cpu->env.pc;
308
+}
309
+
310
static bool m68k_cpu_has_work(CPUState *cs)
311
{
312
return cs->interrupt_request & CPU_INTERRUPT_HARD;
313
@@ -XXX,XX +XXX,XX @@ static void m68k_cpu_class_init(ObjectClass *c, void *data)
314
cc->has_work = m68k_cpu_has_work;
315
cc->dump_state = m68k_cpu_dump_state;
316
cc->set_pc = m68k_cpu_set_pc;
317
+ cc->get_pc = m68k_cpu_get_pc;
318
cc->gdb_read_register = m68k_cpu_gdb_read_register;
319
cc->gdb_write_register = m68k_cpu_gdb_write_register;
320
#if defined(CONFIG_SOFTMMU)
321
diff --git a/target/microblaze/cpu.c b/target/microblaze/cpu.c
322
index XXXXXXX..XXXXXXX 100644
323
--- a/target/microblaze/cpu.c
324
+++ b/target/microblaze/cpu.c
325
@@ -XXX,XX +XXX,XX @@ static void mb_cpu_set_pc(CPUState *cs, vaddr value)
326
cpu->env.iflags = 0;
327
}
328
329
+static vaddr mb_cpu_get_pc(CPUState *cs)
330
+{
331
+ MicroBlazeCPU *cpu = MICROBLAZE_CPU(cs);
332
+
333
+ return cpu->env.pc;
334
+}
335
+
336
static void mb_cpu_synchronize_from_tb(CPUState *cs,
337
const TranslationBlock *tb)
338
{
339
@@ -XXX,XX +XXX,XX @@ static void mb_cpu_class_init(ObjectClass *oc, void *data)
340
341
cc->dump_state = mb_cpu_dump_state;
342
cc->set_pc = mb_cpu_set_pc;
343
+ cc->get_pc = mb_cpu_get_pc;
344
cc->gdb_read_register = mb_cpu_gdb_read_register;
345
cc->gdb_write_register = mb_cpu_gdb_write_register;
346
347
diff --git a/target/mips/cpu.c b/target/mips/cpu.c
348
index XXXXXXX..XXXXXXX 100644
349
--- a/target/mips/cpu.c
350
+++ b/target/mips/cpu.c
351
@@ -XXX,XX +XXX,XX @@ static void mips_cpu_set_pc(CPUState *cs, vaddr value)
352
mips_env_set_pc(&cpu->env, value);
353
}
354
355
+static vaddr mips_cpu_get_pc(CPUState *cs)
356
+{
357
+ MIPSCPU *cpu = MIPS_CPU(cs);
358
+
359
+ return cpu->env.active_tc.PC;
360
+}
361
+
362
static bool mips_cpu_has_work(CPUState *cs)
363
{
364
MIPSCPU *cpu = MIPS_CPU(cs);
365
@@ -XXX,XX +XXX,XX @@ static void mips_cpu_class_init(ObjectClass *c, void *data)
366
cc->has_work = mips_cpu_has_work;
367
cc->dump_state = mips_cpu_dump_state;
368
cc->set_pc = mips_cpu_set_pc;
369
+ cc->get_pc = mips_cpu_get_pc;
370
cc->gdb_read_register = mips_cpu_gdb_read_register;
371
cc->gdb_write_register = mips_cpu_gdb_write_register;
372
#ifndef CONFIG_USER_ONLY
373
diff --git a/target/nios2/cpu.c b/target/nios2/cpu.c
374
index XXXXXXX..XXXXXXX 100644
375
--- a/target/nios2/cpu.c
376
+++ b/target/nios2/cpu.c
377
@@ -XXX,XX +XXX,XX @@ static void nios2_cpu_set_pc(CPUState *cs, vaddr value)
378
env->pc = value;
379
}
380
381
+static vaddr nios2_cpu_get_pc(CPUState *cs)
382
+{
383
+ Nios2CPU *cpu = NIOS2_CPU(cs);
384
+ CPUNios2State *env = &cpu->env;
385
+
386
+ return env->pc;
387
+}
388
+
389
static bool nios2_cpu_has_work(CPUState *cs)
390
{
391
return cs->interrupt_request & CPU_INTERRUPT_HARD;
392
@@ -XXX,XX +XXX,XX @@ static void nios2_cpu_class_init(ObjectClass *oc, void *data)
393
cc->has_work = nios2_cpu_has_work;
394
cc->dump_state = nios2_cpu_dump_state;
395
cc->set_pc = nios2_cpu_set_pc;
396
+ cc->get_pc = nios2_cpu_get_pc;
397
cc->disas_set_info = nios2_cpu_disas_set_info;
398
#ifndef CONFIG_USER_ONLY
399
cc->sysemu_ops = &nios2_sysemu_ops;
400
diff --git a/target/openrisc/cpu.c b/target/openrisc/cpu.c
401
index XXXXXXX..XXXXXXX 100644
402
--- a/target/openrisc/cpu.c
403
+++ b/target/openrisc/cpu.c
404
@@ -XXX,XX +XXX,XX @@ static void openrisc_cpu_set_pc(CPUState *cs, vaddr value)
405
cpu->env.dflag = 0;
406
}
407
408
+static vaddr openrisc_cpu_get_pc(CPUState *cs)
409
+{
410
+ OpenRISCCPU *cpu = OPENRISC_CPU(cs);
411
+
412
+ return cpu->env.pc;
413
+}
414
+
415
static void openrisc_cpu_synchronize_from_tb(CPUState *cs,
416
const TranslationBlock *tb)
417
{
418
@@ -XXX,XX +XXX,XX @@ static void openrisc_cpu_class_init(ObjectClass *oc, void *data)
419
cc->has_work = openrisc_cpu_has_work;
420
cc->dump_state = openrisc_cpu_dump_state;
421
cc->set_pc = openrisc_cpu_set_pc;
422
+ cc->get_pc = openrisc_cpu_get_pc;
423
cc->gdb_read_register = openrisc_cpu_gdb_read_register;
424
cc->gdb_write_register = openrisc_cpu_gdb_write_register;
425
#ifndef CONFIG_USER_ONLY
426
diff --git a/target/ppc/cpu_init.c b/target/ppc/cpu_init.c
427
index XXXXXXX..XXXXXXX 100644
428
--- a/target/ppc/cpu_init.c
429
+++ b/target/ppc/cpu_init.c
430
@@ -XXX,XX +XXX,XX @@ static void ppc_cpu_set_pc(CPUState *cs, vaddr value)
431
cpu->env.nip = value;
432
}
433
434
+static vaddr ppc_cpu_get_pc(CPUState *cs)
435
+{
436
+ PowerPCCPU *cpu = POWERPC_CPU(cs);
437
+
438
+ return cpu->env.nip;
439
+}
440
+
441
static bool ppc_cpu_has_work(CPUState *cs)
442
{
443
PowerPCCPU *cpu = POWERPC_CPU(cs);
444
@@ -XXX,XX +XXX,XX @@ static void ppc_cpu_class_init(ObjectClass *oc, void *data)
445
cc->has_work = ppc_cpu_has_work;
446
cc->dump_state = ppc_cpu_dump_state;
447
cc->set_pc = ppc_cpu_set_pc;
448
+ cc->get_pc = ppc_cpu_get_pc;
449
cc->gdb_read_register = ppc_cpu_gdb_read_register;
450
cc->gdb_write_register = ppc_cpu_gdb_write_register;
451
#ifndef CONFIG_USER_ONLY
452
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
453
index XXXXXXX..XXXXXXX 100644
454
--- a/target/riscv/cpu.c
455
+++ b/target/riscv/cpu.c
456
@@ -XXX,XX +XXX,XX @@ static void riscv_cpu_set_pc(CPUState *cs, vaddr value)
136
}
457
}
137
}
458
}
138
459
139
-static inline void tcg_out_st(TCGContext *s, TCGType type, TCGReg data,
460
+static vaddr riscv_cpu_get_pc(CPUState *cs)
140
- TCGReg base, intptr_t ofs)
461
+{
141
+static void tcg_out_st(TCGContext *s, TCGType type, TCGReg data,
462
+ RISCVCPU *cpu = RISCV_CPU(cs);
142
+ TCGReg base, intptr_t ofs)
463
+ CPURISCVState *env = &cpu->env;
143
{
464
+
144
- if (type == TCG_TYPE_I32) {
465
+ /* Match cpu_get_tb_cpu_state. */
145
- tcg_out_mem(s, RX_ST, RXY_STY, data, base, TCG_REG_NONE, ofs);
466
+ if (env->xl == MXL_RV32) {
146
- } else {
467
+ return env->pc & UINT32_MAX;
147
- tcg_out_mem(s, 0, RXY_STG, data, base, TCG_REG_NONE, ofs);
468
+ }
148
+ switch (type) {
469
+ return env->pc;
149
+ case TCG_TYPE_I32:
470
+}
150
+ if (likely(is_general_reg(data))) {
471
+
151
+ tcg_out_mem(s, RX_ST, RXY_STY, data, base, TCG_REG_NONE, ofs);
472
static void riscv_cpu_synchronize_from_tb(CPUState *cs,
152
+ } else {
473
const TranslationBlock *tb)
153
+ tcg_out_vrx_mem(s, VRX_VSTEF, data, base, TCG_REG_NONE, ofs, 1);
474
{
154
+ }
475
@@ -XXX,XX +XXX,XX @@ static void riscv_cpu_class_init(ObjectClass *c, void *data)
155
+ break;
476
cc->has_work = riscv_cpu_has_work;
156
+
477
cc->dump_state = riscv_cpu_dump_state;
157
+ case TCG_TYPE_I64:
478
cc->set_pc = riscv_cpu_set_pc;
158
+ if (likely(is_general_reg(data))) {
479
+ cc->get_pc = riscv_cpu_get_pc;
159
+ tcg_out_mem(s, 0, RXY_STG, data, base, TCG_REG_NONE, ofs);
480
cc->gdb_read_register = riscv_cpu_gdb_read_register;
160
+ break;
481
cc->gdb_write_register = riscv_cpu_gdb_write_register;
161
+ }
482
cc->gdb_num_core_regs = 33;
162
+ /* fallthru */
483
diff --git a/target/rx/cpu.c b/target/rx/cpu.c
163
+
484
index XXXXXXX..XXXXXXX 100644
164
+ case TCG_TYPE_V64:
485
--- a/target/rx/cpu.c
165
+ tcg_out_vrx_mem(s, VRX_VSTEG, data, base, TCG_REG_NONE, ofs, 0);
486
+++ b/target/rx/cpu.c
166
+ break;
487
@@ -XXX,XX +XXX,XX @@ static void rx_cpu_set_pc(CPUState *cs, vaddr value)
167
+
488
cpu->env.pc = value;
168
+ case TCG_TYPE_V128:
489
}
169
+ /* Hint quadword aligned. */
490
170
+ tcg_out_vrx_mem(s, VRX_VST, data, base, TCG_REG_NONE, ofs, 4);
491
+static vaddr rx_cpu_get_pc(CPUState *cs)
171
+ break;
492
+{
172
+
493
+ RXCPU *cpu = RX_CPU(cs);
173
+ default:
494
+
174
+ g_assert_not_reached();
495
+ return cpu->env.pc;
175
}
496
+}
176
}
497
+
177
498
static void rx_cpu_synchronize_from_tb(CPUState *cs,
499
const TranslationBlock *tb)
500
{
501
@@ -XXX,XX +XXX,XX @@ static void rx_cpu_class_init(ObjectClass *klass, void *data)
502
cc->has_work = rx_cpu_has_work;
503
cc->dump_state = rx_cpu_dump_state;
504
cc->set_pc = rx_cpu_set_pc;
505
+ cc->get_pc = rx_cpu_get_pc;
506
507
#ifndef CONFIG_USER_ONLY
508
cc->sysemu_ops = &rx_sysemu_ops;
509
diff --git a/target/s390x/cpu.c b/target/s390x/cpu.c
510
index XXXXXXX..XXXXXXX 100644
511
--- a/target/s390x/cpu.c
512
+++ b/target/s390x/cpu.c
513
@@ -XXX,XX +XXX,XX @@ static void s390_cpu_set_pc(CPUState *cs, vaddr value)
514
cpu->env.psw.addr = value;
515
}
516
517
+static vaddr s390_cpu_get_pc(CPUState *cs)
518
+{
519
+ S390CPU *cpu = S390_CPU(cs);
520
+
521
+ return cpu->env.psw.addr;
522
+}
523
+
524
static bool s390_cpu_has_work(CPUState *cs)
525
{
526
S390CPU *cpu = S390_CPU(cs);
527
@@ -XXX,XX +XXX,XX @@ static void s390_cpu_class_init(ObjectClass *oc, void *data)
528
cc->has_work = s390_cpu_has_work;
529
cc->dump_state = s390_cpu_dump_state;
530
cc->set_pc = s390_cpu_set_pc;
531
+ cc->get_pc = s390_cpu_get_pc;
532
cc->gdb_read_register = s390_cpu_gdb_read_register;
533
cc->gdb_write_register = s390_cpu_gdb_write_register;
534
#ifndef CONFIG_USER_ONLY
535
diff --git a/target/sh4/cpu.c b/target/sh4/cpu.c
536
index XXXXXXX..XXXXXXX 100644
537
--- a/target/sh4/cpu.c
538
+++ b/target/sh4/cpu.c
539
@@ -XXX,XX +XXX,XX @@ static void superh_cpu_set_pc(CPUState *cs, vaddr value)
540
cpu->env.pc = value;
541
}
542
543
+static vaddr superh_cpu_get_pc(CPUState *cs)
544
+{
545
+ SuperHCPU *cpu = SUPERH_CPU(cs);
546
+
547
+ return cpu->env.pc;
548
+}
549
+
550
static void superh_cpu_synchronize_from_tb(CPUState *cs,
551
const TranslationBlock *tb)
552
{
553
@@ -XXX,XX +XXX,XX @@ static void superh_cpu_class_init(ObjectClass *oc, void *data)
554
cc->has_work = superh_cpu_has_work;
555
cc->dump_state = superh_cpu_dump_state;
556
cc->set_pc = superh_cpu_set_pc;
557
+ cc->get_pc = superh_cpu_get_pc;
558
cc->gdb_read_register = superh_cpu_gdb_read_register;
559
cc->gdb_write_register = superh_cpu_gdb_write_register;
560
#ifndef CONFIG_USER_ONLY
561
diff --git a/target/sparc/cpu.c b/target/sparc/cpu.c
562
index XXXXXXX..XXXXXXX 100644
563
--- a/target/sparc/cpu.c
564
+++ b/target/sparc/cpu.c
565
@@ -XXX,XX +XXX,XX @@ static void sparc_cpu_set_pc(CPUState *cs, vaddr value)
566
cpu->env.npc = value + 4;
567
}
568
569
+static vaddr sparc_cpu_get_pc(CPUState *cs)
570
+{
571
+ SPARCCPU *cpu = SPARC_CPU(cs);
572
+
573
+ return cpu->env.pc;
574
+}
575
+
576
static void sparc_cpu_synchronize_from_tb(CPUState *cs,
577
const TranslationBlock *tb)
578
{
579
@@ -XXX,XX +XXX,XX @@ static void sparc_cpu_class_init(ObjectClass *oc, void *data)
580
cc->memory_rw_debug = sparc_cpu_memory_rw_debug;
581
#endif
582
cc->set_pc = sparc_cpu_set_pc;
583
+ cc->get_pc = sparc_cpu_get_pc;
584
cc->gdb_read_register = sparc_cpu_gdb_read_register;
585
cc->gdb_write_register = sparc_cpu_gdb_write_register;
586
#ifndef CONFIG_USER_ONLY
587
diff --git a/target/tricore/cpu.c b/target/tricore/cpu.c
588
index XXXXXXX..XXXXXXX 100644
589
--- a/target/tricore/cpu.c
590
+++ b/target/tricore/cpu.c
591
@@ -XXX,XX +XXX,XX @@ static void tricore_cpu_set_pc(CPUState *cs, vaddr value)
592
env->PC = value & ~(target_ulong)1;
593
}
594
595
+static vaddr tricore_cpu_get_pc(CPUState *cs)
596
+{
597
+ TriCoreCPU *cpu = TRICORE_CPU(cs);
598
+ CPUTriCoreState *env = &cpu->env;
599
+
600
+ return env->PC;
601
+}
602
+
603
static void tricore_cpu_synchronize_from_tb(CPUState *cs,
604
const TranslationBlock *tb)
605
{
606
@@ -XXX,XX +XXX,XX @@ static void tricore_cpu_class_init(ObjectClass *c, void *data)
607
608
cc->dump_state = tricore_cpu_dump_state;
609
cc->set_pc = tricore_cpu_set_pc;
610
+ cc->get_pc = tricore_cpu_get_pc;
611
cc->sysemu_ops = &tricore_sysemu_ops;
612
cc->tcg_ops = &tricore_tcg_ops;
613
}
614
diff --git a/target/xtensa/cpu.c b/target/xtensa/cpu.c
615
index XXXXXXX..XXXXXXX 100644
616
--- a/target/xtensa/cpu.c
617
+++ b/target/xtensa/cpu.c
618
@@ -XXX,XX +XXX,XX @@ static void xtensa_cpu_set_pc(CPUState *cs, vaddr value)
619
cpu->env.pc = value;
620
}
621
622
+static vaddr xtensa_cpu_get_pc(CPUState *cs)
623
+{
624
+ XtensaCPU *cpu = XTENSA_CPU(cs);
625
+
626
+ return cpu->env.pc;
627
+}
628
+
629
static bool xtensa_cpu_has_work(CPUState *cs)
630
{
631
#ifndef CONFIG_USER_ONLY
632
@@ -XXX,XX +XXX,XX @@ static void xtensa_cpu_class_init(ObjectClass *oc, void *data)
633
cc->has_work = xtensa_cpu_has_work;
634
cc->dump_state = xtensa_cpu_dump_state;
635
cc->set_pc = xtensa_cpu_set_pc;
636
+ cc->get_pc = xtensa_cpu_get_pc;
637
cc->gdb_read_register = xtensa_cpu_gdb_read_register;
638
cc->gdb_write_register = xtensa_cpu_gdb_write_register;
639
cc->gdb_stop_before_watchpoint = true;
178
--
640
--
179
2.25.1
641
2.34.1
180
642
181
643
diff view generated by jsdifflib
1
From: Philipp Tomsich <philipp.tomsich@vrull.eu>
1
The availability of tb->pc will shortly be conditional.
2
Introduce accessor functions to minimize ifdefs.
2
3
3
dup_const always generates a uint64_t, which may exceed the size of a
4
Pass around a known pc to places like tcg_gen_code,
4
target_long (generating warnings with recent-enough compilers).
5
where the caller must already have the value.
5
6
6
To ensure that we can use dup_const both for 64bit and 32bit targets,
7
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
7
this adds dup_const_tl, which either maps back to dup_const (for 64bit
8
targets) or provides a similar implementation using 32bit constants.
9
10
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
11
Signed-off-by: Philipp Tomsich <philipp.tomsich@vrull.eu>
12
Message-Id: <20211003214243.3813425-1-philipp.tomsich@vrull.eu>
13
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
14
---
9
---
15
include/tcg/tcg.h | 12 ++++++++++++
10
accel/tcg/internal.h | 6 ++++
16
1 file changed, 12 insertions(+)
11
include/exec/exec-all.h | 6 ++++
12
include/tcg/tcg.h | 2 +-
13
accel/tcg/cpu-exec.c | 46 ++++++++++++++-----------
14
accel/tcg/translate-all.c | 37 +++++++++++---------
15
target/arm/cpu.c | 4 +--
16
target/avr/cpu.c | 2 +-
17
target/hexagon/cpu.c | 2 +-
18
target/hppa/cpu.c | 4 +--
19
target/i386/tcg/tcg-cpu.c | 2 +-
20
target/loongarch/cpu.c | 2 +-
21
target/microblaze/cpu.c | 2 +-
22
target/mips/tcg/exception.c | 2 +-
23
target/mips/tcg/sysemu/special_helper.c | 2 +-
24
target/openrisc/cpu.c | 2 +-
25
target/riscv/cpu.c | 4 +--
26
target/rx/cpu.c | 2 +-
27
target/sh4/cpu.c | 4 +--
28
target/sparc/cpu.c | 2 +-
29
target/tricore/cpu.c | 2 +-
30
tcg/tcg.c | 8 ++---
31
21 files changed, 82 insertions(+), 61 deletions(-)
17
32
33
diff --git a/accel/tcg/internal.h b/accel/tcg/internal.h
34
index XXXXXXX..XXXXXXX 100644
35
--- a/accel/tcg/internal.h
36
+++ b/accel/tcg/internal.h
37
@@ -XXX,XX +XXX,XX @@ G_NORETURN void cpu_io_recompile(CPUState *cpu, uintptr_t retaddr);
38
void page_init(void);
39
void tb_htable_init(void);
40
41
+/* Return the current PC from CPU, which may be cached in TB. */
42
+static inline target_ulong log_pc(CPUState *cpu, const TranslationBlock *tb)
43
+{
44
+ return tb_pc(tb);
45
+}
46
+
47
#endif /* ACCEL_TCG_INTERNAL_H */
48
diff --git a/include/exec/exec-all.h b/include/exec/exec-all.h
49
index XXXXXXX..XXXXXXX 100644
50
--- a/include/exec/exec-all.h
51
+++ b/include/exec/exec-all.h
52
@@ -XXX,XX +XXX,XX @@ struct TranslationBlock {
53
uintptr_t jmp_dest[2];
54
};
55
56
+/* Hide the read to avoid ifdefs for TARGET_TB_PCREL. */
57
+static inline target_ulong tb_pc(const TranslationBlock *tb)
58
+{
59
+ return tb->pc;
60
+}
61
+
62
/* Hide the qatomic_read to make code a little easier on the eyes */
63
static inline uint32_t tb_cflags(const TranslationBlock *tb)
64
{
18
diff --git a/include/tcg/tcg.h b/include/tcg/tcg.h
65
diff --git a/include/tcg/tcg.h b/include/tcg/tcg.h
19
index XXXXXXX..XXXXXXX 100644
66
index XXXXXXX..XXXXXXX 100644
20
--- a/include/tcg/tcg.h
67
--- a/include/tcg/tcg.h
21
+++ b/include/tcg/tcg.h
68
+++ b/include/tcg/tcg.h
22
@@ -XXX,XX +XXX,XX @@ uint64_t dup_const(unsigned vece, uint64_t c);
69
@@ -XXX,XX +XXX,XX @@ void tcg_register_thread(void);
23
: (qemu_build_not_reached_always(), 0)) \
70
void tcg_prologue_init(TCGContext *s);
24
: dup_const(VECE, C))
71
void tcg_func_start(TCGContext *s);
25
72
26
+#if TARGET_LONG_BITS == 64
73
-int tcg_gen_code(TCGContext *s, TranslationBlock *tb);
27
+# define dup_const_tl dup_const
74
+int tcg_gen_code(TCGContext *s, TranslationBlock *tb, target_ulong pc_start);
28
+#else
75
29
+# define dup_const_tl(VECE, C) \
76
void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size);
30
+ (__builtin_constant_p(VECE) \
77
31
+ ? ( (VECE) == MO_8 ? 0x01010101ul * (uint8_t)(C) \
78
diff --git a/accel/tcg/cpu-exec.c b/accel/tcg/cpu-exec.c
32
+ : (VECE) == MO_16 ? 0x00010001ul * (uint16_t)(C) \
79
index XXXXXXX..XXXXXXX 100644
33
+ : (VECE) == MO_32 ? 0x00000001ul * (uint32_t)(C) \
80
--- a/accel/tcg/cpu-exec.c
34
+ : (qemu_build_not_reached_always(), 0)) \
81
+++ b/accel/tcg/cpu-exec.c
35
+ : (target_long)dup_const(VECE, C))
82
@@ -XXX,XX +XXX,XX @@ static bool tb_lookup_cmp(const void *p, const void *d)
36
+#endif
83
const TranslationBlock *tb = p;
84
const struct tb_desc *desc = d;
85
86
- if (tb->pc == desc->pc &&
87
+ if (tb_pc(tb) == desc->pc &&
88
tb->page_addr[0] == desc->page_addr0 &&
89
tb->cs_base == desc->cs_base &&
90
tb->flags == desc->flags &&
91
@@ -XXX,XX +XXX,XX @@ static inline TranslationBlock *tb_lookup(CPUState *cpu, target_ulong pc,
92
return tb;
93
}
94
95
-static inline void log_cpu_exec(target_ulong pc, CPUState *cpu,
96
- const TranslationBlock *tb)
97
+static void log_cpu_exec(target_ulong pc, CPUState *cpu,
98
+ const TranslationBlock *tb)
99
{
100
- if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_CPU | CPU_LOG_EXEC))
101
- && qemu_log_in_addr_range(pc)) {
102
-
103
+ if (qemu_log_in_addr_range(pc)) {
104
qemu_log_mask(CPU_LOG_EXEC,
105
"Trace %d: %p [" TARGET_FMT_lx
106
"/" TARGET_FMT_lx "/%08x/%08x] %s\n",
107
@@ -XXX,XX +XXX,XX @@ const void *HELPER(lookup_tb_ptr)(CPUArchState *env)
108
return tcg_code_gen_epilogue;
109
}
110
111
- log_cpu_exec(pc, cpu, tb);
112
+ if (qemu_loglevel_mask(CPU_LOG_TB_CPU | CPU_LOG_EXEC)) {
113
+ log_cpu_exec(pc, cpu, tb);
114
+ }
115
116
return tb->tc.ptr;
117
}
118
@@ -XXX,XX +XXX,XX @@ cpu_tb_exec(CPUState *cpu, TranslationBlock *itb, int *tb_exit)
119
TranslationBlock *last_tb;
120
const void *tb_ptr = itb->tc.ptr;
121
122
- log_cpu_exec(itb->pc, cpu, itb);
123
+ if (qemu_loglevel_mask(CPU_LOG_TB_CPU | CPU_LOG_EXEC)) {
124
+ log_cpu_exec(log_pc(cpu, itb), cpu, itb);
125
+ }
126
127
qemu_thread_jit_execute();
128
ret = tcg_qemu_tb_exec(env, tb_ptr);
129
@@ -XXX,XX +XXX,XX @@ cpu_tb_exec(CPUState *cpu, TranslationBlock *itb, int *tb_exit)
130
* of the start of the TB.
131
*/
132
CPUClass *cc = CPU_GET_CLASS(cpu);
133
- qemu_log_mask_and_addr(CPU_LOG_EXEC, last_tb->pc,
134
- "Stopped execution of TB chain before %p ["
135
- TARGET_FMT_lx "] %s\n",
136
- last_tb->tc.ptr, last_tb->pc,
137
- lookup_symbol(last_tb->pc));
37
+
138
+
38
/*
139
if (cc->tcg_ops->synchronize_from_tb) {
39
* Memory helpers that will be used by TCG generated code.
140
cc->tcg_ops->synchronize_from_tb(cpu, last_tb);
40
*/
141
} else {
142
assert(cc->set_pc);
143
- cc->set_pc(cpu, last_tb->pc);
144
+ cc->set_pc(cpu, tb_pc(last_tb));
145
+ }
146
+ if (qemu_loglevel_mask(CPU_LOG_EXEC)) {
147
+ target_ulong pc = log_pc(cpu, last_tb);
148
+ if (qemu_log_in_addr_range(pc)) {
149
+ qemu_log("Stopped execution of TB chain before %p ["
150
+ TARGET_FMT_lx "] %s\n",
151
+ last_tb->tc.ptr, pc, lookup_symbol(pc));
152
+ }
153
}
154
}
155
156
@@ -XXX,XX +XXX,XX @@ static inline void tb_add_jump(TranslationBlock *tb, int n,
157
158
qemu_spin_unlock(&tb_next->jmp_lock);
159
160
- qemu_log_mask_and_addr(CPU_LOG_EXEC, tb->pc,
161
- "Linking TBs %p [" TARGET_FMT_lx
162
- "] index %d -> %p [" TARGET_FMT_lx "]\n",
163
- tb->tc.ptr, tb->pc, n,
164
- tb_next->tc.ptr, tb_next->pc);
165
+ qemu_log_mask(CPU_LOG_EXEC, "Linking TBs %p index %d -> %p\n",
166
+ tb->tc.ptr, n, tb_next->tc.ptr);
167
return;
168
169
out_unlock_next:
170
@@ -XXX,XX +XXX,XX @@ static inline bool cpu_handle_interrupt(CPUState *cpu,
171
}
172
173
static inline void cpu_loop_exec_tb(CPUState *cpu, TranslationBlock *tb,
174
+ target_ulong pc,
175
TranslationBlock **last_tb, int *tb_exit)
176
{
177
int32_t insns_left;
178
179
- trace_exec_tb(tb, tb->pc);
180
+ trace_exec_tb(tb, pc);
181
tb = cpu_tb_exec(cpu, tb, tb_exit);
182
if (*tb_exit != TB_EXIT_REQUESTED) {
183
*last_tb = tb;
184
@@ -XXX,XX +XXX,XX @@ int cpu_exec(CPUState *cpu)
185
tb_add_jump(last_tb, tb_exit, tb);
186
}
187
188
- cpu_loop_exec_tb(cpu, tb, &last_tb, &tb_exit);
189
+ cpu_loop_exec_tb(cpu, tb, pc, &last_tb, &tb_exit);
190
191
/* Try to align the host and virtual clocks
192
if the guest is in advance */
193
diff --git a/accel/tcg/translate-all.c b/accel/tcg/translate-all.c
194
index XXXXXXX..XXXXXXX 100644
195
--- a/accel/tcg/translate-all.c
196
+++ b/accel/tcg/translate-all.c
197
@@ -XXX,XX +XXX,XX @@ static int encode_search(TranslationBlock *tb, uint8_t *block)
198
199
for (j = 0; j < TARGET_INSN_START_WORDS; ++j) {
200
if (i == 0) {
201
- prev = (j == 0 ? tb->pc : 0);
202
+ prev = (j == 0 ? tb_pc(tb) : 0);
203
} else {
204
prev = tcg_ctx->gen_insn_data[i - 1][j];
205
}
206
@@ -XXX,XX +XXX,XX @@ static int encode_search(TranslationBlock *tb, uint8_t *block)
207
static int cpu_restore_state_from_tb(CPUState *cpu, TranslationBlock *tb,
208
uintptr_t searched_pc, bool reset_icount)
209
{
210
- target_ulong data[TARGET_INSN_START_WORDS] = { tb->pc };
211
+ target_ulong data[TARGET_INSN_START_WORDS] = { tb_pc(tb) };
212
uintptr_t host_pc = (uintptr_t)tb->tc.ptr;
213
CPUArchState *env = cpu->env_ptr;
214
const uint8_t *p = tb->tc.ptr + tb->tc.size;
215
@@ -XXX,XX +XXX,XX @@ static bool tb_cmp(const void *ap, const void *bp)
216
const TranslationBlock *a = ap;
217
const TranslationBlock *b = bp;
218
219
- return a->pc == b->pc &&
220
+ return tb_pc(a) == tb_pc(b) &&
221
a->cs_base == b->cs_base &&
222
a->flags == b->flags &&
223
(tb_cflags(a) & ~CF_INVALID) == (tb_cflags(b) & ~CF_INVALID) &&
224
@@ -XXX,XX +XXX,XX @@ static void do_tb_invalidate_check(void *p, uint32_t hash, void *userp)
225
TranslationBlock *tb = p;
226
target_ulong addr = *(target_ulong *)userp;
227
228
- if (!(addr + TARGET_PAGE_SIZE <= tb->pc || addr >= tb->pc + tb->size)) {
229
+ if (!(addr + TARGET_PAGE_SIZE <= tb_pc(tb) ||
230
+ addr >= tb_pc(tb) + tb->size)) {
231
printf("ERROR invalidate: address=" TARGET_FMT_lx
232
- " PC=%08lx size=%04x\n", addr, (long)tb->pc, tb->size);
233
+ " PC=%08lx size=%04x\n", addr, (long)tb_pc(tb), tb->size);
234
}
235
}
236
237
@@ -XXX,XX +XXX,XX @@ static void do_tb_page_check(void *p, uint32_t hash, void *userp)
238
TranslationBlock *tb = p;
239
int flags1, flags2;
240
241
- flags1 = page_get_flags(tb->pc);
242
- flags2 = page_get_flags(tb->pc + tb->size - 1);
243
+ flags1 = page_get_flags(tb_pc(tb));
244
+ flags2 = page_get_flags(tb_pc(tb) + tb->size - 1);
245
if ((flags1 & PAGE_WRITE) || (flags2 & PAGE_WRITE)) {
246
printf("ERROR page flags: PC=%08lx size=%04x f1=%x f2=%x\n",
247
- (long)tb->pc, tb->size, flags1, flags2);
248
+ (long)tb_pc(tb), tb->size, flags1, flags2);
249
}
250
}
251
252
@@ -XXX,XX +XXX,XX @@ static void do_tb_phys_invalidate(TranslationBlock *tb, bool rm_from_page_list)
253
254
/* remove the TB from the hash list */
255
phys_pc = tb->page_addr[0];
256
- h = tb_hash_func(phys_pc, tb->pc, tb->flags, orig_cflags,
257
+ h = tb_hash_func(phys_pc, tb_pc(tb), tb->flags, orig_cflags,
258
tb->trace_vcpu_dstate);
259
if (!qht_remove(&tb_ctx.htable, tb, h)) {
260
return;
261
@@ -XXX,XX +XXX,XX @@ tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
262
}
263
264
/* add in the hash table */
265
- h = tb_hash_func(phys_pc, tb->pc, tb->flags, tb->cflags,
266
+ h = tb_hash_func(phys_pc, tb_pc(tb), tb->flags, tb->cflags,
267
tb->trace_vcpu_dstate);
268
qht_insert(&tb_ctx.htable, tb, h, &existing_tb);
269
270
@@ -XXX,XX +XXX,XX @@ TranslationBlock *tb_gen_code(CPUState *cpu,
271
tcg_ctx->cpu = NULL;
272
max_insns = tb->icount;
273
274
- trace_translate_block(tb, tb->pc, tb->tc.ptr);
275
+ trace_translate_block(tb, pc, tb->tc.ptr);
276
277
/* generate machine code */
278
tb->jmp_reset_offset[0] = TB_JMP_RESET_OFFSET_INVALID;
279
@@ -XXX,XX +XXX,XX @@ TranslationBlock *tb_gen_code(CPUState *cpu,
280
ti = profile_getclock();
281
#endif
282
283
- gen_code_size = tcg_gen_code(tcg_ctx, tb);
284
+ gen_code_size = tcg_gen_code(tcg_ctx, tb, pc);
285
if (unlikely(gen_code_size < 0)) {
286
error_return:
287
switch (gen_code_size) {
288
@@ -XXX,XX +XXX,XX @@ TranslationBlock *tb_gen_code(CPUState *cpu,
289
290
#ifdef DEBUG_DISAS
291
if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM) &&
292
- qemu_log_in_addr_range(tb->pc)) {
293
+ qemu_log_in_addr_range(pc)) {
294
FILE *logfile = qemu_log_trylock();
295
if (logfile) {
296
int code_size, data_size;
297
@@ -XXX,XX +XXX,XX @@ void cpu_io_recompile(CPUState *cpu, uintptr_t retaddr)
298
*/
299
cpu->cflags_next_tb = curr_cflags(cpu) | CF_MEMI_ONLY | CF_LAST_IO | n;
300
301
- qemu_log_mask_and_addr(CPU_LOG_EXEC, tb->pc,
302
- "cpu_io_recompile: rewound execution of TB to "
303
- TARGET_FMT_lx "\n", tb->pc);
304
+ if (qemu_loglevel_mask(CPU_LOG_EXEC)) {
305
+ target_ulong pc = log_pc(cpu, tb);
306
+ if (qemu_log_in_addr_range(pc)) {
307
+ qemu_log("cpu_io_recompile: rewound execution of TB to "
308
+ TARGET_FMT_lx "\n", pc);
309
+ }
310
+ }
311
312
cpu_loop_exit_noexc(cpu);
313
}
314
diff --git a/target/arm/cpu.c b/target/arm/cpu.c
315
index XXXXXXX..XXXXXXX 100644
316
--- a/target/arm/cpu.c
317
+++ b/target/arm/cpu.c
318
@@ -XXX,XX +XXX,XX @@ void arm_cpu_synchronize_from_tb(CPUState *cs,
319
* never possible for an AArch64 TB to chain to an AArch32 TB.
320
*/
321
if (is_a64(env)) {
322
- env->pc = tb->pc;
323
+ env->pc = tb_pc(tb);
324
} else {
325
- env->regs[15] = tb->pc;
326
+ env->regs[15] = tb_pc(tb);
327
}
328
}
329
#endif /* CONFIG_TCG */
330
diff --git a/target/avr/cpu.c b/target/avr/cpu.c
331
index XXXXXXX..XXXXXXX 100644
332
--- a/target/avr/cpu.c
333
+++ b/target/avr/cpu.c
334
@@ -XXX,XX +XXX,XX @@ static void avr_cpu_synchronize_from_tb(CPUState *cs,
335
AVRCPU *cpu = AVR_CPU(cs);
336
CPUAVRState *env = &cpu->env;
337
338
- env->pc_w = tb->pc / 2; /* internally PC points to words */
339
+ env->pc_w = tb_pc(tb) / 2; /* internally PC points to words */
340
}
341
342
static void avr_cpu_reset(DeviceState *ds)
343
diff --git a/target/hexagon/cpu.c b/target/hexagon/cpu.c
344
index XXXXXXX..XXXXXXX 100644
345
--- a/target/hexagon/cpu.c
346
+++ b/target/hexagon/cpu.c
347
@@ -XXX,XX +XXX,XX @@ static void hexagon_cpu_synchronize_from_tb(CPUState *cs,
348
{
349
HexagonCPU *cpu = HEXAGON_CPU(cs);
350
CPUHexagonState *env = &cpu->env;
351
- env->gpr[HEX_REG_PC] = tb->pc;
352
+ env->gpr[HEX_REG_PC] = tb_pc(tb);
353
}
354
355
static bool hexagon_cpu_has_work(CPUState *cs)
356
diff --git a/target/hppa/cpu.c b/target/hppa/cpu.c
357
index XXXXXXX..XXXXXXX 100644
358
--- a/target/hppa/cpu.c
359
+++ b/target/hppa/cpu.c
360
@@ -XXX,XX +XXX,XX @@ static void hppa_cpu_synchronize_from_tb(CPUState *cs,
361
HPPACPU *cpu = HPPA_CPU(cs);
362
363
#ifdef CONFIG_USER_ONLY
364
- cpu->env.iaoq_f = tb->pc;
365
+ cpu->env.iaoq_f = tb_pc(tb);
366
cpu->env.iaoq_b = tb->cs_base;
367
#else
368
/* Recover the IAOQ values from the GVA + PRIV. */
369
@@ -XXX,XX +XXX,XX @@ static void hppa_cpu_synchronize_from_tb(CPUState *cs,
370
int32_t diff = cs_base;
371
372
cpu->env.iasq_f = iasq_f;
373
- cpu->env.iaoq_f = (tb->pc & ~iasq_f) + priv;
374
+ cpu->env.iaoq_f = (tb_pc(tb) & ~iasq_f) + priv;
375
if (diff) {
376
cpu->env.iaoq_b = cpu->env.iaoq_f + diff;
377
}
378
diff --git a/target/i386/tcg/tcg-cpu.c b/target/i386/tcg/tcg-cpu.c
379
index XXXXXXX..XXXXXXX 100644
380
--- a/target/i386/tcg/tcg-cpu.c
381
+++ b/target/i386/tcg/tcg-cpu.c
382
@@ -XXX,XX +XXX,XX @@ static void x86_cpu_synchronize_from_tb(CPUState *cs,
383
{
384
X86CPU *cpu = X86_CPU(cs);
385
386
- cpu->env.eip = tb->pc - tb->cs_base;
387
+ cpu->env.eip = tb_pc(tb) - tb->cs_base;
388
}
389
390
#ifndef CONFIG_USER_ONLY
391
diff --git a/target/loongarch/cpu.c b/target/loongarch/cpu.c
392
index XXXXXXX..XXXXXXX 100644
393
--- a/target/loongarch/cpu.c
394
+++ b/target/loongarch/cpu.c
395
@@ -XXX,XX +XXX,XX @@ static void loongarch_cpu_synchronize_from_tb(CPUState *cs,
396
LoongArchCPU *cpu = LOONGARCH_CPU(cs);
397
CPULoongArchState *env = &cpu->env;
398
399
- env->pc = tb->pc;
400
+ env->pc = tb_pc(tb);
401
}
402
#endif /* CONFIG_TCG */
403
404
diff --git a/target/microblaze/cpu.c b/target/microblaze/cpu.c
405
index XXXXXXX..XXXXXXX 100644
406
--- a/target/microblaze/cpu.c
407
+++ b/target/microblaze/cpu.c
408
@@ -XXX,XX +XXX,XX @@ static void mb_cpu_synchronize_from_tb(CPUState *cs,
409
{
410
MicroBlazeCPU *cpu = MICROBLAZE_CPU(cs);
411
412
- cpu->env.pc = tb->pc;
413
+ cpu->env.pc = tb_pc(tb);
414
cpu->env.iflags = tb->flags & IFLAGS_TB_MASK;
415
}
416
417
diff --git a/target/mips/tcg/exception.c b/target/mips/tcg/exception.c
418
index XXXXXXX..XXXXXXX 100644
419
--- a/target/mips/tcg/exception.c
420
+++ b/target/mips/tcg/exception.c
421
@@ -XXX,XX +XXX,XX @@ void mips_cpu_synchronize_from_tb(CPUState *cs, const TranslationBlock *tb)
422
MIPSCPU *cpu = MIPS_CPU(cs);
423
CPUMIPSState *env = &cpu->env;
424
425
- env->active_tc.PC = tb->pc;
426
+ env->active_tc.PC = tb_pc(tb);
427
env->hflags &= ~MIPS_HFLAG_BMASK;
428
env->hflags |= tb->flags & MIPS_HFLAG_BMASK;
429
}
430
diff --git a/target/mips/tcg/sysemu/special_helper.c b/target/mips/tcg/sysemu/special_helper.c
431
index XXXXXXX..XXXXXXX 100644
432
--- a/target/mips/tcg/sysemu/special_helper.c
433
+++ b/target/mips/tcg/sysemu/special_helper.c
434
@@ -XXX,XX +XXX,XX @@ bool mips_io_recompile_replay_branch(CPUState *cs, const TranslationBlock *tb)
435
CPUMIPSState *env = &cpu->env;
436
437
if ((env->hflags & MIPS_HFLAG_BMASK) != 0
438
- && env->active_tc.PC != tb->pc) {
439
+ && env->active_tc.PC != tb_pc(tb)) {
440
env->active_tc.PC -= (env->hflags & MIPS_HFLAG_B16 ? 2 : 4);
441
env->hflags &= ~MIPS_HFLAG_BMASK;
442
return true;
443
diff --git a/target/openrisc/cpu.c b/target/openrisc/cpu.c
444
index XXXXXXX..XXXXXXX 100644
445
--- a/target/openrisc/cpu.c
446
+++ b/target/openrisc/cpu.c
447
@@ -XXX,XX +XXX,XX @@ static void openrisc_cpu_synchronize_from_tb(CPUState *cs,
448
{
449
OpenRISCCPU *cpu = OPENRISC_CPU(cs);
450
451
- cpu->env.pc = tb->pc;
452
+ cpu->env.pc = tb_pc(tb);
453
}
454
455
456
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
457
index XXXXXXX..XXXXXXX 100644
458
--- a/target/riscv/cpu.c
459
+++ b/target/riscv/cpu.c
460
@@ -XXX,XX +XXX,XX @@ static void riscv_cpu_synchronize_from_tb(CPUState *cs,
461
RISCVMXL xl = FIELD_EX32(tb->flags, TB_FLAGS, XL);
462
463
if (xl == MXL_RV32) {
464
- env->pc = (int32_t)tb->pc;
465
+ env->pc = (int32_t)tb_pc(tb);
466
} else {
467
- env->pc = tb->pc;
468
+ env->pc = tb_pc(tb);
469
}
470
}
471
472
diff --git a/target/rx/cpu.c b/target/rx/cpu.c
473
index XXXXXXX..XXXXXXX 100644
474
--- a/target/rx/cpu.c
475
+++ b/target/rx/cpu.c
476
@@ -XXX,XX +XXX,XX @@ static void rx_cpu_synchronize_from_tb(CPUState *cs,
477
{
478
RXCPU *cpu = RX_CPU(cs);
479
480
- cpu->env.pc = tb->pc;
481
+ cpu->env.pc = tb_pc(tb);
482
}
483
484
static bool rx_cpu_has_work(CPUState *cs)
485
diff --git a/target/sh4/cpu.c b/target/sh4/cpu.c
486
index XXXXXXX..XXXXXXX 100644
487
--- a/target/sh4/cpu.c
488
+++ b/target/sh4/cpu.c
489
@@ -XXX,XX +XXX,XX @@ static void superh_cpu_synchronize_from_tb(CPUState *cs,
490
{
491
SuperHCPU *cpu = SUPERH_CPU(cs);
492
493
- cpu->env.pc = tb->pc;
494
+ cpu->env.pc = tb_pc(tb);
495
cpu->env.flags = tb->flags & TB_FLAG_ENVFLAGS_MASK;
496
}
497
498
@@ -XXX,XX +XXX,XX @@ static bool superh_io_recompile_replay_branch(CPUState *cs,
499
CPUSH4State *env = &cpu->env;
500
501
if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
502
- && env->pc != tb->pc) {
503
+ && env->pc != tb_pc(tb)) {
504
env->pc -= 2;
505
env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
506
return true;
507
diff --git a/target/sparc/cpu.c b/target/sparc/cpu.c
508
index XXXXXXX..XXXXXXX 100644
509
--- a/target/sparc/cpu.c
510
+++ b/target/sparc/cpu.c
511
@@ -XXX,XX +XXX,XX @@ static void sparc_cpu_synchronize_from_tb(CPUState *cs,
512
{
513
SPARCCPU *cpu = SPARC_CPU(cs);
514
515
- cpu->env.pc = tb->pc;
516
+ cpu->env.pc = tb_pc(tb);
517
cpu->env.npc = tb->cs_base;
518
}
519
520
diff --git a/target/tricore/cpu.c b/target/tricore/cpu.c
521
index XXXXXXX..XXXXXXX 100644
522
--- a/target/tricore/cpu.c
523
+++ b/target/tricore/cpu.c
524
@@ -XXX,XX +XXX,XX @@ static void tricore_cpu_synchronize_from_tb(CPUState *cs,
525
TriCoreCPU *cpu = TRICORE_CPU(cs);
526
CPUTriCoreState *env = &cpu->env;
527
528
- env->PC = tb->pc;
529
+ env->PC = tb_pc(tb);
530
}
531
532
static void tricore_cpu_reset(DeviceState *dev)
533
diff --git a/tcg/tcg.c b/tcg/tcg.c
534
index XXXXXXX..XXXXXXX 100644
535
--- a/tcg/tcg.c
536
+++ b/tcg/tcg.c
537
@@ -XXX,XX +XXX,XX @@ int64_t tcg_cpu_exec_time(void)
538
#endif
539
540
541
-int tcg_gen_code(TCGContext *s, TranslationBlock *tb)
542
+int tcg_gen_code(TCGContext *s, TranslationBlock *tb, target_ulong pc_start)
543
{
544
#ifdef CONFIG_PROFILER
545
TCGProfile *prof = &s->prof;
546
@@ -XXX,XX +XXX,XX @@ int tcg_gen_code(TCGContext *s, TranslationBlock *tb)
547
548
#ifdef DEBUG_DISAS
549
if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP)
550
- && qemu_log_in_addr_range(tb->pc))) {
551
+ && qemu_log_in_addr_range(pc_start))) {
552
FILE *logfile = qemu_log_trylock();
553
if (logfile) {
554
fprintf(logfile, "OP:\n");
555
@@ -XXX,XX +XXX,XX @@ int tcg_gen_code(TCGContext *s, TranslationBlock *tb)
556
if (s->nb_indirects > 0) {
557
#ifdef DEBUG_DISAS
558
if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND)
559
- && qemu_log_in_addr_range(tb->pc))) {
560
+ && qemu_log_in_addr_range(pc_start))) {
561
FILE *logfile = qemu_log_trylock();
562
if (logfile) {
563
fprintf(logfile, "OP before indirect lowering:\n");
564
@@ -XXX,XX +XXX,XX @@ int tcg_gen_code(TCGContext *s, TranslationBlock *tb)
565
566
#ifdef DEBUG_DISAS
567
if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT)
568
- && qemu_log_in_addr_range(tb->pc))) {
569
+ && qemu_log_in_addr_range(pc_start))) {
570
FILE *logfile = qemu_log_trylock();
571
if (logfile) {
572
fprintf(logfile, "OP after optimization and liveness analysis:\n");
41
--
573
--
42
2.25.1
574
2.34.1
43
575
44
576
diff view generated by jsdifflib
1
Prepare for targets to be able to produce TBs that can
2
run in more than one virtual context.
3
4
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
1
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
2
---
6
---
3
tcg/s390x/tcg-target.c.inc | 122 ++++++++++++++++++++++++++++++++++++-
7
accel/tcg/internal.h | 4 +++
4
1 file changed, 119 insertions(+), 3 deletions(-)
8
accel/tcg/tb-jmp-cache.h | 41 +++++++++++++++++++++++++
9
include/exec/cpu-defs.h | 3 ++
10
include/exec/exec-all.h | 32 ++++++++++++++++++--
11
accel/tcg/cpu-exec.c | 16 ++++++----
12
accel/tcg/translate-all.c | 64 ++++++++++++++++++++++++++-------------
13
6 files changed, 131 insertions(+), 29 deletions(-)
5
14
6
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
15
diff --git a/accel/tcg/internal.h b/accel/tcg/internal.h
7
index XXXXXXX..XXXXXXX 100644
16
index XXXXXXX..XXXXXXX 100644
8
--- a/tcg/s390x/tcg-target.c.inc
17
--- a/accel/tcg/internal.h
9
+++ b/tcg/s390x/tcg-target.c.inc
18
+++ b/accel/tcg/internal.h
10
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
19
@@ -XXX,XX +XXX,XX @@ void tb_htable_init(void);
11
RX_STC = 0x42,
20
/* Return the current PC from CPU, which may be cached in TB. */
12
RX_STH = 0x40,
21
static inline target_ulong log_pc(CPUState *cpu, const TranslationBlock *tb)
13
22
{
14
+ VRIa_VGBM = 0xe744,
23
+#if TARGET_TB_PCREL
15
+ VRIa_VREPI = 0xe745,
24
+ return cpu->cc->get_pc(cpu);
16
+ VRIb_VGM = 0xe746,
25
+#else
17
+ VRIc_VREP = 0xe74d,
26
return tb_pc(tb);
18
+
27
+#endif
19
VRRa_VLR = 0xe756,
28
}
20
+ VRRf_VLVGP = 0xe762,
29
21
30
#endif /* ACCEL_TCG_INTERNAL_H */
22
VRSb_VLVG = 0xe722,
31
diff --git a/accel/tcg/tb-jmp-cache.h b/accel/tcg/tb-jmp-cache.h
23
VRSc_VLGV = 0xe721,
32
index XXXXXXX..XXXXXXX 100644
24
33
--- a/accel/tcg/tb-jmp-cache.h
25
VRX_VL = 0xe706,
34
+++ b/accel/tcg/tb-jmp-cache.h
26
VRX_VLLEZ = 0xe704,
35
@@ -XXX,XX +XXX,XX @@
27
+ VRX_VLREP = 0xe705,
36
28
VRX_VST = 0xe70e,
37
/*
29
VRX_VSTEF = 0xe70b,
38
* Accessed in parallel; all accesses to 'tb' must be atomic.
30
VRX_VSTEG = 0xe70a,
39
+ * For TARGET_TB_PCREL, accesses to 'pc' must be protected by
31
@@ -XXX,XX +XXX,XX @@ static int RXB(TCGReg v1, TCGReg v2, TCGReg v3, TCGReg v4)
40
+ * a load_acquire/store_release to 'tb'.
32
| ((v4 & 0x10) << (4 + 0));
41
*/
33
}
42
struct CPUJumpCache {
34
43
struct {
35
+static void tcg_out_insn_VRIa(TCGContext *s, S390Opcode op,
44
TranslationBlock *tb;
36
+ TCGReg v1, uint16_t i2, int m3)
45
+#if TARGET_TB_PCREL
46
+ target_ulong pc;
47
+#endif
48
} array[TB_JMP_CACHE_SIZE];
49
};
50
51
+static inline TranslationBlock *
52
+tb_jmp_cache_get_tb(CPUJumpCache *jc, uint32_t hash)
37
+{
53
+{
38
+ tcg_debug_assert(is_vector_reg(v1));
54
+#if TARGET_TB_PCREL
39
+ tcg_out16(s, (op & 0xff00) | ((v1 & 0xf) << 4));
55
+ /* Use acquire to ensure current load of pc from jc. */
40
+ tcg_out16(s, i2);
56
+ return qatomic_load_acquire(&jc->array[hash].tb);
41
+ tcg_out16(s, (op & 0x00ff) | RXB(v1, 0, 0, 0) | (m3 << 12));
57
+#else
58
+ /* Use rcu_read to ensure current load of pc from *tb. */
59
+ return qatomic_rcu_read(&jc->array[hash].tb);
60
+#endif
42
+}
61
+}
43
+
62
+
44
+static void tcg_out_insn_VRIb(TCGContext *s, S390Opcode op,
63
+static inline target_ulong
45
+ TCGReg v1, uint8_t i2, uint8_t i3, int m4)
64
+tb_jmp_cache_get_pc(CPUJumpCache *jc, uint32_t hash, TranslationBlock *tb)
46
+{
65
+{
47
+ tcg_debug_assert(is_vector_reg(v1));
66
+#if TARGET_TB_PCREL
48
+ tcg_out16(s, (op & 0xff00) | ((v1 & 0xf) << 4));
67
+ return jc->array[hash].pc;
49
+ tcg_out16(s, (i2 << 8) | (i3 & 0xff));
68
+#else
50
+ tcg_out16(s, (op & 0x00ff) | RXB(v1, 0, 0, 0) | (m4 << 12));
69
+ return tb_pc(tb);
70
+#endif
51
+}
71
+}
52
+
72
+
53
+static void tcg_out_insn_VRIc(TCGContext *s, S390Opcode op,
73
+static inline void
54
+ TCGReg v1, uint16_t i2, TCGReg v3, int m4)
74
+tb_jmp_cache_set(CPUJumpCache *jc, uint32_t hash,
75
+ TranslationBlock *tb, target_ulong pc)
55
+{
76
+{
56
+ tcg_debug_assert(is_vector_reg(v1));
77
+#if TARGET_TB_PCREL
57
+ tcg_debug_assert(is_vector_reg(v3));
78
+ jc->array[hash].pc = pc;
58
+ tcg_out16(s, (op & 0xff00) | ((v1 & 0xf) << 4) | (v3 & 0xf));
79
+ /* Use store_release on tb to ensure pc is written first. */
59
+ tcg_out16(s, i2);
80
+ qatomic_store_release(&jc->array[hash].tb, tb);
60
+ tcg_out16(s, (op & 0x00ff) | RXB(v1, 0, v3, 0) | (m4 << 12));
81
+#else
82
+ /* Use the pc value already stored in tb->pc. */
83
+ qatomic_set(&jc->array[hash].tb, tb);
84
+#endif
61
+}
85
+}
62
+
86
+
63
static void tcg_out_insn_VRRa(TCGContext *s, S390Opcode op,
87
#endif /* ACCEL_TCG_TB_JMP_CACHE_H */
64
TCGReg v1, TCGReg v2, int m3)
88
diff --git a/include/exec/cpu-defs.h b/include/exec/cpu-defs.h
65
{
89
index XXXXXXX..XXXXXXX 100644
66
@@ -XXX,XX +XXX,XX @@ static void tcg_out_insn_VRRa(TCGContext *s, S390Opcode op,
90
--- a/include/exec/cpu-defs.h
67
tcg_out32(s, (op & 0x00ff) | RXB(v1, v2, 0, 0) | (m3 << 12));
91
+++ b/include/exec/cpu-defs.h
68
}
92
@@ -XXX,XX +XXX,XX @@
69
93
# error TARGET_PAGE_BITS must be defined in cpu-param.h
70
+static void tcg_out_insn_VRRf(TCGContext *s, S390Opcode op,
94
# endif
71
+ TCGReg v1, TCGReg r2, TCGReg r3)
95
#endif
96
+#ifndef TARGET_TB_PCREL
97
+# define TARGET_TB_PCREL 0
98
+#endif
99
100
#define TARGET_LONG_SIZE (TARGET_LONG_BITS / 8)
101
102
diff --git a/include/exec/exec-all.h b/include/exec/exec-all.h
103
index XXXXXXX..XXXXXXX 100644
104
--- a/include/exec/exec-all.h
105
+++ b/include/exec/exec-all.h
106
@@ -XXX,XX +XXX,XX @@ struct tb_tc {
107
};
108
109
struct TranslationBlock {
110
- target_ulong pc; /* simulated PC corresponding to this block (EIP + CS base) */
111
- target_ulong cs_base; /* CS base for this block */
112
+#if !TARGET_TB_PCREL
113
+ /*
114
+ * Guest PC corresponding to this block. This must be the true
115
+ * virtual address. Therefore e.g. x86 stores EIP + CS_BASE, and
116
+ * targets like Arm, MIPS, HP-PA, which reuse low bits for ISA or
117
+ * privilege, must store those bits elsewhere.
118
+ *
119
+ * If TARGET_TB_PCREL, the opcodes for the TranslationBlock are
120
+ * written such that the TB is associated only with the physical
121
+ * page and may be run in any virtual address context. In this case,
122
+ * PC must always be taken from ENV in a target-specific manner.
123
+ * Unwind information is taken as offsets from the page, to be
124
+ * deposited into the "current" PC.
125
+ */
126
+ target_ulong pc;
127
+#endif
128
+
129
+ /*
130
+ * Target-specific data associated with the TranslationBlock, e.g.:
131
+ * x86: the original user, the Code Segment virtual base,
132
+ * arm: an extension of tb->flags,
133
+ * s390x: instruction data for EXECUTE,
134
+ * sparc: the next pc of the instruction queue (for delay slots).
135
+ */
136
+ target_ulong cs_base;
137
+
138
uint32_t flags; /* flags defining in which context the code was generated */
139
uint32_t cflags; /* compile flags */
140
141
@@ -XXX,XX +XXX,XX @@ struct TranslationBlock {
142
/* Hide the read to avoid ifdefs for TARGET_TB_PCREL. */
143
static inline target_ulong tb_pc(const TranslationBlock *tb)
144
{
145
+#if TARGET_TB_PCREL
146
+ qemu_build_not_reached();
147
+#else
148
return tb->pc;
149
+#endif
150
}
151
152
/* Hide the qatomic_read to make code a little easier on the eyes */
153
diff --git a/accel/tcg/cpu-exec.c b/accel/tcg/cpu-exec.c
154
index XXXXXXX..XXXXXXX 100644
155
--- a/accel/tcg/cpu-exec.c
156
+++ b/accel/tcg/cpu-exec.c
157
@@ -XXX,XX +XXX,XX @@ static bool tb_lookup_cmp(const void *p, const void *d)
158
const TranslationBlock *tb = p;
159
const struct tb_desc *desc = d;
160
161
- if (tb_pc(tb) == desc->pc &&
162
+ if ((TARGET_TB_PCREL || tb_pc(tb) == desc->pc) &&
163
tb->page_addr[0] == desc->page_addr0 &&
164
tb->cs_base == desc->cs_base &&
165
tb->flags == desc->flags &&
166
@@ -XXX,XX +XXX,XX @@ static TranslationBlock *tb_htable_lookup(CPUState *cpu, target_ulong pc,
167
return NULL;
168
}
169
desc.page_addr0 = phys_pc;
170
- h = tb_hash_func(phys_pc, pc, flags, cflags, *cpu->trace_dstate);
171
+ h = tb_hash_func(phys_pc, (TARGET_TB_PCREL ? 0 : pc),
172
+ flags, cflags, *cpu->trace_dstate);
173
return qht_lookup_custom(&tb_ctx.htable, &desc, h, tb_lookup_cmp);
174
}
175
176
@@ -XXX,XX +XXX,XX @@ static inline TranslationBlock *tb_lookup(CPUState *cpu, target_ulong pc,
177
uint32_t flags, uint32_t cflags)
178
{
179
TranslationBlock *tb;
180
+ CPUJumpCache *jc;
181
uint32_t hash;
182
183
/* we should never be trying to look up an INVALID tb */
184
tcg_debug_assert(!(cflags & CF_INVALID));
185
186
hash = tb_jmp_cache_hash_func(pc);
187
- tb = qatomic_rcu_read(&cpu->tb_jmp_cache->array[hash].tb);
188
+ jc = cpu->tb_jmp_cache;
189
+ tb = tb_jmp_cache_get_tb(jc, hash);
190
191
if (likely(tb &&
192
- tb->pc == pc &&
193
+ tb_jmp_cache_get_pc(jc, hash, tb) == pc &&
194
tb->cs_base == cs_base &&
195
tb->flags == flags &&
196
tb->trace_vcpu_dstate == *cpu->trace_dstate &&
197
@@ -XXX,XX +XXX,XX @@ static inline TranslationBlock *tb_lookup(CPUState *cpu, target_ulong pc,
198
if (tb == NULL) {
199
return NULL;
200
}
201
- qatomic_set(&cpu->tb_jmp_cache->array[hash].tb, tb);
202
+ tb_jmp_cache_set(jc, hash, tb, pc);
203
return tb;
204
}
205
206
@@ -XXX,XX +XXX,XX @@ cpu_tb_exec(CPUState *cpu, TranslationBlock *itb, int *tb_exit)
207
if (cc->tcg_ops->synchronize_from_tb) {
208
cc->tcg_ops->synchronize_from_tb(cpu, last_tb);
209
} else {
210
+ assert(!TARGET_TB_PCREL);
211
assert(cc->set_pc);
212
cc->set_pc(cpu, tb_pc(last_tb));
213
}
214
@@ -XXX,XX +XXX,XX @@ int cpu_exec(CPUState *cpu)
215
* for the fast lookup
216
*/
217
h = tb_jmp_cache_hash_func(pc);
218
- qatomic_set(&cpu->tb_jmp_cache->array[h].tb, tb);
219
+ tb_jmp_cache_set(cpu->tb_jmp_cache, h, tb, pc);
220
}
221
222
#ifndef CONFIG_USER_ONLY
223
diff --git a/accel/tcg/translate-all.c b/accel/tcg/translate-all.c
224
index XXXXXXX..XXXXXXX 100644
225
--- a/accel/tcg/translate-all.c
226
+++ b/accel/tcg/translate-all.c
227
@@ -XXX,XX +XXX,XX @@ static int encode_search(TranslationBlock *tb, uint8_t *block)
228
229
for (j = 0; j < TARGET_INSN_START_WORDS; ++j) {
230
if (i == 0) {
231
- prev = (j == 0 ? tb_pc(tb) : 0);
232
+ prev = (!TARGET_TB_PCREL && j == 0 ? tb_pc(tb) : 0);
233
} else {
234
prev = tcg_ctx->gen_insn_data[i - 1][j];
235
}
236
@@ -XXX,XX +XXX,XX @@ static int encode_search(TranslationBlock *tb, uint8_t *block)
237
static int cpu_restore_state_from_tb(CPUState *cpu, TranslationBlock *tb,
238
uintptr_t searched_pc, bool reset_icount)
239
{
240
- target_ulong data[TARGET_INSN_START_WORDS] = { tb_pc(tb) };
241
+ target_ulong data[TARGET_INSN_START_WORDS];
242
uintptr_t host_pc = (uintptr_t)tb->tc.ptr;
243
CPUArchState *env = cpu->env_ptr;
244
const uint8_t *p = tb->tc.ptr + tb->tc.size;
245
@@ -XXX,XX +XXX,XX @@ static int cpu_restore_state_from_tb(CPUState *cpu, TranslationBlock *tb,
246
return -1;
247
}
248
249
+ memset(data, 0, sizeof(data));
250
+ if (!TARGET_TB_PCREL) {
251
+ data[0] = tb_pc(tb);
252
+ }
253
+
254
/* Reconstruct the stored insn data while looking for the point at
255
which the end of the insn exceeds the searched_pc. */
256
for (i = 0; i < num_insns; ++i) {
257
@@ -XXX,XX +XXX,XX @@ static bool tb_cmp(const void *ap, const void *bp)
258
const TranslationBlock *a = ap;
259
const TranslationBlock *b = bp;
260
261
- return tb_pc(a) == tb_pc(b) &&
262
- a->cs_base == b->cs_base &&
263
- a->flags == b->flags &&
264
- (tb_cflags(a) & ~CF_INVALID) == (tb_cflags(b) & ~CF_INVALID) &&
265
- a->trace_vcpu_dstate == b->trace_vcpu_dstate &&
266
- a->page_addr[0] == b->page_addr[0] &&
267
- a->page_addr[1] == b->page_addr[1];
268
+ return ((TARGET_TB_PCREL || tb_pc(a) == tb_pc(b)) &&
269
+ a->cs_base == b->cs_base &&
270
+ a->flags == b->flags &&
271
+ (tb_cflags(a) & ~CF_INVALID) == (tb_cflags(b) & ~CF_INVALID) &&
272
+ a->trace_vcpu_dstate == b->trace_vcpu_dstate &&
273
+ a->page_addr[0] == b->page_addr[0] &&
274
+ a->page_addr[1] == b->page_addr[1]);
275
}
276
277
void tb_htable_init(void)
278
@@ -XXX,XX +XXX,XX @@ static inline void tb_jmp_unlink(TranslationBlock *dest)
279
qemu_spin_unlock(&dest->jmp_lock);
280
}
281
282
+static void tb_jmp_cache_inval_tb(TranslationBlock *tb)
72
+{
283
+{
73
+ tcg_debug_assert(is_vector_reg(v1));
284
+ CPUState *cpu;
74
+ tcg_debug_assert(is_general_reg(r2));
285
+
75
+ tcg_debug_assert(is_general_reg(r3));
286
+ if (TARGET_TB_PCREL) {
76
+ tcg_out16(s, (op & 0xff00) | ((v1 & 0xf) << 4) | r2);
287
+ /* A TB may be at any virtual address */
77
+ tcg_out16(s, r3 << 12);
288
+ CPU_FOREACH(cpu) {
78
+ tcg_out16(s, (op & 0x00ff) | RXB(v1, 0, 0, 0));
289
+ tcg_flush_jmp_cache(cpu);
79
+}
290
+ }
80
+
291
+ } else {
81
static void tcg_out_insn_VRSb(TCGContext *s, S390Opcode op, TCGReg v1,
292
+ uint32_t h = tb_jmp_cache_hash_func(tb_pc(tb));
82
intptr_t d2, TCGReg b2, TCGReg r3, int m4)
293
+
83
{
294
+ CPU_FOREACH(cpu) {
84
@@ -XXX,XX +XXX,XX @@ static inline void tcg_out_op(TCGContext *s, TCGOpcode opc,
295
+ CPUJumpCache *jc = cpu->tb_jmp_cache;
85
static bool tcg_out_dup_vec(TCGContext *s, TCGType type, unsigned vece,
296
+
86
TCGReg dst, TCGReg src)
297
+ if (qatomic_read(&jc->array[h].tb) == tb) {
87
{
298
+ qatomic_set(&jc->array[h].tb, NULL);
88
- g_assert_not_reached();
299
+ }
89
+ if (is_general_reg(src)) {
90
+ /* Replicate general register into two MO_64. */
91
+ tcg_out_insn(s, VRRf, VLVGP, dst, src, src);
92
+ if (vece == MO_64) {
93
+ return true;
94
+ }
300
+ }
95
+ }
301
+ }
96
+
302
+}
97
+ /*
303
+
98
+ * Recall that the "standard" integer, within a vector, is the
304
/*
99
+ * rightmost element of the leftmost doubleword, a-la VLLEZ.
305
* In user-mode, call with mmap_lock held.
100
+ */
306
* In !user-mode, if @rm_from_page_list is set, call with the TB's pages'
101
+ tcg_out_insn(s, VRIc, VREP, dst, (8 >> vece) - 1, src, vece);
307
@@ -XXX,XX +XXX,XX @@ static inline void tb_jmp_unlink(TranslationBlock *dest)
102
+ return true;
308
*/
103
}
309
static void do_tb_phys_invalidate(TranslationBlock *tb, bool rm_from_page_list)
104
310
{
105
static bool tcg_out_dupm_vec(TCGContext *s, TCGType type, unsigned vece,
311
- CPUState *cpu;
106
TCGReg dst, TCGReg base, intptr_t offset)
312
PageDesc *p;
107
{
313
uint32_t h;
108
- g_assert_not_reached();
314
tb_page_addr_t phys_pc;
109
+ tcg_out_vrx_mem(s, VRX_VLREP, dst, base, TCG_REG_NONE, offset, vece);
315
@@ -XXX,XX +XXX,XX @@ static void do_tb_phys_invalidate(TranslationBlock *tb, bool rm_from_page_list)
110
+ return true;
316
111
}
317
/* remove the TB from the hash list */
112
318
phys_pc = tb->page_addr[0];
113
static void tcg_out_dupi_vec(TCGContext *s, TCGType type, unsigned vece,
319
- h = tb_hash_func(phys_pc, tb_pc(tb), tb->flags, orig_cflags,
114
TCGReg dst, int64_t val)
320
- tb->trace_vcpu_dstate);
115
{
321
+ h = tb_hash_func(phys_pc, (TARGET_TB_PCREL ? 0 : tb_pc(tb)),
116
- g_assert_not_reached();
322
+ tb->flags, orig_cflags, tb->trace_vcpu_dstate);
117
+ int i, mask, msb, lsb;
323
if (!qht_remove(&tb_ctx.htable, tb, h)) {
118
+
324
return;
119
+ /* Look for int16_t elements. */
325
}
120
+ if (vece <= MO_16 ||
326
@@ -XXX,XX +XXX,XX @@ static void do_tb_phys_invalidate(TranslationBlock *tb, bool rm_from_page_list)
121
+ (vece == MO_32 ? (int32_t)val : val) == (int16_t)val) {
327
}
122
+ tcg_out_insn(s, VRIa, VREPI, dst, val, vece);
328
123
+ return;
329
/* remove the TB from the hash list */
124
+ }
330
- h = tb_jmp_cache_hash_func(tb->pc);
125
+
331
- CPU_FOREACH(cpu) {
126
+ /* Look for bit masks. */
332
- CPUJumpCache *jc = cpu->tb_jmp_cache;
127
+ if (vece == MO_32) {
333
- if (qatomic_read(&jc->array[h].tb) == tb) {
128
+ if (risbg_mask((int32_t)val)) {
334
- qatomic_set(&jc->array[h].tb, NULL);
129
+ /* Handle wraparound by swapping msb and lsb. */
335
- }
130
+ if ((val & 0x80000001u) == 0x80000001u) {
336
- }
131
+ msb = 32 - ctz32(~val);
337
+ tb_jmp_cache_inval_tb(tb);
132
+ lsb = clz32(~val) - 1;
338
133
+ } else {
339
/* suppress this TB from the two jump lists */
134
+ msb = clz32(val);
340
tb_remove_from_jmp_list(tb, 0);
135
+ lsb = 31 - ctz32(val);
341
@@ -XXX,XX +XXX,XX @@ tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
136
+ }
342
}
137
+ tcg_out_insn(s, VRIb, VGM, dst, lsb, msb, MO_32);
343
138
+ return;
344
/* add in the hash table */
139
+ }
345
- h = tb_hash_func(phys_pc, tb_pc(tb), tb->flags, tb->cflags,
140
+ } else {
346
- tb->trace_vcpu_dstate);
141
+ if (risbg_mask(val)) {
347
+ h = tb_hash_func(phys_pc, (TARGET_TB_PCREL ? 0 : tb_pc(tb)),
142
+ /* Handle wraparound by swapping msb and lsb. */
348
+ tb->flags, tb->cflags, tb->trace_vcpu_dstate);
143
+ if ((val & 0x8000000000000001ull) == 0x8000000000000001ull) {
349
qht_insert(&tb_ctx.htable, tb, h, &existing_tb);
144
+ /* Handle wraparound by swapping msb and lsb. */
350
145
+ msb = 64 - ctz64(~val);
351
/* remove TB from the page(s) if we couldn't insert it */
146
+ lsb = clz64(~val) - 1;
352
@@ -XXX,XX +XXX,XX @@ TranslationBlock *tb_gen_code(CPUState *cpu,
147
+ } else {
353
148
+ msb = clz64(val);
354
gen_code_buf = tcg_ctx->code_gen_ptr;
149
+ lsb = 63 - ctz64(val);
355
tb->tc.ptr = tcg_splitwx_to_rx(gen_code_buf);
150
+ }
356
+#if !TARGET_TB_PCREL
151
+ tcg_out_insn(s, VRIb, VGM, dst, lsb, msb, MO_64);
357
tb->pc = pc;
152
+ return;
358
+#endif
153
+ }
359
tb->cs_base = cs_base;
154
+ }
360
tb->flags = flags;
155
+
361
tb->cflags = cflags;
156
+ /* Look for all bytes 0x00 or 0xff. */
157
+ for (i = mask = 0; i < 8; i++) {
158
+ uint8_t byte = val >> (i * 8);
159
+ if (byte == 0xff) {
160
+ mask |= 1 << i;
161
+ } else if (byte != 0) {
162
+ break;
163
+ }
164
+ }
165
+ if (i == 8) {
166
+ tcg_out_insn(s, VRIa, VGBM, dst, mask * 0x0101, 0);
167
+ return;
168
+ }
169
+
170
+ /* Otherwise, stuff it in the constant pool. */
171
+ tcg_out_insn(s, RIL, LARL, TCG_TMP0, 0);
172
+ new_pool_label(s, val, R_390_PC32DBL, s->code_ptr - 2, 2);
173
+ tcg_out_insn(s, VRX, VLREP, dst, TCG_TMP0, TCG_REG_NONE, 0, MO_64);
174
}
175
176
static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
177
--
362
--
178
2.25.1
363
2.34.1
179
364
180
365
diff view generated by jsdifflib
1
Add registers and function stubs. The functionality
1
From: Leandro Lupori <leandro.lupori@eldorado.org.br>
2
is disabled via squashing s390_facilities[2] to 0.
3
2
4
We must still include results for the mandatory opcodes in
3
PowerPC64 processors handle direct branches better than indirect
5
tcg_target_op_def, as all opcodes are checked during tcg init.
4
ones, resulting in less stalled cycles and branch misses.
6
5
7
Reviewed-by: David Hildenbrand <david@redhat.com>
6
However, PPC's tb_target_set_jmp_target() was only using direct
7
branches for 16-bit jumps, while PowerPC64's unconditional branch
8
instructions are able to handle displacements of up to 26 bits.
9
To take advantage of this, now jumps whose displacements fit in
10
between 17 and 26 bits are also converted to direct branches.
11
12
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
13
Signed-off-by: Leandro Lupori <leandro.lupori@eldorado.org.br>
14
[rth: Expanded some commentary.]
8
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
15
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
9
---
16
---
10
tcg/s390x/tcg-target-con-set.h | 4 +
17
tcg/ppc/tcg-target.c.inc | 119 +++++++++++++++++++++++++++++----------
11
tcg/s390x/tcg-target-con-str.h | 1 +
18
1 file changed, 88 insertions(+), 31 deletions(-)
12
tcg/s390x/tcg-target.h | 35 ++++++++-
13
tcg/s390x/tcg-target.opc.h | 12 +++
14
tcg/s390x/tcg-target.c.inc | 137 ++++++++++++++++++++++++++++++++-
15
5 files changed, 184 insertions(+), 5 deletions(-)
16
create mode 100644 tcg/s390x/tcg-target.opc.h
17
19
18
diff --git a/tcg/s390x/tcg-target-con-set.h b/tcg/s390x/tcg-target-con-set.h
20
diff --git a/tcg/ppc/tcg-target.c.inc b/tcg/ppc/tcg-target.c.inc
19
index XXXXXXX..XXXXXXX 100644
21
index XXXXXXX..XXXXXXX 100644
20
--- a/tcg/s390x/tcg-target-con-set.h
22
--- a/tcg/ppc/tcg-target.c.inc
21
+++ b/tcg/s390x/tcg-target-con-set.h
23
+++ b/tcg/ppc/tcg-target.c.inc
22
@@ -XXX,XX +XXX,XX @@ C_O0_I1(r)
24
@@ -XXX,XX +XXX,XX @@ static void tcg_out_mb(TCGContext *s, TCGArg a0)
23
C_O0_I2(L, L)
25
tcg_out32(s, insn);
24
C_O0_I2(r, r)
25
C_O0_I2(r, ri)
26
+C_O0_I2(v, r)
27
C_O1_I1(r, L)
28
C_O1_I1(r, r)
29
+C_O1_I1(v, r)
30
+C_O1_I1(v, vr)
31
C_O1_I2(r, 0, ri)
32
C_O1_I2(r, 0, rI)
33
C_O1_I2(r, 0, rJ)
34
C_O1_I2(r, r, ri)
35
C_O1_I2(r, rZ, r)
36
+C_O1_I2(v, v, v)
37
C_O1_I4(r, r, ri, r, 0)
38
C_O1_I4(r, r, ri, rI, 0)
39
C_O2_I2(b, a, 0, r)
40
diff --git a/tcg/s390x/tcg-target-con-str.h b/tcg/s390x/tcg-target-con-str.h
41
index XXXXXXX..XXXXXXX 100644
42
--- a/tcg/s390x/tcg-target-con-str.h
43
+++ b/tcg/s390x/tcg-target-con-str.h
44
@@ -XXX,XX +XXX,XX @@
45
*/
46
REGS('r', ALL_GENERAL_REGS)
47
REGS('L', ALL_GENERAL_REGS & ~SOFTMMU_RESERVE_REGS)
48
+REGS('v', ALL_VECTOR_REGS)
49
/*
50
* A (single) even/odd pair for division.
51
* TODO: Add something to the register allocator to allow
52
diff --git a/tcg/s390x/tcg-target.h b/tcg/s390x/tcg-target.h
53
index XXXXXXX..XXXXXXX 100644
54
--- a/tcg/s390x/tcg-target.h
55
+++ b/tcg/s390x/tcg-target.h
56
@@ -XXX,XX +XXX,XX @@ typedef enum TCGReg {
57
TCG_REG_R8, TCG_REG_R9, TCG_REG_R10, TCG_REG_R11,
58
TCG_REG_R12, TCG_REG_R13, TCG_REG_R14, TCG_REG_R15,
59
60
+ TCG_REG_V0 = 32, TCG_REG_V1, TCG_REG_V2, TCG_REG_V3,
61
+ TCG_REG_V4, TCG_REG_V5, TCG_REG_V6, TCG_REG_V7,
62
+ TCG_REG_V8, TCG_REG_V9, TCG_REG_V10, TCG_REG_V11,
63
+ TCG_REG_V12, TCG_REG_V13, TCG_REG_V14, TCG_REG_V15,
64
+ TCG_REG_V16, TCG_REG_V17, TCG_REG_V18, TCG_REG_V19,
65
+ TCG_REG_V20, TCG_REG_V21, TCG_REG_V22, TCG_REG_V23,
66
+ TCG_REG_V24, TCG_REG_V25, TCG_REG_V26, TCG_REG_V27,
67
+ TCG_REG_V28, TCG_REG_V29, TCG_REG_V30, TCG_REG_V31,
68
+
69
TCG_AREG0 = TCG_REG_R10,
70
TCG_REG_CALL_STACK = TCG_REG_R15
71
} TCGReg;
72
73
-#define TCG_TARGET_NB_REGS 16
74
+#define TCG_TARGET_NB_REGS 64
75
76
/* A list of relevant facilities used by this translator. Some of these
77
are required for proper operation, and these are checked at startup. */
78
@@ -XXX,XX +XXX,XX @@ typedef enum TCGReg {
79
#define FACILITY_FAST_BCR_SER FACILITY_LOAD_ON_COND
80
#define FACILITY_DISTINCT_OPS FACILITY_LOAD_ON_COND
81
#define FACILITY_LOAD_ON_COND2 53
82
+#define FACILITY_VECTOR 129
83
84
-extern uint64_t s390_facilities[1];
85
+extern uint64_t s390_facilities[3];
86
87
#define HAVE_FACILITY(X) \
88
((s390_facilities[FACILITY_##X / 64] >> (63 - FACILITY_##X % 64)) & 1)
89
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities[1];
90
#define TCG_TARGET_HAS_muluh_i64 0
91
#define TCG_TARGET_HAS_mulsh_i64 0
92
93
+#define TCG_TARGET_HAS_v64 HAVE_FACILITY(VECTOR)
94
+#define TCG_TARGET_HAS_v128 HAVE_FACILITY(VECTOR)
95
+#define TCG_TARGET_HAS_v256 0
96
+
97
+#define TCG_TARGET_HAS_andc_vec 0
98
+#define TCG_TARGET_HAS_orc_vec 0
99
+#define TCG_TARGET_HAS_not_vec 0
100
+#define TCG_TARGET_HAS_neg_vec 0
101
+#define TCG_TARGET_HAS_abs_vec 0
102
+#define TCG_TARGET_HAS_roti_vec 0
103
+#define TCG_TARGET_HAS_rots_vec 0
104
+#define TCG_TARGET_HAS_rotv_vec 0
105
+#define TCG_TARGET_HAS_shi_vec 0
106
+#define TCG_TARGET_HAS_shs_vec 0
107
+#define TCG_TARGET_HAS_shv_vec 0
108
+#define TCG_TARGET_HAS_mul_vec 0
109
+#define TCG_TARGET_HAS_sat_vec 0
110
+#define TCG_TARGET_HAS_minmax_vec 0
111
+#define TCG_TARGET_HAS_bitsel_vec 0
112
+#define TCG_TARGET_HAS_cmpsel_vec 0
113
+
114
/* used for function call generation */
115
#define TCG_TARGET_STACK_ALIGN        8
116
#define TCG_TARGET_CALL_STACK_OFFSET    160
117
diff --git a/tcg/s390x/tcg-target.opc.h b/tcg/s390x/tcg-target.opc.h
118
new file mode 100644
119
index XXXXXXX..XXXXXXX
120
--- /dev/null
121
+++ b/tcg/s390x/tcg-target.opc.h
122
@@ -XXX,XX +XXX,XX @@
123
+/*
124
+ * Copyright (c) 2021 Linaro
125
+ *
126
+ * This work is licensed under the terms of the GNU GPL, version 2 or
127
+ * (at your option) any later version.
128
+ *
129
+ * See the COPYING file in the top-level directory for details.
130
+ *
131
+ * Target-specific opcodes for host vector expansion. These will be
132
+ * emitted by tcg_expand_vec_op. For those familiar with GCC internals,
133
+ * consider these to be UNSPEC with names.
134
+ */
135
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
136
index XXXXXXX..XXXXXXX 100644
137
--- a/tcg/s390x/tcg-target.c.inc
138
+++ b/tcg/s390x/tcg-target.c.inc
139
@@ -XXX,XX +XXX,XX @@
140
#define TCG_CT_CONST_ZERO 0x800
141
142
#define ALL_GENERAL_REGS MAKE_64BIT_MASK(0, 16)
143
+#define ALL_VECTOR_REGS MAKE_64BIT_MASK(32, 32)
144
+
145
/*
146
* For softmmu, we need to avoid conflicts with the first 3
147
* argument registers to perform the tlb lookup, and to call
148
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
149
150
#ifdef CONFIG_DEBUG_TCG
151
static const char * const tcg_target_reg_names[TCG_TARGET_NB_REGS] = {
152
- "%r0", "%r1", "%r2", "%r3", "%r4", "%r5", "%r6", "%r7",
153
- "%r8", "%r9", "%r10" "%r11" "%r12" "%r13" "%r14" "%r15"
154
+ "%r0", "%r1", "%r2", "%r3", "%r4", "%r5", "%r6", "%r7",
155
+ "%r8", "%r9", "%r10", "%r11", "%r12", "%r13", "%r14", "%r15",
156
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
157
+ "%v0", "%v1", "%v2", "%v3", "%v4", "%v5", "%v6", "%v7",
158
+ "%v8", "%v9", "%v10", "%v11", "%v12", "%v13", "%v14", "%v15",
159
+ "%v16", "%v17", "%v18", "%v19", "%v20", "%v21", "%v22", "%v23",
160
+ "%v24", "%v25", "%v26", "%v27", "%v28", "%v29", "%v30", "%v31",
161
};
162
#endif
163
164
@@ -XXX,XX +XXX,XX @@ static const int tcg_target_reg_alloc_order[] = {
165
TCG_REG_R4,
166
TCG_REG_R3,
167
TCG_REG_R2,
168
+
169
+ /* V8-V15 are call saved, and omitted. */
170
+ TCG_REG_V0,
171
+ TCG_REG_V1,
172
+ TCG_REG_V2,
173
+ TCG_REG_V3,
174
+ TCG_REG_V4,
175
+ TCG_REG_V5,
176
+ TCG_REG_V6,
177
+ TCG_REG_V7,
178
+ TCG_REG_V16,
179
+ TCG_REG_V17,
180
+ TCG_REG_V18,
181
+ TCG_REG_V19,
182
+ TCG_REG_V20,
183
+ TCG_REG_V21,
184
+ TCG_REG_V22,
185
+ TCG_REG_V23,
186
+ TCG_REG_V24,
187
+ TCG_REG_V25,
188
+ TCG_REG_V26,
189
+ TCG_REG_V27,
190
+ TCG_REG_V28,
191
+ TCG_REG_V29,
192
+ TCG_REG_V30,
193
+ TCG_REG_V31,
194
};
195
196
static const int tcg_target_call_iarg_regs[] = {
197
@@ -XXX,XX +XXX,XX @@ static void * const qemu_st_helpers[(MO_SIZE | MO_BSWAP) + 1] = {
198
#endif
199
200
static const tcg_insn_unit *tb_ret_addr;
201
-uint64_t s390_facilities[1];
202
+uint64_t s390_facilities[3];
203
204
static bool patch_reloc(tcg_insn_unit *src_rw, int type,
205
intptr_t value, intptr_t addend)
206
@@ -XXX,XX +XXX,XX @@ static inline void tcg_out_op(TCGContext *s, TCGOpcode opc,
207
}
208
}
26
}
209
27
210
+static bool tcg_out_dup_vec(TCGContext *s, TCGType type, unsigned vece,
28
+static inline uint64_t make_pair(tcg_insn_unit i1, tcg_insn_unit i2)
211
+ TCGReg dst, TCGReg src)
212
+{
29
+{
213
+ g_assert_not_reached();
30
+ if (HOST_BIG_ENDIAN) {
31
+ return (uint64_t)i1 << 32 | i2;
32
+ }
33
+ return (uint64_t)i2 << 32 | i1;
214
+}
34
+}
215
+
35
+
216
+static bool tcg_out_dupm_vec(TCGContext *s, TCGType type, unsigned vece,
36
+static inline void ppc64_replace2(uintptr_t rx, uintptr_t rw,
217
+ TCGReg dst, TCGReg base, intptr_t offset)
37
+ tcg_insn_unit i0, tcg_insn_unit i1)
218
+{
38
+{
219
+ g_assert_not_reached();
39
+#if TCG_TARGET_REG_BITS == 64
40
+ qatomic_set((uint64_t *)rw, make_pair(i0, i1));
41
+ flush_idcache_range(rx, rw, 8);
42
+#else
43
+ qemu_build_not_reached();
44
+#endif
220
+}
45
+}
221
+
46
+
222
+static void tcg_out_dupi_vec(TCGContext *s, TCGType type, unsigned vece,
47
+static inline void ppc64_replace4(uintptr_t rx, uintptr_t rw,
223
+ TCGReg dst, int64_t val)
48
+ tcg_insn_unit i0, tcg_insn_unit i1,
49
+ tcg_insn_unit i2, tcg_insn_unit i3)
224
+{
50
+{
225
+ g_assert_not_reached();
51
+ uint64_t p[2];
52
+
53
+ p[!HOST_BIG_ENDIAN] = make_pair(i0, i1);
54
+ p[HOST_BIG_ENDIAN] = make_pair(i2, i3);
55
+
56
+ /*
57
+ * There's no convenient way to get the compiler to allocate a pair
58
+ * of registers at an even index, so copy into r6/r7 and clobber.
59
+ */
60
+ asm("mr %%r6, %1\n\t"
61
+ "mr %%r7, %2\n\t"
62
+ "stq %%r6, %0"
63
+ : "=Q"(*(__int128 *)rw) : "r"(p[0]), "r"(p[1]) : "r6", "r7");
64
+ flush_idcache_range(rx, rw, 16);
226
+}
65
+}
227
+
66
+
228
+static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
67
void tb_target_set_jmp_target(uintptr_t tc_ptr, uintptr_t jmp_rx,
229
+ unsigned vecl, unsigned vece,
68
uintptr_t jmp_rw, uintptr_t addr)
230
+ const TCGArg *args, const int *const_args)
231
+{
232
+ g_assert_not_reached();
233
+}
234
+
235
+int tcg_can_emit_vec_op(TCGOpcode opc, TCGType type, unsigned vece)
236
+{
237
+ return 0;
238
+}
239
+
240
+void tcg_expand_vec_op(TCGOpcode opc, TCGType type, unsigned vece,
241
+ TCGArg a0, ...)
242
+{
243
+ g_assert_not_reached();
244
+}
245
+
246
static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
247
{
69
{
248
switch (op) {
70
- if (TCG_TARGET_REG_BITS == 64) {
249
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
71
- tcg_insn_unit i1, i2;
250
? C_O2_I4(r, r, 0, 1, rA, r)
72
- intptr_t tb_diff = addr - tc_ptr;
251
: C_O2_I4(r, r, 0, 1, r, r));
73
- intptr_t br_diff = addr - (jmp_rx + 4);
252
74
- uint64_t pair;
253
+ case INDEX_op_st_vec:
75
+ tcg_insn_unit i0, i1, i2, i3;
254
+ return C_O0_I2(v, r);
76
+ intptr_t tb_diff = addr - tc_ptr;
255
+ case INDEX_op_ld_vec:
77
+ intptr_t br_diff = addr - (jmp_rx + 4);
256
+ case INDEX_op_dupm_vec:
78
+ intptr_t lo, hi;
257
+ return C_O1_I1(v, r);
79
258
+ case INDEX_op_dup_vec:
80
- /* This does not exercise the range of the branch, but we do
259
+ return C_O1_I1(v, vr);
81
- still need to be able to load the new value of TCG_REG_TB.
260
+ case INDEX_op_add_vec:
82
- But this does still happen quite often. */
261
+ case INDEX_op_sub_vec:
83
- if (tb_diff == (int16_t)tb_diff) {
262
+ case INDEX_op_and_vec:
84
- i1 = ADDI | TAI(TCG_REG_TB, TCG_REG_TB, tb_diff);
263
+ case INDEX_op_or_vec:
85
- i2 = B | (br_diff & 0x3fffffc);
264
+ case INDEX_op_xor_vec:
86
- } else {
265
+ case INDEX_op_cmp_vec:
87
- intptr_t lo = (int16_t)tb_diff;
266
+ return C_O1_I2(v, v, v);
88
- intptr_t hi = (int32_t)(tb_diff - lo);
267
+
89
- assert(tb_diff == hi + lo);
268
default:
90
- i1 = ADDIS | TAI(TCG_REG_TB, TCG_REG_TB, hi >> 16);
269
g_assert_not_reached();
91
- i2 = ADDI | TAI(TCG_REG_TB, TCG_REG_TB, lo);
270
}
92
- }
271
}
93
-#if HOST_BIG_ENDIAN
272
94
- pair = (uint64_t)i1 << 32 | i2;
273
+/*
95
-#else
274
+ * Mainline glibc added HWCAP_S390_VX before it was kernel abi.
96
- pair = (uint64_t)i2 << 32 | i1;
275
+ * Some distros have fixed this up locally, others have not.
97
-#endif
276
+ */
98
-
277
+#ifndef HWCAP_S390_VXRS
99
- /* As per the enclosing if, this is ppc64. Avoid the _Static_assert
278
+#define HWCAP_S390_VXRS 2048
100
- within qatomic_set that would fail to build a ppc32 host. */
279
+#endif
101
- qatomic_set__nocheck((uint64_t *)jmp_rw, pair);
280
+
102
- flush_idcache_range(jmp_rx, jmp_rw, 8);
281
static void query_s390_facilities(void)
103
- } else {
282
{
104
+ if (TCG_TARGET_REG_BITS == 32) {
283
unsigned long hwcap = qemu_getauxval(AT_HWCAP);
105
intptr_t diff = addr - jmp_rx;
284
@@ -XXX,XX +XXX,XX @@ static void query_s390_facilities(void)
106
tcg_debug_assert(in_range_b(diff));
285
asm volatile(".word 0xb2b0,0x1000"
107
qatomic_set((uint32_t *)jmp_rw, B | (diff & 0x3fffffc));
286
: "=r"(r0) : "r"(r0), "r"(r1) : "memory", "cc");
108
flush_idcache_range(jmp_rx, jmp_rw, 4);
109
+ return;
287
}
110
}
288
+
111
+
289
+ /*
112
+ /*
290
+ * Use of vector registers requires os support beyond the facility bit.
113
+ * For 16-bit displacements, we can use a single add + branch.
291
+ * If the kernel does not advertise support, disable the facility bits.
114
+ * This happens quite often.
292
+ * There is nothing else we currently care about in the 3rd word, so
293
+ * disable VECTOR with one store.
294
+ */
115
+ */
295
+ if (1 || !(hwcap & HWCAP_S390_VXRS)) {
116
+ if (tb_diff == (int16_t)tb_diff) {
296
+ s390_facilities[2] = 0;
117
+ i0 = ADDI | TAI(TCG_REG_TB, TCG_REG_TB, tb_diff);
118
+ i1 = B | (br_diff & 0x3fffffc);
119
+ ppc64_replace2(jmp_rx, jmp_rw, i0, i1);
120
+ return;
297
+ }
121
+ }
122
+
123
+ lo = (int16_t)tb_diff;
124
+ hi = (int32_t)(tb_diff - lo);
125
+ assert(tb_diff == hi + lo);
126
+ i0 = ADDIS | TAI(TCG_REG_TB, TCG_REG_TB, hi >> 16);
127
+ i1 = ADDI | TAI(TCG_REG_TB, TCG_REG_TB, lo);
128
+
129
+ /*
130
+ * Without stq from 2.07, we can only update two insns,
131
+ * and those must be the ones that load the target address.
132
+ */
133
+ if (!have_isa_2_07) {
134
+ ppc64_replace2(jmp_rx, jmp_rw, i0, i1);
135
+ return;
136
+ }
137
+
138
+ /*
139
+ * For 26-bit displacements, we can use a direct branch.
140
+ * Otherwise we still need the indirect branch, which we
141
+ * must restore after a potential direct branch write.
142
+ */
143
+ br_diff -= 4;
144
+ if (in_range_b(br_diff)) {
145
+ i2 = B | (br_diff & 0x3fffffc);
146
+ i3 = NOP;
147
+ } else {
148
+ i2 = MTSPR | RS(TCG_REG_TB) | CTR;
149
+ i3 = BCCTR | BO_ALWAYS;
150
+ }
151
+ ppc64_replace4(jmp_rx, jmp_rw, i0, i1, i2, i3);
298
}
152
}
299
153
300
static void tcg_target_init(TCGContext *s)
154
static void tcg_out_call_int(TCGContext *s, int lk,
301
@@ -XXX,XX +XXX,XX @@ static void tcg_target_init(TCGContext *s)
155
@@ -XXX,XX +XXX,XX @@ static void tcg_out_op(TCGContext *s, TCGOpcode opc,
302
156
if (s->tb_jmp_insn_offset) {
303
tcg_target_available_regs[TCG_TYPE_I32] = 0xffff;
157
/* Direct jump. */
304
tcg_target_available_regs[TCG_TYPE_I64] = 0xffff;
158
if (TCG_TARGET_REG_BITS == 64) {
305
+ if (HAVE_FACILITY(VECTOR)) {
159
- /* Ensure the next insns are 8-byte aligned. */
306
+ tcg_target_available_regs[TCG_TYPE_V64] = 0xffffffff00000000ull;
160
- if ((uintptr_t)s->code_ptr & 7) {
307
+ tcg_target_available_regs[TCG_TYPE_V128] = 0xffffffff00000000ull;
161
+ /* Ensure the next insns are 8 or 16-byte aligned. */
308
+ }
162
+ while ((uintptr_t)s->code_ptr & (have_isa_2_07 ? 15 : 7)) {
309
163
tcg_out32(s, NOP);
310
tcg_target_call_clobber_regs = 0;
164
}
311
tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_R0);
165
s->tb_jmp_insn_offset[args[0]] = tcg_current_code_size(s);
312
@@ -XXX,XX +XXX,XX @@ static void tcg_target_init(TCGContext *s)
313
/* The return register can be considered call-clobbered. */
314
tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_R14);
315
316
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V0);
317
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V1);
318
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V2);
319
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V3);
320
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V4);
321
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V5);
322
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V6);
323
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V7);
324
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V16);
325
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V17);
326
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V18);
327
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V19);
328
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V20);
329
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V21);
330
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V22);
331
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V23);
332
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V24);
333
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V25);
334
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V26);
335
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V27);
336
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V28);
337
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V29);
338
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V30);
339
+ tcg_regset_set_reg(tcg_target_call_clobber_regs, TCG_REG_V31);
340
+
341
s->reserved_regs = 0;
342
tcg_regset_set_reg(s->reserved_regs, TCG_TMP0);
343
/* XXX many insns can't be used with R0, so we better avoid it for now */
344
--
166
--
345
2.25.1
167
2.34.1
346
347
diff view generated by jsdifflib
1
For usadd, we only have to consider overflow. Since ~B + B == -1,
1
The value previously chosen overlaps GUSA_MASK.
2
the maximum value for A that saturates is ~B.
3
2
4
For ussub, we only have to consider underflow. The minimum value
3
Rename all DELAY_SLOT_* and GUSA_* defines to emphasize
5
that saturates to 0 from A - B is B.
4
that they are included in TB_FLAGs. Add aliases for the
5
FPSCR and SR bits that are included in TB_FLAGS, so that
6
we don't accidentally reassign those bits.
6
7
8
Fixes: 4da06fb3062 ("target/sh4: Implement prctl_unalign_sigbus")
9
Resolves: https://gitlab.com/qemu-project/qemu/-/issues/856
10
Reviewed-by: Yoshinori Sato <ysato@users.sourceforge.jp>
7
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
11
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
---
12
---
9
tcg/tcg-op-vec.c | 37 +++++++++++++++++++++++++++++++++++--
13
target/sh4/cpu.h | 56 +++++++++++++------------
10
1 file changed, 35 insertions(+), 2 deletions(-)
14
linux-user/sh4/signal.c | 6 +--
15
target/sh4/cpu.c | 6 +--
16
target/sh4/helper.c | 6 +--
17
target/sh4/translate.c | 90 ++++++++++++++++++++++-------------------
18
5 files changed, 88 insertions(+), 76 deletions(-)
11
19
12
diff --git a/tcg/tcg-op-vec.c b/tcg/tcg-op-vec.c
20
diff --git a/target/sh4/cpu.h b/target/sh4/cpu.h
13
index XXXXXXX..XXXXXXX 100644
21
index XXXXXXX..XXXXXXX 100644
14
--- a/tcg/tcg-op-vec.c
22
--- a/target/sh4/cpu.h
15
+++ b/tcg/tcg-op-vec.c
23
+++ b/target/sh4/cpu.h
16
@@ -XXX,XX +XXX,XX @@ bool tcg_can_emit_vecop_list(const TCGOpcode *list,
24
@@ -XXX,XX +XXX,XX @@
17
continue;
25
#define FPSCR_RM_NEAREST (0 << 0)
18
}
26
#define FPSCR_RM_ZERO (1 << 0)
19
break;
27
20
+ case INDEX_op_usadd_vec:
28
-#define DELAY_SLOT_MASK 0x7
21
+ if (tcg_can_emit_vec_op(INDEX_op_umin_vec, type, vece) ||
29
-#define DELAY_SLOT (1 << 0)
22
+ tcg_can_emit_vec_op(INDEX_op_cmp_vec, type, vece)) {
30
-#define DELAY_SLOT_CONDITIONAL (1 << 1)
23
+ continue;
31
-#define DELAY_SLOT_RTE (1 << 2)
24
+ }
32
+#define TB_FLAG_DELAY_SLOT (1 << 0)
25
+ break;
33
+#define TB_FLAG_DELAY_SLOT_COND (1 << 1)
26
+ case INDEX_op_ussub_vec:
34
+#define TB_FLAG_DELAY_SLOT_RTE (1 << 2)
27
+ if (tcg_can_emit_vec_op(INDEX_op_umax_vec, type, vece) ||
35
+#define TB_FLAG_PENDING_MOVCA (1 << 3)
28
+ tcg_can_emit_vec_op(INDEX_op_cmp_vec, type, vece)) {
36
+#define TB_FLAG_GUSA_SHIFT 4 /* [11:4] */
29
+ continue;
37
+#define TB_FLAG_GUSA_EXCLUSIVE (1 << 12)
30
+ }
38
+#define TB_FLAG_UNALIGN (1 << 13)
31
+ break;
39
+#define TB_FLAG_SR_FD (1 << SR_FD) /* 15 */
32
case INDEX_op_cmpsel_vec:
40
+#define TB_FLAG_FPSCR_PR FPSCR_PR /* 19 */
33
case INDEX_op_smin_vec:
41
+#define TB_FLAG_FPSCR_SZ FPSCR_SZ /* 20 */
34
case INDEX_op_smax_vec:
42
+#define TB_FLAG_FPSCR_FR FPSCR_FR /* 21 */
35
@@ -XXX,XX +XXX,XX @@ void tcg_gen_ssadd_vec(unsigned vece, TCGv_vec r, TCGv_vec a, TCGv_vec b)
43
+#define TB_FLAG_SR_RB (1 << SR_RB) /* 29 */
36
44
+#define TB_FLAG_SR_MD (1 << SR_MD) /* 30 */
37
void tcg_gen_usadd_vec(unsigned vece, TCGv_vec r, TCGv_vec a, TCGv_vec b)
45
46
-#define TB_FLAG_PENDING_MOVCA (1 << 3)
47
-#define TB_FLAG_UNALIGN (1 << 4)
48
-
49
-#define GUSA_SHIFT 4
50
-#ifdef CONFIG_USER_ONLY
51
-#define GUSA_EXCLUSIVE (1 << 12)
52
-#define GUSA_MASK ((0xff << GUSA_SHIFT) | GUSA_EXCLUSIVE)
53
-#else
54
-/* Provide dummy versions of the above to allow tests against tbflags
55
- to be elided while avoiding ifdefs. */
56
-#define GUSA_EXCLUSIVE 0
57
-#define GUSA_MASK 0
58
-#endif
59
-
60
-#define TB_FLAG_ENVFLAGS_MASK (DELAY_SLOT_MASK | GUSA_MASK)
61
+#define TB_FLAG_DELAY_SLOT_MASK (TB_FLAG_DELAY_SLOT | \
62
+ TB_FLAG_DELAY_SLOT_COND | \
63
+ TB_FLAG_DELAY_SLOT_RTE)
64
+#define TB_FLAG_GUSA_MASK ((0xff << TB_FLAG_GUSA_SHIFT) | \
65
+ TB_FLAG_GUSA_EXCLUSIVE)
66
+#define TB_FLAG_FPSCR_MASK (TB_FLAG_FPSCR_PR | \
67
+ TB_FLAG_FPSCR_SZ | \
68
+ TB_FLAG_FPSCR_FR)
69
+#define TB_FLAG_SR_MASK (TB_FLAG_SR_FD | \
70
+ TB_FLAG_SR_RB | \
71
+ TB_FLAG_SR_MD)
72
+#define TB_FLAG_ENVFLAGS_MASK (TB_FLAG_DELAY_SLOT_MASK | \
73
+ TB_FLAG_GUSA_MASK)
74
75
typedef struct tlb_t {
76
uint32_t vpn;        /* virtual page number */
77
@@ -XXX,XX +XXX,XX @@ static inline int cpu_mmu_index (CPUSH4State *env, bool ifetch)
38
{
78
{
39
- do_op3_nofail(vece, r, a, b, INDEX_op_usadd_vec);
79
/* The instruction in a RTE delay slot is fetched in privileged
40
+ if (!do_op3(vece, r, a, b, INDEX_op_usadd_vec)) {
80
mode, but executed in user mode. */
41
+ const TCGOpcode *hold_list = tcg_swap_vecop_list(NULL);
81
- if (ifetch && (env->flags & DELAY_SLOT_RTE)) {
42
+ TCGv_vec t = tcg_temp_new_vec_matching(r);
82
+ if (ifetch && (env->flags & TB_FLAG_DELAY_SLOT_RTE)) {
43
+
83
return 0;
44
+ /* usadd(a, b) = min(a, ~b) + b */
84
} else {
45
+ tcg_gen_not_vec(vece, t, b);
85
return (env->sr & (1u << SR_MD)) == 0 ? 1 : 0;
46
+ tcg_gen_umin_vec(vece, t, t, a);
86
@@ -XXX,XX +XXX,XX @@ static inline void cpu_get_tb_cpu_state(CPUSH4State *env, target_ulong *pc,
47
+ tcg_gen_add_vec(vece, r, t, b);
87
{
48
+
88
*pc = env->pc;
49
+ tcg_temp_free_vec(t);
89
/* For a gUSA region, notice the end of the region. */
50
+ tcg_swap_vecop_list(hold_list);
90
- *cs_base = env->flags & GUSA_MASK ? env->gregs[0] : 0;
51
+ }
91
- *flags = env->flags /* TB_FLAG_ENVFLAGS_MASK: bits 0-2, 4-12 */
92
- | (env->fpscr & (FPSCR_FR | FPSCR_SZ | FPSCR_PR)) /* Bits 19-21 */
93
- | (env->sr & ((1u << SR_MD) | (1u << SR_RB))) /* Bits 29-30 */
94
- | (env->sr & (1u << SR_FD)) /* Bit 15 */
95
+ *cs_base = env->flags & TB_FLAG_GUSA_MASK ? env->gregs[0] : 0;
96
+ *flags = env->flags
97
+ | (env->fpscr & TB_FLAG_FPSCR_MASK)
98
+ | (env->sr & TB_FLAG_SR_MASK)
99
| (env->movcal_backup ? TB_FLAG_PENDING_MOVCA : 0); /* Bit 3 */
100
#ifdef CONFIG_USER_ONLY
101
*flags |= TB_FLAG_UNALIGN * !env_cpu(env)->prctl_unalign_sigbus;
102
diff --git a/linux-user/sh4/signal.c b/linux-user/sh4/signal.c
103
index XXXXXXX..XXXXXXX 100644
104
--- a/linux-user/sh4/signal.c
105
+++ b/linux-user/sh4/signal.c
106
@@ -XXX,XX +XXX,XX @@ static void restore_sigcontext(CPUSH4State *regs, struct target_sigcontext *sc)
107
__get_user(regs->fpul, &sc->sc_fpul);
108
109
regs->tra = -1; /* disable syscall checks */
110
- regs->flags &= ~(DELAY_SLOT_MASK | GUSA_MASK);
111
+ regs->flags = 0;
52
}
112
}
53
113
54
void tcg_gen_sssub_vec(unsigned vece, TCGv_vec r, TCGv_vec a, TCGv_vec b)
114
void setup_frame(int sig, struct target_sigaction *ka,
55
@@ -XXX,XX +XXX,XX @@ void tcg_gen_sssub_vec(unsigned vece, TCGv_vec r, TCGv_vec a, TCGv_vec b)
115
@@ -XXX,XX +XXX,XX @@ void setup_frame(int sig, struct target_sigaction *ka,
56
116
regs->gregs[5] = 0;
57
void tcg_gen_ussub_vec(unsigned vece, TCGv_vec r, TCGv_vec a, TCGv_vec b)
117
regs->gregs[6] = frame_addr += offsetof(typeof(*frame), sc);
118
regs->pc = (unsigned long) ka->_sa_handler;
119
- regs->flags &= ~(DELAY_SLOT_MASK | GUSA_MASK);
120
+ regs->flags &= ~(TB_FLAG_DELAY_SLOT_MASK | TB_FLAG_GUSA_MASK);
121
122
unlock_user_struct(frame, frame_addr, 1);
123
return;
124
@@ -XXX,XX +XXX,XX @@ void setup_rt_frame(int sig, struct target_sigaction *ka,
125
regs->gregs[5] = frame_addr + offsetof(typeof(*frame), info);
126
regs->gregs[6] = frame_addr + offsetof(typeof(*frame), uc);
127
regs->pc = (unsigned long) ka->_sa_handler;
128
- regs->flags &= ~(DELAY_SLOT_MASK | GUSA_MASK);
129
+ regs->flags &= ~(TB_FLAG_DELAY_SLOT_MASK | TB_FLAG_GUSA_MASK);
130
131
unlock_user_struct(frame, frame_addr, 1);
132
return;
133
diff --git a/target/sh4/cpu.c b/target/sh4/cpu.c
134
index XXXXXXX..XXXXXXX 100644
135
--- a/target/sh4/cpu.c
136
+++ b/target/sh4/cpu.c
137
@@ -XXX,XX +XXX,XX @@ static void superh_cpu_synchronize_from_tb(CPUState *cs,
138
SuperHCPU *cpu = SUPERH_CPU(cs);
139
140
cpu->env.pc = tb_pc(tb);
141
- cpu->env.flags = tb->flags & TB_FLAG_ENVFLAGS_MASK;
142
+ cpu->env.flags = tb->flags;
143
}
144
145
#ifndef CONFIG_USER_ONLY
146
@@ -XXX,XX +XXX,XX @@ static bool superh_io_recompile_replay_branch(CPUState *cs,
147
SuperHCPU *cpu = SUPERH_CPU(cs);
148
CPUSH4State *env = &cpu->env;
149
150
- if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
151
+ if ((env->flags & (TB_FLAG_DELAY_SLOT | TB_FLAG_DELAY_SLOT_COND))
152
&& env->pc != tb_pc(tb)) {
153
env->pc -= 2;
154
- env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
155
+ env->flags &= ~(TB_FLAG_DELAY_SLOT | TB_FLAG_DELAY_SLOT_COND);
156
return true;
157
}
158
return false;
159
diff --git a/target/sh4/helper.c b/target/sh4/helper.c
160
index XXXXXXX..XXXXXXX 100644
161
--- a/target/sh4/helper.c
162
+++ b/target/sh4/helper.c
163
@@ -XXX,XX +XXX,XX @@ void superh_cpu_do_interrupt(CPUState *cs)
164
env->sr |= (1u << SR_BL) | (1u << SR_MD) | (1u << SR_RB);
165
env->lock_addr = -1;
166
167
- if (env->flags & DELAY_SLOT_MASK) {
168
+ if (env->flags & TB_FLAG_DELAY_SLOT_MASK) {
169
/* Branch instruction should be executed again before delay slot. */
170
    env->spc -= 2;
171
    /* Clear flags for exception/interrupt routine. */
172
- env->flags &= ~DELAY_SLOT_MASK;
173
+ env->flags &= ~TB_FLAG_DELAY_SLOT_MASK;
174
}
175
176
if (do_exp) {
177
@@ -XXX,XX +XXX,XX @@ bool superh_cpu_exec_interrupt(CPUState *cs, int interrupt_request)
178
CPUSH4State *env = &cpu->env;
179
180
/* Delay slots are indivisible, ignore interrupts */
181
- if (env->flags & DELAY_SLOT_MASK) {
182
+ if (env->flags & TB_FLAG_DELAY_SLOT_MASK) {
183
return false;
184
} else {
185
superh_cpu_do_interrupt(cs);
186
diff --git a/target/sh4/translate.c b/target/sh4/translate.c
187
index XXXXXXX..XXXXXXX 100644
188
--- a/target/sh4/translate.c
189
+++ b/target/sh4/translate.c
190
@@ -XXX,XX +XXX,XX @@ void superh_cpu_dump_state(CPUState *cs, FILE *f, int flags)
191
         i, env->gregs[i], i + 1, env->gregs[i + 1],
192
         i + 2, env->gregs[i + 2], i + 3, env->gregs[i + 3]);
193
}
194
- if (env->flags & DELAY_SLOT) {
195
+ if (env->flags & TB_FLAG_DELAY_SLOT) {
196
qemu_printf("in delay slot (delayed_pc=0x%08x)\n",
197
         env->delayed_pc);
198
- } else if (env->flags & DELAY_SLOT_CONDITIONAL) {
199
+ } else if (env->flags & TB_FLAG_DELAY_SLOT_COND) {
200
qemu_printf("in conditional delay slot (delayed_pc=0x%08x)\n",
201
         env->delayed_pc);
202
- } else if (env->flags & DELAY_SLOT_RTE) {
203
+ } else if (env->flags & TB_FLAG_DELAY_SLOT_RTE) {
204
qemu_fprintf(f, "in rte delay slot (delayed_pc=0x%08x)\n",
205
env->delayed_pc);
206
}
207
@@ -XXX,XX +XXX,XX @@ static inline void gen_save_cpu_state(DisasContext *ctx, bool save_pc)
208
209
static inline bool use_exit_tb(DisasContext *ctx)
58
{
210
{
59
- do_op3_nofail(vece, r, a, b, INDEX_op_ussub_vec);
211
- return (ctx->tbflags & GUSA_EXCLUSIVE) != 0;
60
+ if (!do_op3(vece, r, a, b, INDEX_op_ussub_vec)) {
212
+ return (ctx->tbflags & TB_FLAG_GUSA_EXCLUSIVE) != 0;
61
+ const TCGOpcode *hold_list = tcg_swap_vecop_list(NULL);
62
+ TCGv_vec t = tcg_temp_new_vec_matching(r);
63
+
64
+ /* ussub(a, b) = max(a, b) - b */
65
+ tcg_gen_umax_vec(vece, t, a, b);
66
+ tcg_gen_sub_vec(vece, r, t, b);
67
+
68
+ tcg_temp_free_vec(t);
69
+ tcg_swap_vecop_list(hold_list);
70
+ }
71
}
213
}
72
214
73
static void do_minmax(unsigned vece, TCGv_vec r, TCGv_vec a,
215
static bool use_goto_tb(DisasContext *ctx, target_ulong dest)
216
@@ -XXX,XX +XXX,XX @@ static void gen_conditional_jump(DisasContext *ctx, target_ulong dest,
217
TCGLabel *l1 = gen_new_label();
218
TCGCond cond_not_taken = jump_if_true ? TCG_COND_EQ : TCG_COND_NE;
219
220
- if (ctx->tbflags & GUSA_EXCLUSIVE) {
221
+ if (ctx->tbflags & TB_FLAG_GUSA_EXCLUSIVE) {
222
/* When in an exclusive region, we must continue to the end.
223
Therefore, exit the region on a taken branch, but otherwise
224
fall through to the next instruction. */
225
tcg_gen_brcondi_i32(cond_not_taken, cpu_sr_t, 0, l1);
226
- tcg_gen_movi_i32(cpu_flags, ctx->envflags & ~GUSA_MASK);
227
+ tcg_gen_movi_i32(cpu_flags, ctx->envflags & ~TB_FLAG_GUSA_MASK);
228
/* Note that this won't actually use a goto_tb opcode because we
229
disallow it in use_goto_tb, but it handles exit + singlestep. */
230
gen_goto_tb(ctx, 0, dest);
231
@@ -XXX,XX +XXX,XX @@ static void gen_delayed_conditional_jump(DisasContext * ctx)
232
tcg_gen_mov_i32(ds, cpu_delayed_cond);
233
tcg_gen_discard_i32(cpu_delayed_cond);
234
235
- if (ctx->tbflags & GUSA_EXCLUSIVE) {
236
+ if (ctx->tbflags & TB_FLAG_GUSA_EXCLUSIVE) {
237
/* When in an exclusive region, we must continue to the end.
238
Therefore, exit the region on a taken branch, but otherwise
239
fall through to the next instruction. */
240
tcg_gen_brcondi_i32(TCG_COND_EQ, ds, 0, l1);
241
242
/* Leave the gUSA region. */
243
- tcg_gen_movi_i32(cpu_flags, ctx->envflags & ~GUSA_MASK);
244
+ tcg_gen_movi_i32(cpu_flags, ctx->envflags & ~TB_FLAG_GUSA_MASK);
245
gen_jump(ctx);
246
247
gen_set_label(l1);
248
@@ -XXX,XX +XXX,XX @@ static inline void gen_store_fpr64(DisasContext *ctx, TCGv_i64 t, int reg)
249
#define XHACK(x) ((((x) & 1 ) << 4) | ((x) & 0xe))
250
251
#define CHECK_NOT_DELAY_SLOT \
252
- if (ctx->envflags & DELAY_SLOT_MASK) { \
253
- goto do_illegal_slot; \
254
+ if (ctx->envflags & TB_FLAG_DELAY_SLOT_MASK) { \
255
+ goto do_illegal_slot; \
256
}
257
258
#define CHECK_PRIVILEGED \
259
@@ -XXX,XX +XXX,XX @@ static void _decode_opc(DisasContext * ctx)
260
case 0x000b:        /* rts */
261
    CHECK_NOT_DELAY_SLOT
262
    tcg_gen_mov_i32(cpu_delayed_pc, cpu_pr);
263
- ctx->envflags |= DELAY_SLOT;
264
+ ctx->envflags |= TB_FLAG_DELAY_SLOT;
265
    ctx->delayed_pc = (uint32_t) - 1;
266
    return;
267
case 0x0028:        /* clrmac */
268
@@ -XXX,XX +XXX,XX @@ static void _decode_opc(DisasContext * ctx)
269
    CHECK_NOT_DELAY_SLOT
270
gen_write_sr(cpu_ssr);
271
    tcg_gen_mov_i32(cpu_delayed_pc, cpu_spc);
272
- ctx->envflags |= DELAY_SLOT_RTE;
273
+ ctx->envflags |= TB_FLAG_DELAY_SLOT_RTE;
274
    ctx->delayed_pc = (uint32_t) - 1;
275
ctx->base.is_jmp = DISAS_STOP;
276
    return;
277
@@ -XXX,XX +XXX,XX @@ static void _decode_opc(DisasContext * ctx)
278
    return;
279
case 0xe000:        /* mov #imm,Rn */
280
#ifdef CONFIG_USER_ONLY
281
- /* Detect the start of a gUSA region. If so, update envflags
282
- and end the TB. This will allow us to see the end of the
283
- region (stored in R0) in the next TB. */
284
+ /*
285
+ * Detect the start of a gUSA region (mov #-n, r15).
286
+ * If so, update envflags and end the TB. This will allow us
287
+ * to see the end of the region (stored in R0) in the next TB.
288
+ */
289
if (B11_8 == 15 && B7_0s < 0 &&
290
(tb_cflags(ctx->base.tb) & CF_PARALLEL)) {
291
- ctx->envflags = deposit32(ctx->envflags, GUSA_SHIFT, 8, B7_0s);
292
+ ctx->envflags =
293
+ deposit32(ctx->envflags, TB_FLAG_GUSA_SHIFT, 8, B7_0s);
294
ctx->base.is_jmp = DISAS_STOP;
295
}
296
#endif
297
@@ -XXX,XX +XXX,XX @@ static void _decode_opc(DisasContext * ctx)
298
case 0xa000:        /* bra disp */
299
    CHECK_NOT_DELAY_SLOT
300
ctx->delayed_pc = ctx->base.pc_next + 4 + B11_0s * 2;
301
- ctx->envflags |= DELAY_SLOT;
302
+ ctx->envflags |= TB_FLAG_DELAY_SLOT;
303
    return;
304
case 0xb000:        /* bsr disp */
305
    CHECK_NOT_DELAY_SLOT
306
tcg_gen_movi_i32(cpu_pr, ctx->base.pc_next + 4);
307
ctx->delayed_pc = ctx->base.pc_next + 4 + B11_0s * 2;
308
- ctx->envflags |= DELAY_SLOT;
309
+ ctx->envflags |= TB_FLAG_DELAY_SLOT;
310
    return;
311
}
312
313
@@ -XXX,XX +XXX,XX @@ static void _decode_opc(DisasContext * ctx)
314
    CHECK_NOT_DELAY_SLOT
315
tcg_gen_xori_i32(cpu_delayed_cond, cpu_sr_t, 1);
316
ctx->delayed_pc = ctx->base.pc_next + 4 + B7_0s * 2;
317
- ctx->envflags |= DELAY_SLOT_CONDITIONAL;
318
+ ctx->envflags |= TB_FLAG_DELAY_SLOT_COND;
319
    return;
320
case 0x8900:        /* bt label */
321
    CHECK_NOT_DELAY_SLOT
322
@@ -XXX,XX +XXX,XX @@ static void _decode_opc(DisasContext * ctx)
323
    CHECK_NOT_DELAY_SLOT
324
tcg_gen_mov_i32(cpu_delayed_cond, cpu_sr_t);
325
ctx->delayed_pc = ctx->base.pc_next + 4 + B7_0s * 2;
326
- ctx->envflags |= DELAY_SLOT_CONDITIONAL;
327
+ ctx->envflags |= TB_FLAG_DELAY_SLOT_COND;
328
    return;
329
case 0x8800:        /* cmp/eq #imm,R0 */
330
tcg_gen_setcondi_i32(TCG_COND_EQ, cpu_sr_t, REG(0), B7_0s);
331
@@ -XXX,XX +XXX,XX @@ static void _decode_opc(DisasContext * ctx)
332
case 0x0023:        /* braf Rn */
333
    CHECK_NOT_DELAY_SLOT
334
tcg_gen_addi_i32(cpu_delayed_pc, REG(B11_8), ctx->base.pc_next + 4);
335
- ctx->envflags |= DELAY_SLOT;
336
+ ctx->envflags |= TB_FLAG_DELAY_SLOT;
337
    ctx->delayed_pc = (uint32_t) - 1;
338
    return;
339
case 0x0003:        /* bsrf Rn */
340
    CHECK_NOT_DELAY_SLOT
341
tcg_gen_movi_i32(cpu_pr, ctx->base.pc_next + 4);
342
    tcg_gen_add_i32(cpu_delayed_pc, REG(B11_8), cpu_pr);
343
- ctx->envflags |= DELAY_SLOT;
344
+ ctx->envflags |= TB_FLAG_DELAY_SLOT;
345
    ctx->delayed_pc = (uint32_t) - 1;
346
    return;
347
case 0x4015:        /* cmp/pl Rn */
348
@@ -XXX,XX +XXX,XX @@ static void _decode_opc(DisasContext * ctx)
349
case 0x402b:        /* jmp @Rn */
350
    CHECK_NOT_DELAY_SLOT
351
    tcg_gen_mov_i32(cpu_delayed_pc, REG(B11_8));
352
- ctx->envflags |= DELAY_SLOT;
353
+ ctx->envflags |= TB_FLAG_DELAY_SLOT;
354
    ctx->delayed_pc = (uint32_t) - 1;
355
    return;
356
case 0x400b:        /* jsr @Rn */
357
    CHECK_NOT_DELAY_SLOT
358
tcg_gen_movi_i32(cpu_pr, ctx->base.pc_next + 4);
359
    tcg_gen_mov_i32(cpu_delayed_pc, REG(B11_8));
360
- ctx->envflags |= DELAY_SLOT;
361
+ ctx->envflags |= TB_FLAG_DELAY_SLOT;
362
    ctx->delayed_pc = (uint32_t) - 1;
363
    return;
364
case 0x400e:        /* ldc Rm,SR */
365
@@ -XXX,XX +XXX,XX @@ static void _decode_opc(DisasContext * ctx)
366
fflush(stderr);
367
#endif
368
do_illegal:
369
- if (ctx->envflags & DELAY_SLOT_MASK) {
370
+ if (ctx->envflags & TB_FLAG_DELAY_SLOT_MASK) {
371
do_illegal_slot:
372
gen_save_cpu_state(ctx, true);
373
gen_helper_raise_slot_illegal_instruction(cpu_env);
374
@@ -XXX,XX +XXX,XX @@ static void _decode_opc(DisasContext * ctx)
375
376
do_fpu_disabled:
377
gen_save_cpu_state(ctx, true);
378
- if (ctx->envflags & DELAY_SLOT_MASK) {
379
+ if (ctx->envflags & TB_FLAG_DELAY_SLOT_MASK) {
380
gen_helper_raise_slot_fpu_disable(cpu_env);
381
} else {
382
gen_helper_raise_fpu_disable(cpu_env);
383
@@ -XXX,XX +XXX,XX @@ static void decode_opc(DisasContext * ctx)
384
385
_decode_opc(ctx);
386
387
- if (old_flags & DELAY_SLOT_MASK) {
388
+ if (old_flags & TB_FLAG_DELAY_SLOT_MASK) {
389
/* go out of the delay slot */
390
- ctx->envflags &= ~DELAY_SLOT_MASK;
391
+ ctx->envflags &= ~TB_FLAG_DELAY_SLOT_MASK;
392
393
/* When in an exclusive region, we must continue to the end
394
for conditional branches. */
395
- if (ctx->tbflags & GUSA_EXCLUSIVE
396
- && old_flags & DELAY_SLOT_CONDITIONAL) {
397
+ if (ctx->tbflags & TB_FLAG_GUSA_EXCLUSIVE
398
+ && old_flags & TB_FLAG_DELAY_SLOT_COND) {
399
gen_delayed_conditional_jump(ctx);
400
return;
401
}
402
/* Otherwise this is probably an invalid gUSA region.
403
Drop the GUSA bits so the next TB doesn't see them. */
404
- ctx->envflags &= ~GUSA_MASK;
405
+ ctx->envflags &= ~TB_FLAG_GUSA_MASK;
406
407
tcg_gen_movi_i32(cpu_flags, ctx->envflags);
408
- if (old_flags & DELAY_SLOT_CONDITIONAL) {
409
+ if (old_flags & TB_FLAG_DELAY_SLOT_COND) {
410
     gen_delayed_conditional_jump(ctx);
411
} else {
412
gen_jump(ctx);
413
@@ -XXX,XX +XXX,XX @@ static void decode_gusa(DisasContext *ctx, CPUSH4State *env)
414
}
415
416
/* The entire region has been translated. */
417
- ctx->envflags &= ~GUSA_MASK;
418
+ ctx->envflags &= ~TB_FLAG_GUSA_MASK;
419
ctx->base.pc_next = pc_end;
420
ctx->base.num_insns += max_insns - 1;
421
return;
422
@@ -XXX,XX +XXX,XX @@ static void decode_gusa(DisasContext *ctx, CPUSH4State *env)
423
424
/* Restart with the EXCLUSIVE bit set, within a TB run via
425
cpu_exec_step_atomic holding the exclusive lock. */
426
- ctx->envflags |= GUSA_EXCLUSIVE;
427
+ ctx->envflags |= TB_FLAG_GUSA_EXCLUSIVE;
428
gen_save_cpu_state(ctx, false);
429
gen_helper_exclusive(cpu_env);
430
ctx->base.is_jmp = DISAS_NORETURN;
431
@@ -XXX,XX +XXX,XX @@ static void sh4_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs)
432
(tbflags & (1 << SR_RB))) * 0x10;
433
ctx->fbank = tbflags & FPSCR_FR ? 0x10 : 0;
434
435
- if (tbflags & GUSA_MASK) {
436
+#ifdef CONFIG_USER_ONLY
437
+ if (tbflags & TB_FLAG_GUSA_MASK) {
438
+ /* In gUSA exclusive region. */
439
uint32_t pc = ctx->base.pc_next;
440
uint32_t pc_end = ctx->base.tb->cs_base;
441
- int backup = sextract32(ctx->tbflags, GUSA_SHIFT, 8);
442
+ int backup = sextract32(ctx->tbflags, TB_FLAG_GUSA_SHIFT, 8);
443
int max_insns = (pc_end - pc) / 2;
444
445
if (pc != pc_end + backup || max_insns < 2) {
446
/* This is a malformed gUSA region. Don't do anything special,
447
since the interpreter is likely to get confused. */
448
- ctx->envflags &= ~GUSA_MASK;
449
- } else if (tbflags & GUSA_EXCLUSIVE) {
450
+ ctx->envflags &= ~TB_FLAG_GUSA_MASK;
451
+ } else if (tbflags & TB_FLAG_GUSA_EXCLUSIVE) {
452
/* Regardless of single-stepping or the end of the page,
453
we must complete execution of the gUSA region while
454
holding the exclusive lock. */
455
@@ -XXX,XX +XXX,XX @@ static void sh4_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs)
456
return;
457
}
458
}
459
+#endif
460
461
/* Since the ISA is fixed-width, we can bound by the number
462
of instructions remaining on the page. */
463
@@ -XXX,XX +XXX,XX @@ static void sh4_tr_translate_insn(DisasContextBase *dcbase, CPUState *cs)
464
DisasContext *ctx = container_of(dcbase, DisasContext, base);
465
466
#ifdef CONFIG_USER_ONLY
467
- if (unlikely(ctx->envflags & GUSA_MASK)
468
- && !(ctx->envflags & GUSA_EXCLUSIVE)) {
469
+ if (unlikely(ctx->envflags & TB_FLAG_GUSA_MASK)
470
+ && !(ctx->envflags & TB_FLAG_GUSA_EXCLUSIVE)) {
471
/* We're in an gUSA region, and we have not already fallen
472
back on using an exclusive region. Attempt to parse the
473
region into a single supported atomic operation. Failure
474
@@ -XXX,XX +XXX,XX @@ static void sh4_tr_tb_stop(DisasContextBase *dcbase, CPUState *cs)
475
{
476
DisasContext *ctx = container_of(dcbase, DisasContext, base);
477
478
- if (ctx->tbflags & GUSA_EXCLUSIVE) {
479
+ if (ctx->tbflags & TB_FLAG_GUSA_EXCLUSIVE) {
480
/* Ending the region of exclusivity. Clear the bits. */
481
- ctx->envflags &= ~GUSA_MASK;
482
+ ctx->envflags &= ~TB_FLAG_GUSA_MASK;
483
}
484
485
switch (ctx->base.is_jmp) {
74
--
486
--
75
2.25.1
487
2.34.1
76
77
diff view generated by jsdifflib
Deleted patch
1
This emphasizes that we don't support s390, only 64-bit s390x hosts.
2
1
3
Reviewed-by: Thomas Huth <thuth@redhat.com>
4
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
5
Reviewed-by: David Hildenbrand <david@redhat.com>
6
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
7
---
8
meson.build | 2 --
9
tcg/{s390 => s390x}/tcg-target-con-set.h | 0
10
tcg/{s390 => s390x}/tcg-target-con-str.h | 0
11
tcg/{s390 => s390x}/tcg-target.h | 0
12
tcg/{s390 => s390x}/tcg-target.c.inc | 0
13
5 files changed, 2 deletions(-)
14
rename tcg/{s390 => s390x}/tcg-target-con-set.h (100%)
15
rename tcg/{s390 => s390x}/tcg-target-con-str.h (100%)
16
rename tcg/{s390 => s390x}/tcg-target.h (100%)
17
rename tcg/{s390 => s390x}/tcg-target.c.inc (100%)
18
19
diff --git a/meson.build b/meson.build
20
index XXXXXXX..XXXXXXX 100644
21
--- a/meson.build
22
+++ b/meson.build
23
@@ -XXX,XX +XXX,XX @@ if not get_option('tcg').disabled()
24
tcg_arch = 'tci'
25
elif config_host['ARCH'] == 'sparc64'
26
tcg_arch = 'sparc'
27
- elif config_host['ARCH'] == 's390x'
28
- tcg_arch = 's390'
29
elif config_host['ARCH'] in ['x86_64', 'x32']
30
tcg_arch = 'i386'
31
elif config_host['ARCH'] == 'ppc64'
32
diff --git a/tcg/s390/tcg-target-con-set.h b/tcg/s390x/tcg-target-con-set.h
33
similarity index 100%
34
rename from tcg/s390/tcg-target-con-set.h
35
rename to tcg/s390x/tcg-target-con-set.h
36
diff --git a/tcg/s390/tcg-target-con-str.h b/tcg/s390x/tcg-target-con-str.h
37
similarity index 100%
38
rename from tcg/s390/tcg-target-con-str.h
39
rename to tcg/s390x/tcg-target-con-str.h
40
diff --git a/tcg/s390/tcg-target.h b/tcg/s390x/tcg-target.h
41
similarity index 100%
42
rename from tcg/s390/tcg-target.h
43
rename to tcg/s390x/tcg-target.h
44
diff --git a/tcg/s390/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
45
similarity index 100%
46
rename from tcg/s390/tcg-target.c.inc
47
rename to tcg/s390x/tcg-target.c.inc
48
--
49
2.25.1
50
51
diff view generated by jsdifflib
Deleted patch
1
They are rightly values in the same enumeration.
2
1
3
Reviewed-by: David Hildenbrand <david@redhat.com>
4
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
---
6
tcg/s390x/tcg-target.h | 28 +++++++---------------------
7
1 file changed, 7 insertions(+), 21 deletions(-)
8
9
diff --git a/tcg/s390x/tcg-target.h b/tcg/s390x/tcg-target.h
10
index XXXXXXX..XXXXXXX 100644
11
--- a/tcg/s390x/tcg-target.h
12
+++ b/tcg/s390x/tcg-target.h
13
@@ -XXX,XX +XXX,XX @@
14
#define MAX_CODE_GEN_BUFFER_SIZE (3 * GiB)
15
16
typedef enum TCGReg {
17
- TCG_REG_R0 = 0,
18
- TCG_REG_R1,
19
- TCG_REG_R2,
20
- TCG_REG_R3,
21
- TCG_REG_R4,
22
- TCG_REG_R5,
23
- TCG_REG_R6,
24
- TCG_REG_R7,
25
- TCG_REG_R8,
26
- TCG_REG_R9,
27
- TCG_REG_R10,
28
- TCG_REG_R11,
29
- TCG_REG_R12,
30
- TCG_REG_R13,
31
- TCG_REG_R14,
32
- TCG_REG_R15
33
+ TCG_REG_R0, TCG_REG_R1, TCG_REG_R2, TCG_REG_R3,
34
+ TCG_REG_R4, TCG_REG_R5, TCG_REG_R6, TCG_REG_R7,
35
+ TCG_REG_R8, TCG_REG_R9, TCG_REG_R10, TCG_REG_R11,
36
+ TCG_REG_R12, TCG_REG_R13, TCG_REG_R14, TCG_REG_R15,
37
+
38
+ TCG_AREG0 = TCG_REG_R10,
39
+ TCG_REG_CALL_STACK = TCG_REG_R15
40
} TCGReg;
41
42
#define TCG_TARGET_NB_REGS 16
43
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities[1];
44
#define TCG_TARGET_HAS_mulsh_i64 0
45
46
/* used for function call generation */
47
-#define TCG_REG_CALL_STACK        TCG_REG_R15
48
#define TCG_TARGET_STACK_ALIGN        8
49
#define TCG_TARGET_CALL_STACK_OFFSET    160
50
51
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities[1];
52
53
#define TCG_TARGET_DEFAULT_MO (TCG_MO_ALL & ~TCG_MO_ST_LD)
54
55
-enum {
56
- TCG_AREG0 = TCG_REG_R10,
57
-};
58
-
59
static inline void tb_target_set_jmp_target(uintptr_t tc_ptr, uintptr_t jmp_rx,
60
uintptr_t jmp_rw, uintptr_t addr)
61
{
62
--
63
2.25.1
64
65
diff view generated by jsdifflib
Deleted patch
1
These logical and arithmetic operations are optional but trivial.
2
1
3
Reviewed-by: David Hildenbrand <david@redhat.com>
4
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
5
---
6
tcg/s390x/tcg-target-con-set.h | 1 +
7
tcg/s390x/tcg-target.h | 11 ++++++-----
8
tcg/s390x/tcg-target.c.inc | 32 ++++++++++++++++++++++++++++++++
9
3 files changed, 39 insertions(+), 5 deletions(-)
10
11
diff --git a/tcg/s390x/tcg-target-con-set.h b/tcg/s390x/tcg-target-con-set.h
12
index XXXXXXX..XXXXXXX 100644
13
--- a/tcg/s390x/tcg-target-con-set.h
14
+++ b/tcg/s390x/tcg-target-con-set.h
15
@@ -XXX,XX +XXX,XX @@ C_O0_I2(v, r)
16
C_O1_I1(r, L)
17
C_O1_I1(r, r)
18
C_O1_I1(v, r)
19
+C_O1_I1(v, v)
20
C_O1_I1(v, vr)
21
C_O1_I2(r, 0, ri)
22
C_O1_I2(r, 0, rI)
23
diff --git a/tcg/s390x/tcg-target.h b/tcg/s390x/tcg-target.h
24
index XXXXXXX..XXXXXXX 100644
25
--- a/tcg/s390x/tcg-target.h
26
+++ b/tcg/s390x/tcg-target.h
27
@@ -XXX,XX +XXX,XX @@ typedef enum TCGReg {
28
#define FACILITY_DISTINCT_OPS FACILITY_LOAD_ON_COND
29
#define FACILITY_LOAD_ON_COND2 53
30
#define FACILITY_VECTOR 129
31
+#define FACILITY_VECTOR_ENH1 135
32
33
extern uint64_t s390_facilities[3];
34
35
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities[3];
36
#define TCG_TARGET_HAS_v128 HAVE_FACILITY(VECTOR)
37
#define TCG_TARGET_HAS_v256 0
38
39
-#define TCG_TARGET_HAS_andc_vec 0
40
-#define TCG_TARGET_HAS_orc_vec 0
41
-#define TCG_TARGET_HAS_not_vec 0
42
-#define TCG_TARGET_HAS_neg_vec 0
43
-#define TCG_TARGET_HAS_abs_vec 0
44
+#define TCG_TARGET_HAS_andc_vec 1
45
+#define TCG_TARGET_HAS_orc_vec HAVE_FACILITY(VECTOR_ENH1)
46
+#define TCG_TARGET_HAS_not_vec 1
47
+#define TCG_TARGET_HAS_neg_vec 1
48
+#define TCG_TARGET_HAS_abs_vec 1
49
#define TCG_TARGET_HAS_roti_vec 0
50
#define TCG_TARGET_HAS_rots_vec 0
51
#define TCG_TARGET_HAS_rotv_vec 0
52
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
53
index XXXXXXX..XXXXXXX 100644
54
--- a/tcg/s390x/tcg-target.c.inc
55
+++ b/tcg/s390x/tcg-target.c.inc
56
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
57
VRIb_VGM = 0xe746,
58
VRIc_VREP = 0xe74d,
59
60
+ VRRa_VLC = 0xe7de,
61
+ VRRa_VLP = 0xe7df,
62
VRRa_VLR = 0xe756,
63
VRRc_VA = 0xe7f3,
64
VRRc_VCEQ = 0xe7f8, /* we leave the m5 cs field 0 */
65
VRRc_VCH = 0xe7fb, /* " */
66
VRRc_VCHL = 0xe7f9, /* " */
67
VRRc_VN = 0xe768,
68
+ VRRc_VNC = 0xe769,
69
+ VRRc_VNO = 0xe76b,
70
VRRc_VO = 0xe76a,
71
+ VRRc_VOC = 0xe76f,
72
VRRc_VS = 0xe7f7,
73
VRRc_VX = 0xe76d,
74
VRRf_VLVGP = 0xe762,
75
@@ -XXX,XX +XXX,XX @@ static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
76
tcg_out_dupm_vec(s, type, vece, a0, a1, a2);
77
break;
78
79
+ case INDEX_op_abs_vec:
80
+ tcg_out_insn(s, VRRa, VLP, a0, a1, vece);
81
+ break;
82
+ case INDEX_op_neg_vec:
83
+ tcg_out_insn(s, VRRa, VLC, a0, a1, vece);
84
+ break;
85
+ case INDEX_op_not_vec:
86
+ tcg_out_insn(s, VRRc, VNO, a0, a1, a1, 0);
87
+ break;
88
+
89
case INDEX_op_add_vec:
90
tcg_out_insn(s, VRRc, VA, a0, a1, a2, vece);
91
break;
92
@@ -XXX,XX +XXX,XX @@ static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
93
case INDEX_op_and_vec:
94
tcg_out_insn(s, VRRc, VN, a0, a1, a2, 0);
95
break;
96
+ case INDEX_op_andc_vec:
97
+ tcg_out_insn(s, VRRc, VNC, a0, a1, a2, 0);
98
+ break;
99
case INDEX_op_or_vec:
100
tcg_out_insn(s, VRRc, VO, a0, a1, a2, 0);
101
break;
102
+ case INDEX_op_orc_vec:
103
+ tcg_out_insn(s, VRRc, VOC, a0, a1, a2, 0);
104
+ break;
105
case INDEX_op_xor_vec:
106
tcg_out_insn(s, VRRc, VX, a0, a1, a2, 0);
107
break;
108
@@ -XXX,XX +XXX,XX @@ static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
109
int tcg_can_emit_vec_op(TCGOpcode opc, TCGType type, unsigned vece)
110
{
111
switch (opc) {
112
+ case INDEX_op_abs_vec:
113
case INDEX_op_add_vec:
114
case INDEX_op_and_vec:
115
+ case INDEX_op_andc_vec:
116
+ case INDEX_op_neg_vec:
117
+ case INDEX_op_not_vec:
118
case INDEX_op_or_vec:
119
+ case INDEX_op_orc_vec:
120
case INDEX_op_sub_vec:
121
case INDEX_op_xor_vec:
122
return 1;
123
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
124
return C_O1_I1(v, r);
125
case INDEX_op_dup_vec:
126
return C_O1_I1(v, vr);
127
+ case INDEX_op_abs_vec:
128
+ case INDEX_op_neg_vec:
129
+ case INDEX_op_not_vec:
130
+ return C_O1_I1(v, v);
131
case INDEX_op_add_vec:
132
case INDEX_op_sub_vec:
133
case INDEX_op_and_vec:
134
+ case INDEX_op_andc_vec:
135
case INDEX_op_or_vec:
136
+ case INDEX_op_orc_vec:
137
case INDEX_op_xor_vec:
138
case INDEX_op_cmp_vec:
139
return C_O1_I2(v, v, v);
140
--
141
2.25.1
142
143
diff view generated by jsdifflib
Deleted patch
1
Reviewed-by: David Hildenbrand <david@redhat.com>
2
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
3
---
4
tcg/s390x/tcg-target.h | 2 +-
5
tcg/s390x/tcg-target.c.inc | 7 +++++++
6
2 files changed, 8 insertions(+), 1 deletion(-)
7
1
8
diff --git a/tcg/s390x/tcg-target.h b/tcg/s390x/tcg-target.h
9
index XXXXXXX..XXXXXXX 100644
10
--- a/tcg/s390x/tcg-target.h
11
+++ b/tcg/s390x/tcg-target.h
12
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities[3];
13
#define TCG_TARGET_HAS_shi_vec 0
14
#define TCG_TARGET_HAS_shs_vec 0
15
#define TCG_TARGET_HAS_shv_vec 0
16
-#define TCG_TARGET_HAS_mul_vec 0
17
+#define TCG_TARGET_HAS_mul_vec 1
18
#define TCG_TARGET_HAS_sat_vec 0
19
#define TCG_TARGET_HAS_minmax_vec 0
20
#define TCG_TARGET_HAS_bitsel_vec 0
21
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
22
index XXXXXXX..XXXXXXX 100644
23
--- a/tcg/s390x/tcg-target.c.inc
24
+++ b/tcg/s390x/tcg-target.c.inc
25
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
26
VRRc_VCEQ = 0xe7f8, /* we leave the m5 cs field 0 */
27
VRRc_VCH = 0xe7fb, /* " */
28
VRRc_VCHL = 0xe7f9, /* " */
29
+ VRRc_VML = 0xe7a2,
30
VRRc_VN = 0xe768,
31
VRRc_VNC = 0xe769,
32
VRRc_VNO = 0xe76b,
33
@@ -XXX,XX +XXX,XX @@ static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
34
case INDEX_op_andc_vec:
35
tcg_out_insn(s, VRRc, VNC, a0, a1, a2, 0);
36
break;
37
+ case INDEX_op_mul_vec:
38
+ tcg_out_insn(s, VRRc, VML, a0, a1, a2, vece);
39
+ break;
40
case INDEX_op_or_vec:
41
tcg_out_insn(s, VRRc, VO, a0, a1, a2, 0);
42
break;
43
@@ -XXX,XX +XXX,XX @@ int tcg_can_emit_vec_op(TCGOpcode opc, TCGType type, unsigned vece)
44
return 1;
45
case INDEX_op_cmp_vec:
46
return -1;
47
+ case INDEX_op_mul_vec:
48
+ return vece < MO_64;
49
default:
50
return 0;
51
}
52
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
53
case INDEX_op_orc_vec:
54
case INDEX_op_xor_vec:
55
case INDEX_op_cmp_vec:
56
+ case INDEX_op_mul_vec:
57
return C_O1_I2(v, v, v);
58
59
default:
60
--
61
2.25.1
62
63
diff view generated by jsdifflib
Deleted patch
1
Reviewed-by: David Hildenbrand <david@redhat.com>
2
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
3
---
4
tcg/s390x/tcg-target-con-set.h | 1 +
5
tcg/s390x/tcg-target.h | 12 ++---
6
tcg/s390x/tcg-target.c.inc | 93 +++++++++++++++++++++++++++++++++-
7
3 files changed, 99 insertions(+), 7 deletions(-)
8
1
9
diff --git a/tcg/s390x/tcg-target-con-set.h b/tcg/s390x/tcg-target-con-set.h
10
index XXXXXXX..XXXXXXX 100644
11
--- a/tcg/s390x/tcg-target-con-set.h
12
+++ b/tcg/s390x/tcg-target-con-set.h
13
@@ -XXX,XX +XXX,XX @@ C_O1_I2(r, 0, rI)
14
C_O1_I2(r, 0, rJ)
15
C_O1_I2(r, r, ri)
16
C_O1_I2(r, rZ, r)
17
+C_O1_I2(v, v, r)
18
C_O1_I2(v, v, v)
19
C_O1_I4(r, r, ri, r, 0)
20
C_O1_I4(r, r, ri, rI, 0)
21
diff --git a/tcg/s390x/tcg-target.h b/tcg/s390x/tcg-target.h
22
index XXXXXXX..XXXXXXX 100644
23
--- a/tcg/s390x/tcg-target.h
24
+++ b/tcg/s390x/tcg-target.h
25
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities[3];
26
#define TCG_TARGET_HAS_not_vec 1
27
#define TCG_TARGET_HAS_neg_vec 1
28
#define TCG_TARGET_HAS_abs_vec 1
29
-#define TCG_TARGET_HAS_roti_vec 0
30
-#define TCG_TARGET_HAS_rots_vec 0
31
-#define TCG_TARGET_HAS_rotv_vec 0
32
-#define TCG_TARGET_HAS_shi_vec 0
33
-#define TCG_TARGET_HAS_shs_vec 0
34
-#define TCG_TARGET_HAS_shv_vec 0
35
+#define TCG_TARGET_HAS_roti_vec 1
36
+#define TCG_TARGET_HAS_rots_vec 1
37
+#define TCG_TARGET_HAS_rotv_vec 1
38
+#define TCG_TARGET_HAS_shi_vec 1
39
+#define TCG_TARGET_HAS_shs_vec 1
40
+#define TCG_TARGET_HAS_shv_vec 1
41
#define TCG_TARGET_HAS_mul_vec 1
42
#define TCG_TARGET_HAS_sat_vec 0
43
#define TCG_TARGET_HAS_minmax_vec 0
44
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
45
index XXXXXXX..XXXXXXX 100644
46
--- a/tcg/s390x/tcg-target.c.inc
47
+++ b/tcg/s390x/tcg-target.c.inc
48
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
49
VRRc_VCEQ = 0xe7f8, /* we leave the m5 cs field 0 */
50
VRRc_VCH = 0xe7fb, /* " */
51
VRRc_VCHL = 0xe7f9, /* " */
52
+ VRRc_VERLLV = 0xe773,
53
+ VRRc_VESLV = 0xe770,
54
+ VRRc_VESRAV = 0xe77a,
55
+ VRRc_VESRLV = 0xe778,
56
VRRc_VML = 0xe7a2,
57
VRRc_VN = 0xe768,
58
VRRc_VNC = 0xe769,
59
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
60
VRRc_VX = 0xe76d,
61
VRRf_VLVGP = 0xe762,
62
63
+ VRSa_VERLL = 0xe733,
64
+ VRSa_VESL = 0xe730,
65
+ VRSa_VESRA = 0xe73a,
66
+ VRSa_VESRL = 0xe738,
67
VRSb_VLVG = 0xe722,
68
VRSc_VLGV = 0xe721,
69
70
@@ -XXX,XX +XXX,XX @@ static void tcg_out_insn_VRRf(TCGContext *s, S390Opcode op,
71
tcg_out16(s, (op & 0x00ff) | RXB(v1, 0, 0, 0));
72
}
73
74
+static void tcg_out_insn_VRSa(TCGContext *s, S390Opcode op, TCGReg v1,
75
+ intptr_t d2, TCGReg b2, TCGReg v3, int m4)
76
+{
77
+ tcg_debug_assert(is_vector_reg(v1));
78
+ tcg_debug_assert(d2 >= 0 && d2 <= 0xfff);
79
+ tcg_debug_assert(is_general_reg(b2));
80
+ tcg_debug_assert(is_vector_reg(v3));
81
+ tcg_out16(s, (op & 0xff00) | ((v1 & 0xf) << 4) | (v3 & 0xf));
82
+ tcg_out16(s, b2 << 12 | d2);
83
+ tcg_out16(s, (op & 0x00ff) | RXB(v1, 0, v3, 0) | (m4 << 12));
84
+}
85
+
86
static void tcg_out_insn_VRSb(TCGContext *s, S390Opcode op, TCGReg v1,
87
intptr_t d2, TCGReg b2, TCGReg r3, int m4)
88
{
89
@@ -XXX,XX +XXX,XX @@ static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
90
tcg_out_insn(s, VRRc, VX, a0, a1, a2, 0);
91
break;
92
93
+ case INDEX_op_shli_vec:
94
+ tcg_out_insn(s, VRSa, VESL, a0, a2, TCG_REG_NONE, a1, vece);
95
+ break;
96
+ case INDEX_op_shri_vec:
97
+ tcg_out_insn(s, VRSa, VESRL, a0, a2, TCG_REG_NONE, a1, vece);
98
+ break;
99
+ case INDEX_op_sari_vec:
100
+ tcg_out_insn(s, VRSa, VESRA, a0, a2, TCG_REG_NONE, a1, vece);
101
+ break;
102
+ case INDEX_op_rotli_vec:
103
+ tcg_out_insn(s, VRSa, VERLL, a0, a2, TCG_REG_NONE, a1, vece);
104
+ break;
105
+ case INDEX_op_shls_vec:
106
+ tcg_out_insn(s, VRSa, VESL, a0, 0, a2, a1, vece);
107
+ break;
108
+ case INDEX_op_shrs_vec:
109
+ tcg_out_insn(s, VRSa, VESRL, a0, 0, a2, a1, vece);
110
+ break;
111
+ case INDEX_op_sars_vec:
112
+ tcg_out_insn(s, VRSa, VESRA, a0, 0, a2, a1, vece);
113
+ break;
114
+ case INDEX_op_rotls_vec:
115
+ tcg_out_insn(s, VRSa, VERLL, a0, 0, a2, a1, vece);
116
+ break;
117
+ case INDEX_op_shlv_vec:
118
+ tcg_out_insn(s, VRRc, VESLV, a0, a1, a2, vece);
119
+ break;
120
+ case INDEX_op_shrv_vec:
121
+ tcg_out_insn(s, VRRc, VESRLV, a0, a1, a2, vece);
122
+ break;
123
+ case INDEX_op_sarv_vec:
124
+ tcg_out_insn(s, VRRc, VESRAV, a0, a1, a2, vece);
125
+ break;
126
+ case INDEX_op_rotlv_vec:
127
+ tcg_out_insn(s, VRRc, VERLLV, a0, a1, a2, vece);
128
+ break;
129
+
130
case INDEX_op_cmp_vec:
131
switch ((TCGCond)args[3]) {
132
case TCG_COND_EQ:
133
@@ -XXX,XX +XXX,XX @@ int tcg_can_emit_vec_op(TCGOpcode opc, TCGType type, unsigned vece)
134
case INDEX_op_not_vec:
135
case INDEX_op_or_vec:
136
case INDEX_op_orc_vec:
137
+ case INDEX_op_rotli_vec:
138
+ case INDEX_op_rotls_vec:
139
+ case INDEX_op_rotlv_vec:
140
+ case INDEX_op_sari_vec:
141
+ case INDEX_op_sars_vec:
142
+ case INDEX_op_sarv_vec:
143
+ case INDEX_op_shli_vec:
144
+ case INDEX_op_shls_vec:
145
+ case INDEX_op_shlv_vec:
146
+ case INDEX_op_shri_vec:
147
+ case INDEX_op_shrs_vec:
148
+ case INDEX_op_shrv_vec:
149
case INDEX_op_sub_vec:
150
case INDEX_op_xor_vec:
151
return 1;
152
case INDEX_op_cmp_vec:
153
+ case INDEX_op_rotrv_vec:
154
return -1;
155
case INDEX_op_mul_vec:
156
return vece < MO_64;
157
@@ -XXX,XX +XXX,XX @@ void tcg_expand_vec_op(TCGOpcode opc, TCGType type, unsigned vece,
158
TCGArg a0, ...)
159
{
160
va_list va;
161
- TCGv_vec v0, v1, v2;
162
+ TCGv_vec v0, v1, v2, t0;
163
164
va_start(va, a0);
165
v0 = temp_tcgv_vec(arg_temp(a0));
166
@@ -XXX,XX +XXX,XX @@ void tcg_expand_vec_op(TCGOpcode opc, TCGType type, unsigned vece,
167
expand_vec_cmp(type, vece, v0, v1, v2, va_arg(va, TCGArg));
168
break;
169
170
+ case INDEX_op_rotrv_vec:
171
+ t0 = tcg_temp_new_vec(type);
172
+ tcg_gen_neg_vec(vece, t0, v2);
173
+ tcg_gen_rotlv_vec(vece, v0, v1, t0);
174
+ tcg_temp_free_vec(t0);
175
+ break;
176
+
177
default:
178
g_assert_not_reached();
179
}
180
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
181
case INDEX_op_abs_vec:
182
case INDEX_op_neg_vec:
183
case INDEX_op_not_vec:
184
+ case INDEX_op_rotli_vec:
185
+ case INDEX_op_sari_vec:
186
+ case INDEX_op_shli_vec:
187
+ case INDEX_op_shri_vec:
188
return C_O1_I1(v, v);
189
case INDEX_op_add_vec:
190
case INDEX_op_sub_vec:
191
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
192
case INDEX_op_xor_vec:
193
case INDEX_op_cmp_vec:
194
case INDEX_op_mul_vec:
195
+ case INDEX_op_rotlv_vec:
196
+ case INDEX_op_rotrv_vec:
197
+ case INDEX_op_shlv_vec:
198
+ case INDEX_op_shrv_vec:
199
+ case INDEX_op_sarv_vec:
200
return C_O1_I2(v, v, v);
201
+ case INDEX_op_rotls_vec:
202
+ case INDEX_op_shls_vec:
203
+ case INDEX_op_shrs_vec:
204
+ case INDEX_op_sars_vec:
205
+ return C_O1_I2(v, v, r);
206
207
default:
208
g_assert_not_reached();
209
--
210
2.25.1
211
212
diff view generated by jsdifflib
Deleted patch
1
Reviewed-by: David Hildenbrand <david@redhat.com>
2
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
3
---
4
tcg/s390x/tcg-target.h | 2 +-
5
tcg/s390x/tcg-target.c.inc | 25 +++++++++++++++++++++++++
6
2 files changed, 26 insertions(+), 1 deletion(-)
7
1
8
diff --git a/tcg/s390x/tcg-target.h b/tcg/s390x/tcg-target.h
9
index XXXXXXX..XXXXXXX 100644
10
--- a/tcg/s390x/tcg-target.h
11
+++ b/tcg/s390x/tcg-target.h
12
@@ -XXX,XX +XXX,XX @@ extern uint64_t s390_facilities[3];
13
#define TCG_TARGET_HAS_shv_vec 1
14
#define TCG_TARGET_HAS_mul_vec 1
15
#define TCG_TARGET_HAS_sat_vec 0
16
-#define TCG_TARGET_HAS_minmax_vec 0
17
+#define TCG_TARGET_HAS_minmax_vec 1
18
#define TCG_TARGET_HAS_bitsel_vec 0
19
#define TCG_TARGET_HAS_cmpsel_vec 0
20
21
diff --git a/tcg/s390x/tcg-target.c.inc b/tcg/s390x/tcg-target.c.inc
22
index XXXXXXX..XXXXXXX 100644
23
--- a/tcg/s390x/tcg-target.c.inc
24
+++ b/tcg/s390x/tcg-target.c.inc
25
@@ -XXX,XX +XXX,XX @@ typedef enum S390Opcode {
26
VRRc_VESRAV = 0xe77a,
27
VRRc_VESRLV = 0xe778,
28
VRRc_VML = 0xe7a2,
29
+ VRRc_VMN = 0xe7fe,
30
+ VRRc_VMNL = 0xe7fc,
31
+ VRRc_VMX = 0xe7ff,
32
+ VRRc_VMXL = 0xe7fd,
33
VRRc_VN = 0xe768,
34
VRRc_VNC = 0xe769,
35
VRRc_VNO = 0xe76b,
36
@@ -XXX,XX +XXX,XX @@ static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc,
37
tcg_out_insn(s, VRRc, VERLLV, a0, a1, a2, vece);
38
break;
39
40
+ case INDEX_op_smin_vec:
41
+ tcg_out_insn(s, VRRc, VMN, a0, a1, a2, vece);
42
+ break;
43
+ case INDEX_op_smax_vec:
44
+ tcg_out_insn(s, VRRc, VMX, a0, a1, a2, vece);
45
+ break;
46
+ case INDEX_op_umin_vec:
47
+ tcg_out_insn(s, VRRc, VMNL, a0, a1, a2, vece);
48
+ break;
49
+ case INDEX_op_umax_vec:
50
+ tcg_out_insn(s, VRRc, VMXL, a0, a1, a2, vece);
51
+ break;
52
+
53
case INDEX_op_cmp_vec:
54
switch ((TCGCond)args[3]) {
55
case TCG_COND_EQ:
56
@@ -XXX,XX +XXX,XX @@ int tcg_can_emit_vec_op(TCGOpcode opc, TCGType type, unsigned vece)
57
case INDEX_op_shri_vec:
58
case INDEX_op_shrs_vec:
59
case INDEX_op_shrv_vec:
60
+ case INDEX_op_smax_vec:
61
+ case INDEX_op_smin_vec:
62
case INDEX_op_sub_vec:
63
+ case INDEX_op_umax_vec:
64
+ case INDEX_op_umin_vec:
65
case INDEX_op_xor_vec:
66
return 1;
67
case INDEX_op_cmp_vec:
68
@@ -XXX,XX +XXX,XX @@ static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
69
case INDEX_op_shlv_vec:
70
case INDEX_op_shrv_vec:
71
case INDEX_op_sarv_vec:
72
+ case INDEX_op_smax_vec:
73
+ case INDEX_op_smin_vec:
74
+ case INDEX_op_umax_vec:
75
+ case INDEX_op_umin_vec:
76
return C_O1_I2(v, v, v);
77
case INDEX_op_rotls_vec:
78
case INDEX_op_shls_vec:
79
--
80
2.25.1
81
82
diff view generated by jsdifflib