1
The following changes since commit e18e5501d8ac692d32657a3e1ef545b14e72b730:
1
V2 replaces the tcg const temp overflow patch.
2
2
3
Merge remote-tracking branch 'remotes/dgilbert-gitlab/tags/pull-virtiofs-20200210' into staging (2020-02-10 18:09:14 +0000)
3
4
r~
5
6
7
The following changes since commit 0e32462630687a18039464511bd0447ada5709c3:
8
9
Merge remote-tracking branch 'remotes/vivier2/tags/linux-user-for-6.0-pull-request' into staging (2021-01-22 10:35:55 +0000)
4
10
5
are available in the Git repository at:
11
are available in the Git repository at:
6
12
7
https://github.com/rth7680/qemu.git tags/pull-tcg-20200212
13
https://gitlab.com/rth7680/qemu.git tags/pull-tcg-20210124
8
14
9
for you to fetch changes up to 2445971604c1cfd3ec484457159f4ac300fb04d2:
15
for you to fetch changes up to ae30e86661b0f48562cd95918d37cbeec5d02262:
10
16
11
tcg: Add tcg_gen_gvec_5_ptr (2020-02-12 14:58:36 -0800)
17
tcg: Restart code generation when we run out of temps (2021-01-24 08:03:27 -1000)
12
18
13
----------------------------------------------------------------
19
----------------------------------------------------------------
14
Fix breakpoint invalidation.
20
Fix tcg constant temp overflow.
15
Add support for tcg helpers with 7 arguments.
21
Fix running during atomic single-step.
16
Add support for gvec helpers with 5 arguments.
22
Partial support for apple silicon.
23
Cleanups for accel/tcg.
17
24
18
----------------------------------------------------------------
25
----------------------------------------------------------------
19
Max Filippov (1):
26
Douglas Crosher (1):
20
exec: flush CPU TB cache in breakpoint_invalidate
27
tcg: update the cpu running flag in cpu_exec_step_atomic
21
28
22
Richard Henderson (1):
29
Philippe Mathieu-Daudé (4):
23
tcg: Add tcg_gen_gvec_5_ptr
30
accel/tcg: Make cpu_gen_init() static
31
accel/tcg: Restrict tb_gen_code() from other accelerators
32
accel/tcg: Declare missing cpu_loop_exit*() stubs
33
accel/tcg: Restrict cpu_io_recompile() from other accelerators
24
34
25
Taylor Simpson (1):
35
Richard Henderson (4):
26
tcg: Add support for a helper with 7 arguments
36
qemu/compiler: Split out qemu_build_not_reached_always
37
tcg: Optimize inline dup_const for MO_64
38
accel/tcg: Move tb_flush_jmp_cache() to cputlb.c
39
tcg: Restart code generation when we run out of temps
27
40
28
include/exec/helper-gen.h | 13 +++++++++++++
41
Roman Bolshakov (1):
29
include/exec/helper-head.h | 2 ++
42
tcg: Toggle page execution for Apple Silicon
30
include/exec/helper-proto.h | 6 ++++++
31
include/exec/helper-tcg.h | 7 +++++++
32
include/tcg/tcg-op-gvec.h | 7 +++++++
33
exec.c | 15 +++++++--------
34
tcg/tcg-op-gvec.c | 32 ++++++++++++++++++++++++++++++++
35
7 files changed, 74 insertions(+), 8 deletions(-)
36
43
44
accel/tcg/internal.h | 20 ++++++++++++++++++++
45
include/exec/exec-all.h | 11 -----------
46
include/qemu/compiler.h | 5 +++--
47
include/qemu/osdep.h | 28 ++++++++++++++++++++++++++++
48
include/tcg/tcg.h | 6 +++++-
49
accel/stubs/tcg-stub.c | 10 ++++++++++
50
accel/tcg/cpu-exec.c | 7 +++++++
51
accel/tcg/cputlb.c | 19 +++++++++++++++++++
52
accel/tcg/translate-all.c | 38 +++++++++++++++++++-------------------
53
tcg/tcg.c | 12 +++++++++---
54
10 files changed, 120 insertions(+), 36 deletions(-)
55
create mode 100644 accel/tcg/internal.h
56
diff view generated by jsdifflib
Deleted patch
1
From: Max Filippov <jcmvbkbc@gmail.com>
2
1
3
When a breakpoint is inserted at location for which there's currently no
4
virtual to physical translation no action is taken on CPU TB cache. If a
5
TB for that virtual address already exists but is not visible ATM the
6
breakpoint won't be hit next time an instruction at that address will be
7
executed.
8
9
Flush entire CPU TB cache in breakpoint_invalidate to force
10
re-translation of all TBs for the breakpoint address.
11
12
This change fixes the following scenario:
13
- linux user application is running
14
- a breakpoint is inserted from QEMU gdbstub for a user address that is
15
not currently present in the target CPU TLB
16
- an instruction at that address is executed, but the external debugger
17
doesn't get control.
18
19
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
20
Signed-off-by: Max Filippov <jcmvbkbc@gmail.com>
21
Message-Id: <20191127220602.10827-2-jcmvbkbc@gmail.com>
22
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
23
---
24
exec.c | 15 +++++++--------
25
1 file changed, 7 insertions(+), 8 deletions(-)
26
27
diff --git a/exec.c b/exec.c
28
index XXXXXXX..XXXXXXX 100644
29
--- a/exec.c
30
+++ b/exec.c
31
@@ -XXX,XX +XXX,XX @@ void tb_invalidate_phys_addr(AddressSpace *as, hwaddr addr, MemTxAttrs attrs)
32
33
static void breakpoint_invalidate(CPUState *cpu, target_ulong pc)
34
{
35
- MemTxAttrs attrs;
36
- hwaddr phys = cpu_get_phys_page_attrs_debug(cpu, pc, &attrs);
37
- int asidx = cpu_asidx_from_attrs(cpu, attrs);
38
- if (phys != -1) {
39
- /* Locks grabbed by tb_invalidate_phys_addr */
40
- tb_invalidate_phys_addr(cpu->cpu_ases[asidx].as,
41
- phys | (pc & ~TARGET_PAGE_MASK), attrs);
42
- }
43
+ /*
44
+ * There may not be a virtual to physical translation for the pc
45
+ * right now, but there may exist cached TB for this pc.
46
+ * Flush the whole TB cache to force re-translation of such TBs.
47
+ * This is heavyweight, but we're debugging anyway.
48
+ */
49
+ tb_flush(cpu);
50
}
51
#endif
52
53
--
54
2.20.1
55
56
diff view generated by jsdifflib
Deleted patch
1
From: Taylor Simpson <tsimpson@quicinc.com>
2
1
3
Currently, helpers can only take up to 6 arguments. This patch adds the
4
capability for up to 7 arguments. I have tested it with the Hexagon port
5
that I am preparing for submission.
6
7
Signed-off-by: Taylor Simpson <tsimpson@quicinc.com>
8
Message-Id: <1580942510-2820-1-git-send-email-tsimpson@quicinc.com>
9
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
10
---
11
include/exec/helper-gen.h | 13 +++++++++++++
12
include/exec/helper-head.h | 2 ++
13
include/exec/helper-proto.h | 6 ++++++
14
include/exec/helper-tcg.h | 7 +++++++
15
4 files changed, 28 insertions(+)
16
17
diff --git a/include/exec/helper-gen.h b/include/exec/helper-gen.h
18
index XXXXXXX..XXXXXXX 100644
19
--- a/include/exec/helper-gen.h
20
+++ b/include/exec/helper-gen.h
21
@@ -XXX,XX +XXX,XX @@ static inline void glue(gen_helper_, name)(dh_retvar_decl(ret) \
22
tcg_gen_callN(HELPER(name), dh_retvar(ret), 6, args); \
23
}
24
25
+#define DEF_HELPER_FLAGS_7(name, flags, ret, t1, t2, t3, t4, t5, t6, t7)\
26
+static inline void glue(gen_helper_, name)(dh_retvar_decl(ret) \
27
+ dh_arg_decl(t1, 1), dh_arg_decl(t2, 2), dh_arg_decl(t3, 3), \
28
+ dh_arg_decl(t4, 4), dh_arg_decl(t5, 5), dh_arg_decl(t6, 6), \
29
+ dh_arg_decl(t7, 7)) \
30
+{ \
31
+ TCGTemp *args[7] = { dh_arg(t1, 1), dh_arg(t2, 2), dh_arg(t3, 3), \
32
+ dh_arg(t4, 4), dh_arg(t5, 5), dh_arg(t6, 6), \
33
+ dh_arg(t7, 7) }; \
34
+ tcg_gen_callN(HELPER(name), dh_retvar(ret), 7, args); \
35
+}
36
+
37
#include "helper.h"
38
#include "trace/generated-helpers.h"
39
#include "trace/generated-helpers-wrappers.h"
40
@@ -XXX,XX +XXX,XX @@ static inline void glue(gen_helper_, name)(dh_retvar_decl(ret) \
41
#undef DEF_HELPER_FLAGS_4
42
#undef DEF_HELPER_FLAGS_5
43
#undef DEF_HELPER_FLAGS_6
44
+#undef DEF_HELPER_FLAGS_7
45
#undef GEN_HELPER
46
47
#endif /* HELPER_GEN_H */
48
diff --git a/include/exec/helper-head.h b/include/exec/helper-head.h
49
index XXXXXXX..XXXXXXX 100644
50
--- a/include/exec/helper-head.h
51
+++ b/include/exec/helper-head.h
52
@@ -XXX,XX +XXX,XX @@
53
DEF_HELPER_FLAGS_5(name, 0, ret, t1, t2, t3, t4, t5)
54
#define DEF_HELPER_6(name, ret, t1, t2, t3, t4, t5, t6) \
55
DEF_HELPER_FLAGS_6(name, 0, ret, t1, t2, t3, t4, t5, t6)
56
+#define DEF_HELPER_7(name, ret, t1, t2, t3, t4, t5, t6, t7) \
57
+ DEF_HELPER_FLAGS_7(name, 0, ret, t1, t2, t3, t4, t5, t6, t7)
58
59
/* MAX_OPC_PARAM_IARGS must be set to n if last entry is DEF_HELPER_FLAGS_n. */
60
61
diff --git a/include/exec/helper-proto.h b/include/exec/helper-proto.h
62
index XXXXXXX..XXXXXXX 100644
63
--- a/include/exec/helper-proto.h
64
+++ b/include/exec/helper-proto.h
65
@@ -XXX,XX +XXX,XX @@ dh_ctype(ret) HELPER(name) (dh_ctype(t1), dh_ctype(t2), dh_ctype(t3), \
66
dh_ctype(ret) HELPER(name) (dh_ctype(t1), dh_ctype(t2), dh_ctype(t3), \
67
dh_ctype(t4), dh_ctype(t5), dh_ctype(t6));
68
69
+#define DEF_HELPER_FLAGS_7(name, flags, ret, t1, t2, t3, t4, t5, t6, t7) \
70
+dh_ctype(ret) HELPER(name) (dh_ctype(t1), dh_ctype(t2), dh_ctype(t3), \
71
+ dh_ctype(t4), dh_ctype(t5), dh_ctype(t6), \
72
+ dh_ctype(t7));
73
+
74
#include "helper.h"
75
#include "trace/generated-helpers.h"
76
#include "tcg-runtime.h"
77
@@ -XXX,XX +XXX,XX @@ dh_ctype(ret) HELPER(name) (dh_ctype(t1), dh_ctype(t2), dh_ctype(t3), \
78
#undef DEF_HELPER_FLAGS_4
79
#undef DEF_HELPER_FLAGS_5
80
#undef DEF_HELPER_FLAGS_6
81
+#undef DEF_HELPER_FLAGS_7
82
83
#endif /* HELPER_PROTO_H */
84
diff --git a/include/exec/helper-tcg.h b/include/exec/helper-tcg.h
85
index XXXXXXX..XXXXXXX 100644
86
--- a/include/exec/helper-tcg.h
87
+++ b/include/exec/helper-tcg.h
88
@@ -XXX,XX +XXX,XX @@
89
| dh_sizemask(t2, 2) | dh_sizemask(t3, 3) | dh_sizemask(t4, 4) \
90
| dh_sizemask(t5, 5) | dh_sizemask(t6, 6) },
91
92
+#define DEF_HELPER_FLAGS_7(NAME, FLAGS, ret, t1, t2, t3, t4, t5, t6, t7) \
93
+ { .func = HELPER(NAME), .name = str(NAME), .flags = FLAGS, \
94
+ .sizemask = dh_sizemask(ret, 0) | dh_sizemask(t1, 1) \
95
+ | dh_sizemask(t2, 2) | dh_sizemask(t3, 3) | dh_sizemask(t4, 4) \
96
+ | dh_sizemask(t5, 5) | dh_sizemask(t6, 6) | dh_sizemask(t7, 7) },
97
+
98
#include "helper.h"
99
#include "trace/generated-helpers.h"
100
#include "tcg-runtime.h"
101
@@ -XXX,XX +XXX,XX @@
102
#undef DEF_HELPER_FLAGS_4
103
#undef DEF_HELPER_FLAGS_5
104
#undef DEF_HELPER_FLAGS_6
105
+#undef DEF_HELPER_FLAGS_7
106
107
#endif /* HELPER_TCG_H */
108
--
109
2.20.1
110
111
diff view generated by jsdifflib
1
Extend the vector generator infrastructure to handle
1
Some large translation blocks can generate so many unique
2
5 vector arguments.
2
constants that we run out of temps to hold them. In this
3
case, longjmp back to the start of code generation and
4
restart with a smaller translation block.
3
5
4
Reviewed-by: Philippe Mathieu-Daudé <philmd@redhat.com>
6
Buglink: https://bugs.launchpad.net/bugs/1912065
5
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
7
Tested-by: BALATON Zoltan <balaton@eik.bme.hu>
6
Reviewed-by: Taylor Simpson <tsimpson@quicinc.com>
8
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
7
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
9
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
8
---
10
---
9
include/tcg/tcg-op-gvec.h | 7 +++++++
11
include/tcg/tcg.h | 3 +++
10
tcg/tcg-op-gvec.c | 32 ++++++++++++++++++++++++++++++++
12
accel/tcg/translate-all.c | 15 ++++++++++++++-
11
2 files changed, 39 insertions(+)
13
tcg/tcg.c | 11 ++++++++---
14
3 files changed, 25 insertions(+), 4 deletions(-)
12
15
13
diff --git a/include/tcg/tcg-op-gvec.h b/include/tcg/tcg-op-gvec.h
16
diff --git a/include/tcg/tcg.h b/include/tcg/tcg.h
14
index XXXXXXX..XXXXXXX 100644
17
index XXXXXXX..XXXXXXX 100644
15
--- a/include/tcg/tcg-op-gvec.h
18
--- a/include/tcg/tcg.h
16
+++ b/include/tcg/tcg-op-gvec.h
19
+++ b/include/tcg/tcg.h
17
@@ -XXX,XX +XXX,XX @@ void tcg_gen_gvec_4_ptr(uint32_t dofs, uint32_t aofs, uint32_t bofs,
20
@@ -XXX,XX +XXX,XX @@ struct TCGContext {
18
uint32_t maxsz, int32_t data,
21
19
gen_helper_gvec_4_ptr *fn);
22
uint16_t gen_insn_end_off[TCG_MAX_INSNS];
20
23
target_ulong gen_insn_data[TCG_MAX_INSNS][TARGET_INSN_START_WORDS];
21
+typedef void gen_helper_gvec_5_ptr(TCGv_ptr, TCGv_ptr, TCGv_ptr, TCGv_ptr,
22
+ TCGv_ptr, TCGv_ptr, TCGv_i32);
23
+void tcg_gen_gvec_5_ptr(uint32_t dofs, uint32_t aofs, uint32_t bofs,
24
+ uint32_t cofs, uint32_t eofs, TCGv_ptr ptr,
25
+ uint32_t oprsz, uint32_t maxsz, int32_t data,
26
+ gen_helper_gvec_5_ptr *fn);
27
+
24
+
28
/* Expand a gvec operation. Either inline or out-of-line depending on
25
+ /* Exit to translator on overflow. */
29
the actual vector size and the operations supported by the host. */
26
+ sigjmp_buf jmp_trans;
30
typedef struct {
27
};
31
diff --git a/tcg/tcg-op-gvec.c b/tcg/tcg-op-gvec.c
28
29
static inline bool temp_readonly(TCGTemp *ts)
30
diff --git a/accel/tcg/translate-all.c b/accel/tcg/translate-all.c
32
index XXXXXXX..XXXXXXX 100644
31
index XXXXXXX..XXXXXXX 100644
33
--- a/tcg/tcg-op-gvec.c
32
--- a/accel/tcg/translate-all.c
34
+++ b/tcg/tcg-op-gvec.c
33
+++ b/accel/tcg/translate-all.c
35
@@ -XXX,XX +XXX,XX @@ void tcg_gen_gvec_4_ptr(uint32_t dofs, uint32_t aofs, uint32_t bofs,
34
@@ -XXX,XX +XXX,XX @@ TranslationBlock *tb_gen_code(CPUState *cpu,
36
tcg_temp_free_i32(desc);
35
ti = profile_getclock();
36
#endif
37
38
+ gen_code_size = sigsetjmp(tcg_ctx->jmp_trans, 0);
39
+ if (unlikely(gen_code_size != 0)) {
40
+ goto error_return;
41
+ }
42
+
43
tcg_func_start(tcg_ctx);
44
45
tcg_ctx->cpu = env_cpu(env);
46
gen_intermediate_code(cpu, tb, max_insns);
47
tcg_ctx->cpu = NULL;
48
+ max_insns = tb->icount;
49
50
trace_translate_block(tb, tb->pc, tb->tc.ptr);
51
52
@@ -XXX,XX +XXX,XX @@ TranslationBlock *tb_gen_code(CPUState *cpu,
53
54
gen_code_size = tcg_gen_code(tcg_ctx, tb);
55
if (unlikely(gen_code_size < 0)) {
56
+ error_return:
57
switch (gen_code_size) {
58
case -1:
59
/*
60
@@ -XXX,XX +XXX,XX @@ TranslationBlock *tb_gen_code(CPUState *cpu,
61
* flush the TBs, allocate a new TB, re-initialize it per
62
* above, and re-do the actual code generation.
63
*/
64
+ qemu_log_mask(CPU_LOG_TB_OP | CPU_LOG_TB_OP_OPT,
65
+ "Restarting code generation for "
66
+ "code_gen_buffer overflow\n");
67
goto buffer_overflow;
68
69
case -2:
70
@@ -XXX,XX +XXX,XX @@ TranslationBlock *tb_gen_code(CPUState *cpu,
71
* Try again with half as many insns as we attempted this time.
72
* If a single insn overflows, there's a bug somewhere...
73
*/
74
- max_insns = tb->icount;
75
assert(max_insns > 1);
76
max_insns /= 2;
77
+ qemu_log_mask(CPU_LOG_TB_OP | CPU_LOG_TB_OP_OPT,
78
+ "Restarting code generation with "
79
+ "smaller translation block (max %d insns)\n",
80
+ max_insns);
81
goto tb_overflow;
82
83
default:
84
diff --git a/tcg/tcg.c b/tcg/tcg.c
85
index XXXXXXX..XXXXXXX 100644
86
--- a/tcg/tcg.c
87
+++ b/tcg/tcg.c
88
@@ -XXX,XX +XXX,XX @@ void tcg_func_start(TCGContext *s)
89
QSIMPLEQ_INIT(&s->labels);
37
}
90
}
38
91
39
+/* Generate a call to a gvec-style helper with five vector operands
92
-static inline TCGTemp *tcg_temp_alloc(TCGContext *s)
40
+ and an extra pointer operand. */
93
+static TCGTemp *tcg_temp_alloc(TCGContext *s)
41
+void tcg_gen_gvec_5_ptr(uint32_t dofs, uint32_t aofs, uint32_t bofs,
94
{
42
+ uint32_t cofs, uint32_t eofs, TCGv_ptr ptr,
95
int n = s->nb_temps++;
43
+ uint32_t oprsz, uint32_t maxsz, int32_t data,
96
- tcg_debug_assert(n < TCG_MAX_TEMPS);
44
+ gen_helper_gvec_5_ptr *fn)
45
+{
46
+ TCGv_ptr a0, a1, a2, a3, a4;
47
+ TCGv_i32 desc = tcg_const_i32(simd_desc(oprsz, maxsz, data));
48
+
97
+
49
+ a0 = tcg_temp_new_ptr();
98
+ if (n >= TCG_MAX_TEMPS) {
50
+ a1 = tcg_temp_new_ptr();
99
+ /* Signal overflow, starting over with fewer guest insns. */
51
+ a2 = tcg_temp_new_ptr();
100
+ siglongjmp(s->jmp_trans, -2);
52
+ a3 = tcg_temp_new_ptr();
101
+ }
53
+ a4 = tcg_temp_new_ptr();
102
return memset(&s->temps[n], 0, sizeof(TCGTemp));
54
+
103
}
55
+ tcg_gen_addi_ptr(a0, cpu_env, dofs);
104
56
+ tcg_gen_addi_ptr(a1, cpu_env, aofs);
105
-static inline TCGTemp *tcg_global_alloc(TCGContext *s)
57
+ tcg_gen_addi_ptr(a2, cpu_env, bofs);
106
+static TCGTemp *tcg_global_alloc(TCGContext *s)
58
+ tcg_gen_addi_ptr(a3, cpu_env, cofs);
107
{
59
+ tcg_gen_addi_ptr(a4, cpu_env, eofs);
108
TCGTemp *ts;
60
+
109
61
+ fn(a0, a1, a2, a3, a4, ptr, desc);
110
tcg_debug_assert(s->nb_globals == s->nb_temps);
62
+
111
+ tcg_debug_assert(s->nb_globals < TCG_MAX_TEMPS);
63
+ tcg_temp_free_ptr(a0);
112
s->nb_globals++;
64
+ tcg_temp_free_ptr(a1);
113
ts = tcg_temp_alloc(s);
65
+ tcg_temp_free_ptr(a2);
114
ts->kind = TEMP_GLOBAL;
66
+ tcg_temp_free_ptr(a3);
67
+ tcg_temp_free_ptr(a4);
68
+ tcg_temp_free_i32(desc);
69
+}
70
+
71
/* Return true if we want to implement something of OPRSZ bytes
72
in units of LNSZ. This limits the expansion of inline code. */
73
static inline bool check_size_impl(uint32_t oprsz, uint32_t lnsz)
74
--
115
--
75
2.20.1
116
2.25.1
76
117
77
118
diff view generated by jsdifflib