1
The following changes since commit 7774e403f2ac58b3e87bfe8d2f77676501ba893e:
1
The following changes since commit c5ea91da443b458352c1b629b490ee6631775cb4:
2
2
3
Merge remote-tracking branch 'remotes/kraxel/tags/fixes-20200825-pull-request' into staging (2020-08-25 10:54:51 +0100)
3
Merge tag 'pull-trivial-patches' of https://gitlab.com/mjt0k/qemu into staging (2023-09-08 10:06:25 -0400)
4
4
5
are available in the Git repository at:
5
are available in the Git repository at:
6
6
7
git@github.com:alistair23/qemu.git tags/pull-riscv-to-apply-20200825
7
https://github.com/alistair23/qemu.git tags/pull-riscv-to-apply-20230911
8
8
9
for you to fetch changes up to e39a8320b088dd5efc9ebaafe387e52b3d962665:
9
for you to fetch changes up to e7a03409f29e2da59297d55afbaec98c96e43e3a:
10
10
11
target/riscv: Support the Virtual Instruction fault (2020-08-25 09:11:36 -0700)
11
target/riscv: don't read CSR in riscv_csrrw_do64 (2023-09-11 11:45:55 +1000)
12
12
13
----------------------------------------------------------------
13
----------------------------------------------------------------
14
This pull request first adds support for multi-socket NUMA RISC-V
14
First RISC-V PR for 8.2
15
machines. The Spike and Virt machines both support NUMA sockets.
16
15
17
This PR also updates the current experimental Hypervisor support to the
16
* Remove 'host' CPU from TCG
18
v0.6.1 spec.
17
* riscv_htif Fixup printing on big endian hosts
18
* Add zmmul isa string
19
* Add smepmp isa string
20
* Fix page_check_range use in fault-only-first
21
* Use existing lookup tables for MixColumns
22
* Add RISC-V vector cryptographic instruction set support
23
* Implement WARL behaviour for mcountinhibit/mcounteren
24
* Add Zihintntl extension ISA string to DTS
25
* Fix zfa fleq.d and fltq.d
26
* Fix upper/lower mtime write calculation
27
* Make rtc variable names consistent
28
* Use abi type for linux-user target_ucontext
29
* Add RISC-V KVM AIA Support
30
* Fix riscv,pmu DT node path in the virt machine
31
* Update CSR bits name for svadu extension
32
* Mark zicond non-experimental
33
* Fix satp_mode_finalize() when satp_mode.supported = 0
34
* Fix non-KVM --enable-debug build
35
* Add new extensions to hwprobe
36
* Use accelerated helper for AES64KS1I
37
* Allocate itrigger timers only once
38
* Respect mseccfg.RLB for pmpaddrX changes
39
* Align the AIA model to v1.0 ratified spec
40
* Don't read the CSR in riscv_csrrw_do64
19
41
20
----------------------------------------------------------------
42
----------------------------------------------------------------
21
Alistair Francis (13):
43
Akihiko Odaki (1):
22
target/riscv: Allow setting a two-stage lookup in the virt status
44
target/riscv: Allocate itrigger timers only once
23
target/riscv: Allow generating hlv/hlvx/hsv instructions
24
target/riscv: Do two-stage lookups on hlv/hlvx/hsv instructions
25
target/riscv: Don't allow guest to write to htinst
26
target/riscv: Convert MSTATUS MTL to GVA
27
target/riscv: Fix the interrupt cause code
28
target/riscv: Update the Hypervisor trap return/entry
29
target/riscv: Update the CSRs to the v0.6 Hyp extension
30
target/riscv: Only support a single VSXL length
31
target/riscv: Only support little endian guests
32
target/riscv: Support the v0.6 Hypervisor extension CRSs
33
target/riscv: Return the exception from invalid CSR accesses
34
target/riscv: Support the Virtual Instruction fault
35
45
36
Anup Patel (5):
46
Ard Biesheuvel (2):
37
hw/riscv: Allow creating multiple instances of CLINT
47
target/riscv: Use existing lookup tables for MixColumns
38
hw/riscv: Allow creating multiple instances of PLIC
48
target/riscv: Use accelerated helper for AES64KS1I
39
hw/riscv: Add helpers for RISC-V multi-socket NUMA machines
40
hw/riscv: spike: Allow creating multiple NUMA sockets
41
hw/riscv: virt: Allow creating multiple NUMA sockets
42
49
43
include/hw/riscv/numa.h | 113 +++++++
50
Conor Dooley (1):
44
include/hw/riscv/sifive_clint.h | 7 +-
51
hw/riscv: virt: Fix riscv,pmu DT node path
45
include/hw/riscv/sifive_plic.h | 12 +-
46
include/hw/riscv/spike.h | 11 +-
47
include/hw/riscv/virt.h | 9 +-
48
target/riscv/cpu.h | 2 +
49
target/riscv/cpu_bits.h | 25 +-
50
target/riscv/helper.h | 4 +
51
target/riscv/insn32-64.decode | 5 +
52
target/riscv/insn32.decode | 11 +
53
hw/riscv/numa.c | 242 +++++++++++++++
54
hw/riscv/sifive_clint.c | 20 +-
55
hw/riscv/sifive_e.c | 4 +-
56
hw/riscv/sifive_plic.c | 24 +-
57
hw/riscv/sifive_u.c | 4 +-
58
hw/riscv/spike.c | 232 +++++++++-----
59
hw/riscv/virt.c | 526 ++++++++++++++++++--------------
60
target/riscv/cpu_helper.c | 123 ++++----
61
target/riscv/csr.c | 171 +++++++++--
62
target/riscv/op_helper.c | 176 ++++++++++-
63
target/riscv/translate.c | 10 -
64
hw/riscv/meson.build | 1 +
65
target/riscv/insn_trans/trans_rvh.c.inc | 342 ++++++++++++++++++++-
66
23 files changed, 1630 insertions(+), 444 deletions(-)
67
create mode 100644 include/hw/riscv/numa.h
68
create mode 100644 hw/riscv/numa.c
69
52
53
Daniel Henrique Barboza (6):
54
target/riscv/cpu.c: do not run 'host' CPU with TCG
55
target/riscv/cpu.c: add zmmul isa string
56
target/riscv/cpu.c: add smepmp isa string
57
target/riscv: fix satp_mode_finalize() when satp_mode.supported = 0
58
hw/riscv/virt.c: fix non-KVM --enable-debug build
59
hw/intc/riscv_aplic.c fix non-KVM --enable-debug build
60
61
Dickon Hood (2):
62
target/riscv: Refactor translation of vector-widening instruction
63
target/riscv: Add Zvbb ISA extension support
64
65
Jason Chien (3):
66
target/riscv: Add Zihintntl extension ISA string to DTS
67
hw/intc: Fix upper/lower mtime write calculation
68
hw/intc: Make rtc variable names consistent
69
70
Kiran Ostrolenk (4):
71
target/riscv: Refactor some of the generic vector functionality
72
target/riscv: Refactor vector-vector translation macro
73
target/riscv: Refactor some of the generic vector functionality
74
target/riscv: Add Zvknh ISA extension support
75
76
LIU Zhiwei (3):
77
target/riscv: Fix page_check_range use in fault-only-first
78
target/riscv: Fix zfa fleq.d and fltq.d
79
linux-user/riscv: Use abi type for target_ucontext
80
81
Lawrence Hunter (2):
82
target/riscv: Add Zvbc ISA extension support
83
target/riscv: Add Zvksh ISA extension support
84
85
Leon Schuermann (1):
86
target/riscv/pmp.c: respect mseccfg.RLB for pmpaddrX changes
87
88
Max Chou (3):
89
crypto: Create sm4_subword
90
crypto: Add SM4 constant parameter CK
91
target/riscv: Add Zvksed ISA extension support
92
93
Nazar Kazakov (4):
94
target/riscv: Remove redundant "cpu_vl == 0" checks
95
target/riscv: Move vector translation checks
96
target/riscv: Add Zvkned ISA extension support
97
target/riscv: Add Zvkg ISA extension support
98
99
Nikita Shubin (1):
100
target/riscv: don't read CSR in riscv_csrrw_do64
101
102
Rob Bradford (1):
103
target/riscv: Implement WARL behaviour for mcountinhibit/mcounteren
104
105
Robbin Ehn (1):
106
linux-user/riscv: Add new extensions to hwprobe
107
108
Thomas Huth (2):
109
hw/char/riscv_htif: Fix printing of console characters on big endian hosts
110
hw/char/riscv_htif: Fix the console syscall on big endian hosts
111
112
Tommy Wu (1):
113
target/riscv: Align the AIA model to v1.0 ratified spec
114
115
Vineet Gupta (1):
116
riscv: zicond: make non-experimental
117
118
Weiwei Li (1):
119
target/riscv: Update CSR bits name for svadu extension
120
121
Yong-Xuan Wang (5):
122
target/riscv: support the AIA device emulation with KVM enabled
123
target/riscv: check the in-kernel irqchip support
124
target/riscv: Create an KVM AIA irqchip
125
target/riscv: update APLIC and IMSIC to support KVM AIA
126
target/riscv: select KVM AIA in riscv virt machine
127
128
include/crypto/aes.h | 7 +
129
include/crypto/sm4.h | 9 +
130
target/riscv/cpu_bits.h | 8 +-
131
target/riscv/cpu_cfg.h | 9 +
132
target/riscv/debug.h | 3 +-
133
target/riscv/helper.h | 98 +++
134
target/riscv/kvm_riscv.h | 5 +
135
target/riscv/vector_internals.h | 228 +++++++
136
target/riscv/insn32.decode | 58 ++
137
crypto/aes.c | 4 +-
138
crypto/sm4.c | 10 +
139
hw/char/riscv_htif.c | 12 +-
140
hw/intc/riscv_aclint.c | 11 +-
141
hw/intc/riscv_aplic.c | 52 +-
142
hw/intc/riscv_imsic.c | 25 +-
143
hw/riscv/virt.c | 374 ++++++------
144
linux-user/riscv/signal.c | 4 +-
145
linux-user/syscall.c | 14 +-
146
target/arm/tcg/crypto_helper.c | 10 +-
147
target/riscv/cpu.c | 83 ++-
148
target/riscv/cpu_helper.c | 6 +-
149
target/riscv/crypto_helper.c | 51 +-
150
target/riscv/csr.c | 54 +-
151
target/riscv/debug.c | 15 +-
152
target/riscv/kvm.c | 201 ++++++-
153
target/riscv/pmp.c | 4 +
154
target/riscv/translate.c | 1 +
155
target/riscv/vcrypto_helper.c | 970 ++++++++++++++++++++++++++++++
156
target/riscv/vector_helper.c | 245 +-------
157
target/riscv/vector_internals.c | 81 +++
158
target/riscv/insn_trans/trans_rvv.c.inc | 171 +++---
159
target/riscv/insn_trans/trans_rvvk.c.inc | 606 +++++++++++++++++++
160
target/riscv/insn_trans/trans_rvzfa.c.inc | 4 +-
161
target/riscv/meson.build | 4 +-
162
34 files changed, 2785 insertions(+), 652 deletions(-)
163
create mode 100644 target/riscv/vector_internals.h
164
create mode 100644 target/riscv/vcrypto_helper.c
165
create mode 100644 target/riscv/vector_internals.c
166
create mode 100644 target/riscv/insn_trans/trans_rvvk.c.inc
diff view generated by jsdifflib
1
From: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
2
3
The 'host' CPU is available in a CONFIG_KVM build and it's currently
4
available for all accels, but is a KVM only CPU. This means that in a
5
RISC-V KVM capable host we can do things like this:
6
7
$ ./build/qemu-system-riscv64 -M virt,accel=tcg -cpu host --nographic
8
qemu-system-riscv64: H extension requires priv spec 1.12.0
9
10
This CPU does not have a priv spec because we don't filter its extensions
11
via priv spec. We shouldn't be reaching riscv_cpu_realize_tcg() at all
12
with the 'host' CPU.
13
14
We don't have a way to filter the 'host' CPU out of the available CPU
15
options (-cpu help) if the build includes both KVM and TCG. What we can
16
do is to error out during riscv_cpu_realize_tcg() if the user chooses
17
the 'host' CPU with accel=tcg:
18
19
$ ./build/qemu-system-riscv64 -M virt,accel=tcg -cpu host --nographic
20
qemu-system-riscv64: 'host' CPU is not compatible with TCG acceleration
21
22
Signed-off-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
23
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
24
Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org>
25
Message-Id: <20230721133411.474105-1-dbarboza@ventanamicro.com>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
26
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: 08cdefb171b1bdb0c9e3151c509aaadefc3dcd3e.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <08cdefb171b1bdb0c9e3151c509aaadefc3dcd3e.1597259519.git.alistair.francis@wdc.com>
4
---
27
---
5
target/riscv/cpu.h | 2 ++
28
target/riscv/cpu.c | 5 +++++
6
target/riscv/cpu_bits.h | 1 +
29
1 file changed, 5 insertions(+)
7
target/riscv/cpu_helper.c | 18 ++++++++++++++++++
8
3 files changed, 21 insertions(+)
9
30
10
diff --git a/target/riscv/cpu.h b/target/riscv/cpu.h
31
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
11
index XXXXXXX..XXXXXXX 100644
32
index XXXXXXX..XXXXXXX 100644
12
--- a/target/riscv/cpu.h
33
--- a/target/riscv/cpu.c
13
+++ b/target/riscv/cpu.h
34
+++ b/target/riscv/cpu.c
14
@@ -XXX,XX +XXX,XX @@ bool riscv_cpu_virt_enabled(CPURISCVState *env);
35
@@ -XXX,XX +XXX,XX @@ static void riscv_cpu_realize_tcg(DeviceState *dev, Error **errp)
15
void riscv_cpu_set_virt_enabled(CPURISCVState *env, bool enable);
36
CPURISCVState *env = &cpu->env;
16
bool riscv_cpu_force_hs_excep_enabled(CPURISCVState *env);
37
Error *local_err = NULL;
17
void riscv_cpu_set_force_hs_excep(CPURISCVState *env, bool enable);
38
18
+bool riscv_cpu_two_stage_lookup(CPURISCVState *env);
39
+ if (object_dynamic_cast(OBJECT(dev), TYPE_RISCV_CPU_HOST)) {
19
+void riscv_cpu_set_two_stage_lookup(CPURISCVState *env, bool enable);
40
+ error_setg(errp, "'host' CPU is not compatible with TCG acceleration");
20
int riscv_cpu_mmu_index(CPURISCVState *env, bool ifetch);
21
hwaddr riscv_cpu_get_phys_page_debug(CPUState *cpu, vaddr addr);
22
void riscv_cpu_do_unaligned_access(CPUState *cs, vaddr addr,
23
diff --git a/target/riscv/cpu_bits.h b/target/riscv/cpu_bits.h
24
index XXXXXXX..XXXXXXX 100644
25
--- a/target/riscv/cpu_bits.h
26
+++ b/target/riscv/cpu_bits.h
27
@@ -XXX,XX +XXX,XX @@
28
* page table fault.
29
*/
30
#define FORCE_HS_EXCEP 2
31
+#define HS_TWO_STAGE 4
32
33
/* RV32 satp CSR field masks */
34
#define SATP32_MODE 0x80000000
35
diff --git a/target/riscv/cpu_helper.c b/target/riscv/cpu_helper.c
36
index XXXXXXX..XXXXXXX 100644
37
--- a/target/riscv/cpu_helper.c
38
+++ b/target/riscv/cpu_helper.c
39
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_set_force_hs_excep(CPURISCVState *env, bool enable)
40
env->virt = set_field(env->virt, FORCE_HS_EXCEP, enable);
41
}
42
43
+bool riscv_cpu_two_stage_lookup(CPURISCVState *env)
44
+{
45
+ if (!riscv_has_ext(env, RVH)) {
46
+ return false;
47
+ }
48
+
49
+ return get_field(env->virt, HS_TWO_STAGE);
50
+}
51
+
52
+void riscv_cpu_set_two_stage_lookup(CPURISCVState *env, bool enable)
53
+{
54
+ if (!riscv_has_ext(env, RVH)) {
55
+ return;
41
+ return;
56
+ }
42
+ }
57
+
43
+
58
+ env->virt = set_field(env->virt, HS_TWO_STAGE, enable);
44
riscv_cpu_validate_misa_mxl(cpu, &local_err);
59
+}
45
if (local_err != NULL) {
60
+
46
error_propagate(errp, local_err);
61
int riscv_cpu_claim_interrupts(RISCVCPU *cpu, uint32_t interrupts)
62
{
63
CPURISCVState *env = &cpu->env;
64
--
47
--
65
2.28.0
48
2.41.0
66
49
67
50
diff view generated by jsdifflib
New patch
1
From: Thomas Huth <thuth@redhat.com>
1
2
3
The character that should be printed is stored in the 64 bit "payload"
4
variable. The code currently tries to print it by taking the address
5
of the variable and passing this pointer to qemu_chr_fe_write(). However,
6
this only works on little endian hosts where the least significant bits
7
are stored on the lowest address. To do this in a portable way, we have
8
to store the value in an uint8_t variable instead.
9
10
Fixes: 5033606780 ("RISC-V HTIF Console")
11
Signed-off-by: Thomas Huth <thuth@redhat.com>
12
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
13
Reviewed-by: Bin Meng <bmeng@tinylab.org>
14
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
15
Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org>
16
Message-Id: <20230721094720.902454-2-thuth@redhat.com>
17
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
18
---
19
hw/char/riscv_htif.c | 3 ++-
20
1 file changed, 2 insertions(+), 1 deletion(-)
21
22
diff --git a/hw/char/riscv_htif.c b/hw/char/riscv_htif.c
23
index XXXXXXX..XXXXXXX 100644
24
--- a/hw/char/riscv_htif.c
25
+++ b/hw/char/riscv_htif.c
26
@@ -XXX,XX +XXX,XX @@ static void htif_handle_tohost_write(HTIFState *s, uint64_t val_written)
27
s->tohost = 0; /* clear to indicate we read */
28
return;
29
} else if (cmd == HTIF_CONSOLE_CMD_PUTC) {
30
- qemu_chr_fe_write(&s->chr, (uint8_t *)&payload, 1);
31
+ uint8_t ch = (uint8_t)payload;
32
+ qemu_chr_fe_write(&s->chr, &ch, 1);
33
resp = 0x100 | (uint8_t)payload;
34
} else {
35
qemu_log("HTIF device %d: unknown command\n", device);
36
--
37
2.41.0
38
39
diff view generated by jsdifflib
New patch
1
From: Thomas Huth <thuth@redhat.com>
1
2
3
Values that have been read via cpu_physical_memory_read() from the
4
guest's memory have to be swapped in case the host endianess differs
5
from the guest.
6
7
Fixes: a6e13e31d5 ("riscv_htif: Support console output via proxy syscall")
8
Signed-off-by: Thomas Huth <thuth@redhat.com>
9
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
10
Reviewed-by: Bin Meng <bmeng@tinylab.org>
11
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
12
Message-Id: <20230721094720.902454-3-thuth@redhat.com>
13
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
14
---
15
hw/char/riscv_htif.c | 9 +++++----
16
1 file changed, 5 insertions(+), 4 deletions(-)
17
18
diff --git a/hw/char/riscv_htif.c b/hw/char/riscv_htif.c
19
index XXXXXXX..XXXXXXX 100644
20
--- a/hw/char/riscv_htif.c
21
+++ b/hw/char/riscv_htif.c
22
@@ -XXX,XX +XXX,XX @@
23
#include "qemu/timer.h"
24
#include "qemu/error-report.h"
25
#include "exec/address-spaces.h"
26
+#include "exec/tswap.h"
27
#include "sysemu/dma.h"
28
29
#define RISCV_DEBUG_HTIF 0
30
@@ -XXX,XX +XXX,XX @@ static void htif_handle_tohost_write(HTIFState *s, uint64_t val_written)
31
} else {
32
uint64_t syscall[8];
33
cpu_physical_memory_read(payload, syscall, sizeof(syscall));
34
- if (syscall[0] == PK_SYS_WRITE &&
35
- syscall[1] == HTIF_DEV_CONSOLE &&
36
- syscall[3] == HTIF_CONSOLE_CMD_PUTC) {
37
+ if (tswap64(syscall[0]) == PK_SYS_WRITE &&
38
+ tswap64(syscall[1]) == HTIF_DEV_CONSOLE &&
39
+ tswap64(syscall[3]) == HTIF_CONSOLE_CMD_PUTC) {
40
uint8_t ch;
41
- cpu_physical_memory_read(syscall[2], &ch, 1);
42
+ cpu_physical_memory_read(tswap64(syscall[2]), &ch, 1);
43
qemu_chr_fe_write(&s->chr, &ch, 1);
44
resp = 0x100 | (uint8_t)payload;
45
} else {
46
--
47
2.41.0
diff view generated by jsdifflib
New patch
1
From: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
1
2
3
zmmul was promoted from experimental to ratified in commit 6d00ffad4e95.
4
Add a riscv,isa string for it.
5
6
Fixes: 6d00ffad4e95 ("target/riscv: move zmmul out of the experimental properties")
7
Signed-off-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
8
Reviewed-by: Weiwei Li <liweiwei@iscas.ac.cn>
9
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
10
Message-Id: <20230720132424.371132-2-dbarboza@ventanamicro.com>
11
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
12
---
13
target/riscv/cpu.c | 1 +
14
1 file changed, 1 insertion(+)
15
16
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
17
index XXXXXXX..XXXXXXX 100644
18
--- a/target/riscv/cpu.c
19
+++ b/target/riscv/cpu.c
20
@@ -XXX,XX +XXX,XX @@ static const struct isa_ext_data isa_edata_arr[] = {
21
ISA_EXT_DATA_ENTRY(zicsr, PRIV_VERSION_1_10_0, ext_icsr),
22
ISA_EXT_DATA_ENTRY(zifencei, PRIV_VERSION_1_10_0, ext_ifencei),
23
ISA_EXT_DATA_ENTRY(zihintpause, PRIV_VERSION_1_10_0, ext_zihintpause),
24
+ ISA_EXT_DATA_ENTRY(zmmul, PRIV_VERSION_1_12_0, ext_zmmul),
25
ISA_EXT_DATA_ENTRY(zawrs, PRIV_VERSION_1_12_0, ext_zawrs),
26
ISA_EXT_DATA_ENTRY(zfa, PRIV_VERSION_1_12_0, ext_zfa),
27
ISA_EXT_DATA_ENTRY(zfbfmin, PRIV_VERSION_1_12_0, ext_zfbfmin),
28
--
29
2.41.0
diff view generated by jsdifflib
New patch
1
From: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
1
2
3
The cpu->cfg.epmp extension is still experimental, but it already has a
4
'smepmp' riscv,isa string. Add it.
5
6
Signed-off-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
7
Reviewed-by: Weiwei Li <liweiwei@iscas.ac.cn>
8
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
9
Message-Id: <20230720132424.371132-3-dbarboza@ventanamicro.com>
10
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
11
---
12
target/riscv/cpu.c | 1 +
13
1 file changed, 1 insertion(+)
14
15
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
16
index XXXXXXX..XXXXXXX 100644
17
--- a/target/riscv/cpu.c
18
+++ b/target/riscv/cpu.c
19
@@ -XXX,XX +XXX,XX @@ static const struct isa_ext_data isa_edata_arr[] = {
20
ISA_EXT_DATA_ENTRY(zhinx, PRIV_VERSION_1_12_0, ext_zhinx),
21
ISA_EXT_DATA_ENTRY(zhinxmin, PRIV_VERSION_1_12_0, ext_zhinxmin),
22
ISA_EXT_DATA_ENTRY(smaia, PRIV_VERSION_1_12_0, ext_smaia),
23
+ ISA_EXT_DATA_ENTRY(smepmp, PRIV_VERSION_1_12_0, epmp),
24
ISA_EXT_DATA_ENTRY(smstateen, PRIV_VERSION_1_12_0, ext_smstateen),
25
ISA_EXT_DATA_ENTRY(ssaia, PRIV_VERSION_1_12_0, ext_ssaia),
26
ISA_EXT_DATA_ENTRY(sscofpmf, PRIV_VERSION_1_12_0, ext_sscofpmf),
27
--
28
2.41.0
diff view generated by jsdifflib
New patch
1
From: LIU Zhiwei <zhiwei_liu@linux.alibaba.com>
1
2
3
Commit bef6f008b98(accel/tcg: Return bool from page_check_range) converts
4
integer return value to bool type. However, it wrongly converted the use
5
of the API in riscv fault-only-first, where page_check_range < = 0, should
6
be converted to !page_check_range.
7
8
Signed-off-by: LIU Zhiwei <zhiwei_liu@linux.alibaba.com>
9
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
10
Message-ID: <20230729031618.821-1-zhiwei_liu@linux.alibaba.com>
11
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
12
---
13
target/riscv/vector_helper.c | 2 +-
14
1 file changed, 1 insertion(+), 1 deletion(-)
15
16
diff --git a/target/riscv/vector_helper.c b/target/riscv/vector_helper.c
17
index XXXXXXX..XXXXXXX 100644
18
--- a/target/riscv/vector_helper.c
19
+++ b/target/riscv/vector_helper.c
20
@@ -XXX,XX +XXX,XX @@ vext_ldff(void *vd, void *v0, target_ulong base,
21
cpu_mmu_index(env, false));
22
if (host) {
23
#ifdef CONFIG_USER_ONLY
24
- if (page_check_range(addr, offset, PAGE_READ)) {
25
+ if (!page_check_range(addr, offset, PAGE_READ)) {
26
vl = i;
27
goto ProbeSuccess;
28
}
29
--
30
2.41.0
diff view generated by jsdifflib
1
From: Ard Biesheuvel <ardb@kernel.org>
2
3
The AES MixColumns and InvMixColumns operations are relatively
4
expensive 4x4 matrix multiplications in GF(2^8), which is why C
5
implementations usually rely on precomputed lookup tables rather than
6
performing the calculations on demand.
7
8
Given that we already carry those tables in QEMU, we can just grab the
9
right value in the implementation of the RISC-V AES32 instructions. Note
10
that the tables in question are permuted according to the respective
11
Sbox, so we can omit the Sbox lookup as well in this case.
12
13
Cc: Richard Henderson <richard.henderson@linaro.org>
14
Cc: Philippe Mathieu-Daudé <philmd@linaro.org>
15
Cc: Zewen Ye <lustrew@foxmail.com>
16
Cc: Weiwei Li <liweiwei@iscas.ac.cn>
17
Cc: Junqiang Wang <wangjunqiang@iscas.ac.cn>
18
Signed-off-by: Ard Biesheuvel <ardb@kernel.org>
19
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
20
Message-ID: <20230731084043.1791984-1-ardb@kernel.org>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
21
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: 024ad8a594fb2feaf0950fbfad1508cfa82ce7f0.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <024ad8a594fb2feaf0950fbfad1508cfa82ce7f0.1597259519.git.alistair.francis@wdc.com>
4
---
22
---
5
target/riscv/cpu_helper.c | 60 ++++++++++++++++-----------------------
23
include/crypto/aes.h | 7 +++++++
6
1 file changed, 25 insertions(+), 35 deletions(-)
24
crypto/aes.c | 4 ++--
25
target/riscv/crypto_helper.c | 34 ++++------------------------------
26
3 files changed, 13 insertions(+), 32 deletions(-)
7
27
8
diff --git a/target/riscv/cpu_helper.c b/target/riscv/cpu_helper.c
28
diff --git a/include/crypto/aes.h b/include/crypto/aes.h
9
index XXXXXXX..XXXXXXX 100644
29
index XXXXXXX..XXXXXXX 100644
10
--- a/target/riscv/cpu_helper.c
30
--- a/include/crypto/aes.h
11
+++ b/target/riscv/cpu_helper.c
31
+++ b/include/crypto/aes.h
12
@@ -XXX,XX +XXX,XX @@ static int get_physical_address(CPURISCVState *env, hwaddr *physical,
32
@@ -XXX,XX +XXX,XX @@ void AES_decrypt(const unsigned char *in, unsigned char *out,
13
* was called. Background registers will be used if the guest has
33
extern const uint8_t AES_sbox[256];
14
* forced a two stage translation to be on (in HS or M mode).
34
extern const uint8_t AES_isbox[256];
15
*/
35
16
+ if (riscv_cpu_two_stage_lookup(env) && access_type != MMU_INST_FETCH) {
36
+/*
17
+ use_background = true;
37
+AES_Te0[x] = S [x].[02, 01, 01, 03];
18
+ }
38
+AES_Td0[x] = Si[x].[0e, 09, 0d, 0b];
39
+*/
19
+
40
+
20
if (mode == PRV_M && access_type != MMU_INST_FETCH) {
41
+extern const uint32_t AES_Te0[256], AES_Td0[256];
21
if (get_field(env->mstatus, MSTATUS_MPRV)) {
42
+
22
mode = get_field(env->mstatus, MSTATUS_MPP);
43
#endif
44
diff --git a/crypto/aes.c b/crypto/aes.c
45
index XXXXXXX..XXXXXXX 100644
46
--- a/crypto/aes.c
47
+++ b/crypto/aes.c
48
@@ -XXX,XX +XXX,XX @@ AES_Td3[x] = Si[x].[09, 0d, 0b, 0e];
49
AES_Td4[x] = Si[x].[01, 01, 01, 01];
50
*/
51
52
-static const uint32_t AES_Te0[256] = {
53
+const uint32_t AES_Te0[256] = {
54
0xc66363a5U, 0xf87c7c84U, 0xee777799U, 0xf67b7b8dU,
55
0xfff2f20dU, 0xd66b6bbdU, 0xde6f6fb1U, 0x91c5c554U,
56
0x60303050U, 0x02010103U, 0xce6767a9U, 0x562b2b7dU,
57
@@ -XXX,XX +XXX,XX @@ static const uint32_t AES_Te4[256] = {
58
0xb0b0b0b0U, 0x54545454U, 0xbbbbbbbbU, 0x16161616U,
59
};
60
61
-static const uint32_t AES_Td0[256] = {
62
+const uint32_t AES_Td0[256] = {
63
0x51f4a750U, 0x7e416553U, 0x1a17a4c3U, 0x3a275e96U,
64
0x3bab6bcbU, 0x1f9d45f1U, 0xacfa58abU, 0x4be30393U,
65
0x2030fa55U, 0xad766df6U, 0x88cc7691U, 0xf5024c25U,
66
diff --git a/target/riscv/crypto_helper.c b/target/riscv/crypto_helper.c
67
index XXXXXXX..XXXXXXX 100644
68
--- a/target/riscv/crypto_helper.c
69
+++ b/target/riscv/crypto_helper.c
70
@@ -XXX,XX +XXX,XX @@
71
#include "crypto/aes-round.h"
72
#include "crypto/sm4.h"
73
74
-#define AES_XTIME(a) \
75
- ((a << 1) ^ ((a & 0x80) ? 0x1b : 0))
23
-
76
-
24
- if (riscv_has_ext(env, RVH) &&
77
-#define AES_GFMUL(a, b) (( \
25
- MSTATUS_MPV_ISSET(env)) {
78
- (((b) & 0x1) ? (a) : 0) ^ \
26
- use_background = true;
79
- (((b) & 0x2) ? AES_XTIME(a) : 0) ^ \
27
- }
80
- (((b) & 0x4) ? AES_XTIME(AES_XTIME(a)) : 0) ^ \
28
- }
81
- (((b) & 0x8) ? AES_XTIME(AES_XTIME(AES_XTIME(a))) : 0)) & 0xFF)
82
-
83
-static inline uint32_t aes_mixcolumn_byte(uint8_t x, bool fwd)
84
-{
85
- uint32_t u;
86
-
87
- if (fwd) {
88
- u = (AES_GFMUL(x, 3) << 24) | (x << 16) | (x << 8) |
89
- (AES_GFMUL(x, 2) << 0);
90
- } else {
91
- u = (AES_GFMUL(x, 0xb) << 24) | (AES_GFMUL(x, 0xd) << 16) |
92
- (AES_GFMUL(x, 0x9) << 8) | (AES_GFMUL(x, 0xe) << 0);
29
- }
93
- }
94
- return u;
95
-}
30
-
96
-
31
- if (mode == PRV_S && access_type != MMU_INST_FETCH &&
97
#define sext32_xlen(x) (target_ulong)(int32_t)(x)
32
- riscv_has_ext(env, RVH) && !riscv_cpu_virt_enabled(env)) {
98
33
- if (get_field(env->hstatus, HSTATUS_SPRV)) {
99
static inline target_ulong aes32_operation(target_ulong shamt,
34
- mode = get_field(env->mstatus, SSTATUS_SPP);
100
@@ -XXX,XX +XXX,XX @@ static inline target_ulong aes32_operation(target_ulong shamt,
35
- use_background = true;
101
bool enc, bool mix)
102
{
103
uint8_t si = rs2 >> shamt;
104
- uint8_t so;
105
uint32_t mixed;
106
target_ulong res;
107
108
if (enc) {
109
- so = AES_sbox[si];
110
if (mix) {
111
- mixed = aes_mixcolumn_byte(so, true);
112
+ mixed = be32_to_cpu(AES_Te0[si]);
113
} else {
114
- mixed = so;
115
+ mixed = AES_sbox[si];
116
}
117
} else {
118
- so = AES_isbox[si];
119
if (mix) {
120
- mixed = aes_mixcolumn_byte(so, false);
121
+ mixed = be32_to_cpu(AES_Td0[si]);
122
} else {
123
- mixed = so;
124
+ mixed = AES_isbox[si];
36
}
125
}
37
}
126
}
38
127
mixed = rol32(mixed, shamt);
39
@@ -XXX,XX +XXX,XX @@ static void raise_mmu_exception(CPURISCVState *env, target_ulong address,
40
}
41
break;
42
case MMU_DATA_LOAD:
43
- if (riscv_cpu_virt_enabled(env) && !first_stage) {
44
+ if ((riscv_cpu_virt_enabled(env) || riscv_cpu_two_stage_lookup(env)) &&
45
+ !first_stage) {
46
cs->exception_index = RISCV_EXCP_LOAD_GUEST_ACCESS_FAULT;
47
} else {
48
cs->exception_index = page_fault_exceptions ?
49
@@ -XXX,XX +XXX,XX @@ static void raise_mmu_exception(CPURISCVState *env, target_ulong address,
50
}
51
break;
52
case MMU_DATA_STORE:
53
- if (riscv_cpu_virt_enabled(env) && !first_stage) {
54
+ if ((riscv_cpu_virt_enabled(env) || riscv_cpu_two_stage_lookup(env)) &&
55
+ !first_stage) {
56
cs->exception_index = RISCV_EXCP_STORE_GUEST_AMO_ACCESS_FAULT;
57
} else {
58
cs->exception_index = page_fault_exceptions ?
59
@@ -XXX,XX +XXX,XX @@ bool riscv_cpu_tlb_fill(CPUState *cs, vaddr address, int size,
60
hwaddr pa = 0;
61
int prot, prot2;
62
bool pmp_violation = false;
63
- bool m_mode_two_stage = false;
64
- bool hs_mode_two_stage = false;
65
bool first_stage_error = true;
66
int ret = TRANSLATE_FAIL;
67
int mode = mmu_idx;
68
@@ -XXX,XX +XXX,XX @@ bool riscv_cpu_tlb_fill(CPUState *cs, vaddr address, int size,
69
qemu_log_mask(CPU_LOG_MMU, "%s ad %" VADDR_PRIx " rw %d mmu_idx %d\n",
70
__func__, address, access_type, mmu_idx);
71
72
- /*
73
- * Determine if we are in M mode and MPRV is set or in HS mode and SPRV is
74
- * set and we want to access a virtulisation address.
75
- */
76
- if (riscv_has_ext(env, RVH)) {
77
- m_mode_two_stage = env->priv == PRV_M &&
78
- access_type != MMU_INST_FETCH &&
79
- get_field(env->mstatus, MSTATUS_MPRV) &&
80
- MSTATUS_MPV_ISSET(env);
81
-
82
- hs_mode_two_stage = env->priv == PRV_S &&
83
- !riscv_cpu_virt_enabled(env) &&
84
- access_type != MMU_INST_FETCH &&
85
- get_field(env->hstatus, HSTATUS_SPRV) &&
86
- get_field(env->hstatus, HSTATUS_SPV);
87
- }
88
-
89
if (mode == PRV_M && access_type != MMU_INST_FETCH) {
90
if (get_field(env->mstatus, MSTATUS_MPRV)) {
91
mode = get_field(env->mstatus, MSTATUS_MPP);
92
}
93
}
94
95
- if (riscv_cpu_virt_enabled(env) || m_mode_two_stage || hs_mode_two_stage) {
96
+ if (riscv_has_ext(env, RVH) && env->priv == PRV_M &&
97
+ access_type != MMU_INST_FETCH &&
98
+ get_field(env->mstatus, MSTATUS_MPRV) &&
99
+ MSTATUS_MPV_ISSET(env)) {
100
+ riscv_cpu_set_two_stage_lookup(env, true);
101
+ }
102
+
103
+ if (riscv_cpu_virt_enabled(env) ||
104
+ (riscv_cpu_two_stage_lookup(env) && access_type != MMU_INST_FETCH)) {
105
/* Two stage lookup */
106
ret = get_physical_address(env, &pa, &prot, address, access_type,
107
mmu_idx, true, true);
108
@@ -XXX,XX +XXX,XX @@ bool riscv_cpu_tlb_fill(CPUState *cs, vaddr address, int size,
109
__func__, address, ret, pa, prot);
110
}
111
112
+ /* We did the two stage lookup based on MPRV, unset the lookup */
113
+ if (riscv_has_ext(env, RVH) && env->priv == PRV_M &&
114
+ access_type != MMU_INST_FETCH &&
115
+ get_field(env->mstatus, MSTATUS_MPRV) &&
116
+ MSTATUS_MPV_ISSET(env)) {
117
+ riscv_cpu_set_two_stage_lookup(env, false);
118
+ }
119
+
120
if (riscv_feature(env, RISCV_FEATURE_PMP) &&
121
(ret == TRANSLATE_SUCCESS) &&
122
!pmp_hart_has_privs(env, pa, size, 1 << access_type, mode)) {
123
--
128
--
124
2.28.0
129
2.41.0
125
130
126
131
diff view generated by jsdifflib
1
From: Anup Patel <anup.patel@wdc.com>
1
From: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
2
2
3
We add common helper routines which can be shared by RISC-V
3
Take some functions/macros out of `vector_helper` and put them in a new
4
multi-socket NUMA machines.
4
module called `vector_internals`. This ensures they can be used by both
5
vector and vector-crypto helpers (latter implemented in proceeding
6
commits).
5
7
6
We have two types of helpers:
8
Signed-off-by: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
7
1. riscv_socket_xyz() - These helper assist managing multiple
9
Reviewed-by: Weiwei Li <liweiwei@iscas.ac.cn>
8
sockets irrespective whether QEMU NUMA is enabled/disabled
10
Signed-off-by: Max Chou <max.chou@sifive.com>
9
2. riscv_numa_xyz() - These helpers assist in providing
11
Acked-by: Alistair Francis <alistair.francis@wdc.com>
10
necessary QEMU machine callbacks for QEMU NUMA emulation
12
Message-ID: <20230711165917.2629866-2-max.chou@sifive.com>
11
12
Signed-off-by: Anup Patel <anup.patel@wdc.com>
13
Reviewed-by: Atish Patra <atish.patra@wdc.com>
14
Message-Id: <20200616032229.766089-4-anup.patel@wdc.com>
15
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
13
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
16
---
14
---
17
include/hw/riscv/numa.h | 113 +++++++++++++++++++
15
target/riscv/vector_internals.h | 182 +++++++++++++++++++++++++++++
18
hw/riscv/numa.c | 242 ++++++++++++++++++++++++++++++++++++++++
16
target/riscv/vector_helper.c | 201 +-------------------------------
19
hw/riscv/meson.build | 1 +
17
target/riscv/vector_internals.c | 81 +++++++++++++
20
3 files changed, 356 insertions(+)
18
target/riscv/meson.build | 1 +
21
create mode 100644 include/hw/riscv/numa.h
19
4 files changed, 265 insertions(+), 200 deletions(-)
22
create mode 100644 hw/riscv/numa.c
20
create mode 100644 target/riscv/vector_internals.h
21
create mode 100644 target/riscv/vector_internals.c
23
22
24
diff --git a/include/hw/riscv/numa.h b/include/hw/riscv/numa.h
23
diff --git a/target/riscv/vector_internals.h b/target/riscv/vector_internals.h
25
new file mode 100644
24
new file mode 100644
26
index XXXXXXX..XXXXXXX
25
index XXXXXXX..XXXXXXX
27
--- /dev/null
26
--- /dev/null
28
+++ b/include/hw/riscv/numa.h
27
+++ b/target/riscv/vector_internals.h
29
@@ -XXX,XX +XXX,XX @@
28
@@ -XXX,XX +XXX,XX @@
30
+/*
29
+/*
31
+ * QEMU RISC-V NUMA Helper
30
+ * RISC-V Vector Extension Internals
32
+ *
31
+ *
33
+ * Copyright (c) 2020 Western Digital Corporation or its affiliates.
32
+ * Copyright (c) 2020 T-Head Semiconductor Co., Ltd. All rights reserved.
34
+ *
33
+ *
35
+ * This program is free software; you can redistribute it and/or modify it
34
+ * This program is free software; you can redistribute it and/or modify it
36
+ * under the terms and conditions of the GNU General Public License,
35
+ * under the terms and conditions of the GNU General Public License,
37
+ * version 2 or later, as published by the Free Software Foundation.
36
+ * version 2 or later, as published by the Free Software Foundation.
38
+ *
37
+ *
...
...
43
+ *
42
+ *
44
+ * You should have received a copy of the GNU General Public License along with
43
+ * You should have received a copy of the GNU General Public License along with
45
+ * this program. If not, see <http://www.gnu.org/licenses/>.
44
+ * this program. If not, see <http://www.gnu.org/licenses/>.
46
+ */
45
+ */
47
+
46
+
48
+#ifndef RISCV_NUMA_H
47
+#ifndef TARGET_RISCV_VECTOR_INTERNALS_H
49
+#define RISCV_NUMA_H
48
+#define TARGET_RISCV_VECTOR_INTERNALS_H
50
+
49
+
51
+#include "hw/sysbus.h"
50
+#include "qemu/osdep.h"
52
+#include "sysemu/numa.h"
51
+#include "qemu/bitops.h"
53
+
52
+#include "cpu.h"
54
+/**
53
+#include "tcg/tcg-gvec-desc.h"
55
+ * riscv_socket_count:
54
+#include "internals.h"
56
+ * @ms: pointer to machine state
55
+
57
+ *
56
+static inline uint32_t vext_nf(uint32_t desc)
58
+ * Returns: number of sockets for a numa system and 1 for a non-numa system
57
+{
59
+ */
58
+ return FIELD_EX32(simd_data(desc), VDATA, NF);
60
+int riscv_socket_count(const MachineState *ms);
59
+}
61
+
60
+
62
+/**
61
+/*
63
+ * riscv_socket_first_hartid:
62
+ * Note that vector data is stored in host-endian 64-bit chunks,
64
+ * @ms: pointer to machine state
63
+ * so addressing units smaller than that needs a host-endian fixup.
65
+ * @socket_id: socket index
64
+ */
66
+ *
65
+#if HOST_BIG_ENDIAN
67
+ * Returns: first hartid for a valid socket and -1 for an invalid socket
66
+#define H1(x) ((x) ^ 7)
68
+ */
67
+#define H1_2(x) ((x) ^ 6)
69
+int riscv_socket_first_hartid(const MachineState *ms, int socket_id);
68
+#define H1_4(x) ((x) ^ 4)
70
+
69
+#define H2(x) ((x) ^ 3)
71
+/**
70
+#define H4(x) ((x) ^ 1)
72
+ * riscv_socket_last_hartid:
71
+#define H8(x) ((x))
73
+ * @ms: pointer to machine state
72
+#else
74
+ * @socket_id: socket index
73
+#define H1(x) (x)
75
+ *
74
+#define H1_2(x) (x)
76
+ * Returns: last hartid for a valid socket and -1 for an invalid socket
75
+#define H1_4(x) (x)
77
+ */
76
+#define H2(x) (x)
78
+int riscv_socket_last_hartid(const MachineState *ms, int socket_id);
77
+#define H4(x) (x)
79
+
78
+#define H8(x) (x)
80
+/**
79
+#endif
81
+ * riscv_socket_hart_count:
80
+
82
+ * @ms: pointer to machine state
81
+/*
83
+ * @socket_id: socket index
82
+ * Encode LMUL to lmul as following:
84
+ *
83
+ * LMUL vlmul lmul
85
+ * Returns: number of harts for a valid socket and -1 for an invalid socket
84
+ * 1 000 0
86
+ */
85
+ * 2 001 1
87
+int riscv_socket_hart_count(const MachineState *ms, int socket_id);
86
+ * 4 010 2
88
+
87
+ * 8 011 3
89
+/**
88
+ * - 100 -
90
+ * riscv_socket_mem_offset:
89
+ * 1/8 101 -3
91
+ * @ms: pointer to machine state
90
+ * 1/4 110 -2
92
+ * @socket_id: socket index
91
+ * 1/2 111 -1
93
+ *
92
+ */
94
+ * Returns: offset of ram belonging to given socket
93
+static inline int32_t vext_lmul(uint32_t desc)
95
+ */
94
+{
96
+uint64_t riscv_socket_mem_offset(const MachineState *ms, int socket_id);
95
+ return sextract32(FIELD_EX32(simd_data(desc), VDATA, LMUL), 0, 3);
97
+
96
+}
98
+/**
97
+
99
+ * riscv_socket_mem_size:
98
+static inline uint32_t vext_vm(uint32_t desc)
100
+ * @ms: pointer to machine state
99
+{
101
+ * @socket_id: socket index
100
+ return FIELD_EX32(simd_data(desc), VDATA, VM);
102
+ *
101
+}
103
+ * Returns: size of ram belonging to given socket
102
+
104
+ */
103
+static inline uint32_t vext_vma(uint32_t desc)
105
+uint64_t riscv_socket_mem_size(const MachineState *ms, int socket_id);
104
+{
106
+
105
+ return FIELD_EX32(simd_data(desc), VDATA, VMA);
107
+/**
106
+}
108
+ * riscv_socket_check_hartids:
107
+
109
+ * @ms: pointer to machine state
108
+static inline uint32_t vext_vta(uint32_t desc)
110
+ * @socket_id: socket index
109
+{
111
+ *
110
+ return FIELD_EX32(simd_data(desc), VDATA, VTA);
112
+ * Returns: true if hardids belonging to given socket are contiguous else false
111
+}
113
+ */
112
+
114
+bool riscv_socket_check_hartids(const MachineState *ms, int socket_id);
113
+static inline uint32_t vext_vta_all_1s(uint32_t desc)
115
+
114
+{
116
+/**
115
+ return FIELD_EX32(simd_data(desc), VDATA, VTA_ALL_1S);
117
+ * riscv_socket_fdt_write_id:
116
+}
118
+ * @ms: pointer to machine state
117
+
119
+ * @socket_id: socket index
118
+/*
120
+ *
119
+ * Earlier designs (pre-0.9) had a varying number of bits
121
+ * Write NUMA node-id FDT property for given FDT node
120
+ * per mask value (MLEN). In the 0.9 design, MLEN=1.
122
+ */
121
+ * (Section 4.5)
123
+void riscv_socket_fdt_write_id(const MachineState *ms, void *fdt,
122
+ */
124
+ const char *node_name, int socket_id);
123
+static inline int vext_elem_mask(void *v0, int index)
125
+
124
+{
126
+/**
125
+ int idx = index / 64;
127
+ * riscv_socket_fdt_write_distance_matrix:
126
+ int pos = index % 64;
128
+ * @ms: pointer to machine state
127
+ return (((uint64_t *)v0)[idx] >> pos) & 1;
129
+ * @socket_id: socket index
128
+}
130
+ *
129
+
131
+ * Write NUMA distance matrix in FDT for given machine
130
+/*
132
+ */
131
+ * Get number of total elements, including prestart, body and tail elements.
133
+void riscv_socket_fdt_write_distance_matrix(const MachineState *ms, void *fdt);
132
+ * Note that when LMUL < 1, the tail includes the elements past VLMAX that
134
+
133
+ * are held in the same vector register.
135
+CpuInstanceProperties
134
+ */
136
+riscv_numa_cpu_index_to_props(MachineState *ms, unsigned cpu_index);
135
+static inline uint32_t vext_get_total_elems(CPURISCVState *env, uint32_t desc,
137
+
136
+ uint32_t esz)
138
+int64_t riscv_numa_get_default_cpu_node_id(const MachineState *ms, int idx);
137
+{
139
+
138
+ uint32_t vlenb = simd_maxsz(desc);
140
+const CPUArchIdList *riscv_numa_possible_cpu_arch_ids(MachineState *ms);
139
+ uint32_t sew = 1 << FIELD_EX64(env->vtype, VTYPE, VSEW);
141
+
140
+ int8_t emul = ctzl(esz) - ctzl(sew) + vext_lmul(desc) < 0 ? 0 :
142
+#endif /* RISCV_NUMA_H */
141
+ ctzl(esz) - ctzl(sew) + vext_lmul(desc);
143
diff --git a/hw/riscv/numa.c b/hw/riscv/numa.c
142
+ return (vlenb << emul) / esz;
143
+}
144
+
145
+/* set agnostic elements to 1s */
146
+void vext_set_elems_1s(void *base, uint32_t is_agnostic, uint32_t cnt,
147
+ uint32_t tot);
148
+
149
+/* expand macro args before macro */
150
+#define RVVCALL(macro, ...) macro(__VA_ARGS__)
151
+
152
+/* (TD, T1, T2, TX1, TX2) */
153
+#define OP_UUU_B uint8_t, uint8_t, uint8_t, uint8_t, uint8_t
154
+#define OP_UUU_H uint16_t, uint16_t, uint16_t, uint16_t, uint16_t
155
+#define OP_UUU_W uint32_t, uint32_t, uint32_t, uint32_t, uint32_t
156
+#define OP_UUU_D uint64_t, uint64_t, uint64_t, uint64_t, uint64_t
157
+
158
+/* operation of two vector elements */
159
+typedef void opivv2_fn(void *vd, void *vs1, void *vs2, int i);
160
+
161
+#define OPIVV2(NAME, TD, T1, T2, TX1, TX2, HD, HS1, HS2, OP) \
162
+static void do_##NAME(void *vd, void *vs1, void *vs2, int i) \
163
+{ \
164
+ TX1 s1 = *((T1 *)vs1 + HS1(i)); \
165
+ TX2 s2 = *((T2 *)vs2 + HS2(i)); \
166
+ *((TD *)vd + HD(i)) = OP(s2, s1); \
167
+}
168
+
169
+void do_vext_vv(void *vd, void *v0, void *vs1, void *vs2,
170
+ CPURISCVState *env, uint32_t desc,
171
+ opivv2_fn *fn, uint32_t esz);
172
+
173
+/* generate the helpers for OPIVV */
174
+#define GEN_VEXT_VV(NAME, ESZ) \
175
+void HELPER(NAME)(void *vd, void *v0, void *vs1, \
176
+ void *vs2, CPURISCVState *env, \
177
+ uint32_t desc) \
178
+{ \
179
+ do_vext_vv(vd, v0, vs1, vs2, env, desc, \
180
+ do_##NAME, ESZ); \
181
+}
182
+
183
+typedef void opivx2_fn(void *vd, target_long s1, void *vs2, int i);
184
+
185
+/*
186
+ * (T1)s1 gives the real operator type.
187
+ * (TX1)(T1)s1 expands the operator type of widen or narrow operations.
188
+ */
189
+#define OPIVX2(NAME, TD, T1, T2, TX1, TX2, HD, HS2, OP) \
190
+static void do_##NAME(void *vd, target_long s1, void *vs2, int i) \
191
+{ \
192
+ TX2 s2 = *((T2 *)vs2 + HS2(i)); \
193
+ *((TD *)vd + HD(i)) = OP(s2, (TX1)(T1)s1); \
194
+}
195
+
196
+void do_vext_vx(void *vd, void *v0, target_long s1, void *vs2,
197
+ CPURISCVState *env, uint32_t desc,
198
+ opivx2_fn fn, uint32_t esz);
199
+
200
+/* generate the helpers for OPIVX */
201
+#define GEN_VEXT_VX(NAME, ESZ) \
202
+void HELPER(NAME)(void *vd, void *v0, target_ulong s1, \
203
+ void *vs2, CPURISCVState *env, \
204
+ uint32_t desc) \
205
+{ \
206
+ do_vext_vx(vd, v0, s1, vs2, env, desc, \
207
+ do_##NAME, ESZ); \
208
+}
209
+
210
+#endif /* TARGET_RISCV_VECTOR_INTERNALS_H */
211
diff --git a/target/riscv/vector_helper.c b/target/riscv/vector_helper.c
212
index XXXXXXX..XXXXXXX 100644
213
--- a/target/riscv/vector_helper.c
214
+++ b/target/riscv/vector_helper.c
215
@@ -XXX,XX +XXX,XX @@
216
#include "fpu/softfloat.h"
217
#include "tcg/tcg-gvec-desc.h"
218
#include "internals.h"
219
+#include "vector_internals.h"
220
#include <math.h>
221
222
target_ulong HELPER(vsetvl)(CPURISCVState *env, target_ulong s1,
223
@@ -XXX,XX +XXX,XX @@ target_ulong HELPER(vsetvl)(CPURISCVState *env, target_ulong s1,
224
return vl;
225
}
226
227
-/*
228
- * Note that vector data is stored in host-endian 64-bit chunks,
229
- * so addressing units smaller than that needs a host-endian fixup.
230
- */
231
-#if HOST_BIG_ENDIAN
232
-#define H1(x) ((x) ^ 7)
233
-#define H1_2(x) ((x) ^ 6)
234
-#define H1_4(x) ((x) ^ 4)
235
-#define H2(x) ((x) ^ 3)
236
-#define H4(x) ((x) ^ 1)
237
-#define H8(x) ((x))
238
-#else
239
-#define H1(x) (x)
240
-#define H1_2(x) (x)
241
-#define H1_4(x) (x)
242
-#define H2(x) (x)
243
-#define H4(x) (x)
244
-#define H8(x) (x)
245
-#endif
246
-
247
-static inline uint32_t vext_nf(uint32_t desc)
248
-{
249
- return FIELD_EX32(simd_data(desc), VDATA, NF);
250
-}
251
-
252
-static inline uint32_t vext_vm(uint32_t desc)
253
-{
254
- return FIELD_EX32(simd_data(desc), VDATA, VM);
255
-}
256
-
257
-/*
258
- * Encode LMUL to lmul as following:
259
- * LMUL vlmul lmul
260
- * 1 000 0
261
- * 2 001 1
262
- * 4 010 2
263
- * 8 011 3
264
- * - 100 -
265
- * 1/8 101 -3
266
- * 1/4 110 -2
267
- * 1/2 111 -1
268
- */
269
-static inline int32_t vext_lmul(uint32_t desc)
270
-{
271
- return sextract32(FIELD_EX32(simd_data(desc), VDATA, LMUL), 0, 3);
272
-}
273
-
274
-static inline uint32_t vext_vta(uint32_t desc)
275
-{
276
- return FIELD_EX32(simd_data(desc), VDATA, VTA);
277
-}
278
-
279
-static inline uint32_t vext_vma(uint32_t desc)
280
-{
281
- return FIELD_EX32(simd_data(desc), VDATA, VMA);
282
-}
283
-
284
-static inline uint32_t vext_vta_all_1s(uint32_t desc)
285
-{
286
- return FIELD_EX32(simd_data(desc), VDATA, VTA_ALL_1S);
287
-}
288
-
289
/*
290
* Get the maximum number of elements can be operated.
291
*
292
@@ -XXX,XX +XXX,XX @@ static inline uint32_t vext_max_elems(uint32_t desc, uint32_t log2_esz)
293
return scale < 0 ? vlenb >> -scale : vlenb << scale;
294
}
295
296
-/*
297
- * Get number of total elements, including prestart, body and tail elements.
298
- * Note that when LMUL < 1, the tail includes the elements past VLMAX that
299
- * are held in the same vector register.
300
- */
301
-static inline uint32_t vext_get_total_elems(CPURISCVState *env, uint32_t desc,
302
- uint32_t esz)
303
-{
304
- uint32_t vlenb = simd_maxsz(desc);
305
- uint32_t sew = 1 << FIELD_EX64(env->vtype, VTYPE, VSEW);
306
- int8_t emul = ctzl(esz) - ctzl(sew) + vext_lmul(desc) < 0 ? 0 :
307
- ctzl(esz) - ctzl(sew) + vext_lmul(desc);
308
- return (vlenb << emul) / esz;
309
-}
310
-
311
static inline target_ulong adjust_addr(CPURISCVState *env, target_ulong addr)
312
{
313
return (addr & ~env->cur_pmmask) | env->cur_pmbase;
314
@@ -XXX,XX +XXX,XX @@ static void probe_pages(CPURISCVState *env, target_ulong addr,
315
}
316
}
317
318
-/* set agnostic elements to 1s */
319
-static void vext_set_elems_1s(void *base, uint32_t is_agnostic, uint32_t cnt,
320
- uint32_t tot)
321
-{
322
- if (is_agnostic == 0) {
323
- /* policy undisturbed */
324
- return;
325
- }
326
- if (tot - cnt == 0) {
327
- return;
328
- }
329
- memset(base + cnt, -1, tot - cnt);
330
-}
331
-
332
static inline void vext_set_elem_mask(void *v0, int index,
333
uint8_t value)
334
{
335
@@ -XXX,XX +XXX,XX @@ static inline void vext_set_elem_mask(void *v0, int index,
336
((uint64_t *)v0)[idx] = deposit64(old, pos, 1, value);
337
}
338
339
-/*
340
- * Earlier designs (pre-0.9) had a varying number of bits
341
- * per mask value (MLEN). In the 0.9 design, MLEN=1.
342
- * (Section 4.5)
343
- */
344
-static inline int vext_elem_mask(void *v0, int index)
345
-{
346
- int idx = index / 64;
347
- int pos = index % 64;
348
- return (((uint64_t *)v0)[idx] >> pos) & 1;
349
-}
350
-
351
/* elements operations for load and store */
352
typedef void vext_ldst_elem_fn(CPURISCVState *env, abi_ptr addr,
353
uint32_t idx, void *vd, uintptr_t retaddr);
354
@@ -XXX,XX +XXX,XX @@ GEN_VEXT_ST_WHOLE(vs8r_v, int8_t, ste_b)
355
* Vector Integer Arithmetic Instructions
356
*/
357
358
-/* expand macro args before macro */
359
-#define RVVCALL(macro, ...) macro(__VA_ARGS__)
360
-
361
/* (TD, T1, T2, TX1, TX2) */
362
#define OP_SSS_B int8_t, int8_t, int8_t, int8_t, int8_t
363
#define OP_SSS_H int16_t, int16_t, int16_t, int16_t, int16_t
364
#define OP_SSS_W int32_t, int32_t, int32_t, int32_t, int32_t
365
#define OP_SSS_D int64_t, int64_t, int64_t, int64_t, int64_t
366
-#define OP_UUU_B uint8_t, uint8_t, uint8_t, uint8_t, uint8_t
367
-#define OP_UUU_H uint16_t, uint16_t, uint16_t, uint16_t, uint16_t
368
-#define OP_UUU_W uint32_t, uint32_t, uint32_t, uint32_t, uint32_t
369
-#define OP_UUU_D uint64_t, uint64_t, uint64_t, uint64_t, uint64_t
370
#define OP_SUS_B int8_t, uint8_t, int8_t, uint8_t, int8_t
371
#define OP_SUS_H int16_t, uint16_t, int16_t, uint16_t, int16_t
372
#define OP_SUS_W int32_t, uint32_t, int32_t, uint32_t, int32_t
373
@@ -XXX,XX +XXX,XX @@ GEN_VEXT_ST_WHOLE(vs8r_v, int8_t, ste_b)
374
#define NOP_UUU_H uint16_t, uint16_t, uint32_t, uint16_t, uint32_t
375
#define NOP_UUU_W uint32_t, uint32_t, uint64_t, uint32_t, uint64_t
376
377
-/* operation of two vector elements */
378
-typedef void opivv2_fn(void *vd, void *vs1, void *vs2, int i);
379
-
380
-#define OPIVV2(NAME, TD, T1, T2, TX1, TX2, HD, HS1, HS2, OP) \
381
-static void do_##NAME(void *vd, void *vs1, void *vs2, int i) \
382
-{ \
383
- TX1 s1 = *((T1 *)vs1 + HS1(i)); \
384
- TX2 s2 = *((T2 *)vs2 + HS2(i)); \
385
- *((TD *)vd + HD(i)) = OP(s2, s1); \
386
-}
387
#define DO_SUB(N, M) (N - M)
388
#define DO_RSUB(N, M) (M - N)
389
390
@@ -XXX,XX +XXX,XX @@ RVVCALL(OPIVV2, vsub_vv_h, OP_SSS_H, H2, H2, H2, DO_SUB)
391
RVVCALL(OPIVV2, vsub_vv_w, OP_SSS_W, H4, H4, H4, DO_SUB)
392
RVVCALL(OPIVV2, vsub_vv_d, OP_SSS_D, H8, H8, H8, DO_SUB)
393
394
-static void do_vext_vv(void *vd, void *v0, void *vs1, void *vs2,
395
- CPURISCVState *env, uint32_t desc,
396
- opivv2_fn *fn, uint32_t esz)
397
-{
398
- uint32_t vm = vext_vm(desc);
399
- uint32_t vl = env->vl;
400
- uint32_t total_elems = vext_get_total_elems(env, desc, esz);
401
- uint32_t vta = vext_vta(desc);
402
- uint32_t vma = vext_vma(desc);
403
- uint32_t i;
404
-
405
- for (i = env->vstart; i < vl; i++) {
406
- if (!vm && !vext_elem_mask(v0, i)) {
407
- /* set masked-off elements to 1s */
408
- vext_set_elems_1s(vd, vma, i * esz, (i + 1) * esz);
409
- continue;
410
- }
411
- fn(vd, vs1, vs2, i);
412
- }
413
- env->vstart = 0;
414
- /* set tail elements to 1s */
415
- vext_set_elems_1s(vd, vta, vl * esz, total_elems * esz);
416
-}
417
-
418
-/* generate the helpers for OPIVV */
419
-#define GEN_VEXT_VV(NAME, ESZ) \
420
-void HELPER(NAME)(void *vd, void *v0, void *vs1, \
421
- void *vs2, CPURISCVState *env, \
422
- uint32_t desc) \
423
-{ \
424
- do_vext_vv(vd, v0, vs1, vs2, env, desc, \
425
- do_##NAME, ESZ); \
426
-}
427
-
428
GEN_VEXT_VV(vadd_vv_b, 1)
429
GEN_VEXT_VV(vadd_vv_h, 2)
430
GEN_VEXT_VV(vadd_vv_w, 4)
431
@@ -XXX,XX +XXX,XX @@ GEN_VEXT_VV(vsub_vv_h, 2)
432
GEN_VEXT_VV(vsub_vv_w, 4)
433
GEN_VEXT_VV(vsub_vv_d, 8)
434
435
-typedef void opivx2_fn(void *vd, target_long s1, void *vs2, int i);
436
-
437
-/*
438
- * (T1)s1 gives the real operator type.
439
- * (TX1)(T1)s1 expands the operator type of widen or narrow operations.
440
- */
441
-#define OPIVX2(NAME, TD, T1, T2, TX1, TX2, HD, HS2, OP) \
442
-static void do_##NAME(void *vd, target_long s1, void *vs2, int i) \
443
-{ \
444
- TX2 s2 = *((T2 *)vs2 + HS2(i)); \
445
- *((TD *)vd + HD(i)) = OP(s2, (TX1)(T1)s1); \
446
-}
447
448
RVVCALL(OPIVX2, vadd_vx_b, OP_SSS_B, H1, H1, DO_ADD)
449
RVVCALL(OPIVX2, vadd_vx_h, OP_SSS_H, H2, H2, DO_ADD)
450
@@ -XXX,XX +XXX,XX @@ RVVCALL(OPIVX2, vrsub_vx_h, OP_SSS_H, H2, H2, DO_RSUB)
451
RVVCALL(OPIVX2, vrsub_vx_w, OP_SSS_W, H4, H4, DO_RSUB)
452
RVVCALL(OPIVX2, vrsub_vx_d, OP_SSS_D, H8, H8, DO_RSUB)
453
454
-static void do_vext_vx(void *vd, void *v0, target_long s1, void *vs2,
455
- CPURISCVState *env, uint32_t desc,
456
- opivx2_fn fn, uint32_t esz)
457
-{
458
- uint32_t vm = vext_vm(desc);
459
- uint32_t vl = env->vl;
460
- uint32_t total_elems = vext_get_total_elems(env, desc, esz);
461
- uint32_t vta = vext_vta(desc);
462
- uint32_t vma = vext_vma(desc);
463
- uint32_t i;
464
-
465
- for (i = env->vstart; i < vl; i++) {
466
- if (!vm && !vext_elem_mask(v0, i)) {
467
- /* set masked-off elements to 1s */
468
- vext_set_elems_1s(vd, vma, i * esz, (i + 1) * esz);
469
- continue;
470
- }
471
- fn(vd, s1, vs2, i);
472
- }
473
- env->vstart = 0;
474
- /* set tail elements to 1s */
475
- vext_set_elems_1s(vd, vta, vl * esz, total_elems * esz);
476
-}
477
-
478
-/* generate the helpers for OPIVX */
479
-#define GEN_VEXT_VX(NAME, ESZ) \
480
-void HELPER(NAME)(void *vd, void *v0, target_ulong s1, \
481
- void *vs2, CPURISCVState *env, \
482
- uint32_t desc) \
483
-{ \
484
- do_vext_vx(vd, v0, s1, vs2, env, desc, \
485
- do_##NAME, ESZ); \
486
-}
487
-
488
GEN_VEXT_VX(vadd_vx_b, 1)
489
GEN_VEXT_VX(vadd_vx_h, 2)
490
GEN_VEXT_VX(vadd_vx_w, 4)
491
diff --git a/target/riscv/vector_internals.c b/target/riscv/vector_internals.c
144
new file mode 100644
492
new file mode 100644
145
index XXXXXXX..XXXXXXX
493
index XXXXXXX..XXXXXXX
146
--- /dev/null
494
--- /dev/null
147
+++ b/hw/riscv/numa.c
495
+++ b/target/riscv/vector_internals.c
148
@@ -XXX,XX +XXX,XX @@
496
@@ -XXX,XX +XXX,XX @@
149
+/*
497
+/*
150
+ * QEMU RISC-V NUMA Helper
498
+ * RISC-V Vector Extension Internals
151
+ *
499
+ *
152
+ * Copyright (c) 2020 Western Digital Corporation or its affiliates.
500
+ * Copyright (c) 2020 T-Head Semiconductor Co., Ltd. All rights reserved.
153
+ *
501
+ *
154
+ * This program is free software; you can redistribute it and/or modify it
502
+ * This program is free software; you can redistribute it and/or modify it
155
+ * under the terms and conditions of the GNU General Public License,
503
+ * under the terms and conditions of the GNU General Public License,
156
+ * version 2 or later, as published by the Free Software Foundation.
504
+ * version 2 or later, as published by the Free Software Foundation.
157
+ *
505
+ *
...
...
162
+ *
510
+ *
163
+ * You should have received a copy of the GNU General Public License along with
511
+ * You should have received a copy of the GNU General Public License along with
164
+ * this program. If not, see <http://www.gnu.org/licenses/>.
512
+ * this program. If not, see <http://www.gnu.org/licenses/>.
165
+ */
513
+ */
166
+
514
+
167
+#include "qemu/osdep.h"
515
+#include "vector_internals.h"
168
+#include "qemu/units.h"
516
+
169
+#include "qemu/log.h"
517
+/* set agnostic elements to 1s */
170
+#include "qemu/error-report.h"
518
+void vext_set_elems_1s(void *base, uint32_t is_agnostic, uint32_t cnt,
171
+#include "qapi/error.h"
519
+ uint32_t tot)
172
+#include "hw/boards.h"
520
+{
173
+#include "hw/qdev-properties.h"
521
+ if (is_agnostic == 0) {
174
+#include "hw/riscv/numa.h"
522
+ /* policy undisturbed */
175
+#include "sysemu/device_tree.h"
523
+ return;
176
+
177
+static bool numa_enabled(const MachineState *ms)
178
+{
179
+ return (ms->numa_state && ms->numa_state->num_nodes) ? true : false;
180
+}
181
+
182
+int riscv_socket_count(const MachineState *ms)
183
+{
184
+ return (numa_enabled(ms)) ? ms->numa_state->num_nodes : 1;
185
+}
186
+
187
+int riscv_socket_first_hartid(const MachineState *ms, int socket_id)
188
+{
189
+ int i, first_hartid = ms->smp.cpus;
190
+
191
+ if (!numa_enabled(ms)) {
192
+ return (!socket_id) ? 0 : -1;
193
+ }
524
+ }
194
+
525
+ if (tot - cnt == 0) {
195
+ for (i = 0; i < ms->smp.cpus; i++) {
526
+ return ;
196
+ if (ms->possible_cpus->cpus[i].props.node_id != socket_id) {
527
+ }
528
+ memset(base + cnt, -1, tot - cnt);
529
+}
530
+
531
+void do_vext_vv(void *vd, void *v0, void *vs1, void *vs2,
532
+ CPURISCVState *env, uint32_t desc,
533
+ opivv2_fn *fn, uint32_t esz)
534
+{
535
+ uint32_t vm = vext_vm(desc);
536
+ uint32_t vl = env->vl;
537
+ uint32_t total_elems = vext_get_total_elems(env, desc, esz);
538
+ uint32_t vta = vext_vta(desc);
539
+ uint32_t vma = vext_vma(desc);
540
+ uint32_t i;
541
+
542
+ for (i = env->vstart; i < vl; i++) {
543
+ if (!vm && !vext_elem_mask(v0, i)) {
544
+ /* set masked-off elements to 1s */
545
+ vext_set_elems_1s(vd, vma, i * esz, (i + 1) * esz);
197
+ continue;
546
+ continue;
198
+ }
547
+ }
199
+ if (i < first_hartid) {
548
+ fn(vd, vs1, vs2, i);
200
+ first_hartid = i;
201
+ }
202
+ }
549
+ }
203
+
550
+ env->vstart = 0;
204
+ return (first_hartid < ms->smp.cpus) ? first_hartid : -1;
551
+ /* set tail elements to 1s */
205
+}
552
+ vext_set_elems_1s(vd, vta, vl * esz, total_elems * esz);
206
+
553
+}
207
+int riscv_socket_last_hartid(const MachineState *ms, int socket_id)
554
+
208
+{
555
+void do_vext_vx(void *vd, void *v0, target_long s1, void *vs2,
209
+ int i, last_hartid = -1;
556
+ CPURISCVState *env, uint32_t desc,
210
+
557
+ opivx2_fn fn, uint32_t esz)
211
+ if (!numa_enabled(ms)) {
558
+{
212
+ return (!socket_id) ? ms->smp.cpus - 1 : -1;
559
+ uint32_t vm = vext_vm(desc);
213
+ }
560
+ uint32_t vl = env->vl;
214
+
561
+ uint32_t total_elems = vext_get_total_elems(env, desc, esz);
215
+ for (i = 0; i < ms->smp.cpus; i++) {
562
+ uint32_t vta = vext_vta(desc);
216
+ if (ms->possible_cpus->cpus[i].props.node_id != socket_id) {
563
+ uint32_t vma = vext_vma(desc);
564
+ uint32_t i;
565
+
566
+ for (i = env->vstart; i < vl; i++) {
567
+ if (!vm && !vext_elem_mask(v0, i)) {
568
+ /* set masked-off elements to 1s */
569
+ vext_set_elems_1s(vd, vma, i * esz, (i + 1) * esz);
217
+ continue;
570
+ continue;
218
+ }
571
+ }
219
+ if (i > last_hartid) {
572
+ fn(vd, s1, vs2, i);
220
+ last_hartid = i;
221
+ }
222
+ }
573
+ }
223
+
574
+ env->vstart = 0;
224
+ return (last_hartid < ms->smp.cpus) ? last_hartid : -1;
575
+ /* set tail elements to 1s */
225
+}
576
+ vext_set_elems_1s(vd, vta, vl * esz, total_elems * esz);
226
+
577
+}
227
+int riscv_socket_hart_count(const MachineState *ms, int socket_id)
578
diff --git a/target/riscv/meson.build b/target/riscv/meson.build
228
+{
229
+ int first_hartid, last_hartid;
230
+
231
+ if (!numa_enabled(ms)) {
232
+ return (!socket_id) ? ms->smp.cpus : -1;
233
+ }
234
+
235
+ first_hartid = riscv_socket_first_hartid(ms, socket_id);
236
+ if (first_hartid < 0) {
237
+ return -1;
238
+ }
239
+
240
+ last_hartid = riscv_socket_last_hartid(ms, socket_id);
241
+ if (last_hartid < 0) {
242
+ return -1;
243
+ }
244
+
245
+ if (first_hartid > last_hartid) {
246
+ return -1;
247
+ }
248
+
249
+ return last_hartid - first_hartid + 1;
250
+}
251
+
252
+bool riscv_socket_check_hartids(const MachineState *ms, int socket_id)
253
+{
254
+ int i, first_hartid, last_hartid;
255
+
256
+ if (!numa_enabled(ms)) {
257
+ return (!socket_id) ? true : false;
258
+ }
259
+
260
+ first_hartid = riscv_socket_first_hartid(ms, socket_id);
261
+ if (first_hartid < 0) {
262
+ return false;
263
+ }
264
+
265
+ last_hartid = riscv_socket_last_hartid(ms, socket_id);
266
+ if (last_hartid < 0) {
267
+ return false;
268
+ }
269
+
270
+ for (i = first_hartid; i <= last_hartid; i++) {
271
+ if (ms->possible_cpus->cpus[i].props.node_id != socket_id) {
272
+ return false;
273
+ }
274
+ }
275
+
276
+ return true;
277
+}
278
+
279
+uint64_t riscv_socket_mem_offset(const MachineState *ms, int socket_id)
280
+{
281
+ int i;
282
+ uint64_t mem_offset = 0;
283
+
284
+ if (!numa_enabled(ms)) {
285
+ return 0;
286
+ }
287
+
288
+ for (i = 0; i < ms->numa_state->num_nodes; i++) {
289
+ if (i == socket_id) {
290
+ break;
291
+ }
292
+ mem_offset += ms->numa_state->nodes[i].node_mem;
293
+ }
294
+
295
+ return (i == socket_id) ? mem_offset : 0;
296
+}
297
+
298
+uint64_t riscv_socket_mem_size(const MachineState *ms, int socket_id)
299
+{
300
+ if (!numa_enabled(ms)) {
301
+ return (!socket_id) ? ms->ram_size : 0;
302
+ }
303
+
304
+ return (socket_id < ms->numa_state->num_nodes) ?
305
+ ms->numa_state->nodes[socket_id].node_mem : 0;
306
+}
307
+
308
+void riscv_socket_fdt_write_id(const MachineState *ms, void *fdt,
309
+ const char *node_name, int socket_id)
310
+{
311
+ if (numa_enabled(ms)) {
312
+ qemu_fdt_setprop_cell(fdt, node_name, "numa-node-id", socket_id);
313
+ }
314
+}
315
+
316
+void riscv_socket_fdt_write_distance_matrix(const MachineState *ms, void *fdt)
317
+{
318
+ int i, j, idx;
319
+ uint32_t *dist_matrix, dist_matrix_size;
320
+
321
+ if (numa_enabled(ms) && ms->numa_state->have_numa_distance) {
322
+ dist_matrix_size = riscv_socket_count(ms) * riscv_socket_count(ms);
323
+ dist_matrix_size *= (3 * sizeof(uint32_t));
324
+ dist_matrix = g_malloc0(dist_matrix_size);
325
+
326
+ for (i = 0; i < riscv_socket_count(ms); i++) {
327
+ for (j = 0; j < riscv_socket_count(ms); j++) {
328
+ idx = (i * riscv_socket_count(ms) + j) * 3;
329
+ dist_matrix[idx + 0] = cpu_to_be32(i);
330
+ dist_matrix[idx + 1] = cpu_to_be32(j);
331
+ dist_matrix[idx + 2] =
332
+ cpu_to_be32(ms->numa_state->nodes[i].distance[j]);
333
+ }
334
+ }
335
+
336
+ qemu_fdt_add_subnode(fdt, "/distance-map");
337
+ qemu_fdt_setprop_string(fdt, "/distance-map", "compatible",
338
+ "numa-distance-map-v1");
339
+ qemu_fdt_setprop(fdt, "/distance-map", "distance-matrix",
340
+ dist_matrix, dist_matrix_size);
341
+ g_free(dist_matrix);
342
+ }
343
+}
344
+
345
+CpuInstanceProperties
346
+riscv_numa_cpu_index_to_props(MachineState *ms, unsigned cpu_index)
347
+{
348
+ MachineClass *mc = MACHINE_GET_CLASS(ms);
349
+ const CPUArchIdList *possible_cpus = mc->possible_cpu_arch_ids(ms);
350
+
351
+ assert(cpu_index < possible_cpus->len);
352
+ return possible_cpus->cpus[cpu_index].props;
353
+}
354
+
355
+int64_t riscv_numa_get_default_cpu_node_id(const MachineState *ms, int idx)
356
+{
357
+ int64_t nidx = 0;
358
+
359
+ if (ms->numa_state->num_nodes) {
360
+ nidx = idx / (ms->smp.cpus / ms->numa_state->num_nodes);
361
+ if (ms->numa_state->num_nodes <= nidx) {
362
+ nidx = ms->numa_state->num_nodes - 1;
363
+ }
364
+ }
365
+
366
+ return nidx;
367
+}
368
+
369
+const CPUArchIdList *riscv_numa_possible_cpu_arch_ids(MachineState *ms)
370
+{
371
+ int n;
372
+ unsigned int max_cpus = ms->smp.max_cpus;
373
+
374
+ if (ms->possible_cpus) {
375
+ assert(ms->possible_cpus->len == max_cpus);
376
+ return ms->possible_cpus;
377
+ }
378
+
379
+ ms->possible_cpus = g_malloc0(sizeof(CPUArchIdList) +
380
+ sizeof(CPUArchId) * max_cpus);
381
+ ms->possible_cpus->len = max_cpus;
382
+ for (n = 0; n < ms->possible_cpus->len; n++) {
383
+ ms->possible_cpus->cpus[n].type = ms->cpu_type;
384
+ ms->possible_cpus->cpus[n].arch_id = n;
385
+ ms->possible_cpus->cpus[n].props.has_core_id = true;
386
+ ms->possible_cpus->cpus[n].props.core_id = n;
387
+ }
388
+
389
+ return ms->possible_cpus;
390
+}
391
diff --git a/hw/riscv/meson.build b/hw/riscv/meson.build
392
index XXXXXXX..XXXXXXX 100644
579
index XXXXXXX..XXXXXXX 100644
393
--- a/hw/riscv/meson.build
580
--- a/target/riscv/meson.build
394
+++ b/hw/riscv/meson.build
581
+++ b/target/riscv/meson.build
395
@@ -XXX,XX +XXX,XX @@
582
@@ -XXX,XX +XXX,XX @@ riscv_ss.add(files(
396
riscv_ss = ss.source_set()
583
'gdbstub.c',
397
riscv_ss.add(files('boot.c'))
584
'op_helper.c',
398
+riscv_ss.add(files('numa.c'))
585
'vector_helper.c',
399
riscv_ss.add(when: 'CONFIG_HART', if_true: files('riscv_hart.c'))
586
+ 'vector_internals.c',
400
riscv_ss.add(when: 'CONFIG_OPENTITAN', if_true: files('opentitan.c'))
587
'bitmanip_helper.c',
401
riscv_ss.add(when: 'CONFIG_RISCV_VIRT', if_true: files('virt.c'))
588
'translate.c',
589
'm128_helper.c',
402
--
590
--
403
2.28.0
591
2.41.0
404
405
diff view generated by jsdifflib
New patch
1
From: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
1
2
3
Refactor the non SEW-specific stuff out of `GEN_OPIVV_TRANS` into
4
function `opivv_trans` (similar to `opivi_trans`). `opivv_trans` will be
5
used in proceeding vector-crypto commits.
6
7
Signed-off-by: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
9
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
10
Reviewed-by: Weiwei Li <liweiwei@iscas.ac.cn>
11
Signed-off-by: Max Chou <max.chou@sifive.com>
12
Message-ID: <20230711165917.2629866-3-max.chou@sifive.com>
13
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
14
---
15
target/riscv/insn_trans/trans_rvv.c.inc | 62 +++++++++++++------------
16
1 file changed, 32 insertions(+), 30 deletions(-)
17
18
diff --git a/target/riscv/insn_trans/trans_rvv.c.inc b/target/riscv/insn_trans/trans_rvv.c.inc
19
index XXXXXXX..XXXXXXX 100644
20
--- a/target/riscv/insn_trans/trans_rvv.c.inc
21
+++ b/target/riscv/insn_trans/trans_rvv.c.inc
22
@@ -XXX,XX +XXX,XX @@ GEN_OPIWX_WIDEN_TRANS(vwadd_wx)
23
GEN_OPIWX_WIDEN_TRANS(vwsubu_wx)
24
GEN_OPIWX_WIDEN_TRANS(vwsub_wx)
25
26
+static bool opivv_trans(uint32_t vd, uint32_t vs1, uint32_t vs2, uint32_t vm,
27
+ gen_helper_gvec_4_ptr *fn, DisasContext *s)
28
+{
29
+ uint32_t data = 0;
30
+ TCGLabel *over = gen_new_label();
31
+ tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
32
+ tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
33
+
34
+ data = FIELD_DP32(data, VDATA, VM, vm);
35
+ data = FIELD_DP32(data, VDATA, LMUL, s->lmul);
36
+ data = FIELD_DP32(data, VDATA, VTA, s->vta);
37
+ data = FIELD_DP32(data, VDATA, VTA_ALL_1S, s->cfg_vta_all_1s);
38
+ data = FIELD_DP32(data, VDATA, VMA, s->vma);
39
+ tcg_gen_gvec_4_ptr(vreg_ofs(s, vd), vreg_ofs(s, 0), vreg_ofs(s, vs1),
40
+ vreg_ofs(s, vs2), cpu_env, s->cfg_ptr->vlen / 8,
41
+ s->cfg_ptr->vlen / 8, data, fn);
42
+ mark_vs_dirty(s);
43
+ gen_set_label(over);
44
+ return true;
45
+}
46
+
47
/* Vector Integer Add-with-Carry / Subtract-with-Borrow Instructions */
48
/* OPIVV without GVEC IR */
49
-#define GEN_OPIVV_TRANS(NAME, CHECK) \
50
-static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
51
-{ \
52
- if (CHECK(s, a)) { \
53
- uint32_t data = 0; \
54
- static gen_helper_gvec_4_ptr * const fns[4] = { \
55
- gen_helper_##NAME##_b, gen_helper_##NAME##_h, \
56
- gen_helper_##NAME##_w, gen_helper_##NAME##_d, \
57
- }; \
58
- TCGLabel *over = gen_new_label(); \
59
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over); \
60
- tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
61
- \
62
- data = FIELD_DP32(data, VDATA, VM, a->vm); \
63
- data = FIELD_DP32(data, VDATA, LMUL, s->lmul); \
64
- data = FIELD_DP32(data, VDATA, VTA, s->vta); \
65
- data = \
66
- FIELD_DP32(data, VDATA, VTA_ALL_1S, s->cfg_vta_all_1s);\
67
- data = FIELD_DP32(data, VDATA, VMA, s->vma); \
68
- tcg_gen_gvec_4_ptr(vreg_ofs(s, a->rd), vreg_ofs(s, 0), \
69
- vreg_ofs(s, a->rs1), \
70
- vreg_ofs(s, a->rs2), cpu_env, \
71
- s->cfg_ptr->vlen / 8, \
72
- s->cfg_ptr->vlen / 8, data, \
73
- fns[s->sew]); \
74
- mark_vs_dirty(s); \
75
- gen_set_label(over); \
76
- return true; \
77
- } \
78
- return false; \
79
+#define GEN_OPIVV_TRANS(NAME, CHECK) \
80
+static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
81
+{ \
82
+ if (CHECK(s, a)) { \
83
+ static gen_helper_gvec_4_ptr * const fns[4] = { \
84
+ gen_helper_##NAME##_b, gen_helper_##NAME##_h, \
85
+ gen_helper_##NAME##_w, gen_helper_##NAME##_d, \
86
+ }; \
87
+ return opivv_trans(a->rd, a->rs1, a->rs2, a->vm, fns[s->sew], s);\
88
+ } \
89
+ return false; \
90
}
91
92
/*
93
--
94
2.41.0
diff view generated by jsdifflib
New patch
1
From: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
1
2
3
Remove the redundant "vl == 0" check which is already included within the vstart >= vl check, when vl == 0.
4
5
Signed-off-by: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
6
Reviewed-by: Weiwei Li <liweiwei@iscas.ac.cn>
7
Signed-off-by: Max Chou <max.chou@sifive.com>
8
Acked-by: Alistair Francis <alistair.francis@wdc.com>
9
Message-ID: <20230711165917.2629866-4-max.chou@sifive.com>
10
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
11
---
12
target/riscv/insn_trans/trans_rvv.c.inc | 31 +------------------------
13
1 file changed, 1 insertion(+), 30 deletions(-)
14
15
diff --git a/target/riscv/insn_trans/trans_rvv.c.inc b/target/riscv/insn_trans/trans_rvv.c.inc
16
index XXXXXXX..XXXXXXX 100644
17
--- a/target/riscv/insn_trans/trans_rvv.c.inc
18
+++ b/target/riscv/insn_trans/trans_rvv.c.inc
19
@@ -XXX,XX +XXX,XX @@ static bool ldst_us_trans(uint32_t vd, uint32_t rs1, uint32_t data,
20
TCGv_i32 desc;
21
22
TCGLabel *over = gen_new_label();
23
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
24
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
25
26
dest = tcg_temp_new_ptr();
27
@@ -XXX,XX +XXX,XX @@ static bool ldst_stride_trans(uint32_t vd, uint32_t rs1, uint32_t rs2,
28
TCGv_i32 desc;
29
30
TCGLabel *over = gen_new_label();
31
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
32
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
33
34
dest = tcg_temp_new_ptr();
35
@@ -XXX,XX +XXX,XX @@ static bool ldst_index_trans(uint32_t vd, uint32_t rs1, uint32_t vs2,
36
TCGv_i32 desc;
37
38
TCGLabel *over = gen_new_label();
39
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
40
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
41
42
dest = tcg_temp_new_ptr();
43
@@ -XXX,XX +XXX,XX @@ static bool ldff_trans(uint32_t vd, uint32_t rs1, uint32_t data,
44
TCGv_i32 desc;
45
46
TCGLabel *over = gen_new_label();
47
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
48
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
49
50
dest = tcg_temp_new_ptr();
51
@@ -XXX,XX +XXX,XX @@ do_opivv_gvec(DisasContext *s, arg_rmrr *a, GVecGen3Fn *gvec_fn,
52
return false;
53
}
54
55
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
56
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
57
58
if (a->vm && s->vl_eq_vlmax && !(s->vta && s->lmul < 0)) {
59
@@ -XXX,XX +XXX,XX @@ static bool opivx_trans(uint32_t vd, uint32_t rs1, uint32_t vs2, uint32_t vm,
60
uint32_t data = 0;
61
62
TCGLabel *over = gen_new_label();
63
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
64
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
65
66
dest = tcg_temp_new_ptr();
67
@@ -XXX,XX +XXX,XX @@ static bool opivi_trans(uint32_t vd, uint32_t imm, uint32_t vs2, uint32_t vm,
68
uint32_t data = 0;
69
70
TCGLabel *over = gen_new_label();
71
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
72
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
73
74
dest = tcg_temp_new_ptr();
75
@@ -XXX,XX +XXX,XX @@ static bool do_opivv_widen(DisasContext *s, arg_rmrr *a,
76
if (checkfn(s, a)) {
77
uint32_t data = 0;
78
TCGLabel *over = gen_new_label();
79
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
80
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
81
82
data = FIELD_DP32(data, VDATA, VM, a->vm);
83
@@ -XXX,XX +XXX,XX @@ static bool do_opiwv_widen(DisasContext *s, arg_rmrr *a,
84
if (opiwv_widen_check(s, a)) {
85
uint32_t data = 0;
86
TCGLabel *over = gen_new_label();
87
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
88
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
89
90
data = FIELD_DP32(data, VDATA, VM, a->vm);
91
@@ -XXX,XX +XXX,XX @@ static bool opivv_trans(uint32_t vd, uint32_t vs1, uint32_t vs2, uint32_t vm,
92
{
93
uint32_t data = 0;
94
TCGLabel *over = gen_new_label();
95
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
96
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
97
98
data = FIELD_DP32(data, VDATA, VM, vm);
99
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
100
gen_helper_##NAME##_w, \
101
}; \
102
TCGLabel *over = gen_new_label(); \
103
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over); \
104
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
105
\
106
data = FIELD_DP32(data, VDATA, VM, a->vm); \
107
@@ -XXX,XX +XXX,XX @@ static bool trans_vmv_v_v(DisasContext *s, arg_vmv_v_v *a)
108
gen_helper_vmv_v_v_w, gen_helper_vmv_v_v_d,
109
};
110
TCGLabel *over = gen_new_label();
111
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
112
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
113
114
tcg_gen_gvec_2_ptr(vreg_ofs(s, a->rd), vreg_ofs(s, a->rs1),
115
@@ -XXX,XX +XXX,XX @@ static bool trans_vmv_v_x(DisasContext *s, arg_vmv_v_x *a)
116
vext_check_ss(s, a->rd, 0, 1)) {
117
TCGv s1;
118
TCGLabel *over = gen_new_label();
119
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
120
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
121
122
s1 = get_gpr(s, a->rs1, EXT_SIGN);
123
@@ -XXX,XX +XXX,XX @@ static bool trans_vmv_v_i(DisasContext *s, arg_vmv_v_i *a)
124
gen_helper_vmv_v_x_w, gen_helper_vmv_v_x_d,
125
};
126
TCGLabel *over = gen_new_label();
127
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
128
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
129
130
s1 = tcg_constant_i64(simm);
131
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
132
}; \
133
TCGLabel *over = gen_new_label(); \
134
gen_set_rm(s, RISCV_FRM_DYN); \
135
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over); \
136
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
137
\
138
data = FIELD_DP32(data, VDATA, VM, a->vm); \
139
@@ -XXX,XX +XXX,XX @@ static bool opfvf_trans(uint32_t vd, uint32_t rs1, uint32_t vs2,
140
TCGv_i64 t1;
141
142
TCGLabel *over = gen_new_label();
143
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
144
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
145
146
dest = tcg_temp_new_ptr();
147
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
148
}; \
149
TCGLabel *over = gen_new_label(); \
150
gen_set_rm(s, RISCV_FRM_DYN); \
151
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over); \
152
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);\
153
\
154
data = FIELD_DP32(data, VDATA, VM, a->vm); \
155
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
156
}; \
157
TCGLabel *over = gen_new_label(); \
158
gen_set_rm(s, RISCV_FRM_DYN); \
159
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over); \
160
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
161
\
162
data = FIELD_DP32(data, VDATA, VM, a->vm); \
163
@@ -XXX,XX +XXX,XX @@ static bool do_opfv(DisasContext *s, arg_rmr *a,
164
uint32_t data = 0;
165
TCGLabel *over = gen_new_label();
166
gen_set_rm_chkfrm(s, rm);
167
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
168
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
169
170
data = FIELD_DP32(data, VDATA, VM, a->vm);
171
@@ -XXX,XX +XXX,XX @@ static bool trans_vfmv_v_f(DisasContext *s, arg_vfmv_v_f *a)
172
gen_helper_vmv_v_x_d,
173
};
174
TCGLabel *over = gen_new_label();
175
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
176
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
177
178
t1 = tcg_temp_new_i64();
179
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmr *a) \
180
}; \
181
TCGLabel *over = gen_new_label(); \
182
gen_set_rm_chkfrm(s, FRM); \
183
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over); \
184
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
185
\
186
data = FIELD_DP32(data, VDATA, VM, a->vm); \
187
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmr *a) \
188
}; \
189
TCGLabel *over = gen_new_label(); \
190
gen_set_rm(s, RISCV_FRM_DYN); \
191
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over); \
192
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
193
\
194
data = FIELD_DP32(data, VDATA, VM, a->vm); \
195
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmr *a) \
196
}; \
197
TCGLabel *over = gen_new_label(); \
198
gen_set_rm_chkfrm(s, FRM); \
199
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over); \
200
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
201
\
202
data = FIELD_DP32(data, VDATA, VM, a->vm); \
203
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmr *a) \
204
}; \
205
TCGLabel *over = gen_new_label(); \
206
gen_set_rm_chkfrm(s, FRM); \
207
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over); \
208
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
209
\
210
data = FIELD_DP32(data, VDATA, VM, a->vm); \
211
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_r *a) \
212
uint32_t data = 0; \
213
gen_helper_gvec_4_ptr *fn = gen_helper_##NAME; \
214
TCGLabel *over = gen_new_label(); \
215
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over); \
216
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
217
\
218
data = FIELD_DP32(data, VDATA, LMUL, s->lmul); \
219
@@ -XXX,XX +XXX,XX @@ static bool trans_vid_v(DisasContext *s, arg_vid_v *a)
220
require_vm(a->vm, a->rd)) {
221
uint32_t data = 0;
222
TCGLabel *over = gen_new_label();
223
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
224
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
225
226
data = FIELD_DP32(data, VDATA, VM, a->vm);
227
@@ -XXX,XX +XXX,XX @@ static bool trans_vmv_s_x(DisasContext *s, arg_vmv_s_x *a)
228
TCGv s1;
229
TCGLabel *over = gen_new_label();
230
231
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
232
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
233
234
t1 = tcg_temp_new_i64();
235
@@ -XXX,XX +XXX,XX @@ static bool trans_vfmv_s_f(DisasContext *s, arg_vfmv_s_f *a)
236
TCGv_i64 t1;
237
TCGLabel *over = gen_new_label();
238
239
- /* if vl == 0 or vstart >= vl, skip vector register write back */
240
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
241
+ /* if vstart >= vl, skip vector register write back */
242
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
243
244
/* NaN-box f[rs1] */
245
@@ -XXX,XX +XXX,XX @@ static bool int_ext_op(DisasContext *s, arg_rmr *a, uint8_t seq)
246
uint32_t data = 0;
247
gen_helper_gvec_3_ptr *fn;
248
TCGLabel *over = gen_new_label();
249
- tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_vl, 0, over);
250
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
251
252
static gen_helper_gvec_3_ptr * const fns[6][4] = {
253
--
254
2.41.0
diff view generated by jsdifflib
1
From: Lawrence Hunter <lawrence.hunter@codethink.co.uk>
2
3
This commit adds support for the Zvbc vector-crypto extension, which
4
consists of the following instructions:
5
6
* vclmulh.[vx,vv]
7
* vclmul.[vx,vv]
8
9
Translation functions are defined in
10
`target/riscv/insn_trans/trans_rvvk.c.inc` and helpers are defined in
11
`target/riscv/vcrypto_helper.c`.
12
13
Co-authored-by: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
14
Co-authored-by: Max Chou <max.chou@sifive.com>
15
Signed-off-by: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
16
Signed-off-by: Lawrence Hunter <lawrence.hunter@codethink.co.uk>
17
Signed-off-by: Max Chou <max.chou@sifive.com>
18
[max.chou@sifive.com: Exposed x-zvbc property]
19
Message-ID: <20230711165917.2629866-5-max.chou@sifive.com>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
20
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: e7e4e801234f2934306e734f65860f601a5745bd.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <e7e4e801234f2934306e734f65860f601a5745bd.1597259519.git.alistair.francis@wdc.com>
4
---
21
---
5
target/riscv/cpu_bits.h | 1 +
22
target/riscv/cpu_cfg.h | 1 +
6
target/riscv/cpu_helper.c | 16 ++++++----------
23
target/riscv/helper.h | 6 +++
7
target/riscv/op_helper.c | 8 ++------
24
target/riscv/insn32.decode | 6 +++
8
target/riscv/translate.c | 10 ----------
25
target/riscv/cpu.c | 9 ++++
9
4 files changed, 9 insertions(+), 26 deletions(-)
26
target/riscv/translate.c | 1 +
10
27
target/riscv/vcrypto_helper.c | 59 ++++++++++++++++++++++
11
diff --git a/target/riscv/cpu_bits.h b/target/riscv/cpu_bits.h
28
target/riscv/insn_trans/trans_rvvk.c.inc | 62 ++++++++++++++++++++++++
12
index XXXXXXX..XXXXXXX 100644
29
target/riscv/meson.build | 3 +-
13
--- a/target/riscv/cpu_bits.h
30
8 files changed, 146 insertions(+), 1 deletion(-)
14
+++ b/target/riscv/cpu_bits.h
31
create mode 100644 target/riscv/vcrypto_helper.c
15
@@ -XXX,XX +XXX,XX @@
32
create mode 100644 target/riscv/insn_trans/trans_rvvk.c.inc
16
#define HSTATUS_VTSR 0x00400000
33
17
#define HSTATUS_HU 0x00000200
34
diff --git a/target/riscv/cpu_cfg.h b/target/riscv/cpu_cfg.h
18
#define HSTATUS_GVA 0x00000040
35
index XXXXXXX..XXXXXXX 100644
19
+#define HSTATUS_SPVP 0x00000100
36
--- a/target/riscv/cpu_cfg.h
20
37
+++ b/target/riscv/cpu_cfg.h
21
#define HSTATUS32_WPRI 0xFF8FF87E
38
@@ -XXX,XX +XXX,XX @@ struct RISCVCPUConfig {
22
#define HSTATUS64_WPRI 0xFFFFFFFFFF8FF87EULL
39
bool ext_zve32f;
23
diff --git a/target/riscv/cpu_helper.c b/target/riscv/cpu_helper.c
40
bool ext_zve64f;
24
index XXXXXXX..XXXXXXX 100644
41
bool ext_zve64d;
25
--- a/target/riscv/cpu_helper.c
42
+ bool ext_zvbc;
26
+++ b/target/riscv/cpu_helper.c
43
bool ext_zmmul;
27
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_do_interrupt(CPUState *cs)
44
bool ext_zvfbfmin;
28
} else if (riscv_cpu_virt_enabled(env)) {
45
bool ext_zvfbfwma;
29
/* Trap into HS mode, from virt */
46
diff --git a/target/riscv/helper.h b/target/riscv/helper.h
30
riscv_cpu_swap_hypervisor_regs(env);
47
index XXXXXXX..XXXXXXX 100644
31
- env->hstatus = set_field(env->hstatus, HSTATUS_SP2V,
48
--- a/target/riscv/helper.h
32
- get_field(env->hstatus, HSTATUS_SPV));
49
+++ b/target/riscv/helper.h
33
- env->hstatus = set_field(env->hstatus, HSTATUS_SP2P,
50
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_5(vfwcvtbf16_f_f_v, void, ptr, ptr, ptr, env, i32)
34
+ env->hstatus = set_field(env->hstatus, HSTATUS_SPVP,
51
35
get_field(env->mstatus, SSTATUS_SPP));
52
DEF_HELPER_6(vfwmaccbf16_vv, void, ptr, ptr, ptr, ptr, env, i32)
36
env->hstatus = set_field(env->hstatus, HSTATUS_SPV,
53
DEF_HELPER_6(vfwmaccbf16_vf, void, ptr, ptr, i64, ptr, env, i32)
37
riscv_cpu_virt_enabled(env));
54
+
38
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_do_interrupt(CPUState *cs)
55
+/* Vector crypto functions */
39
riscv_cpu_set_force_hs_excep(env, 0);
56
+DEF_HELPER_6(vclmul_vv, void, ptr, ptr, ptr, ptr, env, i32)
40
} else {
57
+DEF_HELPER_6(vclmul_vx, void, ptr, ptr, tl, ptr, env, i32)
41
/* Trap into HS mode */
58
+DEF_HELPER_6(vclmulh_vv, void, ptr, ptr, ptr, ptr, env, i32)
42
- env->hstatus = set_field(env->hstatus, HSTATUS_SP2V,
59
+DEF_HELPER_6(vclmulh_vx, void, ptr, ptr, tl, ptr, env, i32)
43
- get_field(env->hstatus, HSTATUS_SPV));
60
diff --git a/target/riscv/insn32.decode b/target/riscv/insn32.decode
44
- env->hstatus = set_field(env->hstatus, HSTATUS_SP2P,
61
index XXXXXXX..XXXXXXX 100644
45
- get_field(env->mstatus, SSTATUS_SPP));
62
--- a/target/riscv/insn32.decode
46
- env->hstatus = set_field(env->hstatus, HSTATUS_SPV,
63
+++ b/target/riscv/insn32.decode
47
- riscv_cpu_virt_enabled(env));
64
@@ -XXX,XX +XXX,XX @@ vfwcvtbf16_f_f_v 010010 . ..... 01101 001 ..... 1010111 @r2_vm
48
-
65
# *** Zvfbfwma Standard Extension ***
49
+ if (!riscv_cpu_two_stage_lookup(env)) {
66
vfwmaccbf16_vv 111011 . ..... ..... 001 ..... 1010111 @r_vm
50
+ env->hstatus = set_field(env->hstatus, HSTATUS_SPV,
67
vfwmaccbf16_vf 111011 . ..... ..... 101 ..... 1010111 @r_vm
51
+ riscv_cpu_virt_enabled(env));
68
+
52
+ }
69
+# *** Zvbc vector crypto extension ***
53
+ riscv_cpu_set_two_stage_lookup(env, false);
70
+vclmul_vv 001100 . ..... ..... 010 ..... 1010111 @r_vm
54
htval = env->guest_phys_fault_addr;
71
+vclmul_vx 001100 . ..... ..... 110 ..... 1010111 @r_vm
55
}
72
+vclmulh_vv 001101 . ..... ..... 010 ..... 1010111 @r_vm
56
}
73
+vclmulh_vx 001101 . ..... ..... 110 ..... 1010111 @r_vm
57
diff --git a/target/riscv/op_helper.c b/target/riscv/op_helper.c
74
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
58
index XXXXXXX..XXXXXXX 100644
75
index XXXXXXX..XXXXXXX 100644
59
--- a/target/riscv/op_helper.c
76
--- a/target/riscv/cpu.c
60
+++ b/target/riscv/op_helper.c
77
+++ b/target/riscv/cpu.c
61
@@ -XXX,XX +XXX,XX @@ target_ulong helper_sret(CPURISCVState *env, target_ulong cpu_pc_deb)
78
@@ -XXX,XX +XXX,XX @@ static const struct isa_ext_data isa_edata_arr[] = {
62
prev_priv = get_field(mstatus, MSTATUS_SPP);
79
ISA_EXT_DATA_ENTRY(zksed, PRIV_VERSION_1_12_0, ext_zksed),
63
prev_virt = get_field(hstatus, HSTATUS_SPV);
80
ISA_EXT_DATA_ENTRY(zksh, PRIV_VERSION_1_12_0, ext_zksh),
64
81
ISA_EXT_DATA_ENTRY(zkt, PRIV_VERSION_1_12_0, ext_zkt),
65
- hstatus = set_field(hstatus, HSTATUS_SPV,
82
+ ISA_EXT_DATA_ENTRY(zvbc, PRIV_VERSION_1_12_0, ext_zvbc),
66
- get_field(hstatus, HSTATUS_SP2V));
83
ISA_EXT_DATA_ENTRY(zve32f, PRIV_VERSION_1_10_0, ext_zve32f),
67
- mstatus = set_field(mstatus, MSTATUS_SPP,
84
ISA_EXT_DATA_ENTRY(zve64f, PRIV_VERSION_1_10_0, ext_zve64f),
68
- get_field(hstatus, HSTATUS_SP2P));
85
ISA_EXT_DATA_ENTRY(zve64d, PRIV_VERSION_1_10_0, ext_zve64d),
69
- hstatus = set_field(hstatus, HSTATUS_SP2V, 0);
86
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_validate_set_extensions(RISCVCPU *cpu, Error **errp)
70
- hstatus = set_field(hstatus, HSTATUS_SP2P, 0);
87
return;
71
+ hstatus = set_field(hstatus, HSTATUS_SPV, 0);
88
}
72
+ mstatus = set_field(mstatus, MSTATUS_SPP, 0);
89
73
mstatus = set_field(mstatus, SSTATUS_SIE,
90
+ if (cpu->cfg.ext_zvbc && !cpu->cfg.ext_zve64f) {
74
get_field(mstatus, SSTATUS_SPIE));
91
+ error_setg(errp, "Zvbc extension requires V or Zve64{f,d} extensions");
75
mstatus = set_field(mstatus, SSTATUS_SPIE, 1);
92
+ return;
93
+ }
94
+
95
if (cpu->cfg.ext_zk) {
96
cpu->cfg.ext_zkn = true;
97
cpu->cfg.ext_zkr = true;
98
@@ -XXX,XX +XXX,XX @@ static Property riscv_cpu_extensions[] = {
99
DEFINE_PROP_BOOL("x-zvfbfmin", RISCVCPU, cfg.ext_zvfbfmin, false),
100
DEFINE_PROP_BOOL("x-zvfbfwma", RISCVCPU, cfg.ext_zvfbfwma, false),
101
102
+ /* Vector cryptography extensions */
103
+ DEFINE_PROP_BOOL("x-zvbc", RISCVCPU, cfg.ext_zvbc, false),
104
+
105
DEFINE_PROP_END_OF_LIST(),
106
};
107
76
diff --git a/target/riscv/translate.c b/target/riscv/translate.c
108
diff --git a/target/riscv/translate.c b/target/riscv/translate.c
77
index XXXXXXX..XXXXXXX 100644
109
index XXXXXXX..XXXXXXX 100644
78
--- a/target/riscv/translate.c
110
--- a/target/riscv/translate.c
79
+++ b/target/riscv/translate.c
111
+++ b/target/riscv/translate.c
80
@@ -XXX,XX +XXX,XX @@ static void riscv_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs)
112
@@ -XXX,XX +XXX,XX @@ static uint32_t opcode_at(DisasContextBase *dcbase, target_ulong pc)
81
#if !defined(CONFIG_USER_ONLY)
113
#include "insn_trans/trans_rvzfa.c.inc"
82
if (riscv_has_ext(env, RVH)) {
114
#include "insn_trans/trans_rvzfh.c.inc"
83
ctx->virt_enabled = riscv_cpu_virt_enabled(env);
115
#include "insn_trans/trans_rvk.c.inc"
84
- if (env->priv_ver == PRV_M &&
116
+#include "insn_trans/trans_rvvk.c.inc"
85
- get_field(env->mstatus, MSTATUS_MPRV) &&
117
#include "insn_trans/trans_privileged.c.inc"
86
- MSTATUS_MPV_ISSET(env)) {
118
#include "insn_trans/trans_svinval.c.inc"
87
- ctx->virt_enabled = true;
119
#include "insn_trans/trans_rvbf16.c.inc"
88
- } else if (env->priv == PRV_S &&
120
diff --git a/target/riscv/vcrypto_helper.c b/target/riscv/vcrypto_helper.c
89
- !riscv_cpu_virt_enabled(env) &&
121
new file mode 100644
90
- get_field(env->hstatus, HSTATUS_SPRV) &&
122
index XXXXXXX..XXXXXXX
91
- get_field(env->hstatus, HSTATUS_SPV)) {
123
--- /dev/null
92
- ctx->virt_enabled = true;
124
+++ b/target/riscv/vcrypto_helper.c
93
- }
125
@@ -XXX,XX +XXX,XX @@
94
} else {
126
+/*
95
ctx->virt_enabled = false;
127
+ * RISC-V Vector Crypto Extension Helpers for QEMU.
96
}
128
+ *
129
+ * Copyright (C) 2023 SiFive, Inc.
130
+ * Written by Codethink Ltd and SiFive.
131
+ *
132
+ * This program is free software; you can redistribute it and/or modify it
133
+ * under the terms and conditions of the GNU General Public License,
134
+ * version 2 or later, as published by the Free Software Foundation.
135
+ *
136
+ * This program is distributed in the hope it will be useful, but WITHOUT
137
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
138
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
139
+ * more details.
140
+ *
141
+ * You should have received a copy of the GNU General Public License along with
142
+ * this program. If not, see <http://www.gnu.org/licenses/>.
143
+ */
144
+
145
+#include "qemu/osdep.h"
146
+#include "qemu/host-utils.h"
147
+#include "qemu/bitops.h"
148
+#include "cpu.h"
149
+#include "exec/memop.h"
150
+#include "exec/exec-all.h"
151
+#include "exec/helper-proto.h"
152
+#include "internals.h"
153
+#include "vector_internals.h"
154
+
155
+static uint64_t clmul64(uint64_t y, uint64_t x)
156
+{
157
+ uint64_t result = 0;
158
+ for (int j = 63; j >= 0; j--) {
159
+ if ((y >> j) & 1) {
160
+ result ^= (x << j);
161
+ }
162
+ }
163
+ return result;
164
+}
165
+
166
+static uint64_t clmulh64(uint64_t y, uint64_t x)
167
+{
168
+ uint64_t result = 0;
169
+ for (int j = 63; j >= 1; j--) {
170
+ if ((y >> j) & 1) {
171
+ result ^= (x >> (64 - j));
172
+ }
173
+ }
174
+ return result;
175
+}
176
+
177
+RVVCALL(OPIVV2, vclmul_vv, OP_UUU_D, H8, H8, H8, clmul64)
178
+GEN_VEXT_VV(vclmul_vv, 8)
179
+RVVCALL(OPIVX2, vclmul_vx, OP_UUU_D, H8, H8, clmul64)
180
+GEN_VEXT_VX(vclmul_vx, 8)
181
+RVVCALL(OPIVV2, vclmulh_vv, OP_UUU_D, H8, H8, H8, clmulh64)
182
+GEN_VEXT_VV(vclmulh_vv, 8)
183
+RVVCALL(OPIVX2, vclmulh_vx, OP_UUU_D, H8, H8, clmulh64)
184
+GEN_VEXT_VX(vclmulh_vx, 8)
185
diff --git a/target/riscv/insn_trans/trans_rvvk.c.inc b/target/riscv/insn_trans/trans_rvvk.c.inc
186
new file mode 100644
187
index XXXXXXX..XXXXXXX
188
--- /dev/null
189
+++ b/target/riscv/insn_trans/trans_rvvk.c.inc
190
@@ -XXX,XX +XXX,XX @@
191
+/*
192
+ * RISC-V translation routines for the vector crypto extension.
193
+ *
194
+ * Copyright (C) 2023 SiFive, Inc.
195
+ * Written by Codethink Ltd and SiFive.
196
+ *
197
+ * This program is free software; you can redistribute it and/or modify it
198
+ * under the terms and conditions of the GNU General Public License,
199
+ * version 2 or later, as published by the Free Software Foundation.
200
+ *
201
+ * This program is distributed in the hope it will be useful, but WITHOUT
202
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
203
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
204
+ * more details.
205
+ *
206
+ * You should have received a copy of the GNU General Public License along with
207
+ * this program. If not, see <http://www.gnu.org/licenses/>.
208
+ */
209
+
210
+/*
211
+ * Zvbc
212
+ */
213
+
214
+#define GEN_VV_MASKED_TRANS(NAME, CHECK) \
215
+ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
216
+ { \
217
+ if (CHECK(s, a)) { \
218
+ return opivv_trans(a->rd, a->rs1, a->rs2, a->vm, \
219
+ gen_helper_##NAME, s); \
220
+ } \
221
+ return false; \
222
+ }
223
+
224
+static bool vclmul_vv_check(DisasContext *s, arg_rmrr *a)
225
+{
226
+ return opivv_check(s, a) &&
227
+ s->cfg_ptr->ext_zvbc == true &&
228
+ s->sew == MO_64;
229
+}
230
+
231
+GEN_VV_MASKED_TRANS(vclmul_vv, vclmul_vv_check)
232
+GEN_VV_MASKED_TRANS(vclmulh_vv, vclmul_vv_check)
233
+
234
+#define GEN_VX_MASKED_TRANS(NAME, CHECK) \
235
+ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
236
+ { \
237
+ if (CHECK(s, a)) { \
238
+ return opivx_trans(a->rd, a->rs1, a->rs2, a->vm, \
239
+ gen_helper_##NAME, s); \
240
+ } \
241
+ return false; \
242
+ }
243
+
244
+static bool vclmul_vx_check(DisasContext *s, arg_rmrr *a)
245
+{
246
+ return opivx_check(s, a) &&
247
+ s->cfg_ptr->ext_zvbc == true &&
248
+ s->sew == MO_64;
249
+}
250
+
251
+GEN_VX_MASKED_TRANS(vclmul_vx, vclmul_vx_check)
252
+GEN_VX_MASKED_TRANS(vclmulh_vx, vclmul_vx_check)
253
diff --git a/target/riscv/meson.build b/target/riscv/meson.build
254
index XXXXXXX..XXXXXXX 100644
255
--- a/target/riscv/meson.build
256
+++ b/target/riscv/meson.build
257
@@ -XXX,XX +XXX,XX @@ riscv_ss.add(files(
258
'translate.c',
259
'm128_helper.c',
260
'crypto_helper.c',
261
- 'zce_helper.c'
262
+ 'zce_helper.c',
263
+ 'vcrypto_helper.c'
264
))
265
riscv_ss.add(when: 'CONFIG_KVM', if_true: files('kvm.c'), if_false: files('kvm-stub.c'))
266
97
--
267
--
98
2.28.0
268
2.41.0
99
100
diff view generated by jsdifflib
New patch
1
From: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
1
2
3
Move the checks out of `do_opiv{v,x,i}_gvec{,_shift}` functions
4
and into the corresponding macros. This enables the functions to be
5
reused in proceeding commits without check duplication.
6
7
Signed-off-by: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
8
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
9
Reviewed-by: Weiwei Li <liweiwei@iscas.ac.cn>
10
Signed-off-by: Max Chou <max.chou@sifive.com>
11
Message-ID: <20230711165917.2629866-6-max.chou@sifive.com>
12
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
13
---
14
target/riscv/insn_trans/trans_rvv.c.inc | 28 +++++++++++--------------
15
1 file changed, 12 insertions(+), 16 deletions(-)
16
17
diff --git a/target/riscv/insn_trans/trans_rvv.c.inc b/target/riscv/insn_trans/trans_rvv.c.inc
18
index XXXXXXX..XXXXXXX 100644
19
--- a/target/riscv/insn_trans/trans_rvv.c.inc
20
+++ b/target/riscv/insn_trans/trans_rvv.c.inc
21
@@ -XXX,XX +XXX,XX @@ do_opivv_gvec(DisasContext *s, arg_rmrr *a, GVecGen3Fn *gvec_fn,
22
gen_helper_gvec_4_ptr *fn)
23
{
24
TCGLabel *over = gen_new_label();
25
- if (!opivv_check(s, a)) {
26
- return false;
27
- }
28
29
tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
30
31
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
32
gen_helper_##NAME##_b, gen_helper_##NAME##_h, \
33
gen_helper_##NAME##_w, gen_helper_##NAME##_d, \
34
}; \
35
+ if (!opivv_check(s, a)) { \
36
+ return false; \
37
+ } \
38
return do_opivv_gvec(s, a, tcg_gen_gvec_##SUF, fns[s->sew]); \
39
}
40
41
@@ -XXX,XX +XXX,XX @@ static inline bool
42
do_opivx_gvec(DisasContext *s, arg_rmrr *a, GVecGen2sFn *gvec_fn,
43
gen_helper_opivx *fn)
44
{
45
- if (!opivx_check(s, a)) {
46
- return false;
47
- }
48
-
49
if (a->vm && s->vl_eq_vlmax && !(s->vta && s->lmul < 0)) {
50
TCGv_i64 src1 = tcg_temp_new_i64();
51
52
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
53
gen_helper_##NAME##_b, gen_helper_##NAME##_h, \
54
gen_helper_##NAME##_w, gen_helper_##NAME##_d, \
55
}; \
56
+ if (!opivx_check(s, a)) { \
57
+ return false; \
58
+ } \
59
return do_opivx_gvec(s, a, tcg_gen_gvec_##SUF, fns[s->sew]); \
60
}
61
62
@@ -XXX,XX +XXX,XX @@ static inline bool
63
do_opivi_gvec(DisasContext *s, arg_rmrr *a, GVecGen2iFn *gvec_fn,
64
gen_helper_opivx *fn, imm_mode_t imm_mode)
65
{
66
- if (!opivx_check(s, a)) {
67
- return false;
68
- }
69
-
70
if (a->vm && s->vl_eq_vlmax && !(s->vta && s->lmul < 0)) {
71
gvec_fn(s->sew, vreg_ofs(s, a->rd), vreg_ofs(s, a->rs2),
72
extract_imm(s, a->rs1, imm_mode), MAXSZ(s), MAXSZ(s));
73
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
74
gen_helper_##OPIVX##_b, gen_helper_##OPIVX##_h, \
75
gen_helper_##OPIVX##_w, gen_helper_##OPIVX##_d, \
76
}; \
77
+ if (!opivx_check(s, a)) { \
78
+ return false; \
79
+ } \
80
return do_opivi_gvec(s, a, tcg_gen_gvec_##SUF, \
81
fns[s->sew], IMM_MODE); \
82
}
83
@@ -XXX,XX +XXX,XX @@ static inline bool
84
do_opivx_gvec_shift(DisasContext *s, arg_rmrr *a, GVecGen2sFn32 *gvec_fn,
85
gen_helper_opivx *fn)
86
{
87
- if (!opivx_check(s, a)) {
88
- return false;
89
- }
90
-
91
if (a->vm && s->vl_eq_vlmax && !(s->vta && s->lmul < 0)) {
92
TCGv_i32 src1 = tcg_temp_new_i32();
93
94
@@ -XXX,XX +XXX,XX @@ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
95
gen_helper_##NAME##_b, gen_helper_##NAME##_h, \
96
gen_helper_##NAME##_w, gen_helper_##NAME##_d, \
97
}; \
98
- \
99
+ if (!opivx_check(s, a)) { \
100
+ return false; \
101
+ } \
102
return do_opivx_gvec_shift(s, a, tcg_gen_gvec_##SUF, fns[s->sew]); \
103
}
104
105
--
106
2.41.0
diff view generated by jsdifflib
New patch
1
From: Dickon Hood <dickon.hood@codethink.co.uk>
1
2
3
Zvbb (implemented in later commit) has a widening instruction, which
4
requires an extra check on the enabled extensions. Refactor
5
GEN_OPIVX_WIDEN_TRANS() to take a check function to avoid reimplementing
6
it.
7
8
Signed-off-by: Dickon Hood <dickon.hood@codethink.co.uk>
9
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
10
Reviewed-by: Weiwei Li <liweiwei@iscas.ac.cn>
11
Signed-off-by: Max Chou <max.chou@sifive.com>
12
Message-ID: <20230711165917.2629866-7-max.chou@sifive.com>
13
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
14
---
15
target/riscv/insn_trans/trans_rvv.c.inc | 52 +++++++++++--------------
16
1 file changed, 23 insertions(+), 29 deletions(-)
17
18
diff --git a/target/riscv/insn_trans/trans_rvv.c.inc b/target/riscv/insn_trans/trans_rvv.c.inc
19
index XXXXXXX..XXXXXXX 100644
20
--- a/target/riscv/insn_trans/trans_rvv.c.inc
21
+++ b/target/riscv/insn_trans/trans_rvv.c.inc
22
@@ -XXX,XX +XXX,XX @@ static bool opivx_widen_check(DisasContext *s, arg_rmrr *a)
23
vext_check_ds(s, a->rd, a->rs2, a->vm);
24
}
25
26
-static bool do_opivx_widen(DisasContext *s, arg_rmrr *a,
27
- gen_helper_opivx *fn)
28
-{
29
- if (opivx_widen_check(s, a)) {
30
- return opivx_trans(a->rd, a->rs1, a->rs2, a->vm, fn, s);
31
- }
32
- return false;
33
-}
34
-
35
-#define GEN_OPIVX_WIDEN_TRANS(NAME) \
36
-static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
37
-{ \
38
- static gen_helper_opivx * const fns[3] = { \
39
- gen_helper_##NAME##_b, \
40
- gen_helper_##NAME##_h, \
41
- gen_helper_##NAME##_w \
42
- }; \
43
- return do_opivx_widen(s, a, fns[s->sew]); \
44
+#define GEN_OPIVX_WIDEN_TRANS(NAME, CHECK) \
45
+static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
46
+{ \
47
+ if (CHECK(s, a)) { \
48
+ static gen_helper_opivx * const fns[3] = { \
49
+ gen_helper_##NAME##_b, \
50
+ gen_helper_##NAME##_h, \
51
+ gen_helper_##NAME##_w \
52
+ }; \
53
+ return opivx_trans(a->rd, a->rs1, a->rs2, a->vm, fns[s->sew], s); \
54
+ } \
55
+ return false; \
56
}
57
58
-GEN_OPIVX_WIDEN_TRANS(vwaddu_vx)
59
-GEN_OPIVX_WIDEN_TRANS(vwadd_vx)
60
-GEN_OPIVX_WIDEN_TRANS(vwsubu_vx)
61
-GEN_OPIVX_WIDEN_TRANS(vwsub_vx)
62
+GEN_OPIVX_WIDEN_TRANS(vwaddu_vx, opivx_widen_check)
63
+GEN_OPIVX_WIDEN_TRANS(vwadd_vx, opivx_widen_check)
64
+GEN_OPIVX_WIDEN_TRANS(vwsubu_vx, opivx_widen_check)
65
+GEN_OPIVX_WIDEN_TRANS(vwsub_vx, opivx_widen_check)
66
67
/* WIDEN OPIVV with WIDEN */
68
static bool opiwv_widen_check(DisasContext *s, arg_rmrr *a)
69
@@ -XXX,XX +XXX,XX @@ GEN_OPIVX_TRANS(vrem_vx, opivx_check)
70
GEN_OPIVV_WIDEN_TRANS(vwmul_vv, opivv_widen_check)
71
GEN_OPIVV_WIDEN_TRANS(vwmulu_vv, opivv_widen_check)
72
GEN_OPIVV_WIDEN_TRANS(vwmulsu_vv, opivv_widen_check)
73
-GEN_OPIVX_WIDEN_TRANS(vwmul_vx)
74
-GEN_OPIVX_WIDEN_TRANS(vwmulu_vx)
75
-GEN_OPIVX_WIDEN_TRANS(vwmulsu_vx)
76
+GEN_OPIVX_WIDEN_TRANS(vwmul_vx, opivx_widen_check)
77
+GEN_OPIVX_WIDEN_TRANS(vwmulu_vx, opivx_widen_check)
78
+GEN_OPIVX_WIDEN_TRANS(vwmulsu_vx, opivx_widen_check)
79
80
/* Vector Single-Width Integer Multiply-Add Instructions */
81
GEN_OPIVV_TRANS(vmacc_vv, opivv_check)
82
@@ -XXX,XX +XXX,XX @@ GEN_OPIVX_TRANS(vnmsub_vx, opivx_check)
83
GEN_OPIVV_WIDEN_TRANS(vwmaccu_vv, opivv_widen_check)
84
GEN_OPIVV_WIDEN_TRANS(vwmacc_vv, opivv_widen_check)
85
GEN_OPIVV_WIDEN_TRANS(vwmaccsu_vv, opivv_widen_check)
86
-GEN_OPIVX_WIDEN_TRANS(vwmaccu_vx)
87
-GEN_OPIVX_WIDEN_TRANS(vwmacc_vx)
88
-GEN_OPIVX_WIDEN_TRANS(vwmaccsu_vx)
89
-GEN_OPIVX_WIDEN_TRANS(vwmaccus_vx)
90
+GEN_OPIVX_WIDEN_TRANS(vwmaccu_vx, opivx_widen_check)
91
+GEN_OPIVX_WIDEN_TRANS(vwmacc_vx, opivx_widen_check)
92
+GEN_OPIVX_WIDEN_TRANS(vwmaccsu_vx, opivx_widen_check)
93
+GEN_OPIVX_WIDEN_TRANS(vwmaccus_vx, opivx_widen_check)
94
95
/* Vector Integer Merge and Move Instructions */
96
static bool trans_vmv_v_v(DisasContext *s, arg_vmv_v_v *a)
97
--
98
2.41.0
diff view generated by jsdifflib
New patch
1
From: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
1
2
3
Move some macros out of `vector_helper` and into `vector_internals`.
4
This ensures they can be used by both vector and vector-crypto helpers
5
(latter implemented in proceeding commits).
6
7
Signed-off-by: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
8
Reviewed-by: Weiwei Li <liweiwei@iscas.ac.cn>
9
Signed-off-by: Max Chou <max.chou@sifive.com>
10
Message-ID: <20230711165917.2629866-8-max.chou@sifive.com>
11
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
12
---
13
target/riscv/vector_internals.h | 46 +++++++++++++++++++++++++++++++++
14
target/riscv/vector_helper.c | 42 ------------------------------
15
2 files changed, 46 insertions(+), 42 deletions(-)
16
17
diff --git a/target/riscv/vector_internals.h b/target/riscv/vector_internals.h
18
index XXXXXXX..XXXXXXX 100644
19
--- a/target/riscv/vector_internals.h
20
+++ b/target/riscv/vector_internals.h
21
@@ -XXX,XX +XXX,XX @@ void vext_set_elems_1s(void *base, uint32_t is_agnostic, uint32_t cnt,
22
/* expand macro args before macro */
23
#define RVVCALL(macro, ...) macro(__VA_ARGS__)
24
25
+/* (TD, T2, TX2) */
26
+#define OP_UU_B uint8_t, uint8_t, uint8_t
27
+#define OP_UU_H uint16_t, uint16_t, uint16_t
28
+#define OP_UU_W uint32_t, uint32_t, uint32_t
29
+#define OP_UU_D uint64_t, uint64_t, uint64_t
30
+
31
/* (TD, T1, T2, TX1, TX2) */
32
#define OP_UUU_B uint8_t, uint8_t, uint8_t, uint8_t, uint8_t
33
#define OP_UUU_H uint16_t, uint16_t, uint16_t, uint16_t, uint16_t
34
#define OP_UUU_W uint32_t, uint32_t, uint32_t, uint32_t, uint32_t
35
#define OP_UUU_D uint64_t, uint64_t, uint64_t, uint64_t, uint64_t
36
37
+#define OPIVV1(NAME, TD, T2, TX2, HD, HS2, OP) \
38
+static void do_##NAME(void *vd, void *vs2, int i) \
39
+{ \
40
+ TX2 s2 = *((T2 *)vs2 + HS2(i)); \
41
+ *((TD *)vd + HD(i)) = OP(s2); \
42
+}
43
+
44
+#define GEN_VEXT_V(NAME, ESZ) \
45
+void HELPER(NAME)(void *vd, void *v0, void *vs2, \
46
+ CPURISCVState *env, uint32_t desc) \
47
+{ \
48
+ uint32_t vm = vext_vm(desc); \
49
+ uint32_t vl = env->vl; \
50
+ uint32_t total_elems = \
51
+ vext_get_total_elems(env, desc, ESZ); \
52
+ uint32_t vta = vext_vta(desc); \
53
+ uint32_t vma = vext_vma(desc); \
54
+ uint32_t i; \
55
+ \
56
+ for (i = env->vstart; i < vl; i++) { \
57
+ if (!vm && !vext_elem_mask(v0, i)) { \
58
+ /* set masked-off elements to 1s */ \
59
+ vext_set_elems_1s(vd, vma, i * ESZ, \
60
+ (i + 1) * ESZ); \
61
+ continue; \
62
+ } \
63
+ do_##NAME(vd, vs2, i); \
64
+ } \
65
+ env->vstart = 0; \
66
+ /* set tail elements to 1s */ \
67
+ vext_set_elems_1s(vd, vta, vl * ESZ, \
68
+ total_elems * ESZ); \
69
+}
70
+
71
/* operation of two vector elements */
72
typedef void opivv2_fn(void *vd, void *vs1, void *vs2, int i);
73
74
@@ -XXX,XX +XXX,XX @@ void HELPER(NAME)(void *vd, void *v0, target_ulong s1, \
75
do_##NAME, ESZ); \
76
}
77
78
+/* Three of the widening shortening macros: */
79
+/* (TD, T1, T2, TX1, TX2) */
80
+#define WOP_UUU_B uint16_t, uint8_t, uint8_t, uint16_t, uint16_t
81
+#define WOP_UUU_H uint32_t, uint16_t, uint16_t, uint32_t, uint32_t
82
+#define WOP_UUU_W uint64_t, uint32_t, uint32_t, uint64_t, uint64_t
83
+
84
#endif /* TARGET_RISCV_VECTOR_INTERNALS_H */
85
diff --git a/target/riscv/vector_helper.c b/target/riscv/vector_helper.c
86
index XXXXXXX..XXXXXXX 100644
87
--- a/target/riscv/vector_helper.c
88
+++ b/target/riscv/vector_helper.c
89
@@ -XXX,XX +XXX,XX @@ GEN_VEXT_ST_WHOLE(vs8r_v, int8_t, ste_b)
90
#define OP_SUS_H int16_t, uint16_t, int16_t, uint16_t, int16_t
91
#define OP_SUS_W int32_t, uint32_t, int32_t, uint32_t, int32_t
92
#define OP_SUS_D int64_t, uint64_t, int64_t, uint64_t, int64_t
93
-#define WOP_UUU_B uint16_t, uint8_t, uint8_t, uint16_t, uint16_t
94
-#define WOP_UUU_H uint32_t, uint16_t, uint16_t, uint32_t, uint32_t
95
-#define WOP_UUU_W uint64_t, uint32_t, uint32_t, uint64_t, uint64_t
96
#define WOP_SSS_B int16_t, int8_t, int8_t, int16_t, int16_t
97
#define WOP_SSS_H int32_t, int16_t, int16_t, int32_t, int32_t
98
#define WOP_SSS_W int64_t, int32_t, int32_t, int64_t, int64_t
99
@@ -XXX,XX +XXX,XX @@ GEN_VEXT_VF(vfwnmsac_vf_h, 4)
100
GEN_VEXT_VF(vfwnmsac_vf_w, 8)
101
102
/* Vector Floating-Point Square-Root Instruction */
103
-/* (TD, T2, TX2) */
104
-#define OP_UU_H uint16_t, uint16_t, uint16_t
105
-#define OP_UU_W uint32_t, uint32_t, uint32_t
106
-#define OP_UU_D uint64_t, uint64_t, uint64_t
107
-
108
#define OPFVV1(NAME, TD, T2, TX2, HD, HS2, OP) \
109
static void do_##NAME(void *vd, void *vs2, int i, \
110
CPURISCVState *env) \
111
@@ -XXX,XX +XXX,XX @@ GEN_VEXT_CMP_VF(vmfge_vf_w, uint32_t, H4, vmfge32)
112
GEN_VEXT_CMP_VF(vmfge_vf_d, uint64_t, H8, vmfge64)
113
114
/* Vector Floating-Point Classify Instruction */
115
-#define OPIVV1(NAME, TD, T2, TX2, HD, HS2, OP) \
116
-static void do_##NAME(void *vd, void *vs2, int i) \
117
-{ \
118
- TX2 s2 = *((T2 *)vs2 + HS2(i)); \
119
- *((TD *)vd + HD(i)) = OP(s2); \
120
-}
121
-
122
-#define GEN_VEXT_V(NAME, ESZ) \
123
-void HELPER(NAME)(void *vd, void *v0, void *vs2, \
124
- CPURISCVState *env, uint32_t desc) \
125
-{ \
126
- uint32_t vm = vext_vm(desc); \
127
- uint32_t vl = env->vl; \
128
- uint32_t total_elems = \
129
- vext_get_total_elems(env, desc, ESZ); \
130
- uint32_t vta = vext_vta(desc); \
131
- uint32_t vma = vext_vma(desc); \
132
- uint32_t i; \
133
- \
134
- for (i = env->vstart; i < vl; i++) { \
135
- if (!vm && !vext_elem_mask(v0, i)) { \
136
- /* set masked-off elements to 1s */ \
137
- vext_set_elems_1s(vd, vma, i * ESZ, \
138
- (i + 1) * ESZ); \
139
- continue; \
140
- } \
141
- do_##NAME(vd, vs2, i); \
142
- } \
143
- env->vstart = 0; \
144
- /* set tail elements to 1s */ \
145
- vext_set_elems_1s(vd, vta, vl * ESZ, \
146
- total_elems * ESZ); \
147
-}
148
-
149
target_ulong fclass_h(uint64_t frs1)
150
{
151
float16 f = frs1;
152
--
153
2.41.0
diff view generated by jsdifflib
1
From: Dickon Hood <dickon.hood@codethink.co.uk>
2
3
This commit adds support for the Zvbb vector-crypto extension, which
4
consists of the following instructions:
5
6
* vrol.[vv,vx]
7
* vror.[vv,vx,vi]
8
* vbrev8.v
9
* vrev8.v
10
* vandn.[vv,vx]
11
* vbrev.v
12
* vclz.v
13
* vctz.v
14
* vcpop.v
15
* vwsll.[vv,vx,vi]
16
17
Translation functions are defined in
18
`target/riscv/insn_trans/trans_rvvk.c.inc` and helpers are defined in
19
`target/riscv/vcrypto_helper.c`.
20
21
Co-authored-by: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
22
Co-authored-by: William Salmon <will.salmon@codethink.co.uk>
23
Co-authored-by: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
24
[max.chou@sifive.com: Fix imm mode of vror.vi]
25
Signed-off-by: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
26
Signed-off-by: William Salmon <will.salmon@codethink.co.uk>
27
Signed-off-by: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
28
Signed-off-by: Dickon Hood <dickon.hood@codethink.co.uk>
29
Signed-off-by: Max Chou <max.chou@sifive.com>
30
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
31
[max.chou@sifive.com: Exposed x-zvbb property]
32
Message-ID: <20230711165917.2629866-9-max.chou@sifive.com>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
33
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: 477c864312280ea55a98dc84cb01d826751b6c14.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <477c864312280ea55a98dc84cb01d826751b6c14.1597259519.git.alistair.francis@wdc.com>
4
---
34
---
5
target/riscv/cpu_bits.h | 1 +
35
target/riscv/cpu_cfg.h | 1 +
6
target/riscv/helper.h | 3 +
36
target/riscv/helper.h | 62 +++++++++
7
target/riscv/insn32-64.decode | 5 +
37
target/riscv/insn32.decode | 20 +++
8
target/riscv/insn32.decode | 11 +
38
target/riscv/cpu.c | 12 ++
9
target/riscv/op_helper.c | 114 ++++++++
39
target/riscv/vcrypto_helper.c | 138 +++++++++++++++++++
10
target/riscv/insn_trans/trans_rvh.c.inc | 340 ++++++++++++++++++++++++
40
target/riscv/insn_trans/trans_rvvk.c.inc | 164 +++++++++++++++++++++++
11
6 files changed, 474 insertions(+)
41
6 files changed, 397 insertions(+)
12
42
13
diff --git a/target/riscv/cpu_bits.h b/target/riscv/cpu_bits.h
43
diff --git a/target/riscv/cpu_cfg.h b/target/riscv/cpu_cfg.h
14
index XXXXXXX..XXXXXXX 100644
44
index XXXXXXX..XXXXXXX 100644
15
--- a/target/riscv/cpu_bits.h
45
--- a/target/riscv/cpu_cfg.h
16
+++ b/target/riscv/cpu_bits.h
46
+++ b/target/riscv/cpu_cfg.h
17
@@ -XXX,XX +XXX,XX @@
47
@@ -XXX,XX +XXX,XX @@ struct RISCVCPUConfig {
18
#define HSTATUS_SP2V 0x00000200
48
bool ext_zve32f;
19
#define HSTATUS_VTVM 0x00100000
49
bool ext_zve64f;
20
#define HSTATUS_VTSR 0x00400000
50
bool ext_zve64d;
21
+#define HSTATUS_HU 0x00000200
51
+ bool ext_zvbb;
22
52
bool ext_zvbc;
23
#define HSTATUS32_WPRI 0xFF8FF87E
53
bool ext_zmmul;
24
#define HSTATUS64_WPRI 0xFFFFFFFFFF8FF87EULL
54
bool ext_zvfbfmin;
25
diff --git a/target/riscv/helper.h b/target/riscv/helper.h
55
diff --git a/target/riscv/helper.h b/target/riscv/helper.h
26
index XXXXXXX..XXXXXXX 100644
56
index XXXXXXX..XXXXXXX 100644
27
--- a/target/riscv/helper.h
57
--- a/target/riscv/helper.h
28
+++ b/target/riscv/helper.h
58
+++ b/target/riscv/helper.h
29
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_1(tlb_flush, void, env)
59
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_6(vclmul_vv, void, ptr, ptr, ptr, ptr, env, i32)
30
/* Hypervisor functions */
60
DEF_HELPER_6(vclmul_vx, void, ptr, ptr, tl, ptr, env, i32)
31
#ifndef CONFIG_USER_ONLY
61
DEF_HELPER_6(vclmulh_vv, void, ptr, ptr, ptr, ptr, env, i32)
32
DEF_HELPER_1(hyp_tlb_flush, void, env)
62
DEF_HELPER_6(vclmulh_vx, void, ptr, ptr, tl, ptr, env, i32)
33
+DEF_HELPER_4(hyp_load, tl, env, tl, tl, tl)
63
+
34
+DEF_HELPER_5(hyp_store, void, env, tl, tl, tl, tl)
64
+DEF_HELPER_6(vror_vv_b, void, ptr, ptr, ptr, ptr, env, i32)
35
+DEF_HELPER_4(hyp_x_load, tl, env, tl, tl, tl)
65
+DEF_HELPER_6(vror_vv_h, void, ptr, ptr, ptr, ptr, env, i32)
36
#endif
66
+DEF_HELPER_6(vror_vv_w, void, ptr, ptr, ptr, ptr, env, i32)
37
67
+DEF_HELPER_6(vror_vv_d, void, ptr, ptr, ptr, ptr, env, i32)
38
/* Vector functions */
68
+
39
diff --git a/target/riscv/insn32-64.decode b/target/riscv/insn32-64.decode
69
+DEF_HELPER_6(vror_vx_b, void, ptr, ptr, tl, ptr, env, i32)
40
index XXXXXXX..XXXXXXX 100644
70
+DEF_HELPER_6(vror_vx_h, void, ptr, ptr, tl, ptr, env, i32)
41
--- a/target/riscv/insn32-64.decode
71
+DEF_HELPER_6(vror_vx_w, void, ptr, ptr, tl, ptr, env, i32)
42
+++ b/target/riscv/insn32-64.decode
72
+DEF_HELPER_6(vror_vx_d, void, ptr, ptr, tl, ptr, env, i32)
43
@@ -XXX,XX +XXX,XX @@ fmv_x_d 1110001 00000 ..... 000 ..... 1010011 @r2
73
+
44
fcvt_d_l 1101001 00010 ..... ... ..... 1010011 @r2_rm
74
+DEF_HELPER_6(vrol_vv_b, void, ptr, ptr, ptr, ptr, env, i32)
45
fcvt_d_lu 1101001 00011 ..... ... ..... 1010011 @r2_rm
75
+DEF_HELPER_6(vrol_vv_h, void, ptr, ptr, ptr, ptr, env, i32)
46
fmv_d_x 1111001 00000 ..... 000 ..... 1010011 @r2
76
+DEF_HELPER_6(vrol_vv_w, void, ptr, ptr, ptr, ptr, env, i32)
47
+
77
+DEF_HELPER_6(vrol_vv_d, void, ptr, ptr, ptr, ptr, env, i32)
48
+# *** RV32H Base Instruction Set ***
78
+
49
+hlv_wu 0110100 00001 ..... 100 ..... 1110011 @r2
79
+DEF_HELPER_6(vrol_vx_b, void, ptr, ptr, tl, ptr, env, i32)
50
+hlv_d 0110110 00000 ..... 100 ..... 1110011 @r2
80
+DEF_HELPER_6(vrol_vx_h, void, ptr, ptr, tl, ptr, env, i32)
51
+hsv_d 0110111 ..... ..... 100 00000 1110011 @r2_s
81
+DEF_HELPER_6(vrol_vx_w, void, ptr, ptr, tl, ptr, env, i32)
82
+DEF_HELPER_6(vrol_vx_d, void, ptr, ptr, tl, ptr, env, i32)
83
+
84
+DEF_HELPER_5(vrev8_v_b, void, ptr, ptr, ptr, env, i32)
85
+DEF_HELPER_5(vrev8_v_h, void, ptr, ptr, ptr, env, i32)
86
+DEF_HELPER_5(vrev8_v_w, void, ptr, ptr, ptr, env, i32)
87
+DEF_HELPER_5(vrev8_v_d, void, ptr, ptr, ptr, env, i32)
88
+DEF_HELPER_5(vbrev8_v_b, void, ptr, ptr, ptr, env, i32)
89
+DEF_HELPER_5(vbrev8_v_h, void, ptr, ptr, ptr, env, i32)
90
+DEF_HELPER_5(vbrev8_v_w, void, ptr, ptr, ptr, env, i32)
91
+DEF_HELPER_5(vbrev8_v_d, void, ptr, ptr, ptr, env, i32)
92
+DEF_HELPER_5(vbrev_v_b, void, ptr, ptr, ptr, env, i32)
93
+DEF_HELPER_5(vbrev_v_h, void, ptr, ptr, ptr, env, i32)
94
+DEF_HELPER_5(vbrev_v_w, void, ptr, ptr, ptr, env, i32)
95
+DEF_HELPER_5(vbrev_v_d, void, ptr, ptr, ptr, env, i32)
96
+
97
+DEF_HELPER_5(vclz_v_b, void, ptr, ptr, ptr, env, i32)
98
+DEF_HELPER_5(vclz_v_h, void, ptr, ptr, ptr, env, i32)
99
+DEF_HELPER_5(vclz_v_w, void, ptr, ptr, ptr, env, i32)
100
+DEF_HELPER_5(vclz_v_d, void, ptr, ptr, ptr, env, i32)
101
+DEF_HELPER_5(vctz_v_b, void, ptr, ptr, ptr, env, i32)
102
+DEF_HELPER_5(vctz_v_h, void, ptr, ptr, ptr, env, i32)
103
+DEF_HELPER_5(vctz_v_w, void, ptr, ptr, ptr, env, i32)
104
+DEF_HELPER_5(vctz_v_d, void, ptr, ptr, ptr, env, i32)
105
+DEF_HELPER_5(vcpop_v_b, void, ptr, ptr, ptr, env, i32)
106
+DEF_HELPER_5(vcpop_v_h, void, ptr, ptr, ptr, env, i32)
107
+DEF_HELPER_5(vcpop_v_w, void, ptr, ptr, ptr, env, i32)
108
+DEF_HELPER_5(vcpop_v_d, void, ptr, ptr, ptr, env, i32)
109
+
110
+DEF_HELPER_6(vwsll_vv_b, void, ptr, ptr, ptr, ptr, env, i32)
111
+DEF_HELPER_6(vwsll_vv_h, void, ptr, ptr, ptr, ptr, env, i32)
112
+DEF_HELPER_6(vwsll_vv_w, void, ptr, ptr, ptr, ptr, env, i32)
113
+DEF_HELPER_6(vwsll_vx_b, void, ptr, ptr, tl, ptr, env, i32)
114
+DEF_HELPER_6(vwsll_vx_h, void, ptr, ptr, tl, ptr, env, i32)
115
+DEF_HELPER_6(vwsll_vx_w, void, ptr, ptr, tl, ptr, env, i32)
116
+
117
+DEF_HELPER_6(vandn_vv_b, void, ptr, ptr, ptr, ptr, env, i32)
118
+DEF_HELPER_6(vandn_vv_h, void, ptr, ptr, ptr, ptr, env, i32)
119
+DEF_HELPER_6(vandn_vv_w, void, ptr, ptr, ptr, ptr, env, i32)
120
+DEF_HELPER_6(vandn_vv_d, void, ptr, ptr, ptr, ptr, env, i32)
121
+DEF_HELPER_6(vandn_vx_b, void, ptr, ptr, tl, ptr, env, i32)
122
+DEF_HELPER_6(vandn_vx_h, void, ptr, ptr, tl, ptr, env, i32)
123
+DEF_HELPER_6(vandn_vx_w, void, ptr, ptr, tl, ptr, env, i32)
124
+DEF_HELPER_6(vandn_vx_d, void, ptr, ptr, tl, ptr, env, i32)
52
diff --git a/target/riscv/insn32.decode b/target/riscv/insn32.decode
125
diff --git a/target/riscv/insn32.decode b/target/riscv/insn32.decode
53
index XXXXXXX..XXXXXXX 100644
126
index XXXXXXX..XXXXXXX 100644
54
--- a/target/riscv/insn32.decode
127
--- a/target/riscv/insn32.decode
55
+++ b/target/riscv/insn32.decode
128
+++ b/target/riscv/insn32.decode
56
@@ -XXX,XX +XXX,XX @@
129
@@ -XXX,XX +XXX,XX @@
130
%imm_u 12:s20 !function=ex_shift_12
131
%imm_bs 30:2 !function=ex_shift_3
132
%imm_rnum 20:4
133
+%imm_z6 26:1 15:5
134
135
# Argument sets:
136
&empty
137
@@ -XXX,XX +XXX,XX @@
138
@r_vm ...... vm:1 ..... ..... ... ..... ....... &rmrr %rs2 %rs1 %rd
139
@r_vm_1 ...... . ..... ..... ... ..... ....... &rmrr vm=1 %rs2 %rs1 %rd
57
@r_vm_0 ...... . ..... ..... ... ..... ....... &rmrr vm=0 %rs2 %rs1 %rd
140
@r_vm_0 ...... . ..... ..... ... ..... ....... &rmrr vm=0 %rs2 %rs1 %rd
58
@r_wdvm ..... wd:1 vm:1 ..... ..... ... ..... ....... &rwdvm %rs2 %rs1 %rd
141
+@r2_zimm6 ..... . vm:1 ..... ..... ... ..... ....... &rmrr %rs2 rs1=%imm_z6 %rd
59
@r2_zimm . zimm:11 ..... ... ..... ....... %rs1 %rd
142
@r2_zimm11 . zimm:11 ..... ... ..... ....... %rs1 %rd
60
+@r2_s ....... ..... ..... ... ..... ....... %rs2 %rs1
143
@r2_zimm10 .. zimm:10 ..... ... ..... ....... %rs1 %rd
61
144
@r2_s ....... ..... ..... ... ..... ....... %rs2 %rs1
62
@hfence_gvma ....... ..... ..... ... ..... ....... %rs2 %rs1
145
@@ -XXX,XX +XXX,XX @@ vclmul_vv 001100 . ..... ..... 010 ..... 1010111 @r_vm
63
@hfence_vvma ....... ..... ..... ... ..... ....... %rs2 %rs1
146
vclmul_vx 001100 . ..... ..... 110 ..... 1010111 @r_vm
64
@@ -XXX,XX +XXX,XX @@ fcvt_d_w 1101001 00000 ..... ... ..... 1010011 @r2_rm
147
vclmulh_vv 001101 . ..... ..... 010 ..... 1010111 @r_vm
65
fcvt_d_wu 1101001 00001 ..... ... ..... 1010011 @r2_rm
148
vclmulh_vx 001101 . ..... ..... 110 ..... 1010111 @r_vm
66
149
+
67
# *** RV32H Base Instruction Set ***
150
+# *** Zvbb vector crypto extension ***
68
+hlv_b 0110000 00000 ..... 100 ..... 1110011 @r2
151
+vrol_vv 010101 . ..... ..... 000 ..... 1010111 @r_vm
69
+hlv_bu 0110000 00001 ..... 100 ..... 1110011 @r2
152
+vrol_vx 010101 . ..... ..... 100 ..... 1010111 @r_vm
70
+hlv_h 0110010 00000 ..... 100 ..... 1110011 @r2
153
+vror_vv 010100 . ..... ..... 000 ..... 1010111 @r_vm
71
+hlv_hu 0110010 00001 ..... 100 ..... 1110011 @r2
154
+vror_vx 010100 . ..... ..... 100 ..... 1010111 @r_vm
72
+hlvx_hu 0110010 00011 ..... 100 ..... 1110011 @r2
155
+vror_vi 01010. . ..... ..... 011 ..... 1010111 @r2_zimm6
73
+hlv_w 0110100 00000 ..... 100 ..... 1110011 @r2
156
+vbrev8_v 010010 . ..... 01000 010 ..... 1010111 @r2_vm
74
+hlvx_wu 0110100 00011 ..... 100 ..... 1110011 @r2
157
+vrev8_v 010010 . ..... 01001 010 ..... 1010111 @r2_vm
75
+hsv_b 0110001 ..... ..... 100 00000 1110011 @r2_s
158
+vandn_vv 000001 . ..... ..... 000 ..... 1010111 @r_vm
76
+hsv_h 0110011 ..... ..... 100 00000 1110011 @r2_s
159
+vandn_vx 000001 . ..... ..... 100 ..... 1010111 @r_vm
77
+hsv_w 0110101 ..... ..... 100 00000 1110011 @r2_s
160
+vbrev_v 010010 . ..... 01010 010 ..... 1010111 @r2_vm
78
hfence_gvma 0110001 ..... ..... 000 00000 1110011 @hfence_gvma
161
+vclz_v 010010 . ..... 01100 010 ..... 1010111 @r2_vm
79
hfence_vvma 0010001 ..... ..... 000 00000 1110011 @hfence_vvma
162
+vctz_v 010010 . ..... 01101 010 ..... 1010111 @r2_vm
80
163
+vcpop_v 010010 . ..... 01110 010 ..... 1010111 @r2_vm
81
diff --git a/target/riscv/op_helper.c b/target/riscv/op_helper.c
164
+vwsll_vv 110101 . ..... ..... 000 ..... 1010111 @r_vm
165
+vwsll_vx 110101 . ..... ..... 100 ..... 1010111 @r_vm
166
+vwsll_vi 110101 . ..... ..... 011 ..... 1010111 @r_vm
167
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
82
index XXXXXXX..XXXXXXX 100644
168
index XXXXXXX..XXXXXXX 100644
83
--- a/target/riscv/op_helper.c
169
--- a/target/riscv/cpu.c
84
+++ b/target/riscv/op_helper.c
170
+++ b/target/riscv/cpu.c
85
@@ -XXX,XX +XXX,XX @@ void helper_hyp_tlb_flush(CPURISCVState *env)
171
@@ -XXX,XX +XXX,XX @@ static const struct isa_ext_data isa_edata_arr[] = {
86
riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
172
ISA_EXT_DATA_ENTRY(zksed, PRIV_VERSION_1_12_0, ext_zksed),
87
}
173
ISA_EXT_DATA_ENTRY(zksh, PRIV_VERSION_1_12_0, ext_zksh),
88
174
ISA_EXT_DATA_ENTRY(zkt, PRIV_VERSION_1_12_0, ext_zkt),
89
+target_ulong helper_hyp_load(CPURISCVState *env, target_ulong address,
175
+ ISA_EXT_DATA_ENTRY(zvbb, PRIV_VERSION_1_12_0, ext_zvbb),
90
+ target_ulong attrs, target_ulong memop)
176
ISA_EXT_DATA_ENTRY(zvbc, PRIV_VERSION_1_12_0, ext_zvbc),
177
ISA_EXT_DATA_ENTRY(zve32f, PRIV_VERSION_1_10_0, ext_zve32f),
178
ISA_EXT_DATA_ENTRY(zve64f, PRIV_VERSION_1_10_0, ext_zve64f),
179
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_validate_set_extensions(RISCVCPU *cpu, Error **errp)
180
return;
181
}
182
183
+ /*
184
+ * In principle Zve*x would also suffice here, were they supported
185
+ * in qemu
186
+ */
187
+ if (cpu->cfg.ext_zvbb && !cpu->cfg.ext_zve32f) {
188
+ error_setg(errp,
189
+ "Vector crypto extensions require V or Zve* extensions");
190
+ return;
191
+ }
192
+
193
if (cpu->cfg.ext_zvbc && !cpu->cfg.ext_zve64f) {
194
error_setg(errp, "Zvbc extension requires V or Zve64{f,d} extensions");
195
return;
196
@@ -XXX,XX +XXX,XX @@ static Property riscv_cpu_extensions[] = {
197
DEFINE_PROP_BOOL("x-zvfbfwma", RISCVCPU, cfg.ext_zvfbfwma, false),
198
199
/* Vector cryptography extensions */
200
+ DEFINE_PROP_BOOL("x-zvbb", RISCVCPU, cfg.ext_zvbb, false),
201
DEFINE_PROP_BOOL("x-zvbc", RISCVCPU, cfg.ext_zvbc, false),
202
203
DEFINE_PROP_END_OF_LIST(),
204
diff --git a/target/riscv/vcrypto_helper.c b/target/riscv/vcrypto_helper.c
205
index XXXXXXX..XXXXXXX 100644
206
--- a/target/riscv/vcrypto_helper.c
207
+++ b/target/riscv/vcrypto_helper.c
208
@@ -XXX,XX +XXX,XX @@
209
#include "qemu/osdep.h"
210
#include "qemu/host-utils.h"
211
#include "qemu/bitops.h"
212
+#include "qemu/bswap.h"
213
#include "cpu.h"
214
#include "exec/memop.h"
215
#include "exec/exec-all.h"
216
@@ -XXX,XX +XXX,XX @@ RVVCALL(OPIVV2, vclmulh_vv, OP_UUU_D, H8, H8, H8, clmulh64)
217
GEN_VEXT_VV(vclmulh_vv, 8)
218
RVVCALL(OPIVX2, vclmulh_vx, OP_UUU_D, H8, H8, clmulh64)
219
GEN_VEXT_VX(vclmulh_vx, 8)
220
+
221
+RVVCALL(OPIVV2, vror_vv_b, OP_UUU_B, H1, H1, H1, ror8)
222
+RVVCALL(OPIVV2, vror_vv_h, OP_UUU_H, H2, H2, H2, ror16)
223
+RVVCALL(OPIVV2, vror_vv_w, OP_UUU_W, H4, H4, H4, ror32)
224
+RVVCALL(OPIVV2, vror_vv_d, OP_UUU_D, H8, H8, H8, ror64)
225
+GEN_VEXT_VV(vror_vv_b, 1)
226
+GEN_VEXT_VV(vror_vv_h, 2)
227
+GEN_VEXT_VV(vror_vv_w, 4)
228
+GEN_VEXT_VV(vror_vv_d, 8)
229
+
230
+RVVCALL(OPIVX2, vror_vx_b, OP_UUU_B, H1, H1, ror8)
231
+RVVCALL(OPIVX2, vror_vx_h, OP_UUU_H, H2, H2, ror16)
232
+RVVCALL(OPIVX2, vror_vx_w, OP_UUU_W, H4, H4, ror32)
233
+RVVCALL(OPIVX2, vror_vx_d, OP_UUU_D, H8, H8, ror64)
234
+GEN_VEXT_VX(vror_vx_b, 1)
235
+GEN_VEXT_VX(vror_vx_h, 2)
236
+GEN_VEXT_VX(vror_vx_w, 4)
237
+GEN_VEXT_VX(vror_vx_d, 8)
238
+
239
+RVVCALL(OPIVV2, vrol_vv_b, OP_UUU_B, H1, H1, H1, rol8)
240
+RVVCALL(OPIVV2, vrol_vv_h, OP_UUU_H, H2, H2, H2, rol16)
241
+RVVCALL(OPIVV2, vrol_vv_w, OP_UUU_W, H4, H4, H4, rol32)
242
+RVVCALL(OPIVV2, vrol_vv_d, OP_UUU_D, H8, H8, H8, rol64)
243
+GEN_VEXT_VV(vrol_vv_b, 1)
244
+GEN_VEXT_VV(vrol_vv_h, 2)
245
+GEN_VEXT_VV(vrol_vv_w, 4)
246
+GEN_VEXT_VV(vrol_vv_d, 8)
247
+
248
+RVVCALL(OPIVX2, vrol_vx_b, OP_UUU_B, H1, H1, rol8)
249
+RVVCALL(OPIVX2, vrol_vx_h, OP_UUU_H, H2, H2, rol16)
250
+RVVCALL(OPIVX2, vrol_vx_w, OP_UUU_W, H4, H4, rol32)
251
+RVVCALL(OPIVX2, vrol_vx_d, OP_UUU_D, H8, H8, rol64)
252
+GEN_VEXT_VX(vrol_vx_b, 1)
253
+GEN_VEXT_VX(vrol_vx_h, 2)
254
+GEN_VEXT_VX(vrol_vx_w, 4)
255
+GEN_VEXT_VX(vrol_vx_d, 8)
256
+
257
+static uint64_t brev8(uint64_t val)
91
+{
258
+{
92
+ if (env->priv == PRV_M ||
259
+ val = ((val & 0x5555555555555555ull) << 1) |
93
+ (env->priv == PRV_S && !riscv_cpu_virt_enabled(env)) ||
260
+ ((val & 0xAAAAAAAAAAAAAAAAull) >> 1);
94
+ (env->priv == PRV_U && !riscv_cpu_virt_enabled(env) &&
261
+ val = ((val & 0x3333333333333333ull) << 2) |
95
+ get_field(env->hstatus, HSTATUS_HU))) {
262
+ ((val & 0xCCCCCCCCCCCCCCCCull) >> 2);
96
+ target_ulong pte;
263
+ val = ((val & 0x0F0F0F0F0F0F0F0Full) << 4) |
97
+
264
+ ((val & 0xF0F0F0F0F0F0F0F0ull) >> 4);
98
+ riscv_cpu_set_two_stage_lookup(env, true);
265
+
99
+
266
+ return val;
100
+ switch (memop) {
101
+ case MO_SB:
102
+ pte = cpu_ldsb_data_ra(env, address, GETPC());
103
+ break;
104
+ case MO_UB:
105
+ pte = cpu_ldub_data_ra(env, address, GETPC());
106
+ break;
107
+ case MO_TESW:
108
+ pte = cpu_ldsw_data_ra(env, address, GETPC());
109
+ break;
110
+ case MO_TEUW:
111
+ pte = cpu_lduw_data_ra(env, address, GETPC());
112
+ break;
113
+ case MO_TESL:
114
+ pte = cpu_ldl_data_ra(env, address, GETPC());
115
+ break;
116
+ case MO_TEUL:
117
+ pte = cpu_ldl_data_ra(env, address, GETPC());
118
+ break;
119
+ case MO_TEQ:
120
+ pte = cpu_ldq_data_ra(env, address, GETPC());
121
+ break;
122
+ default:
123
+ g_assert_not_reached();
124
+ }
125
+
126
+ riscv_cpu_set_two_stage_lookup(env, false);
127
+
128
+ return pte;
129
+ }
130
+
131
+ riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
132
+ return 0;
133
+}
267
+}
134
+
268
+
135
+void helper_hyp_store(CPURISCVState *env, target_ulong address,
269
+RVVCALL(OPIVV1, vbrev8_v_b, OP_UU_B, H1, H1, brev8)
136
+ target_ulong val, target_ulong attrs, target_ulong memop)
270
+RVVCALL(OPIVV1, vbrev8_v_h, OP_UU_H, H2, H2, brev8)
271
+RVVCALL(OPIVV1, vbrev8_v_w, OP_UU_W, H4, H4, brev8)
272
+RVVCALL(OPIVV1, vbrev8_v_d, OP_UU_D, H8, H8, brev8)
273
+GEN_VEXT_V(vbrev8_v_b, 1)
274
+GEN_VEXT_V(vbrev8_v_h, 2)
275
+GEN_VEXT_V(vbrev8_v_w, 4)
276
+GEN_VEXT_V(vbrev8_v_d, 8)
277
+
278
+#define DO_IDENTITY(a) (a)
279
+RVVCALL(OPIVV1, vrev8_v_b, OP_UU_B, H1, H1, DO_IDENTITY)
280
+RVVCALL(OPIVV1, vrev8_v_h, OP_UU_H, H2, H2, bswap16)
281
+RVVCALL(OPIVV1, vrev8_v_w, OP_UU_W, H4, H4, bswap32)
282
+RVVCALL(OPIVV1, vrev8_v_d, OP_UU_D, H8, H8, bswap64)
283
+GEN_VEXT_V(vrev8_v_b, 1)
284
+GEN_VEXT_V(vrev8_v_h, 2)
285
+GEN_VEXT_V(vrev8_v_w, 4)
286
+GEN_VEXT_V(vrev8_v_d, 8)
287
+
288
+#define DO_ANDN(a, b) ((a) & ~(b))
289
+RVVCALL(OPIVV2, vandn_vv_b, OP_UUU_B, H1, H1, H1, DO_ANDN)
290
+RVVCALL(OPIVV2, vandn_vv_h, OP_UUU_H, H2, H2, H2, DO_ANDN)
291
+RVVCALL(OPIVV2, vandn_vv_w, OP_UUU_W, H4, H4, H4, DO_ANDN)
292
+RVVCALL(OPIVV2, vandn_vv_d, OP_UUU_D, H8, H8, H8, DO_ANDN)
293
+GEN_VEXT_VV(vandn_vv_b, 1)
294
+GEN_VEXT_VV(vandn_vv_h, 2)
295
+GEN_VEXT_VV(vandn_vv_w, 4)
296
+GEN_VEXT_VV(vandn_vv_d, 8)
297
+
298
+RVVCALL(OPIVX2, vandn_vx_b, OP_UUU_B, H1, H1, DO_ANDN)
299
+RVVCALL(OPIVX2, vandn_vx_h, OP_UUU_H, H2, H2, DO_ANDN)
300
+RVVCALL(OPIVX2, vandn_vx_w, OP_UUU_W, H4, H4, DO_ANDN)
301
+RVVCALL(OPIVX2, vandn_vx_d, OP_UUU_D, H8, H8, DO_ANDN)
302
+GEN_VEXT_VX(vandn_vx_b, 1)
303
+GEN_VEXT_VX(vandn_vx_h, 2)
304
+GEN_VEXT_VX(vandn_vx_w, 4)
305
+GEN_VEXT_VX(vandn_vx_d, 8)
306
+
307
+RVVCALL(OPIVV1, vbrev_v_b, OP_UU_B, H1, H1, revbit8)
308
+RVVCALL(OPIVV1, vbrev_v_h, OP_UU_H, H2, H2, revbit16)
309
+RVVCALL(OPIVV1, vbrev_v_w, OP_UU_W, H4, H4, revbit32)
310
+RVVCALL(OPIVV1, vbrev_v_d, OP_UU_D, H8, H8, revbit64)
311
+GEN_VEXT_V(vbrev_v_b, 1)
312
+GEN_VEXT_V(vbrev_v_h, 2)
313
+GEN_VEXT_V(vbrev_v_w, 4)
314
+GEN_VEXT_V(vbrev_v_d, 8)
315
+
316
+RVVCALL(OPIVV1, vclz_v_b, OP_UU_B, H1, H1, clz8)
317
+RVVCALL(OPIVV1, vclz_v_h, OP_UU_H, H2, H2, clz16)
318
+RVVCALL(OPIVV1, vclz_v_w, OP_UU_W, H4, H4, clz32)
319
+RVVCALL(OPIVV1, vclz_v_d, OP_UU_D, H8, H8, clz64)
320
+GEN_VEXT_V(vclz_v_b, 1)
321
+GEN_VEXT_V(vclz_v_h, 2)
322
+GEN_VEXT_V(vclz_v_w, 4)
323
+GEN_VEXT_V(vclz_v_d, 8)
324
+
325
+RVVCALL(OPIVV1, vctz_v_b, OP_UU_B, H1, H1, ctz8)
326
+RVVCALL(OPIVV1, vctz_v_h, OP_UU_H, H2, H2, ctz16)
327
+RVVCALL(OPIVV1, vctz_v_w, OP_UU_W, H4, H4, ctz32)
328
+RVVCALL(OPIVV1, vctz_v_d, OP_UU_D, H8, H8, ctz64)
329
+GEN_VEXT_V(vctz_v_b, 1)
330
+GEN_VEXT_V(vctz_v_h, 2)
331
+GEN_VEXT_V(vctz_v_w, 4)
332
+GEN_VEXT_V(vctz_v_d, 8)
333
+
334
+RVVCALL(OPIVV1, vcpop_v_b, OP_UU_B, H1, H1, ctpop8)
335
+RVVCALL(OPIVV1, vcpop_v_h, OP_UU_H, H2, H2, ctpop16)
336
+RVVCALL(OPIVV1, vcpop_v_w, OP_UU_W, H4, H4, ctpop32)
337
+RVVCALL(OPIVV1, vcpop_v_d, OP_UU_D, H8, H8, ctpop64)
338
+GEN_VEXT_V(vcpop_v_b, 1)
339
+GEN_VEXT_V(vcpop_v_h, 2)
340
+GEN_VEXT_V(vcpop_v_w, 4)
341
+GEN_VEXT_V(vcpop_v_d, 8)
342
+
343
+#define DO_SLL(N, M) (N << (M & (sizeof(N) * 8 - 1)))
344
+RVVCALL(OPIVV2, vwsll_vv_b, WOP_UUU_B, H2, H1, H1, DO_SLL)
345
+RVVCALL(OPIVV2, vwsll_vv_h, WOP_UUU_H, H4, H2, H2, DO_SLL)
346
+RVVCALL(OPIVV2, vwsll_vv_w, WOP_UUU_W, H8, H4, H4, DO_SLL)
347
+GEN_VEXT_VV(vwsll_vv_b, 2)
348
+GEN_VEXT_VV(vwsll_vv_h, 4)
349
+GEN_VEXT_VV(vwsll_vv_w, 8)
350
+
351
+RVVCALL(OPIVX2, vwsll_vx_b, WOP_UUU_B, H2, H1, DO_SLL)
352
+RVVCALL(OPIVX2, vwsll_vx_h, WOP_UUU_H, H4, H2, DO_SLL)
353
+RVVCALL(OPIVX2, vwsll_vx_w, WOP_UUU_W, H8, H4, DO_SLL)
354
+GEN_VEXT_VX(vwsll_vx_b, 2)
355
+GEN_VEXT_VX(vwsll_vx_h, 4)
356
+GEN_VEXT_VX(vwsll_vx_w, 8)
357
diff --git a/target/riscv/insn_trans/trans_rvvk.c.inc b/target/riscv/insn_trans/trans_rvvk.c.inc
358
index XXXXXXX..XXXXXXX 100644
359
--- a/target/riscv/insn_trans/trans_rvvk.c.inc
360
+++ b/target/riscv/insn_trans/trans_rvvk.c.inc
361
@@ -XXX,XX +XXX,XX @@ static bool vclmul_vx_check(DisasContext *s, arg_rmrr *a)
362
363
GEN_VX_MASKED_TRANS(vclmul_vx, vclmul_vx_check)
364
GEN_VX_MASKED_TRANS(vclmulh_vx, vclmul_vx_check)
365
+
366
+/*
367
+ * Zvbb
368
+ */
369
+
370
+#define GEN_OPIVI_GVEC_TRANS_CHECK(NAME, IMM_MODE, OPIVX, SUF, CHECK) \
371
+ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
372
+ { \
373
+ if (CHECK(s, a)) { \
374
+ static gen_helper_opivx *const fns[4] = { \
375
+ gen_helper_##OPIVX##_b, \
376
+ gen_helper_##OPIVX##_h, \
377
+ gen_helper_##OPIVX##_w, \
378
+ gen_helper_##OPIVX##_d, \
379
+ }; \
380
+ return do_opivi_gvec(s, a, tcg_gen_gvec_##SUF, fns[s->sew], \
381
+ IMM_MODE); \
382
+ } \
383
+ return false; \
384
+ }
385
+
386
+#define GEN_OPIVV_GVEC_TRANS_CHECK(NAME, SUF, CHECK) \
387
+ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
388
+ { \
389
+ if (CHECK(s, a)) { \
390
+ static gen_helper_gvec_4_ptr *const fns[4] = { \
391
+ gen_helper_##NAME##_b, \
392
+ gen_helper_##NAME##_h, \
393
+ gen_helper_##NAME##_w, \
394
+ gen_helper_##NAME##_d, \
395
+ }; \
396
+ return do_opivv_gvec(s, a, tcg_gen_gvec_##SUF, fns[s->sew]); \
397
+ } \
398
+ return false; \
399
+ }
400
+
401
+#define GEN_OPIVX_GVEC_SHIFT_TRANS_CHECK(NAME, SUF, CHECK) \
402
+ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
403
+ { \
404
+ if (CHECK(s, a)) { \
405
+ static gen_helper_opivx *const fns[4] = { \
406
+ gen_helper_##NAME##_b, \
407
+ gen_helper_##NAME##_h, \
408
+ gen_helper_##NAME##_w, \
409
+ gen_helper_##NAME##_d, \
410
+ }; \
411
+ return do_opivx_gvec_shift(s, a, tcg_gen_gvec_##SUF, \
412
+ fns[s->sew]); \
413
+ } \
414
+ return false; \
415
+ }
416
+
417
+static bool zvbb_vv_check(DisasContext *s, arg_rmrr *a)
137
+{
418
+{
138
+ if (env->priv == PRV_M ||
419
+ return opivv_check(s, a) && s->cfg_ptr->ext_zvbb == true;
139
+ (env->priv == PRV_S && !riscv_cpu_virt_enabled(env)) ||
140
+ (env->priv == PRV_U && !riscv_cpu_virt_enabled(env) &&
141
+ get_field(env->hstatus, HSTATUS_HU))) {
142
+ riscv_cpu_set_two_stage_lookup(env, true);
143
+
144
+ switch (memop) {
145
+ case MO_SB:
146
+ case MO_UB:
147
+ cpu_stb_data_ra(env, address, val, GETPC());
148
+ break;
149
+ case MO_TESW:
150
+ case MO_TEUW:
151
+ cpu_stw_data_ra(env, address, val, GETPC());
152
+ break;
153
+ case MO_TESL:
154
+ case MO_TEUL:
155
+ cpu_stl_data_ra(env, address, val, GETPC());
156
+ break;
157
+ case MO_TEQ:
158
+ cpu_stq_data_ra(env, address, val, GETPC());
159
+ break;
160
+ default:
161
+ g_assert_not_reached();
162
+ }
163
+
164
+ riscv_cpu_set_two_stage_lookup(env, false);
165
+
166
+ return;
167
+ }
168
+
169
+ riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
170
+}
420
+}
171
+
421
+
172
+target_ulong helper_hyp_x_load(CPURISCVState *env, target_ulong address,
422
+static bool zvbb_vx_check(DisasContext *s, arg_rmrr *a)
173
+ target_ulong attrs, target_ulong memop)
174
+{
423
+{
175
+ if (env->priv == PRV_M ||
424
+ return opivx_check(s, a) && s->cfg_ptr->ext_zvbb == true;
176
+ (env->priv == PRV_S && !riscv_cpu_virt_enabled(env)) ||
177
+ (env->priv == PRV_U && !riscv_cpu_virt_enabled(env) &&
178
+ get_field(env->hstatus, HSTATUS_HU))) {
179
+ target_ulong pte;
180
+
181
+ riscv_cpu_set_two_stage_lookup(env, true);
182
+
183
+ switch (memop) {
184
+ case MO_TEUL:
185
+ pte = cpu_ldub_data_ra(env, address, GETPC());
186
+ break;
187
+ case MO_TEUW:
188
+ pte = cpu_lduw_data_ra(env, address, GETPC());
189
+ break;
190
+ default:
191
+ g_assert_not_reached();
192
+ }
193
+
194
+ riscv_cpu_set_two_stage_lookup(env, false);
195
+
196
+ return pte;
197
+ }
198
+
199
+ riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
200
+ return 0;
201
+}
425
+}
202
+
426
+
203
#endif /* !CONFIG_USER_ONLY */
427
+/* vrol.v[vx] */
204
diff --git a/target/riscv/insn_trans/trans_rvh.c.inc b/target/riscv/insn_trans/trans_rvh.c.inc
428
+GEN_OPIVV_GVEC_TRANS_CHECK(vrol_vv, rotlv, zvbb_vv_check)
205
index XXXXXXX..XXXXXXX 100644
429
+GEN_OPIVX_GVEC_SHIFT_TRANS_CHECK(vrol_vx, rotls, zvbb_vx_check)
206
--- a/target/riscv/insn_trans/trans_rvh.c.inc
430
+
207
+++ b/target/riscv/insn_trans/trans_rvh.c.inc
431
+/* vror.v[vxi] */
208
@@ -XXX,XX +XXX,XX @@
432
+GEN_OPIVV_GVEC_TRANS_CHECK(vror_vv, rotrv, zvbb_vv_check)
209
* this program. If not, see <http://www.gnu.org/licenses/>.
433
+GEN_OPIVX_GVEC_SHIFT_TRANS_CHECK(vror_vx, rotrs, zvbb_vx_check)
210
*/
434
+GEN_OPIVI_GVEC_TRANS_CHECK(vror_vi, IMM_TRUNC_SEW, vror_vx, rotri, zvbb_vx_check)
211
435
+
212
+static bool trans_hlv_b(DisasContext *ctx, arg_hlv_b *a)
436
+#define GEN_OPIVX_GVEC_TRANS_CHECK(NAME, SUF, CHECK) \
437
+ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
438
+ { \
439
+ if (CHECK(s, a)) { \
440
+ static gen_helper_opivx *const fns[4] = { \
441
+ gen_helper_##NAME##_b, \
442
+ gen_helper_##NAME##_h, \
443
+ gen_helper_##NAME##_w, \
444
+ gen_helper_##NAME##_d, \
445
+ }; \
446
+ return do_opivx_gvec(s, a, tcg_gen_gvec_##SUF, fns[s->sew]); \
447
+ } \
448
+ return false; \
449
+ }
450
+
451
+/* vandn.v[vx] */
452
+GEN_OPIVV_GVEC_TRANS_CHECK(vandn_vv, andc, zvbb_vv_check)
453
+GEN_OPIVX_GVEC_TRANS_CHECK(vandn_vx, andcs, zvbb_vx_check)
454
+
455
+#define GEN_OPIV_TRANS(NAME, CHECK) \
456
+ static bool trans_##NAME(DisasContext *s, arg_rmr *a) \
457
+ { \
458
+ if (CHECK(s, a)) { \
459
+ uint32_t data = 0; \
460
+ static gen_helper_gvec_3_ptr *const fns[4] = { \
461
+ gen_helper_##NAME##_b, \
462
+ gen_helper_##NAME##_h, \
463
+ gen_helper_##NAME##_w, \
464
+ gen_helper_##NAME##_d, \
465
+ }; \
466
+ TCGLabel *over = gen_new_label(); \
467
+ tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
468
+ \
469
+ data = FIELD_DP32(data, VDATA, VM, a->vm); \
470
+ data = FIELD_DP32(data, VDATA, LMUL, s->lmul); \
471
+ data = FIELD_DP32(data, VDATA, VTA, s->vta); \
472
+ data = FIELD_DP32(data, VDATA, VTA_ALL_1S, s->cfg_vta_all_1s); \
473
+ data = FIELD_DP32(data, VDATA, VMA, s->vma); \
474
+ tcg_gen_gvec_3_ptr(vreg_ofs(s, a->rd), vreg_ofs(s, 0), \
475
+ vreg_ofs(s, a->rs2), cpu_env, \
476
+ s->cfg_ptr->vlen / 8, s->cfg_ptr->vlen / 8, \
477
+ data, fns[s->sew]); \
478
+ mark_vs_dirty(s); \
479
+ gen_set_label(over); \
480
+ return true; \
481
+ } \
482
+ return false; \
483
+ }
484
+
485
+static bool zvbb_opiv_check(DisasContext *s, arg_rmr *a)
213
+{
486
+{
214
+ REQUIRE_EXT(ctx, RVH);
487
+ return s->cfg_ptr->ext_zvbb == true &&
215
+#ifndef CONFIG_USER_ONLY
488
+ require_rvv(s) &&
216
+ TCGv t0 = tcg_temp_new();
489
+ vext_check_isa_ill(s) &&
217
+ TCGv t1 = tcg_temp_new();
490
+ vext_check_ss(s, a->rd, a->rs2, a->vm);
218
+ TCGv mem_idx = tcg_temp_new();
219
+ TCGv memop = tcg_temp_new();
220
+
221
+ gen_get_gpr(t0, a->rs1);
222
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
223
+ tcg_gen_movi_tl(memop, MO_SB);
224
+
225
+ gen_helper_hyp_load(t1, cpu_env, t0, mem_idx, memop);
226
+ gen_set_gpr(a->rd, t1);
227
+
228
+ tcg_temp_free(t0);
229
+ tcg_temp_free(t1);
230
+ tcg_temp_free(mem_idx);
231
+ tcg_temp_free(memop);
232
+ return true;
233
+#else
234
+ return false;
235
+#endif
236
+}
491
+}
237
+
492
+
238
+static bool trans_hlv_h(DisasContext *ctx, arg_hlv_h *a)
493
+GEN_OPIV_TRANS(vbrev8_v, zvbb_opiv_check)
494
+GEN_OPIV_TRANS(vrev8_v, zvbb_opiv_check)
495
+GEN_OPIV_TRANS(vbrev_v, zvbb_opiv_check)
496
+GEN_OPIV_TRANS(vclz_v, zvbb_opiv_check)
497
+GEN_OPIV_TRANS(vctz_v, zvbb_opiv_check)
498
+GEN_OPIV_TRANS(vcpop_v, zvbb_opiv_check)
499
+
500
+static bool vwsll_vv_check(DisasContext *s, arg_rmrr *a)
239
+{
501
+{
240
+ REQUIRE_EXT(ctx, RVH);
502
+ return s->cfg_ptr->ext_zvbb && opivv_widen_check(s, a);
241
+#ifndef CONFIG_USER_ONLY
242
+ TCGv t0 = tcg_temp_new();
243
+ TCGv t1 = tcg_temp_new();
244
+ TCGv mem_idx = tcg_temp_new();
245
+ TCGv memop = tcg_temp_new();
246
+
247
+ gen_get_gpr(t0, a->rs1);
248
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
249
+ tcg_gen_movi_tl(memop, MO_TESW);
250
+
251
+ gen_helper_hyp_load(t1, cpu_env, t0, mem_idx, memop);
252
+ gen_set_gpr(a->rd, t1);
253
+
254
+ tcg_temp_free(t0);
255
+ tcg_temp_free(t1);
256
+ tcg_temp_free(mem_idx);
257
+ tcg_temp_free(memop);
258
+ return true;
259
+#else
260
+ return false;
261
+#endif
262
+}
503
+}
263
+
504
+
264
+static bool trans_hlv_w(DisasContext *ctx, arg_hlv_w *a)
505
+static bool vwsll_vx_check(DisasContext *s, arg_rmrr *a)
265
+{
506
+{
266
+ REQUIRE_EXT(ctx, RVH);
507
+ return s->cfg_ptr->ext_zvbb && opivx_widen_check(s, a);
267
+#ifndef CONFIG_USER_ONLY
268
+ TCGv t0 = tcg_temp_new();
269
+ TCGv t1 = tcg_temp_new();
270
+ TCGv mem_idx = tcg_temp_new();
271
+ TCGv memop = tcg_temp_new();
272
+
273
+ gen_get_gpr(t0, a->rs1);
274
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
275
+ tcg_gen_movi_tl(memop, MO_TESL);
276
+
277
+ gen_helper_hyp_load(t1, cpu_env, t0, mem_idx, memop);
278
+ gen_set_gpr(a->rd, t1);
279
+
280
+ tcg_temp_free(t0);
281
+ tcg_temp_free(t1);
282
+ tcg_temp_free(mem_idx);
283
+ tcg_temp_free(memop);
284
+ return true;
285
+#else
286
+ return false;
287
+#endif
288
+}
508
+}
289
+
509
+
290
+static bool trans_hlv_bu(DisasContext *ctx, arg_hlv_bu *a)
510
+/* OPIVI without GVEC IR */
291
+{
511
+#define GEN_OPIVI_WIDEN_TRANS(NAME, IMM_MODE, OPIVX, CHECK) \
292
+ REQUIRE_EXT(ctx, RVH);
512
+ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
293
+#ifndef CONFIG_USER_ONLY
513
+ { \
294
+ TCGv t0 = tcg_temp_new();
514
+ if (CHECK(s, a)) { \
295
+ TCGv t1 = tcg_temp_new();
515
+ static gen_helper_opivx *const fns[3] = { \
296
+ TCGv mem_idx = tcg_temp_new();
516
+ gen_helper_##OPIVX##_b, \
297
+ TCGv memop = tcg_temp_new();
517
+ gen_helper_##OPIVX##_h, \
298
+
518
+ gen_helper_##OPIVX##_w, \
299
+ gen_get_gpr(t0, a->rs1);
519
+ }; \
300
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
520
+ return opivi_trans(a->rd, a->rs1, a->rs2, a->vm, fns[s->sew], s, \
301
+ tcg_gen_movi_tl(memop, MO_UB);
521
+ IMM_MODE); \
302
+
522
+ } \
303
+ gen_helper_hyp_load(t1, cpu_env, t0, mem_idx, memop);
523
+ return false; \
304
+ gen_set_gpr(a->rd, t1);
524
+ }
305
+
525
+
306
+ tcg_temp_free(t0);
526
+GEN_OPIVV_WIDEN_TRANS(vwsll_vv, vwsll_vv_check)
307
+ tcg_temp_free(t1);
527
+GEN_OPIVX_WIDEN_TRANS(vwsll_vx, vwsll_vx_check)
308
+ tcg_temp_free(mem_idx);
528
+GEN_OPIVI_WIDEN_TRANS(vwsll_vi, IMM_ZX, vwsll_vx, vwsll_vx_check)
309
+ tcg_temp_free(memop);
310
+ return true;
311
+#else
312
+ return false;
313
+#endif
314
+}
315
+
316
+static bool trans_hlv_hu(DisasContext *ctx, arg_hlv_hu *a)
317
+{
318
+ REQUIRE_EXT(ctx, RVH);
319
+#ifndef CONFIG_USER_ONLY
320
+ TCGv t0 = tcg_temp_new();
321
+ TCGv t1 = tcg_temp_new();
322
+ TCGv mem_idx = tcg_temp_new();
323
+ TCGv memop = tcg_temp_new();
324
+
325
+ gen_get_gpr(t0, a->rs1);
326
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
327
+ tcg_gen_movi_tl(memop, MO_TEUW);
328
+
329
+ gen_helper_hyp_load(t1, cpu_env, t0, mem_idx, memop);
330
+ gen_set_gpr(a->rd, t1);
331
+
332
+ tcg_temp_free(t0);
333
+ tcg_temp_free(t1);
334
+ tcg_temp_free(mem_idx);
335
+ tcg_temp_free(memop);
336
+ return true;
337
+#else
338
+ return false;
339
+#endif
340
+}
341
+
342
+static bool trans_hsv_b(DisasContext *ctx, arg_hsv_b *a)
343
+{
344
+ REQUIRE_EXT(ctx, RVH);
345
+#ifndef CONFIG_USER_ONLY
346
+ TCGv t0 = tcg_temp_new();
347
+ TCGv dat = tcg_temp_new();
348
+ TCGv mem_idx = tcg_temp_new();
349
+ TCGv memop = tcg_temp_new();
350
+
351
+ gen_get_gpr(t0, a->rs1);
352
+ gen_get_gpr(dat, a->rs2);
353
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
354
+ tcg_gen_movi_tl(memop, MO_SB);
355
+
356
+ gen_helper_hyp_store(cpu_env, t0, dat, mem_idx, memop);
357
+
358
+ tcg_temp_free(t0);
359
+ tcg_temp_free(dat);
360
+ tcg_temp_free(mem_idx);
361
+ tcg_temp_free(memop);
362
+ return true;
363
+#else
364
+ return false;
365
+#endif
366
+}
367
+
368
+static bool trans_hsv_h(DisasContext *ctx, arg_hsv_h *a)
369
+{
370
+ REQUIRE_EXT(ctx, RVH);
371
+#ifndef CONFIG_USER_ONLY
372
+ TCGv t0 = tcg_temp_new();
373
+ TCGv dat = tcg_temp_new();
374
+ TCGv mem_idx = tcg_temp_new();
375
+ TCGv memop = tcg_temp_new();
376
+
377
+ gen_get_gpr(t0, a->rs1);
378
+ gen_get_gpr(dat, a->rs2);
379
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
380
+ tcg_gen_movi_tl(memop, MO_TESW);
381
+
382
+ gen_helper_hyp_store(cpu_env, t0, dat, mem_idx, memop);
383
+
384
+ tcg_temp_free(t0);
385
+ tcg_temp_free(dat);
386
+ tcg_temp_free(mem_idx);
387
+ tcg_temp_free(memop);
388
+ return true;
389
+#else
390
+ return false;
391
+#endif
392
+}
393
+
394
+static bool trans_hsv_w(DisasContext *ctx, arg_hsv_w *a)
395
+{
396
+ REQUIRE_EXT(ctx, RVH);
397
+#ifndef CONFIG_USER_ONLY
398
+ TCGv t0 = tcg_temp_new();
399
+ TCGv dat = tcg_temp_new();
400
+ TCGv mem_idx = tcg_temp_new();
401
+ TCGv memop = tcg_temp_new();
402
+
403
+ gen_get_gpr(t0, a->rs1);
404
+ gen_get_gpr(dat, a->rs2);
405
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
406
+ tcg_gen_movi_tl(memop, MO_TESL);
407
+
408
+ gen_helper_hyp_store(cpu_env, t0, dat, mem_idx, memop);
409
+
410
+ tcg_temp_free(t0);
411
+ tcg_temp_free(dat);
412
+ tcg_temp_free(mem_idx);
413
+ tcg_temp_free(memop);
414
+ return true;
415
+#else
416
+ return false;
417
+#endif
418
+}
419
+
420
+#ifdef TARGET_RISCV64
421
+static bool trans_hlv_wu(DisasContext *ctx, arg_hlv_wu *a)
422
+{
423
+ REQUIRE_EXT(ctx, RVH);
424
+#ifndef CONFIG_USER_ONLY
425
+ TCGv t0 = tcg_temp_new();
426
+ TCGv t1 = tcg_temp_new();
427
+ TCGv mem_idx = tcg_temp_new();
428
+ TCGv memop = tcg_temp_new();
429
+
430
+ gen_get_gpr(t0, a->rs1);
431
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
432
+ tcg_gen_movi_tl(memop, MO_TEUL);
433
+
434
+ gen_helper_hyp_load(t1, cpu_env, t0, mem_idx, memop);
435
+ gen_set_gpr(a->rd, t1);
436
+
437
+ tcg_temp_free(t0);
438
+ tcg_temp_free(t1);
439
+ tcg_temp_free(mem_idx);
440
+ tcg_temp_free(memop);
441
+ return true;
442
+#else
443
+ return false;
444
+#endif
445
+}
446
+
447
+static bool trans_hlv_d(DisasContext *ctx, arg_hlv_d *a)
448
+{
449
+ REQUIRE_EXT(ctx, RVH);
450
+#ifndef CONFIG_USER_ONLY
451
+ TCGv t0 = tcg_temp_new();
452
+ TCGv t1 = tcg_temp_new();
453
+ TCGv mem_idx = tcg_temp_new();
454
+ TCGv memop = tcg_temp_new();
455
+
456
+ gen_get_gpr(t0, a->rs1);
457
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
458
+ tcg_gen_movi_tl(memop, MO_TEQ);
459
+
460
+ gen_helper_hyp_load(t1, cpu_env, t0, mem_idx, memop);
461
+ gen_set_gpr(a->rd, t1);
462
+
463
+ tcg_temp_free(t0);
464
+ tcg_temp_free(t1);
465
+ tcg_temp_free(mem_idx);
466
+ tcg_temp_free(memop);
467
+ return true;
468
+#else
469
+ return false;
470
+#endif
471
+}
472
+
473
+static bool trans_hsv_d(DisasContext *ctx, arg_hsv_d *a)
474
+{
475
+ REQUIRE_EXT(ctx, RVH);
476
+#ifndef CONFIG_USER_ONLY
477
+ TCGv t0 = tcg_temp_new();
478
+ TCGv dat = tcg_temp_new();
479
+ TCGv mem_idx = tcg_temp_new();
480
+ TCGv memop = tcg_temp_new();
481
+
482
+ gen_get_gpr(t0, a->rs1);
483
+ gen_get_gpr(dat, a->rs2);
484
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
485
+ tcg_gen_movi_tl(memop, MO_TEQ);
486
+
487
+ gen_helper_hyp_store(cpu_env, t0, dat, mem_idx, memop);
488
+
489
+ tcg_temp_free(t0);
490
+ tcg_temp_free(dat);
491
+ tcg_temp_free(mem_idx);
492
+ tcg_temp_free(memop);
493
+ return true;
494
+#else
495
+ return false;
496
+#endif
497
+}
498
+#endif
499
+
500
+static bool trans_hlvx_hu(DisasContext *ctx, arg_hlvx_hu *a)
501
+{
502
+ REQUIRE_EXT(ctx, RVH);
503
+#ifndef CONFIG_USER_ONLY
504
+ TCGv t0 = tcg_temp_new();
505
+ TCGv t1 = tcg_temp_new();
506
+ TCGv mem_idx = tcg_temp_new();
507
+ TCGv memop = tcg_temp_new();
508
+
509
+ gen_get_gpr(t0, a->rs1);
510
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
511
+ tcg_gen_movi_tl(memop, MO_TEUW);
512
+
513
+ gen_helper_hyp_x_load(t1, cpu_env, t0, mem_idx, memop);
514
+ gen_set_gpr(a->rd, t1);
515
+
516
+ tcg_temp_free(t0);
517
+ tcg_temp_free(t1);
518
+ tcg_temp_free(mem_idx);
519
+ tcg_temp_free(memop);
520
+ return true;
521
+#else
522
+ return false;
523
+#endif
524
+}
525
+
526
+static bool trans_hlvx_wu(DisasContext *ctx, arg_hlvx_wu *a)
527
+{
528
+ REQUIRE_EXT(ctx, RVH);
529
+#ifndef CONFIG_USER_ONLY
530
+ TCGv t0 = tcg_temp_new();
531
+ TCGv t1 = tcg_temp_new();
532
+ TCGv mem_idx = tcg_temp_new();
533
+ TCGv memop = tcg_temp_new();
534
+
535
+ gen_get_gpr(t0, a->rs1);
536
+ tcg_gen_movi_tl(mem_idx, ctx->mem_idx);
537
+ tcg_gen_movi_tl(memop, MO_TEUL);
538
+
539
+ gen_helper_hyp_x_load(t1, cpu_env, t0, mem_idx, memop);
540
+ gen_set_gpr(a->rd, t1);
541
+
542
+ tcg_temp_free(t0);
543
+ tcg_temp_free(t1);
544
+ tcg_temp_free(mem_idx);
545
+ tcg_temp_free(memop);
546
+ return true;
547
+#else
548
+ return false;
549
+#endif
550
+}
551
+
552
static bool trans_hfence_gvma(DisasContext *ctx, arg_sfence_vma *a)
553
{
554
REQUIRE_EXT(ctx, RVH);
555
--
529
--
556
2.28.0
530
2.41.0
557
558
diff view generated by jsdifflib
New patch
1
From: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
1
2
3
This commit adds support for the Zvkned vector-crypto extension, which
4
consists of the following instructions:
5
6
* vaesef.[vv,vs]
7
* vaesdf.[vv,vs]
8
* vaesdm.[vv,vs]
9
* vaesz.vs
10
* vaesem.[vv,vs]
11
* vaeskf1.vi
12
* vaeskf2.vi
13
14
Translation functions are defined in
15
`target/riscv/insn_trans/trans_rvvk.c.inc` and helpers are defined in
16
`target/riscv/vcrypto_helper.c`.
17
18
Co-authored-by: Lawrence Hunter <lawrence.hunter@codethink.co.uk>
19
Co-authored-by: William Salmon <will.salmon@codethink.co.uk>
20
[max.chou@sifive.com: Replaced vstart checking by TCG op]
21
Signed-off-by: Lawrence Hunter <lawrence.hunter@codethink.co.uk>
22
Signed-off-by: William Salmon <will.salmon@codethink.co.uk>
23
Signed-off-by: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
24
Signed-off-by: Max Chou <max.chou@sifive.com>
25
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
26
[max.chou@sifive.com: Imported aes-round.h and exposed x-zvkned
27
property]
28
[max.chou@sifive.com: Fixed endian issues and replaced the vstart & vl
29
egs checking by helper function]
30
[max.chou@sifive.com: Replaced bswap32 calls in aes key expanding]
31
Message-ID: <20230711165917.2629866-10-max.chou@sifive.com>
32
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
33
---
34
target/riscv/cpu_cfg.h | 1 +
35
target/riscv/helper.h | 14 ++
36
target/riscv/insn32.decode | 14 ++
37
target/riscv/cpu.c | 4 +-
38
target/riscv/vcrypto_helper.c | 202 +++++++++++++++++++++++
39
target/riscv/insn_trans/trans_rvvk.c.inc | 147 +++++++++++++++++
40
6 files changed, 381 insertions(+), 1 deletion(-)
41
42
diff --git a/target/riscv/cpu_cfg.h b/target/riscv/cpu_cfg.h
43
index XXXXXXX..XXXXXXX 100644
44
--- a/target/riscv/cpu_cfg.h
45
+++ b/target/riscv/cpu_cfg.h
46
@@ -XXX,XX +XXX,XX @@ struct RISCVCPUConfig {
47
bool ext_zve64d;
48
bool ext_zvbb;
49
bool ext_zvbc;
50
+ bool ext_zvkned;
51
bool ext_zmmul;
52
bool ext_zvfbfmin;
53
bool ext_zvfbfwma;
54
diff --git a/target/riscv/helper.h b/target/riscv/helper.h
55
index XXXXXXX..XXXXXXX 100644
56
--- a/target/riscv/helper.h
57
+++ b/target/riscv/helper.h
58
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_6(vandn_vx_b, void, ptr, ptr, tl, ptr, env, i32)
59
DEF_HELPER_6(vandn_vx_h, void, ptr, ptr, tl, ptr, env, i32)
60
DEF_HELPER_6(vandn_vx_w, void, ptr, ptr, tl, ptr, env, i32)
61
DEF_HELPER_6(vandn_vx_d, void, ptr, ptr, tl, ptr, env, i32)
62
+
63
+DEF_HELPER_2(egs_check, void, i32, env)
64
+
65
+DEF_HELPER_4(vaesef_vv, void, ptr, ptr, env, i32)
66
+DEF_HELPER_4(vaesef_vs, void, ptr, ptr, env, i32)
67
+DEF_HELPER_4(vaesdf_vv, void, ptr, ptr, env, i32)
68
+DEF_HELPER_4(vaesdf_vs, void, ptr, ptr, env, i32)
69
+DEF_HELPER_4(vaesem_vv, void, ptr, ptr, env, i32)
70
+DEF_HELPER_4(vaesem_vs, void, ptr, ptr, env, i32)
71
+DEF_HELPER_4(vaesdm_vv, void, ptr, ptr, env, i32)
72
+DEF_HELPER_4(vaesdm_vs, void, ptr, ptr, env, i32)
73
+DEF_HELPER_4(vaesz_vs, void, ptr, ptr, env, i32)
74
+DEF_HELPER_5(vaeskf1_vi, void, ptr, ptr, i32, env, i32)
75
+DEF_HELPER_5(vaeskf2_vi, void, ptr, ptr, i32, env, i32)
76
diff --git a/target/riscv/insn32.decode b/target/riscv/insn32.decode
77
index XXXXXXX..XXXXXXX 100644
78
--- a/target/riscv/insn32.decode
79
+++ b/target/riscv/insn32.decode
80
@@ -XXX,XX +XXX,XX @@
81
@r_rm ....... ..... ..... ... ..... ....... %rs2 %rs1 %rm %rd
82
@r2_rm ....... ..... ..... ... ..... ....... %rs1 %rm %rd
83
@r2 ....... ..... ..... ... ..... ....... &r2 %rs1 %rd
84
+@r2_vm_1 ...... . ..... ..... ... ..... ....... &rmr vm=1 %rs2 %rd
85
@r2_nfvm ... ... vm:1 ..... ..... ... ..... ....... &r2nfvm %nf %rs1 %rd
86
@r2_vm ...... vm:1 ..... ..... ... ..... ....... &rmr %rs2 %rd
87
@r1_vm ...... vm:1 ..... ..... ... ..... ....... %rd
88
@@ -XXX,XX +XXX,XX @@ vcpop_v 010010 . ..... 01110 010 ..... 1010111 @r2_vm
89
vwsll_vv 110101 . ..... ..... 000 ..... 1010111 @r_vm
90
vwsll_vx 110101 . ..... ..... 100 ..... 1010111 @r_vm
91
vwsll_vi 110101 . ..... ..... 011 ..... 1010111 @r_vm
92
+
93
+# *** Zvkned vector crypto extension ***
94
+vaesef_vv 101000 1 ..... 00011 010 ..... 1110111 @r2_vm_1
95
+vaesef_vs 101001 1 ..... 00011 010 ..... 1110111 @r2_vm_1
96
+vaesdf_vv 101000 1 ..... 00001 010 ..... 1110111 @r2_vm_1
97
+vaesdf_vs 101001 1 ..... 00001 010 ..... 1110111 @r2_vm_1
98
+vaesem_vv 101000 1 ..... 00010 010 ..... 1110111 @r2_vm_1
99
+vaesem_vs 101001 1 ..... 00010 010 ..... 1110111 @r2_vm_1
100
+vaesdm_vv 101000 1 ..... 00000 010 ..... 1110111 @r2_vm_1
101
+vaesdm_vs 101001 1 ..... 00000 010 ..... 1110111 @r2_vm_1
102
+vaesz_vs 101001 1 ..... 00111 010 ..... 1110111 @r2_vm_1
103
+vaeskf1_vi 100010 1 ..... ..... 010 ..... 1110111 @r_vm_1
104
+vaeskf2_vi 101010 1 ..... ..... 010 ..... 1110111 @r_vm_1
105
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
106
index XXXXXXX..XXXXXXX 100644
107
--- a/target/riscv/cpu.c
108
+++ b/target/riscv/cpu.c
109
@@ -XXX,XX +XXX,XX @@ static const struct isa_ext_data isa_edata_arr[] = {
110
ISA_EXT_DATA_ENTRY(zvfbfwma, PRIV_VERSION_1_12_0, ext_zvfbfwma),
111
ISA_EXT_DATA_ENTRY(zvfh, PRIV_VERSION_1_12_0, ext_zvfh),
112
ISA_EXT_DATA_ENTRY(zvfhmin, PRIV_VERSION_1_12_0, ext_zvfhmin),
113
+ ISA_EXT_DATA_ENTRY(zvkned, PRIV_VERSION_1_12_0, ext_zvkned),
114
ISA_EXT_DATA_ENTRY(zhinx, PRIV_VERSION_1_12_0, ext_zhinx),
115
ISA_EXT_DATA_ENTRY(zhinxmin, PRIV_VERSION_1_12_0, ext_zhinxmin),
116
ISA_EXT_DATA_ENTRY(smaia, PRIV_VERSION_1_12_0, ext_smaia),
117
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_validate_set_extensions(RISCVCPU *cpu, Error **errp)
118
* In principle Zve*x would also suffice here, were they supported
119
* in qemu
120
*/
121
- if (cpu->cfg.ext_zvbb && !cpu->cfg.ext_zve32f) {
122
+ if ((cpu->cfg.ext_zvbb || cpu->cfg.ext_zvkned) && !cpu->cfg.ext_zve32f) {
123
error_setg(errp,
124
"Vector crypto extensions require V or Zve* extensions");
125
return;
126
@@ -XXX,XX +XXX,XX @@ static Property riscv_cpu_extensions[] = {
127
/* Vector cryptography extensions */
128
DEFINE_PROP_BOOL("x-zvbb", RISCVCPU, cfg.ext_zvbb, false),
129
DEFINE_PROP_BOOL("x-zvbc", RISCVCPU, cfg.ext_zvbc, false),
130
+ DEFINE_PROP_BOOL("x-zvkned", RISCVCPU, cfg.ext_zvkned, false),
131
132
DEFINE_PROP_END_OF_LIST(),
133
};
134
diff --git a/target/riscv/vcrypto_helper.c b/target/riscv/vcrypto_helper.c
135
index XXXXXXX..XXXXXXX 100644
136
--- a/target/riscv/vcrypto_helper.c
137
+++ b/target/riscv/vcrypto_helper.c
138
@@ -XXX,XX +XXX,XX @@
139
#include "qemu/bitops.h"
140
#include "qemu/bswap.h"
141
#include "cpu.h"
142
+#include "crypto/aes.h"
143
+#include "crypto/aes-round.h"
144
#include "exec/memop.h"
145
#include "exec/exec-all.h"
146
#include "exec/helper-proto.h"
147
@@ -XXX,XX +XXX,XX @@ RVVCALL(OPIVX2, vwsll_vx_w, WOP_UUU_W, H8, H4, DO_SLL)
148
GEN_VEXT_VX(vwsll_vx_b, 2)
149
GEN_VEXT_VX(vwsll_vx_h, 4)
150
GEN_VEXT_VX(vwsll_vx_w, 8)
151
+
152
+void HELPER(egs_check)(uint32_t egs, CPURISCVState *env)
153
+{
154
+ uint32_t vl = env->vl;
155
+ uint32_t vstart = env->vstart;
156
+
157
+ if (vl % egs != 0 || vstart % egs != 0) {
158
+ riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
159
+ }
160
+}
161
+
162
+static inline void xor_round_key(AESState *round_state, AESState *round_key)
163
+{
164
+ round_state->v = round_state->v ^ round_key->v;
165
+}
166
+
167
+#define GEN_ZVKNED_HELPER_VV(NAME, ...) \
168
+ void HELPER(NAME)(void *vd, void *vs2, CPURISCVState *env, \
169
+ uint32_t desc) \
170
+ { \
171
+ uint32_t vl = env->vl; \
172
+ uint32_t total_elems = vext_get_total_elems(env, desc, 4); \
173
+ uint32_t vta = vext_vta(desc); \
174
+ \
175
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) { \
176
+ AESState round_key; \
177
+ round_key.d[0] = *((uint64_t *)vs2 + H8(i * 2 + 0)); \
178
+ round_key.d[1] = *((uint64_t *)vs2 + H8(i * 2 + 1)); \
179
+ AESState round_state; \
180
+ round_state.d[0] = *((uint64_t *)vd + H8(i * 2 + 0)); \
181
+ round_state.d[1] = *((uint64_t *)vd + H8(i * 2 + 1)); \
182
+ __VA_ARGS__; \
183
+ *((uint64_t *)vd + H8(i * 2 + 0)) = round_state.d[0]; \
184
+ *((uint64_t *)vd + H8(i * 2 + 1)) = round_state.d[1]; \
185
+ } \
186
+ env->vstart = 0; \
187
+ /* set tail elements to 1s */ \
188
+ vext_set_elems_1s(vd, vta, vl * 4, total_elems * 4); \
189
+ }
190
+
191
+#define GEN_ZVKNED_HELPER_VS(NAME, ...) \
192
+ void HELPER(NAME)(void *vd, void *vs2, CPURISCVState *env, \
193
+ uint32_t desc) \
194
+ { \
195
+ uint32_t vl = env->vl; \
196
+ uint32_t total_elems = vext_get_total_elems(env, desc, 4); \
197
+ uint32_t vta = vext_vta(desc); \
198
+ \
199
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) { \
200
+ AESState round_key; \
201
+ round_key.d[0] = *((uint64_t *)vs2 + H8(0)); \
202
+ round_key.d[1] = *((uint64_t *)vs2 + H8(1)); \
203
+ AESState round_state; \
204
+ round_state.d[0] = *((uint64_t *)vd + H8(i * 2 + 0)); \
205
+ round_state.d[1] = *((uint64_t *)vd + H8(i * 2 + 1)); \
206
+ __VA_ARGS__; \
207
+ *((uint64_t *)vd + H8(i * 2 + 0)) = round_state.d[0]; \
208
+ *((uint64_t *)vd + H8(i * 2 + 1)) = round_state.d[1]; \
209
+ } \
210
+ env->vstart = 0; \
211
+ /* set tail elements to 1s */ \
212
+ vext_set_elems_1s(vd, vta, vl * 4, total_elems * 4); \
213
+ }
214
+
215
+GEN_ZVKNED_HELPER_VV(vaesef_vv, aesenc_SB_SR_AK(&round_state,
216
+ &round_state,
217
+ &round_key,
218
+ false);)
219
+GEN_ZVKNED_HELPER_VS(vaesef_vs, aesenc_SB_SR_AK(&round_state,
220
+ &round_state,
221
+ &round_key,
222
+ false);)
223
+GEN_ZVKNED_HELPER_VV(vaesdf_vv, aesdec_ISB_ISR_AK(&round_state,
224
+ &round_state,
225
+ &round_key,
226
+ false);)
227
+GEN_ZVKNED_HELPER_VS(vaesdf_vs, aesdec_ISB_ISR_AK(&round_state,
228
+ &round_state,
229
+ &round_key,
230
+ false);)
231
+GEN_ZVKNED_HELPER_VV(vaesem_vv, aesenc_SB_SR_MC_AK(&round_state,
232
+ &round_state,
233
+ &round_key,
234
+ false);)
235
+GEN_ZVKNED_HELPER_VS(vaesem_vs, aesenc_SB_SR_MC_AK(&round_state,
236
+ &round_state,
237
+ &round_key,
238
+ false);)
239
+GEN_ZVKNED_HELPER_VV(vaesdm_vv, aesdec_ISB_ISR_AK_IMC(&round_state,
240
+ &round_state,
241
+ &round_key,
242
+ false);)
243
+GEN_ZVKNED_HELPER_VS(vaesdm_vs, aesdec_ISB_ISR_AK_IMC(&round_state,
244
+ &round_state,
245
+ &round_key,
246
+ false);)
247
+GEN_ZVKNED_HELPER_VS(vaesz_vs, xor_round_key(&round_state, &round_key);)
248
+
249
+void HELPER(vaeskf1_vi)(void *vd_vptr, void *vs2_vptr, uint32_t uimm,
250
+ CPURISCVState *env, uint32_t desc)
251
+{
252
+ uint32_t *vd = vd_vptr;
253
+ uint32_t *vs2 = vs2_vptr;
254
+ uint32_t vl = env->vl;
255
+ uint32_t total_elems = vext_get_total_elems(env, desc, 4);
256
+ uint32_t vta = vext_vta(desc);
257
+
258
+ uimm &= 0b1111;
259
+ if (uimm > 10 || uimm == 0) {
260
+ uimm ^= 0b1000;
261
+ }
262
+
263
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) {
264
+ uint32_t rk[8], tmp;
265
+ static const uint32_t rcon[] = {
266
+ 0x00000001, 0x00000002, 0x00000004, 0x00000008, 0x00000010,
267
+ 0x00000020, 0x00000040, 0x00000080, 0x0000001B, 0x00000036,
268
+ };
269
+
270
+ rk[0] = vs2[i * 4 + H4(0)];
271
+ rk[1] = vs2[i * 4 + H4(1)];
272
+ rk[2] = vs2[i * 4 + H4(2)];
273
+ rk[3] = vs2[i * 4 + H4(3)];
274
+ tmp = ror32(rk[3], 8);
275
+
276
+ rk[4] = rk[0] ^ (((uint32_t)AES_sbox[(tmp >> 24) & 0xff] << 24) |
277
+ ((uint32_t)AES_sbox[(tmp >> 16) & 0xff] << 16) |
278
+ ((uint32_t)AES_sbox[(tmp >> 8) & 0xff] << 8) |
279
+ ((uint32_t)AES_sbox[(tmp >> 0) & 0xff] << 0))
280
+ ^ rcon[uimm - 1];
281
+ rk[5] = rk[1] ^ rk[4];
282
+ rk[6] = rk[2] ^ rk[5];
283
+ rk[7] = rk[3] ^ rk[6];
284
+
285
+ vd[i * 4 + H4(0)] = rk[4];
286
+ vd[i * 4 + H4(1)] = rk[5];
287
+ vd[i * 4 + H4(2)] = rk[6];
288
+ vd[i * 4 + H4(3)] = rk[7];
289
+ }
290
+ env->vstart = 0;
291
+ /* set tail elements to 1s */
292
+ vext_set_elems_1s(vd, vta, vl * 4, total_elems * 4);
293
+}
294
+
295
+void HELPER(vaeskf2_vi)(void *vd_vptr, void *vs2_vptr, uint32_t uimm,
296
+ CPURISCVState *env, uint32_t desc)
297
+{
298
+ uint32_t *vd = vd_vptr;
299
+ uint32_t *vs2 = vs2_vptr;
300
+ uint32_t vl = env->vl;
301
+ uint32_t total_elems = vext_get_total_elems(env, desc, 4);
302
+ uint32_t vta = vext_vta(desc);
303
+
304
+ uimm &= 0b1111;
305
+ if (uimm > 14 || uimm < 2) {
306
+ uimm ^= 0b1000;
307
+ }
308
+
309
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) {
310
+ uint32_t rk[12], tmp;
311
+ static const uint32_t rcon[] = {
312
+ 0x00000001, 0x00000002, 0x00000004, 0x00000008, 0x00000010,
313
+ 0x00000020, 0x00000040, 0x00000080, 0x0000001B, 0x00000036,
314
+ };
315
+
316
+ rk[0] = vd[i * 4 + H4(0)];
317
+ rk[1] = vd[i * 4 + H4(1)];
318
+ rk[2] = vd[i * 4 + H4(2)];
319
+ rk[3] = vd[i * 4 + H4(3)];
320
+ rk[4] = vs2[i * 4 + H4(0)];
321
+ rk[5] = vs2[i * 4 + H4(1)];
322
+ rk[6] = vs2[i * 4 + H4(2)];
323
+ rk[7] = vs2[i * 4 + H4(3)];
324
+
325
+ if (uimm % 2 == 0) {
326
+ tmp = ror32(rk[7], 8);
327
+ rk[8] = rk[0] ^ (((uint32_t)AES_sbox[(tmp >> 24) & 0xff] << 24) |
328
+ ((uint32_t)AES_sbox[(tmp >> 16) & 0xff] << 16) |
329
+ ((uint32_t)AES_sbox[(tmp >> 8) & 0xff] << 8) |
330
+ ((uint32_t)AES_sbox[(tmp >> 0) & 0xff] << 0))
331
+ ^ rcon[(uimm - 1) / 2];
332
+ } else {
333
+ rk[8] = rk[0] ^ (((uint32_t)AES_sbox[(rk[7] >> 24) & 0xff] << 24) |
334
+ ((uint32_t)AES_sbox[(rk[7] >> 16) & 0xff] << 16) |
335
+ ((uint32_t)AES_sbox[(rk[7] >> 8) & 0xff] << 8) |
336
+ ((uint32_t)AES_sbox[(rk[7] >> 0) & 0xff] << 0));
337
+ }
338
+ rk[9] = rk[1] ^ rk[8];
339
+ rk[10] = rk[2] ^ rk[9];
340
+ rk[11] = rk[3] ^ rk[10];
341
+
342
+ vd[i * 4 + H4(0)] = rk[8];
343
+ vd[i * 4 + H4(1)] = rk[9];
344
+ vd[i * 4 + H4(2)] = rk[10];
345
+ vd[i * 4 + H4(3)] = rk[11];
346
+ }
347
+ env->vstart = 0;
348
+ /* set tail elements to 1s */
349
+ vext_set_elems_1s(vd, vta, vl * 4, total_elems * 4);
350
+}
351
diff --git a/target/riscv/insn_trans/trans_rvvk.c.inc b/target/riscv/insn_trans/trans_rvvk.c.inc
352
index XXXXXXX..XXXXXXX 100644
353
--- a/target/riscv/insn_trans/trans_rvvk.c.inc
354
+++ b/target/riscv/insn_trans/trans_rvvk.c.inc
355
@@ -XXX,XX +XXX,XX @@ static bool vwsll_vx_check(DisasContext *s, arg_rmrr *a)
356
GEN_OPIVV_WIDEN_TRANS(vwsll_vv, vwsll_vv_check)
357
GEN_OPIVX_WIDEN_TRANS(vwsll_vx, vwsll_vx_check)
358
GEN_OPIVI_WIDEN_TRANS(vwsll_vi, IMM_ZX, vwsll_vx, vwsll_vx_check)
359
+
360
+/*
361
+ * Zvkned
362
+ */
363
+
364
+#define ZVKNED_EGS 4
365
+
366
+#define GEN_V_UNMASKED_TRANS(NAME, CHECK, EGS) \
367
+ static bool trans_##NAME(DisasContext *s, arg_##NAME *a) \
368
+ { \
369
+ if (CHECK(s, a)) { \
370
+ TCGv_ptr rd_v, rs2_v; \
371
+ TCGv_i32 desc, egs; \
372
+ uint32_t data = 0; \
373
+ TCGLabel *over = gen_new_label(); \
374
+ \
375
+ if (!s->vstart_eq_zero || !s->vl_eq_vlmax) { \
376
+ /* save opcode for unwinding in case we throw an exception */ \
377
+ decode_save_opc(s); \
378
+ egs = tcg_constant_i32(EGS); \
379
+ gen_helper_egs_check(egs, cpu_env); \
380
+ tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
381
+ } \
382
+ \
383
+ data = FIELD_DP32(data, VDATA, VM, a->vm); \
384
+ data = FIELD_DP32(data, VDATA, LMUL, s->lmul); \
385
+ data = FIELD_DP32(data, VDATA, VTA, s->vta); \
386
+ data = FIELD_DP32(data, VDATA, VTA_ALL_1S, s->cfg_vta_all_1s); \
387
+ data = FIELD_DP32(data, VDATA, VMA, s->vma); \
388
+ rd_v = tcg_temp_new_ptr(); \
389
+ rs2_v = tcg_temp_new_ptr(); \
390
+ desc = tcg_constant_i32( \
391
+ simd_desc(s->cfg_ptr->vlen / 8, s->cfg_ptr->vlen / 8, data)); \
392
+ tcg_gen_addi_ptr(rd_v, cpu_env, vreg_ofs(s, a->rd)); \
393
+ tcg_gen_addi_ptr(rs2_v, cpu_env, vreg_ofs(s, a->rs2)); \
394
+ gen_helper_##NAME(rd_v, rs2_v, cpu_env, desc); \
395
+ mark_vs_dirty(s); \
396
+ gen_set_label(over); \
397
+ return true; \
398
+ } \
399
+ return false; \
400
+ }
401
+
402
+static bool vaes_check_vv(DisasContext *s, arg_rmr *a)
403
+{
404
+ int egw_bytes = ZVKNED_EGS << s->sew;
405
+ return s->cfg_ptr->ext_zvkned == true &&
406
+ require_rvv(s) &&
407
+ vext_check_isa_ill(s) &&
408
+ MAXSZ(s) >= egw_bytes &&
409
+ require_align(a->rd, s->lmul) &&
410
+ require_align(a->rs2, s->lmul) &&
411
+ s->sew == MO_32;
412
+}
413
+
414
+static bool vaes_check_overlap(DisasContext *s, int vd, int vs2)
415
+{
416
+ int8_t op_size = s->lmul <= 0 ? 1 : 1 << s->lmul;
417
+ return !is_overlapped(vd, op_size, vs2, 1);
418
+}
419
+
420
+static bool vaes_check_vs(DisasContext *s, arg_rmr *a)
421
+{
422
+ int egw_bytes = ZVKNED_EGS << s->sew;
423
+ return vaes_check_overlap(s, a->rd, a->rs2) &&
424
+ MAXSZ(s) >= egw_bytes &&
425
+ s->cfg_ptr->ext_zvkned == true &&
426
+ require_rvv(s) &&
427
+ vext_check_isa_ill(s) &&
428
+ require_align(a->rd, s->lmul) &&
429
+ s->sew == MO_32;
430
+}
431
+
432
+GEN_V_UNMASKED_TRANS(vaesef_vv, vaes_check_vv, ZVKNED_EGS)
433
+GEN_V_UNMASKED_TRANS(vaesef_vs, vaes_check_vs, ZVKNED_EGS)
434
+GEN_V_UNMASKED_TRANS(vaesdf_vv, vaes_check_vv, ZVKNED_EGS)
435
+GEN_V_UNMASKED_TRANS(vaesdf_vs, vaes_check_vs, ZVKNED_EGS)
436
+GEN_V_UNMASKED_TRANS(vaesdm_vv, vaes_check_vv, ZVKNED_EGS)
437
+GEN_V_UNMASKED_TRANS(vaesdm_vs, vaes_check_vs, ZVKNED_EGS)
438
+GEN_V_UNMASKED_TRANS(vaesz_vs, vaes_check_vs, ZVKNED_EGS)
439
+GEN_V_UNMASKED_TRANS(vaesem_vv, vaes_check_vv, ZVKNED_EGS)
440
+GEN_V_UNMASKED_TRANS(vaesem_vs, vaes_check_vs, ZVKNED_EGS)
441
+
442
+#define GEN_VI_UNMASKED_TRANS(NAME, CHECK, EGS) \
443
+ static bool trans_##NAME(DisasContext *s, arg_##NAME *a) \
444
+ { \
445
+ if (CHECK(s, a)) { \
446
+ TCGv_ptr rd_v, rs2_v; \
447
+ TCGv_i32 uimm_v, desc, egs; \
448
+ uint32_t data = 0; \
449
+ TCGLabel *over = gen_new_label(); \
450
+ \
451
+ if (!s->vstart_eq_zero || !s->vl_eq_vlmax) { \
452
+ /* save opcode for unwinding in case we throw an exception */ \
453
+ decode_save_opc(s); \
454
+ egs = tcg_constant_i32(EGS); \
455
+ gen_helper_egs_check(egs, cpu_env); \
456
+ tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
457
+ } \
458
+ \
459
+ data = FIELD_DP32(data, VDATA, VM, a->vm); \
460
+ data = FIELD_DP32(data, VDATA, LMUL, s->lmul); \
461
+ data = FIELD_DP32(data, VDATA, VTA, s->vta); \
462
+ data = FIELD_DP32(data, VDATA, VTA_ALL_1S, s->cfg_vta_all_1s); \
463
+ data = FIELD_DP32(data, VDATA, VMA, s->vma); \
464
+ \
465
+ rd_v = tcg_temp_new_ptr(); \
466
+ rs2_v = tcg_temp_new_ptr(); \
467
+ uimm_v = tcg_constant_i32(a->rs1); \
468
+ desc = tcg_constant_i32( \
469
+ simd_desc(s->cfg_ptr->vlen / 8, s->cfg_ptr->vlen / 8, data)); \
470
+ tcg_gen_addi_ptr(rd_v, cpu_env, vreg_ofs(s, a->rd)); \
471
+ tcg_gen_addi_ptr(rs2_v, cpu_env, vreg_ofs(s, a->rs2)); \
472
+ gen_helper_##NAME(rd_v, rs2_v, uimm_v, cpu_env, desc); \
473
+ mark_vs_dirty(s); \
474
+ gen_set_label(over); \
475
+ return true; \
476
+ } \
477
+ return false; \
478
+ }
479
+
480
+static bool vaeskf1_check(DisasContext *s, arg_vaeskf1_vi *a)
481
+{
482
+ int egw_bytes = ZVKNED_EGS << s->sew;
483
+ return s->cfg_ptr->ext_zvkned == true &&
484
+ require_rvv(s) &&
485
+ vext_check_isa_ill(s) &&
486
+ MAXSZ(s) >= egw_bytes &&
487
+ s->sew == MO_32 &&
488
+ require_align(a->rd, s->lmul) &&
489
+ require_align(a->rs2, s->lmul);
490
+}
491
+
492
+static bool vaeskf2_check(DisasContext *s, arg_vaeskf2_vi *a)
493
+{
494
+ int egw_bytes = ZVKNED_EGS << s->sew;
495
+ return s->cfg_ptr->ext_zvkned == true &&
496
+ require_rvv(s) &&
497
+ vext_check_isa_ill(s) &&
498
+ MAXSZ(s) >= egw_bytes &&
499
+ s->sew == MO_32 &&
500
+ require_align(a->rd, s->lmul) &&
501
+ require_align(a->rs2, s->lmul);
502
+}
503
+
504
+GEN_VI_UNMASKED_TRANS(vaeskf1_vi, vaeskf1_check, ZVKNED_EGS)
505
+GEN_VI_UNMASKED_TRANS(vaeskf2_vi, vaeskf2_check, ZVKNED_EGS)
506
--
507
2.41.0
diff view generated by jsdifflib
1
From: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
2
3
This commit adds support for the Zvknh vector-crypto extension, which
4
consists of the following instructions:
5
6
* vsha2ms.vv
7
* vsha2c[hl].vv
8
9
Translation functions are defined in
10
`target/riscv/insn_trans/trans_rvvk.c.inc` and helpers are defined in
11
`target/riscv/vcrypto_helper.c`.
12
13
Co-authored-by: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
14
Co-authored-by: Lawrence Hunter <lawrence.hunter@codethink.co.uk>
15
[max.chou@sifive.com: Replaced vstart checking by TCG op]
16
Signed-off-by: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
17
Signed-off-by: Lawrence Hunter <lawrence.hunter@codethink.co.uk>
18
Signed-off-by: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
19
Signed-off-by: Max Chou <max.chou@sifive.com>
20
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
21
[max.chou@sifive.com: Exposed x-zvknha & x-zvknhb properties]
22
[max.chou@sifive.com: Replaced SEW selection to happened during
23
translation]
24
Message-ID: <20230711165917.2629866-11-max.chou@sifive.com>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
25
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: 4c744dce9b0b057cbb5cc0f4d4ac75cda682a8af.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <4c744dce9b0b057cbb5cc0f4d4ac75cda682a8af.1597259519.git.alistair.francis@wdc.com>
4
---
26
---
5
target/riscv/cpu_bits.h | 6 +++
27
target/riscv/cpu_cfg.h | 2 +
6
target/riscv/helper.h | 1 +
28
target/riscv/helper.h | 6 +
7
target/riscv/csr.c | 64 ++++++++++++++++++++++++-
29
target/riscv/insn32.decode | 5 +
8
target/riscv/op_helper.c | 42 ++++++++++++++--
30
target/riscv/cpu.c | 13 +-
9
target/riscv/insn_trans/trans_rvh.c.inc | 2 +-
31
target/riscv/vcrypto_helper.c | 238 +++++++++++++++++++++++
10
5 files changed, 109 insertions(+), 6 deletions(-)
32
target/riscv/insn_trans/trans_rvvk.c.inc | 129 ++++++++++++
33
6 files changed, 390 insertions(+), 3 deletions(-)
11
34
12
diff --git a/target/riscv/cpu_bits.h b/target/riscv/cpu_bits.h
35
diff --git a/target/riscv/cpu_cfg.h b/target/riscv/cpu_cfg.h
13
index XXXXXXX..XXXXXXX 100644
36
index XXXXXXX..XXXXXXX 100644
14
--- a/target/riscv/cpu_bits.h
37
--- a/target/riscv/cpu_cfg.h
15
+++ b/target/riscv/cpu_bits.h
38
+++ b/target/riscv/cpu_cfg.h
16
@@ -XXX,XX +XXX,XX @@
39
@@ -XXX,XX +XXX,XX @@ struct RISCVCPUConfig {
17
#define HSTATUS_WPRI HSTATUS64_WPRI
40
bool ext_zvbb;
18
#endif
41
bool ext_zvbc;
19
42
bool ext_zvkned;
20
+#define HCOUNTEREN_CY (1 << 0)
43
+ bool ext_zvknha;
21
+#define HCOUNTEREN_TM (1 << 1)
44
+ bool ext_zvknhb;
22
+#define HCOUNTEREN_IR (1 << 2)
45
bool ext_zmmul;
23
+#define HCOUNTEREN_HPM3 (1 << 3)
46
bool ext_zvfbfmin;
24
+
47
bool ext_zvfbfwma;
25
/* Privilege modes */
26
#define PRV_U 0
27
#define PRV_S 1
28
@@ -XXX,XX +XXX,XX @@
29
#define RISCV_EXCP_STORE_PAGE_FAULT 0xf /* since: priv-1.10.0 */
30
#define RISCV_EXCP_INST_GUEST_PAGE_FAULT 0x14
31
#define RISCV_EXCP_LOAD_GUEST_ACCESS_FAULT 0x15
32
+#define RISCV_EXCP_VIRT_INSTRUCTION_FAULT 0x16
33
#define RISCV_EXCP_STORE_GUEST_AMO_ACCESS_FAULT 0x17
34
35
#define RISCV_EXCP_INT_FLAG 0x80000000
36
diff --git a/target/riscv/helper.h b/target/riscv/helper.h
48
diff --git a/target/riscv/helper.h b/target/riscv/helper.h
37
index XXXXXXX..XXXXXXX 100644
49
index XXXXXXX..XXXXXXX 100644
38
--- a/target/riscv/helper.h
50
--- a/target/riscv/helper.h
39
+++ b/target/riscv/helper.h
51
+++ b/target/riscv/helper.h
40
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_1(tlb_flush, void, env)
52
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_4(vaesdm_vs, void, ptr, ptr, env, i32)
41
/* Hypervisor functions */
53
DEF_HELPER_4(vaesz_vs, void, ptr, ptr, env, i32)
42
#ifndef CONFIG_USER_ONLY
54
DEF_HELPER_5(vaeskf1_vi, void, ptr, ptr, i32, env, i32)
43
DEF_HELPER_1(hyp_tlb_flush, void, env)
55
DEF_HELPER_5(vaeskf2_vi, void, ptr, ptr, i32, env, i32)
44
+DEF_HELPER_1(hyp_gvma_tlb_flush, void, env)
56
+
45
DEF_HELPER_4(hyp_load, tl, env, tl, tl, tl)
57
+DEF_HELPER_5(vsha2ms_vv, void, ptr, ptr, ptr, env, i32)
46
DEF_HELPER_5(hyp_store, void, env, tl, tl, tl, tl)
58
+DEF_HELPER_5(vsha2ch32_vv, void, ptr, ptr, ptr, env, i32)
47
DEF_HELPER_4(hyp_x_load, tl, env, tl, tl, tl)
59
+DEF_HELPER_5(vsha2ch64_vv, void, ptr, ptr, ptr, env, i32)
48
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
60
+DEF_HELPER_5(vsha2cl32_vv, void, ptr, ptr, ptr, env, i32)
61
+DEF_HELPER_5(vsha2cl64_vv, void, ptr, ptr, ptr, env, i32)
62
diff --git a/target/riscv/insn32.decode b/target/riscv/insn32.decode
49
index XXXXXXX..XXXXXXX 100644
63
index XXXXXXX..XXXXXXX 100644
50
--- a/target/riscv/csr.c
64
--- a/target/riscv/insn32.decode
51
+++ b/target/riscv/csr.c
65
+++ b/target/riscv/insn32.decode
52
@@ -XXX,XX +XXX,XX @@ static int ctr(CPURISCVState *env, int csrno)
66
@@ -XXX,XX +XXX,XX @@ vaesdm_vs 101001 1 ..... 00000 010 ..... 1110111 @r2_vm_1
53
/* The Counters extensions is not enabled */
67
vaesz_vs 101001 1 ..... 00111 010 ..... 1110111 @r2_vm_1
54
return -RISCV_EXCP_ILLEGAL_INST;
68
vaeskf1_vi 100010 1 ..... ..... 010 ..... 1110111 @r_vm_1
55
}
69
vaeskf2_vi 101010 1 ..... ..... 010 ..... 1110111 @r_vm_1
56
+
70
+
57
+ if (riscv_cpu_virt_enabled(env)) {
71
+# *** Zvknh vector crypto extension ***
58
+ switch (csrno) {
72
+vsha2ms_vv 101101 1 ..... ..... 010 ..... 1110111 @r_vm_1
59
+ case CSR_CYCLE:
73
+vsha2ch_vv 101110 1 ..... ..... 010 ..... 1110111 @r_vm_1
60
+ if (!get_field(env->hcounteren, HCOUNTEREN_CY) &&
74
+vsha2cl_vv 101111 1 ..... ..... 010 ..... 1110111 @r_vm_1
61
+ get_field(env->mcounteren, HCOUNTEREN_CY)) {
75
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
62
+ return -RISCV_EXCP_VIRT_INSTRUCTION_FAULT;
63
+ }
64
+ break;
65
+ case CSR_TIME:
66
+ if (!get_field(env->hcounteren, HCOUNTEREN_TM) &&
67
+ get_field(env->mcounteren, HCOUNTEREN_TM)) {
68
+ return -RISCV_EXCP_VIRT_INSTRUCTION_FAULT;
69
+ }
70
+ break;
71
+ case CSR_INSTRET:
72
+ if (!get_field(env->hcounteren, HCOUNTEREN_IR) &&
73
+ get_field(env->mcounteren, HCOUNTEREN_IR)) {
74
+ return -RISCV_EXCP_VIRT_INSTRUCTION_FAULT;
75
+ }
76
+ break;
77
+ case CSR_HPMCOUNTER3...CSR_HPMCOUNTER31:
78
+ if (!get_field(env->hcounteren, 1 << (csrno - CSR_HPMCOUNTER3)) &&
79
+ get_field(env->mcounteren, 1 << (csrno - CSR_HPMCOUNTER3))) {
80
+ return -RISCV_EXCP_VIRT_INSTRUCTION_FAULT;
81
+ }
82
+ break;
83
+#if defined(TARGET_RISCV32)
84
+ case CSR_CYCLEH:
85
+ if (!get_field(env->hcounteren, HCOUNTEREN_CY) &&
86
+ get_field(env->mcounteren, HCOUNTEREN_CY)) {
87
+ return -RISCV_EXCP_VIRT_INSTRUCTION_FAULT;
88
+ }
89
+ break;
90
+ case CSR_TIMEH:
91
+ if (!get_field(env->hcounteren, HCOUNTEREN_TM) &&
92
+ get_field(env->mcounteren, HCOUNTEREN_TM)) {
93
+ return -RISCV_EXCP_VIRT_INSTRUCTION_FAULT;
94
+ }
95
+ break;
96
+ case CSR_INSTRETH:
97
+ if (!get_field(env->hcounteren, HCOUNTEREN_IR) &&
98
+ get_field(env->mcounteren, HCOUNTEREN_IR)) {
99
+ return -RISCV_EXCP_VIRT_INSTRUCTION_FAULT;
100
+ }
101
+ break;
102
+ case CSR_HPMCOUNTER3H...CSR_HPMCOUNTER31H:
103
+ if (!get_field(env->hcounteren, 1 << (csrno - CSR_HPMCOUNTER3H)) &&
104
+ get_field(env->mcounteren, 1 << (csrno - CSR_HPMCOUNTER3H))) {
105
+ return -RISCV_EXCP_VIRT_INSTRUCTION_FAULT;
106
+ }
107
+ break;
108
+#endif
109
+ }
110
+ }
111
#endif
112
return 0;
113
}
114
@@ -XXX,XX +XXX,XX @@ static int hmode(CPURISCVState *env, int csrno)
115
if ((env->priv == PRV_S && !riscv_cpu_virt_enabled(env)) ||
116
env->priv == PRV_M) {
117
return 0;
118
+ } else {
119
+ return -RISCV_EXCP_VIRT_INSTRUCTION_FAULT;
120
}
121
}
122
123
@@ -XXX,XX +XXX,XX @@ static const target_ulong delegable_excps =
124
(1ULL << (RISCV_EXCP_STORE_PAGE_FAULT)) |
125
(1ULL << (RISCV_EXCP_INST_GUEST_PAGE_FAULT)) |
126
(1ULL << (RISCV_EXCP_LOAD_GUEST_ACCESS_FAULT)) |
127
+ (1ULL << (RISCV_EXCP_VIRT_INSTRUCTION_FAULT)) |
128
(1ULL << (RISCV_EXCP_STORE_GUEST_AMO_ACCESS_FAULT));
129
static const target_ulong sstatus_v1_10_mask = SSTATUS_SIE | SSTATUS_SPIE |
130
SSTATUS_UIE | SSTATUS_UPIE | SSTATUS_SPP | SSTATUS_FS | SSTATUS_XS |
131
@@ -XXX,XX +XXX,XX @@ int riscv_csrrw(CPURISCVState *env, int csrno, target_ulong *ret_value,
132
}
133
134
/* check predicate */
135
- if (!csr_ops[csrno].predicate || csr_ops[csrno].predicate(env, csrno) < 0) {
136
+ if (!csr_ops[csrno].predicate) {
137
return -RISCV_EXCP_ILLEGAL_INST;
138
}
139
+ ret = csr_ops[csrno].predicate(env, csrno);
140
+ if (ret < 0) {
141
+ return ret;
142
+ }
143
144
/* execute combined read/write operation if it exists */
145
if (csr_ops[csrno].op) {
146
diff --git a/target/riscv/op_helper.c b/target/riscv/op_helper.c
147
index XXXXXXX..XXXXXXX 100644
76
index XXXXXXX..XXXXXXX 100644
148
--- a/target/riscv/op_helper.c
77
--- a/target/riscv/cpu.c
149
+++ b/target/riscv/op_helper.c
78
+++ b/target/riscv/cpu.c
150
@@ -XXX,XX +XXX,XX @@ target_ulong helper_sret(CPURISCVState *env, target_ulong cpu_pc_deb)
79
@@ -XXX,XX +XXX,XX @@ static const struct isa_ext_data isa_edata_arr[] = {
151
riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
80
ISA_EXT_DATA_ENTRY(zvfh, PRIV_VERSION_1_12_0, ext_zvfh),
152
}
81
ISA_EXT_DATA_ENTRY(zvfhmin, PRIV_VERSION_1_12_0, ext_zvfhmin),
153
82
ISA_EXT_DATA_ENTRY(zvkned, PRIV_VERSION_1_12_0, ext_zvkned),
154
+ if (riscv_has_ext(env, RVH) && riscv_cpu_virt_enabled(env) &&
83
+ ISA_EXT_DATA_ENTRY(zvknha, PRIV_VERSION_1_12_0, ext_zvknha),
155
+ get_field(env->hstatus, HSTATUS_VTSR)) {
84
+ ISA_EXT_DATA_ENTRY(zvknhb, PRIV_VERSION_1_12_0, ext_zvknhb),
156
+ riscv_raise_exception(env, RISCV_EXCP_VIRT_INSTRUCTION_FAULT, GETPC());
85
ISA_EXT_DATA_ENTRY(zhinx, PRIV_VERSION_1_12_0, ext_zhinx),
157
+ }
86
ISA_EXT_DATA_ENTRY(zhinxmin, PRIV_VERSION_1_12_0, ext_zhinxmin),
158
+
87
ISA_EXT_DATA_ENTRY(smaia, PRIV_VERSION_1_12_0, ext_smaia),
159
mstatus = env->mstatus;
88
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_validate_set_extensions(RISCVCPU *cpu, Error **errp)
160
89
* In principle Zve*x would also suffice here, were they supported
161
if (riscv_has_ext(env, RVH) && !riscv_cpu_virt_enabled(env)) {
90
* in qemu
162
@@ -XXX,XX +XXX,XX @@ void helper_wfi(CPURISCVState *env)
91
*/
163
if ((env->priv == PRV_S &&
92
- if ((cpu->cfg.ext_zvbb || cpu->cfg.ext_zvkned) && !cpu->cfg.ext_zve32f) {
164
get_field(env->mstatus, MSTATUS_TW)) ||
93
+ if ((cpu->cfg.ext_zvbb || cpu->cfg.ext_zvkned || cpu->cfg.ext_zvknha) &&
165
riscv_cpu_virt_enabled(env)) {
94
+ !cpu->cfg.ext_zve32f) {
166
- riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
95
error_setg(errp,
167
+ riscv_raise_exception(env, RISCV_EXCP_VIRT_INSTRUCTION_FAULT, GETPC());
96
"Vector crypto extensions require V or Zve* extensions");
168
} else {
169
cs->halted = 1;
170
cs->exception_index = EXCP_HLT;
171
@@ -XXX,XX +XXX,XX @@ void helper_tlb_flush(CPURISCVState *env)
172
(env->priv == PRV_S &&
173
get_field(env->mstatus, MSTATUS_TVM))) {
174
riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
175
+ } else if (riscv_has_ext(env, RVH) && riscv_cpu_virt_enabled(env) &&
176
+ get_field(env->hstatus, HSTATUS_VTVM)) {
177
+ riscv_raise_exception(env, RISCV_EXCP_VIRT_INSTRUCTION_FAULT, GETPC());
178
} else {
179
tlb_flush(cs);
180
}
181
@@ -XXX,XX +XXX,XX @@ void helper_hyp_tlb_flush(CPURISCVState *env)
182
{
183
CPUState *cs = env_cpu(env);
184
185
+ if (env->priv == PRV_S && riscv_cpu_virt_enabled(env)) {
186
+ riscv_raise_exception(env, RISCV_EXCP_VIRT_INSTRUCTION_FAULT, GETPC());
187
+ }
188
+
189
if (env->priv == PRV_M ||
190
(env->priv == PRV_S && !riscv_cpu_virt_enabled(env))) {
191
tlb_flush(cs);
192
@@ -XXX,XX +XXX,XX @@ void helper_hyp_tlb_flush(CPURISCVState *env)
193
riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
194
}
195
196
+void helper_hyp_gvma_tlb_flush(CPURISCVState *env)
197
+{
198
+ if (env->priv == PRV_S && !riscv_cpu_virt_enabled(env) &&
199
+ get_field(env->mstatus, MSTATUS_TVM)) {
200
+ riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
201
+ }
202
+
203
+ helper_hyp_tlb_flush(env);
204
+}
205
+
206
target_ulong helper_hyp_load(CPURISCVState *env, target_ulong address,
207
target_ulong attrs, target_ulong memop)
208
{
209
@@ -XXX,XX +XXX,XX @@ target_ulong helper_hyp_load(CPURISCVState *env, target_ulong address,
210
return pte;
211
}
212
213
- riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
214
+ if (riscv_cpu_virt_enabled(env)) {
215
+ riscv_raise_exception(env, RISCV_EXCP_VIRT_INSTRUCTION_FAULT, GETPC());
216
+ } else {
217
+ riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
218
+ }
219
return 0;
220
}
221
222
@@ -XXX,XX +XXX,XX @@ void helper_hyp_store(CPURISCVState *env, target_ulong address,
223
return;
97
return;
224
}
98
}
225
99
226
- riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
100
- if (cpu->cfg.ext_zvbc && !cpu->cfg.ext_zve64f) {
227
+ if (riscv_cpu_virt_enabled(env)) {
101
- error_setg(errp, "Zvbc extension requires V or Zve64{f,d} extensions");
228
+ riscv_raise_exception(env, RISCV_EXCP_VIRT_INSTRUCTION_FAULT, GETPC());
102
+ if ((cpu->cfg.ext_zvbc || cpu->cfg.ext_zvknhb) && !cpu->cfg.ext_zve64f) {
229
+ } else {
103
+ error_setg(
230
+ riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
104
+ errp,
231
+ }
105
+ "Zvbc and Zvknhb extensions require V or Zve64{f,d} extensions");
106
return;
107
}
108
109
@@ -XXX,XX +XXX,XX @@ static Property riscv_cpu_extensions[] = {
110
DEFINE_PROP_BOOL("x-zvbb", RISCVCPU, cfg.ext_zvbb, false),
111
DEFINE_PROP_BOOL("x-zvbc", RISCVCPU, cfg.ext_zvbc, false),
112
DEFINE_PROP_BOOL("x-zvkned", RISCVCPU, cfg.ext_zvkned, false),
113
+ DEFINE_PROP_BOOL("x-zvknha", RISCVCPU, cfg.ext_zvknha, false),
114
+ DEFINE_PROP_BOOL("x-zvknhb", RISCVCPU, cfg.ext_zvknhb, false),
115
116
DEFINE_PROP_END_OF_LIST(),
117
};
118
diff --git a/target/riscv/vcrypto_helper.c b/target/riscv/vcrypto_helper.c
119
index XXXXXXX..XXXXXXX 100644
120
--- a/target/riscv/vcrypto_helper.c
121
+++ b/target/riscv/vcrypto_helper.c
122
@@ -XXX,XX +XXX,XX @@ void HELPER(vaeskf2_vi)(void *vd_vptr, void *vs2_vptr, uint32_t uimm,
123
/* set tail elements to 1s */
124
vext_set_elems_1s(vd, vta, vl * 4, total_elems * 4);
232
}
125
}
233
126
+
234
target_ulong helper_hyp_x_load(CPURISCVState *env, target_ulong address,
127
+static inline uint32_t sig0_sha256(uint32_t x)
235
@@ -XXX,XX +XXX,XX @@ target_ulong helper_hyp_x_load(CPURISCVState *env, target_ulong address,
128
+{
236
return pte;
129
+ return ror32(x, 7) ^ ror32(x, 18) ^ (x >> 3);
237
}
130
+}
238
131
+
239
- riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
132
+static inline uint32_t sig1_sha256(uint32_t x)
240
+ if (riscv_cpu_virt_enabled(env)) {
133
+{
241
+ riscv_raise_exception(env, RISCV_EXCP_VIRT_INSTRUCTION_FAULT, GETPC());
134
+ return ror32(x, 17) ^ ror32(x, 19) ^ (x >> 10);
242
+ } else {
135
+}
243
+ riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
136
+
244
+ }
137
+static inline uint64_t sig0_sha512(uint64_t x)
245
return 0;
138
+{
246
}
139
+ return ror64(x, 1) ^ ror64(x, 8) ^ (x >> 7);
247
140
+}
248
diff --git a/target/riscv/insn_trans/trans_rvh.c.inc b/target/riscv/insn_trans/trans_rvh.c.inc
141
+
142
+static inline uint64_t sig1_sha512(uint64_t x)
143
+{
144
+ return ror64(x, 19) ^ ror64(x, 61) ^ (x >> 6);
145
+}
146
+
147
+static inline void vsha2ms_e32(uint32_t *vd, uint32_t *vs1, uint32_t *vs2)
148
+{
149
+ uint32_t res[4];
150
+ res[0] = sig1_sha256(vs1[H4(2)]) + vs2[H4(1)] + sig0_sha256(vd[H4(1)]) +
151
+ vd[H4(0)];
152
+ res[1] = sig1_sha256(vs1[H4(3)]) + vs2[H4(2)] + sig0_sha256(vd[H4(2)]) +
153
+ vd[H4(1)];
154
+ res[2] =
155
+ sig1_sha256(res[0]) + vs2[H4(3)] + sig0_sha256(vd[H4(3)]) + vd[H4(2)];
156
+ res[3] =
157
+ sig1_sha256(res[1]) + vs1[H4(0)] + sig0_sha256(vs2[H4(0)]) + vd[H4(3)];
158
+ vd[H4(3)] = res[3];
159
+ vd[H4(2)] = res[2];
160
+ vd[H4(1)] = res[1];
161
+ vd[H4(0)] = res[0];
162
+}
163
+
164
+static inline void vsha2ms_e64(uint64_t *vd, uint64_t *vs1, uint64_t *vs2)
165
+{
166
+ uint64_t res[4];
167
+ res[0] = sig1_sha512(vs1[2]) + vs2[1] + sig0_sha512(vd[1]) + vd[0];
168
+ res[1] = sig1_sha512(vs1[3]) + vs2[2] + sig0_sha512(vd[2]) + vd[1];
169
+ res[2] = sig1_sha512(res[0]) + vs2[3] + sig0_sha512(vd[3]) + vd[2];
170
+ res[3] = sig1_sha512(res[1]) + vs1[0] + sig0_sha512(vs2[0]) + vd[3];
171
+ vd[3] = res[3];
172
+ vd[2] = res[2];
173
+ vd[1] = res[1];
174
+ vd[0] = res[0];
175
+}
176
+
177
+void HELPER(vsha2ms_vv)(void *vd, void *vs1, void *vs2, CPURISCVState *env,
178
+ uint32_t desc)
179
+{
180
+ uint32_t sew = FIELD_EX64(env->vtype, VTYPE, VSEW);
181
+ uint32_t esz = sew == MO_32 ? 4 : 8;
182
+ uint32_t total_elems;
183
+ uint32_t vta = vext_vta(desc);
184
+
185
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) {
186
+ if (sew == MO_32) {
187
+ vsha2ms_e32(((uint32_t *)vd) + i * 4, ((uint32_t *)vs1) + i * 4,
188
+ ((uint32_t *)vs2) + i * 4);
189
+ } else {
190
+ /* If not 32 then SEW should be 64 */
191
+ vsha2ms_e64(((uint64_t *)vd) + i * 4, ((uint64_t *)vs1) + i * 4,
192
+ ((uint64_t *)vs2) + i * 4);
193
+ }
194
+ }
195
+ /* set tail elements to 1s */
196
+ total_elems = vext_get_total_elems(env, desc, esz);
197
+ vext_set_elems_1s(vd, vta, env->vl * esz, total_elems * esz);
198
+ env->vstart = 0;
199
+}
200
+
201
+static inline uint64_t sum0_64(uint64_t x)
202
+{
203
+ return ror64(x, 28) ^ ror64(x, 34) ^ ror64(x, 39);
204
+}
205
+
206
+static inline uint32_t sum0_32(uint32_t x)
207
+{
208
+ return ror32(x, 2) ^ ror32(x, 13) ^ ror32(x, 22);
209
+}
210
+
211
+static inline uint64_t sum1_64(uint64_t x)
212
+{
213
+ return ror64(x, 14) ^ ror64(x, 18) ^ ror64(x, 41);
214
+}
215
+
216
+static inline uint32_t sum1_32(uint32_t x)
217
+{
218
+ return ror32(x, 6) ^ ror32(x, 11) ^ ror32(x, 25);
219
+}
220
+
221
+#define ch(x, y, z) ((x & y) ^ ((~x) & z))
222
+
223
+#define maj(x, y, z) ((x & y) ^ (x & z) ^ (y & z))
224
+
225
+static void vsha2c_64(uint64_t *vs2, uint64_t *vd, uint64_t *vs1)
226
+{
227
+ uint64_t a = vs2[3], b = vs2[2], e = vs2[1], f = vs2[0];
228
+ uint64_t c = vd[3], d = vd[2], g = vd[1], h = vd[0];
229
+ uint64_t W0 = vs1[0], W1 = vs1[1];
230
+ uint64_t T1 = h + sum1_64(e) + ch(e, f, g) + W0;
231
+ uint64_t T2 = sum0_64(a) + maj(a, b, c);
232
+
233
+ h = g;
234
+ g = f;
235
+ f = e;
236
+ e = d + T1;
237
+ d = c;
238
+ c = b;
239
+ b = a;
240
+ a = T1 + T2;
241
+
242
+ T1 = h + sum1_64(e) + ch(e, f, g) + W1;
243
+ T2 = sum0_64(a) + maj(a, b, c);
244
+ h = g;
245
+ g = f;
246
+ f = e;
247
+ e = d + T1;
248
+ d = c;
249
+ c = b;
250
+ b = a;
251
+ a = T1 + T2;
252
+
253
+ vd[0] = f;
254
+ vd[1] = e;
255
+ vd[2] = b;
256
+ vd[3] = a;
257
+}
258
+
259
+static void vsha2c_32(uint32_t *vs2, uint32_t *vd, uint32_t *vs1)
260
+{
261
+ uint32_t a = vs2[H4(3)], b = vs2[H4(2)], e = vs2[H4(1)], f = vs2[H4(0)];
262
+ uint32_t c = vd[H4(3)], d = vd[H4(2)], g = vd[H4(1)], h = vd[H4(0)];
263
+ uint32_t W0 = vs1[H4(0)], W1 = vs1[H4(1)];
264
+ uint32_t T1 = h + sum1_32(e) + ch(e, f, g) + W0;
265
+ uint32_t T2 = sum0_32(a) + maj(a, b, c);
266
+
267
+ h = g;
268
+ g = f;
269
+ f = e;
270
+ e = d + T1;
271
+ d = c;
272
+ c = b;
273
+ b = a;
274
+ a = T1 + T2;
275
+
276
+ T1 = h + sum1_32(e) + ch(e, f, g) + W1;
277
+ T2 = sum0_32(a) + maj(a, b, c);
278
+ h = g;
279
+ g = f;
280
+ f = e;
281
+ e = d + T1;
282
+ d = c;
283
+ c = b;
284
+ b = a;
285
+ a = T1 + T2;
286
+
287
+ vd[H4(0)] = f;
288
+ vd[H4(1)] = e;
289
+ vd[H4(2)] = b;
290
+ vd[H4(3)] = a;
291
+}
292
+
293
+void HELPER(vsha2ch32_vv)(void *vd, void *vs1, void *vs2, CPURISCVState *env,
294
+ uint32_t desc)
295
+{
296
+ const uint32_t esz = 4;
297
+ uint32_t total_elems;
298
+ uint32_t vta = vext_vta(desc);
299
+
300
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) {
301
+ vsha2c_32(((uint32_t *)vs2) + 4 * i, ((uint32_t *)vd) + 4 * i,
302
+ ((uint32_t *)vs1) + 4 * i + 2);
303
+ }
304
+
305
+ /* set tail elements to 1s */
306
+ total_elems = vext_get_total_elems(env, desc, esz);
307
+ vext_set_elems_1s(vd, vta, env->vl * esz, total_elems * esz);
308
+ env->vstart = 0;
309
+}
310
+
311
+void HELPER(vsha2ch64_vv)(void *vd, void *vs1, void *vs2, CPURISCVState *env,
312
+ uint32_t desc)
313
+{
314
+ const uint32_t esz = 8;
315
+ uint32_t total_elems;
316
+ uint32_t vta = vext_vta(desc);
317
+
318
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) {
319
+ vsha2c_64(((uint64_t *)vs2) + 4 * i, ((uint64_t *)vd) + 4 * i,
320
+ ((uint64_t *)vs1) + 4 * i + 2);
321
+ }
322
+
323
+ /* set tail elements to 1s */
324
+ total_elems = vext_get_total_elems(env, desc, esz);
325
+ vext_set_elems_1s(vd, vta, env->vl * esz, total_elems * esz);
326
+ env->vstart = 0;
327
+}
328
+
329
+void HELPER(vsha2cl32_vv)(void *vd, void *vs1, void *vs2, CPURISCVState *env,
330
+ uint32_t desc)
331
+{
332
+ const uint32_t esz = 4;
333
+ uint32_t total_elems;
334
+ uint32_t vta = vext_vta(desc);
335
+
336
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) {
337
+ vsha2c_32(((uint32_t *)vs2) + 4 * i, ((uint32_t *)vd) + 4 * i,
338
+ (((uint32_t *)vs1) + 4 * i));
339
+ }
340
+
341
+ /* set tail elements to 1s */
342
+ total_elems = vext_get_total_elems(env, desc, esz);
343
+ vext_set_elems_1s(vd, vta, env->vl * esz, total_elems * esz);
344
+ env->vstart = 0;
345
+}
346
+
347
+void HELPER(vsha2cl64_vv)(void *vd, void *vs1, void *vs2, CPURISCVState *env,
348
+ uint32_t desc)
349
+{
350
+ uint32_t esz = 8;
351
+ uint32_t total_elems;
352
+ uint32_t vta = vext_vta(desc);
353
+
354
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) {
355
+ vsha2c_64(((uint64_t *)vs2) + 4 * i, ((uint64_t *)vd) + 4 * i,
356
+ (((uint64_t *)vs1) + 4 * i));
357
+ }
358
+
359
+ /* set tail elements to 1s */
360
+ total_elems = vext_get_total_elems(env, desc, esz);
361
+ vext_set_elems_1s(vd, vta, env->vl * esz, total_elems * esz);
362
+ env->vstart = 0;
363
+}
364
diff --git a/target/riscv/insn_trans/trans_rvvk.c.inc b/target/riscv/insn_trans/trans_rvvk.c.inc
249
index XXXXXXX..XXXXXXX 100644
365
index XXXXXXX..XXXXXXX 100644
250
--- a/target/riscv/insn_trans/trans_rvh.c.inc
366
--- a/target/riscv/insn_trans/trans_rvvk.c.inc
251
+++ b/target/riscv/insn_trans/trans_rvh.c.inc
367
+++ b/target/riscv/insn_trans/trans_rvvk.c.inc
252
@@ -XXX,XX +XXX,XX @@ static bool trans_hfence_gvma(DisasContext *ctx, arg_sfence_vma *a)
368
@@ -XXX,XX +XXX,XX @@ static bool vaeskf2_check(DisasContext *s, arg_vaeskf2_vi *a)
253
{
369
254
REQUIRE_EXT(ctx, RVH);
370
GEN_VI_UNMASKED_TRANS(vaeskf1_vi, vaeskf1_check, ZVKNED_EGS)
255
#ifndef CONFIG_USER_ONLY
371
GEN_VI_UNMASKED_TRANS(vaeskf2_vi, vaeskf2_check, ZVKNED_EGS)
256
- gen_helper_hyp_tlb_flush(cpu_env);
372
+
257
+ gen_helper_hyp_gvma_tlb_flush(cpu_env);
373
+/*
258
return true;
374
+ * Zvknh
259
#endif
375
+ */
260
return false;
376
+
377
+#define ZVKNH_EGS 4
378
+
379
+#define GEN_VV_UNMASKED_TRANS(NAME, CHECK, EGS) \
380
+ static bool trans_##NAME(DisasContext *s, arg_rmrr *a) \
381
+ { \
382
+ if (CHECK(s, a)) { \
383
+ uint32_t data = 0; \
384
+ TCGLabel *over = gen_new_label(); \
385
+ TCGv_i32 egs; \
386
+ \
387
+ if (!s->vstart_eq_zero || !s->vl_eq_vlmax) { \
388
+ /* save opcode for unwinding in case we throw an exception */ \
389
+ decode_save_opc(s); \
390
+ egs = tcg_constant_i32(EGS); \
391
+ gen_helper_egs_check(egs, cpu_env); \
392
+ tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); \
393
+ } \
394
+ \
395
+ data = FIELD_DP32(data, VDATA, VM, a->vm); \
396
+ data = FIELD_DP32(data, VDATA, LMUL, s->lmul); \
397
+ data = FIELD_DP32(data, VDATA, VTA, s->vta); \
398
+ data = FIELD_DP32(data, VDATA, VTA_ALL_1S, s->cfg_vta_all_1s); \
399
+ data = FIELD_DP32(data, VDATA, VMA, s->vma); \
400
+ \
401
+ tcg_gen_gvec_3_ptr(vreg_ofs(s, a->rd), vreg_ofs(s, a->rs1), \
402
+ vreg_ofs(s, a->rs2), cpu_env, \
403
+ s->cfg_ptr->vlen / 8, s->cfg_ptr->vlen / 8, \
404
+ data, gen_helper_##NAME); \
405
+ \
406
+ mark_vs_dirty(s); \
407
+ gen_set_label(over); \
408
+ return true; \
409
+ } \
410
+ return false; \
411
+ }
412
+
413
+static bool vsha_check_sew(DisasContext *s)
414
+{
415
+ return (s->cfg_ptr->ext_zvknha == true && s->sew == MO_32) ||
416
+ (s->cfg_ptr->ext_zvknhb == true &&
417
+ (s->sew == MO_32 || s->sew == MO_64));
418
+}
419
+
420
+static bool vsha_check(DisasContext *s, arg_rmrr *a)
421
+{
422
+ int egw_bytes = ZVKNH_EGS << s->sew;
423
+ int mult = 1 << MAX(s->lmul, 0);
424
+ return opivv_check(s, a) &&
425
+ vsha_check_sew(s) &&
426
+ MAXSZ(s) >= egw_bytes &&
427
+ !is_overlapped(a->rd, mult, a->rs1, mult) &&
428
+ !is_overlapped(a->rd, mult, a->rs2, mult) &&
429
+ s->lmul >= 0;
430
+}
431
+
432
+GEN_VV_UNMASKED_TRANS(vsha2ms_vv, vsha_check, ZVKNH_EGS)
433
+
434
+static bool trans_vsha2cl_vv(DisasContext *s, arg_rmrr *a)
435
+{
436
+ if (vsha_check(s, a)) {
437
+ uint32_t data = 0;
438
+ TCGLabel *over = gen_new_label();
439
+ TCGv_i32 egs;
440
+
441
+ if (!s->vstart_eq_zero || !s->vl_eq_vlmax) {
442
+ /* save opcode for unwinding in case we throw an exception */
443
+ decode_save_opc(s);
444
+ egs = tcg_constant_i32(ZVKNH_EGS);
445
+ gen_helper_egs_check(egs, cpu_env);
446
+ tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
447
+ }
448
+
449
+ data = FIELD_DP32(data, VDATA, VM, a->vm);
450
+ data = FIELD_DP32(data, VDATA, LMUL, s->lmul);
451
+ data = FIELD_DP32(data, VDATA, VTA, s->vta);
452
+ data = FIELD_DP32(data, VDATA, VTA_ALL_1S, s->cfg_vta_all_1s);
453
+ data = FIELD_DP32(data, VDATA, VMA, s->vma);
454
+
455
+ tcg_gen_gvec_3_ptr(vreg_ofs(s, a->rd), vreg_ofs(s, a->rs1),
456
+ vreg_ofs(s, a->rs2), cpu_env, s->cfg_ptr->vlen / 8,
457
+ s->cfg_ptr->vlen / 8, data,
458
+ s->sew == MO_32 ?
459
+ gen_helper_vsha2cl32_vv : gen_helper_vsha2cl64_vv);
460
+
461
+ mark_vs_dirty(s);
462
+ gen_set_label(over);
463
+ return true;
464
+ }
465
+ return false;
466
+}
467
+
468
+static bool trans_vsha2ch_vv(DisasContext *s, arg_rmrr *a)
469
+{
470
+ if (vsha_check(s, a)) {
471
+ uint32_t data = 0;
472
+ TCGLabel *over = gen_new_label();
473
+ TCGv_i32 egs;
474
+
475
+ if (!s->vstart_eq_zero || !s->vl_eq_vlmax) {
476
+ /* save opcode for unwinding in case we throw an exception */
477
+ decode_save_opc(s);
478
+ egs = tcg_constant_i32(ZVKNH_EGS);
479
+ gen_helper_egs_check(egs, cpu_env);
480
+ tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over);
481
+ }
482
+
483
+ data = FIELD_DP32(data, VDATA, VM, a->vm);
484
+ data = FIELD_DP32(data, VDATA, LMUL, s->lmul);
485
+ data = FIELD_DP32(data, VDATA, VTA, s->vta);
486
+ data = FIELD_DP32(data, VDATA, VTA_ALL_1S, s->cfg_vta_all_1s);
487
+ data = FIELD_DP32(data, VDATA, VMA, s->vma);
488
+
489
+ tcg_gen_gvec_3_ptr(vreg_ofs(s, a->rd), vreg_ofs(s, a->rs1),
490
+ vreg_ofs(s, a->rs2), cpu_env, s->cfg_ptr->vlen / 8,
491
+ s->cfg_ptr->vlen / 8, data,
492
+ s->sew == MO_32 ?
493
+ gen_helper_vsha2ch32_vv : gen_helper_vsha2ch64_vv);
494
+
495
+ mark_vs_dirty(s);
496
+ gen_set_label(over);
497
+ return true;
498
+ }
499
+ return false;
500
+}
261
--
501
--
262
2.28.0
502
2.41.0
263
264
diff view generated by jsdifflib
New patch
1
1
From: Lawrence Hunter <lawrence.hunter@codethink.co.uk>
2
3
This commit adds support for the Zvksh vector-crypto extension, which
4
consists of the following instructions:
5
6
* vsm3me.vv
7
* vsm3c.vi
8
9
Translation functions are defined in
10
`target/riscv/insn_trans/trans_rvvk.c.inc` and helpers are defined in
11
`target/riscv/vcrypto_helper.c`.
12
13
Co-authored-by: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
14
[max.chou@sifive.com: Replaced vstart checking by TCG op]
15
Signed-off-by: Kiran Ostrolenk <kiran.ostrolenk@codethink.co.uk>
16
Signed-off-by: Lawrence Hunter <lawrence.hunter@codethink.co.uk>
17
Signed-off-by: Max Chou <max.chou@sifive.com>
18
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
19
[max.chou@sifive.com: Exposed x-zvksh property]
20
Message-ID: <20230711165917.2629866-12-max.chou@sifive.com>
21
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
22
---
23
target/riscv/cpu_cfg.h | 1 +
24
target/riscv/helper.h | 3 +
25
target/riscv/insn32.decode | 4 +
26
target/riscv/cpu.c | 6 +-
27
target/riscv/vcrypto_helper.c | 134 +++++++++++++++++++++++
28
target/riscv/insn_trans/trans_rvvk.c.inc | 31 ++++++
29
6 files changed, 177 insertions(+), 2 deletions(-)
30
31
diff --git a/target/riscv/cpu_cfg.h b/target/riscv/cpu_cfg.h
32
index XXXXXXX..XXXXXXX 100644
33
--- a/target/riscv/cpu_cfg.h
34
+++ b/target/riscv/cpu_cfg.h
35
@@ -XXX,XX +XXX,XX @@ struct RISCVCPUConfig {
36
bool ext_zvkned;
37
bool ext_zvknha;
38
bool ext_zvknhb;
39
+ bool ext_zvksh;
40
bool ext_zmmul;
41
bool ext_zvfbfmin;
42
bool ext_zvfbfwma;
43
diff --git a/target/riscv/helper.h b/target/riscv/helper.h
44
index XXXXXXX..XXXXXXX 100644
45
--- a/target/riscv/helper.h
46
+++ b/target/riscv/helper.h
47
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_5(vsha2ch32_vv, void, ptr, ptr, ptr, env, i32)
48
DEF_HELPER_5(vsha2ch64_vv, void, ptr, ptr, ptr, env, i32)
49
DEF_HELPER_5(vsha2cl32_vv, void, ptr, ptr, ptr, env, i32)
50
DEF_HELPER_5(vsha2cl64_vv, void, ptr, ptr, ptr, env, i32)
51
+
52
+DEF_HELPER_5(vsm3me_vv, void, ptr, ptr, ptr, env, i32)
53
+DEF_HELPER_5(vsm3c_vi, void, ptr, ptr, i32, env, i32)
54
diff --git a/target/riscv/insn32.decode b/target/riscv/insn32.decode
55
index XXXXXXX..XXXXXXX 100644
56
--- a/target/riscv/insn32.decode
57
+++ b/target/riscv/insn32.decode
58
@@ -XXX,XX +XXX,XX @@ vaeskf2_vi 101010 1 ..... ..... 010 ..... 1110111 @r_vm_1
59
vsha2ms_vv 101101 1 ..... ..... 010 ..... 1110111 @r_vm_1
60
vsha2ch_vv 101110 1 ..... ..... 010 ..... 1110111 @r_vm_1
61
vsha2cl_vv 101111 1 ..... ..... 010 ..... 1110111 @r_vm_1
62
+
63
+# *** Zvksh vector crypto extension ***
64
+vsm3me_vv 100000 1 ..... ..... 010 ..... 1110111 @r_vm_1
65
+vsm3c_vi 101011 1 ..... ..... 010 ..... 1110111 @r_vm_1
66
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
67
index XXXXXXX..XXXXXXX 100644
68
--- a/target/riscv/cpu.c
69
+++ b/target/riscv/cpu.c
70
@@ -XXX,XX +XXX,XX @@ static const struct isa_ext_data isa_edata_arr[] = {
71
ISA_EXT_DATA_ENTRY(zvkned, PRIV_VERSION_1_12_0, ext_zvkned),
72
ISA_EXT_DATA_ENTRY(zvknha, PRIV_VERSION_1_12_0, ext_zvknha),
73
ISA_EXT_DATA_ENTRY(zvknhb, PRIV_VERSION_1_12_0, ext_zvknhb),
74
+ ISA_EXT_DATA_ENTRY(zvksh, PRIV_VERSION_1_12_0, ext_zvksh),
75
ISA_EXT_DATA_ENTRY(zhinx, PRIV_VERSION_1_12_0, ext_zhinx),
76
ISA_EXT_DATA_ENTRY(zhinxmin, PRIV_VERSION_1_12_0, ext_zhinxmin),
77
ISA_EXT_DATA_ENTRY(smaia, PRIV_VERSION_1_12_0, ext_smaia),
78
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_validate_set_extensions(RISCVCPU *cpu, Error **errp)
79
* In principle Zve*x would also suffice here, were they supported
80
* in qemu
81
*/
82
- if ((cpu->cfg.ext_zvbb || cpu->cfg.ext_zvkned || cpu->cfg.ext_zvknha) &&
83
- !cpu->cfg.ext_zve32f) {
84
+ if ((cpu->cfg.ext_zvbb || cpu->cfg.ext_zvkned || cpu->cfg.ext_zvknha ||
85
+ cpu->cfg.ext_zvksh) && !cpu->cfg.ext_zve32f) {
86
error_setg(errp,
87
"Vector crypto extensions require V or Zve* extensions");
88
return;
89
@@ -XXX,XX +XXX,XX @@ static Property riscv_cpu_extensions[] = {
90
DEFINE_PROP_BOOL("x-zvkned", RISCVCPU, cfg.ext_zvkned, false),
91
DEFINE_PROP_BOOL("x-zvknha", RISCVCPU, cfg.ext_zvknha, false),
92
DEFINE_PROP_BOOL("x-zvknhb", RISCVCPU, cfg.ext_zvknhb, false),
93
+ DEFINE_PROP_BOOL("x-zvksh", RISCVCPU, cfg.ext_zvksh, false),
94
95
DEFINE_PROP_END_OF_LIST(),
96
};
97
diff --git a/target/riscv/vcrypto_helper.c b/target/riscv/vcrypto_helper.c
98
index XXXXXXX..XXXXXXX 100644
99
--- a/target/riscv/vcrypto_helper.c
100
+++ b/target/riscv/vcrypto_helper.c
101
@@ -XXX,XX +XXX,XX @@ void HELPER(vsha2cl64_vv)(void *vd, void *vs1, void *vs2, CPURISCVState *env,
102
vext_set_elems_1s(vd, vta, env->vl * esz, total_elems * esz);
103
env->vstart = 0;
104
}
105
+
106
+static inline uint32_t p1(uint32_t x)
107
+{
108
+ return x ^ rol32(x, 15) ^ rol32(x, 23);
109
+}
110
+
111
+static inline uint32_t zvksh_w(uint32_t m16, uint32_t m9, uint32_t m3,
112
+ uint32_t m13, uint32_t m6)
113
+{
114
+ return p1(m16 ^ m9 ^ rol32(m3, 15)) ^ rol32(m13, 7) ^ m6;
115
+}
116
+
117
+void HELPER(vsm3me_vv)(void *vd_vptr, void *vs1_vptr, void *vs2_vptr,
118
+ CPURISCVState *env, uint32_t desc)
119
+{
120
+ uint32_t esz = memop_size(FIELD_EX64(env->vtype, VTYPE, VSEW));
121
+ uint32_t total_elems = vext_get_total_elems(env, desc, esz);
122
+ uint32_t vta = vext_vta(desc);
123
+ uint32_t *vd = vd_vptr;
124
+ uint32_t *vs1 = vs1_vptr;
125
+ uint32_t *vs2 = vs2_vptr;
126
+
127
+ for (int i = env->vstart / 8; i < env->vl / 8; i++) {
128
+ uint32_t w[24];
129
+ for (int j = 0; j < 8; j++) {
130
+ w[j] = bswap32(vs1[H4((i * 8) + j)]);
131
+ w[j + 8] = bswap32(vs2[H4((i * 8) + j)]);
132
+ }
133
+ for (int j = 0; j < 8; j++) {
134
+ w[j + 16] =
135
+ zvksh_w(w[j], w[j + 7], w[j + 13], w[j + 3], w[j + 10]);
136
+ }
137
+ for (int j = 0; j < 8; j++) {
138
+ vd[(i * 8) + j] = bswap32(w[H4(j + 16)]);
139
+ }
140
+ }
141
+ vext_set_elems_1s(vd_vptr, vta, env->vl * esz, total_elems * esz);
142
+ env->vstart = 0;
143
+}
144
+
145
+static inline uint32_t ff1(uint32_t x, uint32_t y, uint32_t z)
146
+{
147
+ return x ^ y ^ z;
148
+}
149
+
150
+static inline uint32_t ff2(uint32_t x, uint32_t y, uint32_t z)
151
+{
152
+ return (x & y) | (x & z) | (y & z);
153
+}
154
+
155
+static inline uint32_t ff_j(uint32_t x, uint32_t y, uint32_t z, uint32_t j)
156
+{
157
+ return (j <= 15) ? ff1(x, y, z) : ff2(x, y, z);
158
+}
159
+
160
+static inline uint32_t gg1(uint32_t x, uint32_t y, uint32_t z)
161
+{
162
+ return x ^ y ^ z;
163
+}
164
+
165
+static inline uint32_t gg2(uint32_t x, uint32_t y, uint32_t z)
166
+{
167
+ return (x & y) | (~x & z);
168
+}
169
+
170
+static inline uint32_t gg_j(uint32_t x, uint32_t y, uint32_t z, uint32_t j)
171
+{
172
+ return (j <= 15) ? gg1(x, y, z) : gg2(x, y, z);
173
+}
174
+
175
+static inline uint32_t t_j(uint32_t j)
176
+{
177
+ return (j <= 15) ? 0x79cc4519 : 0x7a879d8a;
178
+}
179
+
180
+static inline uint32_t p_0(uint32_t x)
181
+{
182
+ return x ^ rol32(x, 9) ^ rol32(x, 17);
183
+}
184
+
185
+static void sm3c(uint32_t *vd, uint32_t *vs1, uint32_t *vs2, uint32_t uimm)
186
+{
187
+ uint32_t x0, x1;
188
+ uint32_t j;
189
+ uint32_t ss1, ss2, tt1, tt2;
190
+ x0 = vs2[0] ^ vs2[4];
191
+ x1 = vs2[1] ^ vs2[5];
192
+ j = 2 * uimm;
193
+ ss1 = rol32(rol32(vs1[0], 12) + vs1[4] + rol32(t_j(j), j % 32), 7);
194
+ ss2 = ss1 ^ rol32(vs1[0], 12);
195
+ tt1 = ff_j(vs1[0], vs1[1], vs1[2], j) + vs1[3] + ss2 + x0;
196
+ tt2 = gg_j(vs1[4], vs1[5], vs1[6], j) + vs1[7] + ss1 + vs2[0];
197
+ vs1[3] = vs1[2];
198
+ vd[3] = rol32(vs1[1], 9);
199
+ vs1[1] = vs1[0];
200
+ vd[1] = tt1;
201
+ vs1[7] = vs1[6];
202
+ vd[7] = rol32(vs1[5], 19);
203
+ vs1[5] = vs1[4];
204
+ vd[5] = p_0(tt2);
205
+ j = 2 * uimm + 1;
206
+ ss1 = rol32(rol32(vd[1], 12) + vd[5] + rol32(t_j(j), j % 32), 7);
207
+ ss2 = ss1 ^ rol32(vd[1], 12);
208
+ tt1 = ff_j(vd[1], vs1[1], vd[3], j) + vs1[3] + ss2 + x1;
209
+ tt2 = gg_j(vd[5], vs1[5], vd[7], j) + vs1[7] + ss1 + vs2[1];
210
+ vd[2] = rol32(vs1[1], 9);
211
+ vd[0] = tt1;
212
+ vd[6] = rol32(vs1[5], 19);
213
+ vd[4] = p_0(tt2);
214
+}
215
+
216
+void HELPER(vsm3c_vi)(void *vd_vptr, void *vs2_vptr, uint32_t uimm,
217
+ CPURISCVState *env, uint32_t desc)
218
+{
219
+ uint32_t esz = memop_size(FIELD_EX64(env->vtype, VTYPE, VSEW));
220
+ uint32_t total_elems = vext_get_total_elems(env, desc, esz);
221
+ uint32_t vta = vext_vta(desc);
222
+ uint32_t *vd = vd_vptr;
223
+ uint32_t *vs2 = vs2_vptr;
224
+ uint32_t v1[8], v2[8], v3[8];
225
+
226
+ for (int i = env->vstart / 8; i < env->vl / 8; i++) {
227
+ for (int k = 0; k < 8; k++) {
228
+ v2[k] = bswap32(vd[H4(i * 8 + k)]);
229
+ v3[k] = bswap32(vs2[H4(i * 8 + k)]);
230
+ }
231
+ sm3c(v1, v2, v3, uimm);
232
+ for (int k = 0; k < 8; k++) {
233
+ vd[i * 8 + k] = bswap32(v1[H4(k)]);
234
+ }
235
+ }
236
+ vext_set_elems_1s(vd_vptr, vta, env->vl * esz, total_elems * esz);
237
+ env->vstart = 0;
238
+}
239
diff --git a/target/riscv/insn_trans/trans_rvvk.c.inc b/target/riscv/insn_trans/trans_rvvk.c.inc
240
index XXXXXXX..XXXXXXX 100644
241
--- a/target/riscv/insn_trans/trans_rvvk.c.inc
242
+++ b/target/riscv/insn_trans/trans_rvvk.c.inc
243
@@ -XXX,XX +XXX,XX @@ static bool trans_vsha2ch_vv(DisasContext *s, arg_rmrr *a)
244
}
245
return false;
246
}
247
+
248
+/*
249
+ * Zvksh
250
+ */
251
+
252
+#define ZVKSH_EGS 8
253
+
254
+static inline bool vsm3_check(DisasContext *s, arg_rmrr *a)
255
+{
256
+ int egw_bytes = ZVKSH_EGS << s->sew;
257
+ int mult = 1 << MAX(s->lmul, 0);
258
+ return s->cfg_ptr->ext_zvksh == true &&
259
+ require_rvv(s) &&
260
+ vext_check_isa_ill(s) &&
261
+ !is_overlapped(a->rd, mult, a->rs2, mult) &&
262
+ MAXSZ(s) >= egw_bytes &&
263
+ s->sew == MO_32;
264
+}
265
+
266
+static inline bool vsm3me_check(DisasContext *s, arg_rmrr *a)
267
+{
268
+ return vsm3_check(s, a) && vext_check_sss(s, a->rd, a->rs1, a->rs2, a->vm);
269
+}
270
+
271
+static inline bool vsm3c_check(DisasContext *s, arg_rmrr *a)
272
+{
273
+ return vsm3_check(s, a) && vext_check_ss(s, a->rd, a->rs2, a->vm);
274
+}
275
+
276
+GEN_VV_UNMASKED_TRANS(vsm3me_vv, vsm3me_check, ZVKSH_EGS)
277
+GEN_VI_UNMASKED_TRANS(vsm3c_vi, vsm3c_check, ZVKSH_EGS)
278
--
279
2.41.0
diff view generated by jsdifflib
New patch
1
1
From: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
2
3
This commit adds support for the Zvkg vector-crypto extension, which
4
consists of the following instructions:
5
6
* vgmul.vv
7
* vghsh.vv
8
9
Translation functions are defined in
10
`target/riscv/insn_trans/trans_rvvk.c.inc` and helpers are defined in
11
`target/riscv/vcrypto_helper.c`.
12
13
Co-authored-by: Lawrence Hunter <lawrence.hunter@codethink.co.uk>
14
[max.chou@sifive.com: Replaced vstart checking by TCG op]
15
Signed-off-by: Lawrence Hunter <lawrence.hunter@codethink.co.uk>
16
Signed-off-by: Nazar Kazakov <nazar.kazakov@codethink.co.uk>
17
Signed-off-by: Max Chou <max.chou@sifive.com>
18
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
19
[max.chou@sifive.com: Exposed x-zvkg property]
20
[max.chou@sifive.com: Replaced uint by int for cross win32 build]
21
Message-ID: <20230711165917.2629866-13-max.chou@sifive.com>
22
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
23
---
24
target/riscv/cpu_cfg.h | 1 +
25
target/riscv/helper.h | 3 +
26
target/riscv/insn32.decode | 4 ++
27
target/riscv/cpu.c | 6 +-
28
target/riscv/vcrypto_helper.c | 72 ++++++++++++++++++++++++
29
target/riscv/insn_trans/trans_rvvk.c.inc | 30 ++++++++++
30
6 files changed, 114 insertions(+), 2 deletions(-)
31
32
diff --git a/target/riscv/cpu_cfg.h b/target/riscv/cpu_cfg.h
33
index XXXXXXX..XXXXXXX 100644
34
--- a/target/riscv/cpu_cfg.h
35
+++ b/target/riscv/cpu_cfg.h
36
@@ -XXX,XX +XXX,XX @@ struct RISCVCPUConfig {
37
bool ext_zve64d;
38
bool ext_zvbb;
39
bool ext_zvbc;
40
+ bool ext_zvkg;
41
bool ext_zvkned;
42
bool ext_zvknha;
43
bool ext_zvknhb;
44
diff --git a/target/riscv/helper.h b/target/riscv/helper.h
45
index XXXXXXX..XXXXXXX 100644
46
--- a/target/riscv/helper.h
47
+++ b/target/riscv/helper.h
48
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_5(vsha2cl64_vv, void, ptr, ptr, ptr, env, i32)
49
50
DEF_HELPER_5(vsm3me_vv, void, ptr, ptr, ptr, env, i32)
51
DEF_HELPER_5(vsm3c_vi, void, ptr, ptr, i32, env, i32)
52
+
53
+DEF_HELPER_5(vghsh_vv, void, ptr, ptr, ptr, env, i32)
54
+DEF_HELPER_4(vgmul_vv, void, ptr, ptr, env, i32)
55
diff --git a/target/riscv/insn32.decode b/target/riscv/insn32.decode
56
index XXXXXXX..XXXXXXX 100644
57
--- a/target/riscv/insn32.decode
58
+++ b/target/riscv/insn32.decode
59
@@ -XXX,XX +XXX,XX @@ vsha2cl_vv 101111 1 ..... ..... 010 ..... 1110111 @r_vm_1
60
# *** Zvksh vector crypto extension ***
61
vsm3me_vv 100000 1 ..... ..... 010 ..... 1110111 @r_vm_1
62
vsm3c_vi 101011 1 ..... ..... 010 ..... 1110111 @r_vm_1
63
+
64
+# *** Zvkg vector crypto extension ***
65
+vghsh_vv 101100 1 ..... ..... 010 ..... 1110111 @r_vm_1
66
+vgmul_vv 101000 1 ..... 10001 010 ..... 1110111 @r2_vm_1
67
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
68
index XXXXXXX..XXXXXXX 100644
69
--- a/target/riscv/cpu.c
70
+++ b/target/riscv/cpu.c
71
@@ -XXX,XX +XXX,XX @@ static const struct isa_ext_data isa_edata_arr[] = {
72
ISA_EXT_DATA_ENTRY(zvfbfwma, PRIV_VERSION_1_12_0, ext_zvfbfwma),
73
ISA_EXT_DATA_ENTRY(zvfh, PRIV_VERSION_1_12_0, ext_zvfh),
74
ISA_EXT_DATA_ENTRY(zvfhmin, PRIV_VERSION_1_12_0, ext_zvfhmin),
75
+ ISA_EXT_DATA_ENTRY(zvkg, PRIV_VERSION_1_12_0, ext_zvkg),
76
ISA_EXT_DATA_ENTRY(zvkned, PRIV_VERSION_1_12_0, ext_zvkned),
77
ISA_EXT_DATA_ENTRY(zvknha, PRIV_VERSION_1_12_0, ext_zvknha),
78
ISA_EXT_DATA_ENTRY(zvknhb, PRIV_VERSION_1_12_0, ext_zvknhb),
79
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_validate_set_extensions(RISCVCPU *cpu, Error **errp)
80
* In principle Zve*x would also suffice here, were they supported
81
* in qemu
82
*/
83
- if ((cpu->cfg.ext_zvbb || cpu->cfg.ext_zvkned || cpu->cfg.ext_zvknha ||
84
- cpu->cfg.ext_zvksh) && !cpu->cfg.ext_zve32f) {
85
+ if ((cpu->cfg.ext_zvbb || cpu->cfg.ext_zvkg || cpu->cfg.ext_zvkned ||
86
+ cpu->cfg.ext_zvknha || cpu->cfg.ext_zvksh) && !cpu->cfg.ext_zve32f) {
87
error_setg(errp,
88
"Vector crypto extensions require V or Zve* extensions");
89
return;
90
@@ -XXX,XX +XXX,XX @@ static Property riscv_cpu_extensions[] = {
91
/* Vector cryptography extensions */
92
DEFINE_PROP_BOOL("x-zvbb", RISCVCPU, cfg.ext_zvbb, false),
93
DEFINE_PROP_BOOL("x-zvbc", RISCVCPU, cfg.ext_zvbc, false),
94
+ DEFINE_PROP_BOOL("x-zvkg", RISCVCPU, cfg.ext_zvkg, false),
95
DEFINE_PROP_BOOL("x-zvkned", RISCVCPU, cfg.ext_zvkned, false),
96
DEFINE_PROP_BOOL("x-zvknha", RISCVCPU, cfg.ext_zvknha, false),
97
DEFINE_PROP_BOOL("x-zvknhb", RISCVCPU, cfg.ext_zvknhb, false),
98
diff --git a/target/riscv/vcrypto_helper.c b/target/riscv/vcrypto_helper.c
99
index XXXXXXX..XXXXXXX 100644
100
--- a/target/riscv/vcrypto_helper.c
101
+++ b/target/riscv/vcrypto_helper.c
102
@@ -XXX,XX +XXX,XX @@ void HELPER(vsm3c_vi)(void *vd_vptr, void *vs2_vptr, uint32_t uimm,
103
vext_set_elems_1s(vd_vptr, vta, env->vl * esz, total_elems * esz);
104
env->vstart = 0;
105
}
106
+
107
+void HELPER(vghsh_vv)(void *vd_vptr, void *vs1_vptr, void *vs2_vptr,
108
+ CPURISCVState *env, uint32_t desc)
109
+{
110
+ uint64_t *vd = vd_vptr;
111
+ uint64_t *vs1 = vs1_vptr;
112
+ uint64_t *vs2 = vs2_vptr;
113
+ uint32_t vta = vext_vta(desc);
114
+ uint32_t total_elems = vext_get_total_elems(env, desc, 4);
115
+
116
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) {
117
+ uint64_t Y[2] = {vd[i * 2 + 0], vd[i * 2 + 1]};
118
+ uint64_t H[2] = {brev8(vs2[i * 2 + 0]), brev8(vs2[i * 2 + 1])};
119
+ uint64_t X[2] = {vs1[i * 2 + 0], vs1[i * 2 + 1]};
120
+ uint64_t Z[2] = {0, 0};
121
+
122
+ uint64_t S[2] = {brev8(Y[0] ^ X[0]), brev8(Y[1] ^ X[1])};
123
+
124
+ for (int j = 0; j < 128; j++) {
125
+ if ((S[j / 64] >> (j % 64)) & 1) {
126
+ Z[0] ^= H[0];
127
+ Z[1] ^= H[1];
128
+ }
129
+ bool reduce = ((H[1] >> 63) & 1);
130
+ H[1] = H[1] << 1 | H[0] >> 63;
131
+ H[0] = H[0] << 1;
132
+ if (reduce) {
133
+ H[0] ^= 0x87;
134
+ }
135
+ }
136
+
137
+ vd[i * 2 + 0] = brev8(Z[0]);
138
+ vd[i * 2 + 1] = brev8(Z[1]);
139
+ }
140
+ /* set tail elements to 1s */
141
+ vext_set_elems_1s(vd, vta, env->vl * 4, total_elems * 4);
142
+ env->vstart = 0;
143
+}
144
+
145
+void HELPER(vgmul_vv)(void *vd_vptr, void *vs2_vptr, CPURISCVState *env,
146
+ uint32_t desc)
147
+{
148
+ uint64_t *vd = vd_vptr;
149
+ uint64_t *vs2 = vs2_vptr;
150
+ uint32_t vta = vext_vta(desc);
151
+ uint32_t total_elems = vext_get_total_elems(env, desc, 4);
152
+
153
+ for (uint32_t i = env->vstart / 4; i < env->vl / 4; i++) {
154
+ uint64_t Y[2] = {brev8(vd[i * 2 + 0]), brev8(vd[i * 2 + 1])};
155
+ uint64_t H[2] = {brev8(vs2[i * 2 + 0]), brev8(vs2[i * 2 + 1])};
156
+ uint64_t Z[2] = {0, 0};
157
+
158
+ for (int j = 0; j < 128; j++) {
159
+ if ((Y[j / 64] >> (j % 64)) & 1) {
160
+ Z[0] ^= H[0];
161
+ Z[1] ^= H[1];
162
+ }
163
+ bool reduce = ((H[1] >> 63) & 1);
164
+ H[1] = H[1] << 1 | H[0] >> 63;
165
+ H[0] = H[0] << 1;
166
+ if (reduce) {
167
+ H[0] ^= 0x87;
168
+ }
169
+ }
170
+
171
+ vd[i * 2 + 0] = brev8(Z[0]);
172
+ vd[i * 2 + 1] = brev8(Z[1]);
173
+ }
174
+ /* set tail elements to 1s */
175
+ vext_set_elems_1s(vd, vta, env->vl * 4, total_elems * 4);
176
+ env->vstart = 0;
177
+}
178
diff --git a/target/riscv/insn_trans/trans_rvvk.c.inc b/target/riscv/insn_trans/trans_rvvk.c.inc
179
index XXXXXXX..XXXXXXX 100644
180
--- a/target/riscv/insn_trans/trans_rvvk.c.inc
181
+++ b/target/riscv/insn_trans/trans_rvvk.c.inc
182
@@ -XXX,XX +XXX,XX @@ static inline bool vsm3c_check(DisasContext *s, arg_rmrr *a)
183
184
GEN_VV_UNMASKED_TRANS(vsm3me_vv, vsm3me_check, ZVKSH_EGS)
185
GEN_VI_UNMASKED_TRANS(vsm3c_vi, vsm3c_check, ZVKSH_EGS)
186
+
187
+/*
188
+ * Zvkg
189
+ */
190
+
191
+#define ZVKG_EGS 4
192
+
193
+static bool vgmul_check(DisasContext *s, arg_rmr *a)
194
+{
195
+ int egw_bytes = ZVKG_EGS << s->sew;
196
+ return s->cfg_ptr->ext_zvkg == true &&
197
+ vext_check_isa_ill(s) &&
198
+ require_rvv(s) &&
199
+ MAXSZ(s) >= egw_bytes &&
200
+ vext_check_ss(s, a->rd, a->rs2, a->vm) &&
201
+ s->sew == MO_32;
202
+}
203
+
204
+GEN_V_UNMASKED_TRANS(vgmul_vv, vgmul_check, ZVKG_EGS)
205
+
206
+static bool vghsh_check(DisasContext *s, arg_rmrr *a)
207
+{
208
+ int egw_bytes = ZVKG_EGS << s->sew;
209
+ return s->cfg_ptr->ext_zvkg == true &&
210
+ opivv_check(s, a) &&
211
+ MAXSZ(s) >= egw_bytes &&
212
+ s->sew == MO_32;
213
+}
214
+
215
+GEN_VV_UNMASKED_TRANS(vghsh_vv, vghsh_check, ZVKG_EGS)
216
--
217
2.41.0
diff view generated by jsdifflib
New patch
1
From: Max Chou <max.chou@sifive.com>
1
2
3
Allows sharing of sm4_subword between different targets.
4
5
Signed-off-by: Max Chou <max.chou@sifive.com>
6
Reviewed-by: Frank Chang <frank.chang@sifive.com>
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Signed-off-by: Max Chou <max.chou@sifive.com>
9
Message-ID: <20230711165917.2629866-14-max.chou@sifive.com>
10
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
11
---
12
include/crypto/sm4.h | 8 ++++++++
13
target/arm/tcg/crypto_helper.c | 10 ++--------
14
2 files changed, 10 insertions(+), 8 deletions(-)
15
16
diff --git a/include/crypto/sm4.h b/include/crypto/sm4.h
17
index XXXXXXX..XXXXXXX 100644
18
--- a/include/crypto/sm4.h
19
+++ b/include/crypto/sm4.h
20
@@ -XXX,XX +XXX,XX @@
21
22
extern const uint8_t sm4_sbox[256];
23
24
+static inline uint32_t sm4_subword(uint32_t word)
25
+{
26
+ return sm4_sbox[word & 0xff] |
27
+ sm4_sbox[(word >> 8) & 0xff] << 8 |
28
+ sm4_sbox[(word >> 16) & 0xff] << 16 |
29
+ sm4_sbox[(word >> 24) & 0xff] << 24;
30
+}
31
+
32
#endif
33
diff --git a/target/arm/tcg/crypto_helper.c b/target/arm/tcg/crypto_helper.c
34
index XXXXXXX..XXXXXXX 100644
35
--- a/target/arm/tcg/crypto_helper.c
36
+++ b/target/arm/tcg/crypto_helper.c
37
@@ -XXX,XX +XXX,XX @@ static void do_crypto_sm4e(uint64_t *rd, uint64_t *rn, uint64_t *rm)
38
CR_ST_WORD(d, (i + 3) % 4) ^
39
CR_ST_WORD(n, i);
40
41
- t = sm4_sbox[t & 0xff] |
42
- sm4_sbox[(t >> 8) & 0xff] << 8 |
43
- sm4_sbox[(t >> 16) & 0xff] << 16 |
44
- sm4_sbox[(t >> 24) & 0xff] << 24;
45
+ t = sm4_subword(t);
46
47
CR_ST_WORD(d, i) ^= t ^ rol32(t, 2) ^ rol32(t, 10) ^ rol32(t, 18) ^
48
rol32(t, 24);
49
@@ -XXX,XX +XXX,XX @@ static void do_crypto_sm4ekey(uint64_t *rd, uint64_t *rn, uint64_t *rm)
50
CR_ST_WORD(d, (i + 3) % 4) ^
51
CR_ST_WORD(m, i);
52
53
- t = sm4_sbox[t & 0xff] |
54
- sm4_sbox[(t >> 8) & 0xff] << 8 |
55
- sm4_sbox[(t >> 16) & 0xff] << 16 |
56
- sm4_sbox[(t >> 24) & 0xff] << 24;
57
+ t = sm4_subword(t);
58
59
CR_ST_WORD(d, i) ^= t ^ rol32(t, 13) ^ rol32(t, 23);
60
}
61
--
62
2.41.0
diff view generated by jsdifflib
New patch
1
From: Max Chou <max.chou@sifive.com>
1
2
3
Adds sm4_ck constant for use in sm4 cryptography across different targets.
4
5
Signed-off-by: Max Chou <max.chou@sifive.com>
6
Reviewed-by: Frank Chang <frank.chang@sifive.com>
7
Signed-off-by: Max Chou <max.chou@sifive.com>
8
Message-ID: <20230711165917.2629866-15-max.chou@sifive.com>
9
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
10
---
11
include/crypto/sm4.h | 1 +
12
crypto/sm4.c | 10 ++++++++++
13
2 files changed, 11 insertions(+)
14
15
diff --git a/include/crypto/sm4.h b/include/crypto/sm4.h
16
index XXXXXXX..XXXXXXX 100644
17
--- a/include/crypto/sm4.h
18
+++ b/include/crypto/sm4.h
19
@@ -XXX,XX +XXX,XX @@
20
#define QEMU_SM4_H
21
22
extern const uint8_t sm4_sbox[256];
23
+extern const uint32_t sm4_ck[32];
24
25
static inline uint32_t sm4_subword(uint32_t word)
26
{
27
diff --git a/crypto/sm4.c b/crypto/sm4.c
28
index XXXXXXX..XXXXXXX 100644
29
--- a/crypto/sm4.c
30
+++ b/crypto/sm4.c
31
@@ -XXX,XX +XXX,XX @@ uint8_t const sm4_sbox[] = {
32
0x79, 0xee, 0x5f, 0x3e, 0xd7, 0xcb, 0x39, 0x48,
33
};
34
35
+uint32_t const sm4_ck[] = {
36
+ 0x00070e15, 0x1c232a31, 0x383f464d, 0x545b6269,
37
+ 0x70777e85, 0x8c939aa1, 0xa8afb6bd, 0xc4cbd2d9,
38
+ 0xe0e7eef5, 0xfc030a11, 0x181f262d, 0x343b4249,
39
+ 0x50575e65, 0x6c737a81, 0x888f969d, 0xa4abb2b9,
40
+ 0xc0c7ced5, 0xdce3eaf1, 0xf8ff060d, 0x141b2229,
41
+ 0x30373e45, 0x4c535a61, 0x686f767d, 0x848b9299,
42
+ 0xa0a7aeb5, 0xbcc3cad1, 0xd8dfe6ed, 0xf4fb0209,
43
+ 0x10171e25, 0x2c333a41, 0x484f565d, 0x646b7279
44
+};
45
--
46
2.41.0
diff view generated by jsdifflib
New patch
1
1
From: Max Chou <max.chou@sifive.com>
2
3
This commit adds support for the Zvksed vector-crypto extension, which
4
consists of the following instructions:
5
6
* vsm4k.vi
7
* vsm4r.[vv,vs]
8
9
Translation functions are defined in
10
`target/riscv/insn_trans/trans_rvvk.c.inc` and helpers are defined in
11
`target/riscv/vcrypto_helper.c`.
12
13
Signed-off-by: Max Chou <max.chou@sifive.com>
14
Reviewed-by: Frank Chang <frank.chang@sifive.com>
15
[lawrence.hunter@codethink.co.uk: Moved SM4 functions from
16
crypto_helper.c to vcrypto_helper.c]
17
[nazar.kazakov@codethink.co.uk: Added alignment checks, refactored code to
18
use macros, and minor style changes]
19
Signed-off-by: Max Chou <max.chou@sifive.com>
20
Message-ID: <20230711165917.2629866-16-max.chou@sifive.com>
21
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
22
---
23
target/riscv/cpu_cfg.h | 1 +
24
target/riscv/helper.h | 4 +
25
target/riscv/insn32.decode | 5 +
26
target/riscv/cpu.c | 5 +-
27
target/riscv/vcrypto_helper.c | 127 +++++++++++++++++++++++
28
target/riscv/insn_trans/trans_rvvk.c.inc | 43 ++++++++
29
6 files changed, 184 insertions(+), 1 deletion(-)
30
31
diff --git a/target/riscv/cpu_cfg.h b/target/riscv/cpu_cfg.h
32
index XXXXXXX..XXXXXXX 100644
33
--- a/target/riscv/cpu_cfg.h
34
+++ b/target/riscv/cpu_cfg.h
35
@@ -XXX,XX +XXX,XX @@ struct RISCVCPUConfig {
36
bool ext_zvkned;
37
bool ext_zvknha;
38
bool ext_zvknhb;
39
+ bool ext_zvksed;
40
bool ext_zvksh;
41
bool ext_zmmul;
42
bool ext_zvfbfmin;
43
diff --git a/target/riscv/helper.h b/target/riscv/helper.h
44
index XXXXXXX..XXXXXXX 100644
45
--- a/target/riscv/helper.h
46
+++ b/target/riscv/helper.h
47
@@ -XXX,XX +XXX,XX @@ DEF_HELPER_5(vsm3c_vi, void, ptr, ptr, i32, env, i32)
48
49
DEF_HELPER_5(vghsh_vv, void, ptr, ptr, ptr, env, i32)
50
DEF_HELPER_4(vgmul_vv, void, ptr, ptr, env, i32)
51
+
52
+DEF_HELPER_5(vsm4k_vi, void, ptr, ptr, i32, env, i32)
53
+DEF_HELPER_4(vsm4r_vv, void, ptr, ptr, env, i32)
54
+DEF_HELPER_4(vsm4r_vs, void, ptr, ptr, env, i32)
55
diff --git a/target/riscv/insn32.decode b/target/riscv/insn32.decode
56
index XXXXXXX..XXXXXXX 100644
57
--- a/target/riscv/insn32.decode
58
+++ b/target/riscv/insn32.decode
59
@@ -XXX,XX +XXX,XX @@ vsm3c_vi 101011 1 ..... ..... 010 ..... 1110111 @r_vm_1
60
# *** Zvkg vector crypto extension ***
61
vghsh_vv 101100 1 ..... ..... 010 ..... 1110111 @r_vm_1
62
vgmul_vv 101000 1 ..... 10001 010 ..... 1110111 @r2_vm_1
63
+
64
+# *** Zvksed vector crypto extension ***
65
+vsm4k_vi 100001 1 ..... ..... 010 ..... 1110111 @r_vm_1
66
+vsm4r_vv 101000 1 ..... 10000 010 ..... 1110111 @r2_vm_1
67
+vsm4r_vs 101001 1 ..... 10000 010 ..... 1110111 @r2_vm_1
68
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
69
index XXXXXXX..XXXXXXX 100644
70
--- a/target/riscv/cpu.c
71
+++ b/target/riscv/cpu.c
72
@@ -XXX,XX +XXX,XX @@ static const struct isa_ext_data isa_edata_arr[] = {
73
ISA_EXT_DATA_ENTRY(zvkned, PRIV_VERSION_1_12_0, ext_zvkned),
74
ISA_EXT_DATA_ENTRY(zvknha, PRIV_VERSION_1_12_0, ext_zvknha),
75
ISA_EXT_DATA_ENTRY(zvknhb, PRIV_VERSION_1_12_0, ext_zvknhb),
76
+ ISA_EXT_DATA_ENTRY(zvksed, PRIV_VERSION_1_12_0, ext_zvksed),
77
ISA_EXT_DATA_ENTRY(zvksh, PRIV_VERSION_1_12_0, ext_zvksh),
78
ISA_EXT_DATA_ENTRY(zhinx, PRIV_VERSION_1_12_0, ext_zhinx),
79
ISA_EXT_DATA_ENTRY(zhinxmin, PRIV_VERSION_1_12_0, ext_zhinxmin),
80
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_validate_set_extensions(RISCVCPU *cpu, Error **errp)
81
* in qemu
82
*/
83
if ((cpu->cfg.ext_zvbb || cpu->cfg.ext_zvkg || cpu->cfg.ext_zvkned ||
84
- cpu->cfg.ext_zvknha || cpu->cfg.ext_zvksh) && !cpu->cfg.ext_zve32f) {
85
+ cpu->cfg.ext_zvknha || cpu->cfg.ext_zvksed || cpu->cfg.ext_zvksh) &&
86
+ !cpu->cfg.ext_zve32f) {
87
error_setg(errp,
88
"Vector crypto extensions require V or Zve* extensions");
89
return;
90
@@ -XXX,XX +XXX,XX @@ static Property riscv_cpu_extensions[] = {
91
DEFINE_PROP_BOOL("x-zvkned", RISCVCPU, cfg.ext_zvkned, false),
92
DEFINE_PROP_BOOL("x-zvknha", RISCVCPU, cfg.ext_zvknha, false),
93
DEFINE_PROP_BOOL("x-zvknhb", RISCVCPU, cfg.ext_zvknhb, false),
94
+ DEFINE_PROP_BOOL("x-zvksed", RISCVCPU, cfg.ext_zvksed, false),
95
DEFINE_PROP_BOOL("x-zvksh", RISCVCPU, cfg.ext_zvksh, false),
96
97
DEFINE_PROP_END_OF_LIST(),
98
diff --git a/target/riscv/vcrypto_helper.c b/target/riscv/vcrypto_helper.c
99
index XXXXXXX..XXXXXXX 100644
100
--- a/target/riscv/vcrypto_helper.c
101
+++ b/target/riscv/vcrypto_helper.c
102
@@ -XXX,XX +XXX,XX @@
103
#include "cpu.h"
104
#include "crypto/aes.h"
105
#include "crypto/aes-round.h"
106
+#include "crypto/sm4.h"
107
#include "exec/memop.h"
108
#include "exec/exec-all.h"
109
#include "exec/helper-proto.h"
110
@@ -XXX,XX +XXX,XX @@ void HELPER(vgmul_vv)(void *vd_vptr, void *vs2_vptr, CPURISCVState *env,
111
vext_set_elems_1s(vd, vta, env->vl * 4, total_elems * 4);
112
env->vstart = 0;
113
}
114
+
115
+void HELPER(vsm4k_vi)(void *vd, void *vs2, uint32_t uimm5, CPURISCVState *env,
116
+ uint32_t desc)
117
+{
118
+ const uint32_t egs = 4;
119
+ uint32_t rnd = uimm5 & 0x7;
120
+ uint32_t group_start = env->vstart / egs;
121
+ uint32_t group_end = env->vl / egs;
122
+ uint32_t esz = sizeof(uint32_t);
123
+ uint32_t total_elems = vext_get_total_elems(env, desc, esz);
124
+
125
+ for (uint32_t i = group_start; i < group_end; ++i) {
126
+ uint32_t vstart = i * egs;
127
+ uint32_t vend = (i + 1) * egs;
128
+ uint32_t rk[4] = {0};
129
+ uint32_t tmp[8] = {0};
130
+
131
+ for (uint32_t j = vstart; j < vend; ++j) {
132
+ rk[j - vstart] = *((uint32_t *)vs2 + H4(j));
133
+ }
134
+
135
+ for (uint32_t j = 0; j < egs; ++j) {
136
+ tmp[j] = rk[j];
137
+ }
138
+
139
+ for (uint32_t j = 0; j < egs; ++j) {
140
+ uint32_t b, s;
141
+ b = tmp[j + 1] ^ tmp[j + 2] ^ tmp[j + 3] ^ sm4_ck[rnd * 4 + j];
142
+
143
+ s = sm4_subword(b);
144
+
145
+ tmp[j + 4] = tmp[j] ^ (s ^ rol32(s, 13) ^ rol32(s, 23));
146
+ }
147
+
148
+ for (uint32_t j = vstart; j < vend; ++j) {
149
+ *((uint32_t *)vd + H4(j)) = tmp[egs + (j - vstart)];
150
+ }
151
+ }
152
+
153
+ env->vstart = 0;
154
+ /* set tail elements to 1s */
155
+ vext_set_elems_1s(vd, vext_vta(desc), env->vl * esz, total_elems * esz);
156
+}
157
+
158
+static void do_sm4_round(uint32_t *rk, uint32_t *buf)
159
+{
160
+ const uint32_t egs = 4;
161
+ uint32_t s, b;
162
+
163
+ for (uint32_t j = egs; j < egs * 2; ++j) {
164
+ b = buf[j - 3] ^ buf[j - 2] ^ buf[j - 1] ^ rk[j - 4];
165
+
166
+ s = sm4_subword(b);
167
+
168
+ buf[j] = buf[j - 4] ^ (s ^ rol32(s, 2) ^ rol32(s, 10) ^ rol32(s, 18) ^
169
+ rol32(s, 24));
170
+ }
171
+}
172
+
173
+void HELPER(vsm4r_vv)(void *vd, void *vs2, CPURISCVState *env, uint32_t desc)
174
+{
175
+ const uint32_t egs = 4;
176
+ uint32_t group_start = env->vstart / egs;
177
+ uint32_t group_end = env->vl / egs;
178
+ uint32_t esz = sizeof(uint32_t);
179
+ uint32_t total_elems = vext_get_total_elems(env, desc, esz);
180
+
181
+ for (uint32_t i = group_start; i < group_end; ++i) {
182
+ uint32_t vstart = i * egs;
183
+ uint32_t vend = (i + 1) * egs;
184
+ uint32_t rk[4] = {0};
185
+ uint32_t tmp[8] = {0};
186
+
187
+ for (uint32_t j = vstart; j < vend; ++j) {
188
+ rk[j - vstart] = *((uint32_t *)vs2 + H4(j));
189
+ }
190
+
191
+ for (uint32_t j = vstart; j < vend; ++j) {
192
+ tmp[j - vstart] = *((uint32_t *)vd + H4(j));
193
+ }
194
+
195
+ do_sm4_round(rk, tmp);
196
+
197
+ for (uint32_t j = vstart; j < vend; ++j) {
198
+ *((uint32_t *)vd + H4(j)) = tmp[egs + (j - vstart)];
199
+ }
200
+ }
201
+
202
+ env->vstart = 0;
203
+ /* set tail elements to 1s */
204
+ vext_set_elems_1s(vd, vext_vta(desc), env->vl * esz, total_elems * esz);
205
+}
206
+
207
+void HELPER(vsm4r_vs)(void *vd, void *vs2, CPURISCVState *env, uint32_t desc)
208
+{
209
+ const uint32_t egs = 4;
210
+ uint32_t group_start = env->vstart / egs;
211
+ uint32_t group_end = env->vl / egs;
212
+ uint32_t esz = sizeof(uint32_t);
213
+ uint32_t total_elems = vext_get_total_elems(env, desc, esz);
214
+
215
+ for (uint32_t i = group_start; i < group_end; ++i) {
216
+ uint32_t vstart = i * egs;
217
+ uint32_t vend = (i + 1) * egs;
218
+ uint32_t rk[4] = {0};
219
+ uint32_t tmp[8] = {0};
220
+
221
+ for (uint32_t j = 0; j < egs; ++j) {
222
+ rk[j] = *((uint32_t *)vs2 + H4(j));
223
+ }
224
+
225
+ for (uint32_t j = vstart; j < vend; ++j) {
226
+ tmp[j - vstart] = *((uint32_t *)vd + H4(j));
227
+ }
228
+
229
+ do_sm4_round(rk, tmp);
230
+
231
+ for (uint32_t j = vstart; j < vend; ++j) {
232
+ *((uint32_t *)vd + H4(j)) = tmp[egs + (j - vstart)];
233
+ }
234
+ }
235
+
236
+ env->vstart = 0;
237
+ /* set tail elements to 1s */
238
+ vext_set_elems_1s(vd, vext_vta(desc), env->vl * esz, total_elems * esz);
239
+}
240
diff --git a/target/riscv/insn_trans/trans_rvvk.c.inc b/target/riscv/insn_trans/trans_rvvk.c.inc
241
index XXXXXXX..XXXXXXX 100644
242
--- a/target/riscv/insn_trans/trans_rvvk.c.inc
243
+++ b/target/riscv/insn_trans/trans_rvvk.c.inc
244
@@ -XXX,XX +XXX,XX @@ static bool vghsh_check(DisasContext *s, arg_rmrr *a)
245
}
246
247
GEN_VV_UNMASKED_TRANS(vghsh_vv, vghsh_check, ZVKG_EGS)
248
+
249
+/*
250
+ * Zvksed
251
+ */
252
+
253
+#define ZVKSED_EGS 4
254
+
255
+static bool zvksed_check(DisasContext *s)
256
+{
257
+ int egw_bytes = ZVKSED_EGS << s->sew;
258
+ return s->cfg_ptr->ext_zvksed == true &&
259
+ require_rvv(s) &&
260
+ vext_check_isa_ill(s) &&
261
+ MAXSZ(s) >= egw_bytes &&
262
+ s->sew == MO_32;
263
+}
264
+
265
+static bool vsm4k_vi_check(DisasContext *s, arg_rmrr *a)
266
+{
267
+ return zvksed_check(s) &&
268
+ require_align(a->rd, s->lmul) &&
269
+ require_align(a->rs2, s->lmul);
270
+}
271
+
272
+GEN_VI_UNMASKED_TRANS(vsm4k_vi, vsm4k_vi_check, ZVKSED_EGS)
273
+
274
+static bool vsm4r_vv_check(DisasContext *s, arg_rmr *a)
275
+{
276
+ return zvksed_check(s) &&
277
+ require_align(a->rd, s->lmul) &&
278
+ require_align(a->rs2, s->lmul);
279
+}
280
+
281
+GEN_V_UNMASKED_TRANS(vsm4r_vv, vsm4r_vv_check, ZVKSED_EGS)
282
+
283
+static bool vsm4r_vs_check(DisasContext *s, arg_rmr *a)
284
+{
285
+ return zvksed_check(s) &&
286
+ !is_overlapped(a->rd, 1 << MAX(s->lmul, 0), a->rs2, 1) &&
287
+ require_align(a->rd, s->lmul);
288
+}
289
+
290
+GEN_V_UNMASKED_TRANS(vsm4r_vs, vsm4r_vs_check, ZVKSED_EGS)
291
--
292
2.41.0
diff view generated by jsdifflib
1
From: Rob Bradford <rbradford@rivosinc.com>
2
3
These are WARL fields - zero out the bits for unavailable counters and
4
special case the TM bit in mcountinhibit which is hardwired to zero.
5
This patch achieves this by modifying the value written so that any use
6
of the field will see the correctly masked bits.
7
8
Tested by modifying OpenSBI to write max value to these CSRs and upon
9
subsequent read the appropriate number of bits for number of PMUs is
10
enabled and the TM bit is zero in mcountinhibit.
11
12
Signed-off-by: Rob Bradford <rbradford@rivosinc.com>
13
Acked-by: Alistair Francis <alistair.francis@wdc.com>
14
Reviewed-by: Atish Patra <atishp@rivosinc.com>
15
Message-ID: <20230802124906.24197-1-rbradford@rivosinc.com>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
16
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: ca5359fec6b2aff851eef3b3bc4b53cb5d4ad194.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <ca5359fec6b2aff851eef3b3bc4b53cb5d4ad194.1597259519.git.alistair.francis@wdc.com>
4
---
17
---
5
target/riscv/csr.c | 1 -
18
target/riscv/csr.c | 11 +++++++++--
6
1 file changed, 1 deletion(-)
19
1 file changed, 9 insertions(+), 2 deletions(-)
7
20
8
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
21
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
9
index XXXXXXX..XXXXXXX 100644
22
index XXXXXXX..XXXXXXX 100644
10
--- a/target/riscv/csr.c
23
--- a/target/riscv/csr.c
11
+++ b/target/riscv/csr.c
24
+++ b/target/riscv/csr.c
12
@@ -XXX,XX +XXX,XX @@ static int read_htinst(CPURISCVState *env, int csrno, target_ulong *val)
25
@@ -XXX,XX +XXX,XX @@ static RISCVException write_mcountinhibit(CPURISCVState *env, int csrno,
13
14
static int write_htinst(CPURISCVState *env, int csrno, target_ulong val)
15
{
26
{
16
- env->htinst = val;
27
int cidx;
17
return 0;
28
PMUCTRState *counter;
29
+ RISCVCPU *cpu = env_archcpu(env);
30
31
- env->mcountinhibit = val;
32
+ /* WARL register - disable unavailable counters; TM bit is always 0 */
33
+ env->mcountinhibit =
34
+ val & (cpu->pmu_avail_ctrs | COUNTEREN_CY | COUNTEREN_IR);
35
36
/* Check if any other counter is also monitoring cycles/instructions */
37
for (cidx = 0; cidx < RV_MAX_MHPMCOUNTERS; cidx++) {
38
@@ -XXX,XX +XXX,XX @@ static RISCVException read_mcounteren(CPURISCVState *env, int csrno,
39
static RISCVException write_mcounteren(CPURISCVState *env, int csrno,
40
target_ulong val)
41
{
42
- env->mcounteren = val;
43
+ RISCVCPU *cpu = env_archcpu(env);
44
+
45
+ /* WARL register - disable unavailable counters */
46
+ env->mcounteren = val & (cpu->pmu_avail_ctrs | COUNTEREN_CY | COUNTEREN_TM |
47
+ COUNTEREN_IR);
48
return RISCV_EXCP_NONE;
18
}
49
}
19
50
20
--
51
--
21
2.28.0
52
2.41.0
22
23
diff view generated by jsdifflib
New patch
1
From: Jason Chien <jason.chien@sifive.com>
1
2
3
RVA23 Profiles states:
4
The RVA23 profiles are intended to be used for 64-bit application
5
processors that will run rich OS stacks from standard binary OS
6
distributions and with a substantial number of third-party binary user
7
applications that will be supported over a considerable length of time
8
in the field.
9
10
The chapter 4 of the unprivileged spec introduces the Zihintntl extension
11
and Zihintntl is a mandatory extension presented in RVA23 Profiles, whose
12
purpose is to enable application and operating system portability across
13
different implementations. Thus the DTS should contain the Zihintntl ISA
14
string in order to pass to software.
15
16
The unprivileged spec states:
17
Like any HINTs, these instructions may be freely ignored. Hence, although
18
they are described in terms of cache-based memory hierarchies, they do not
19
mandate the provision of caches.
20
21
These instructions are encoded with non-used opcode, e.g. ADD x0, x0, x2,
22
which QEMU already supports, and QEMU does not emulate cache. Therefore
23
these instructions can be considered as a no-op, and we only need to add
24
a new property for the Zihintntl extension.
25
26
Reviewed-by: Frank Chang <frank.chang@sifive.com>
27
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
28
Signed-off-by: Jason Chien <jason.chien@sifive.com>
29
Message-ID: <20230726074049.19505-2-jason.chien@sifive.com>
30
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
31
---
32
target/riscv/cpu_cfg.h | 1 +
33
target/riscv/cpu.c | 2 ++
34
2 files changed, 3 insertions(+)
35
36
diff --git a/target/riscv/cpu_cfg.h b/target/riscv/cpu_cfg.h
37
index XXXXXXX..XXXXXXX 100644
38
--- a/target/riscv/cpu_cfg.h
39
+++ b/target/riscv/cpu_cfg.h
40
@@ -XXX,XX +XXX,XX @@ struct RISCVCPUConfig {
41
bool ext_icbom;
42
bool ext_icboz;
43
bool ext_zicond;
44
+ bool ext_zihintntl;
45
bool ext_zihintpause;
46
bool ext_smstateen;
47
bool ext_sstc;
48
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
49
index XXXXXXX..XXXXXXX 100644
50
--- a/target/riscv/cpu.c
51
+++ b/target/riscv/cpu.c
52
@@ -XXX,XX +XXX,XX @@ static const struct isa_ext_data isa_edata_arr[] = {
53
ISA_EXT_DATA_ENTRY(zicond, PRIV_VERSION_1_12_0, ext_zicond),
54
ISA_EXT_DATA_ENTRY(zicsr, PRIV_VERSION_1_10_0, ext_icsr),
55
ISA_EXT_DATA_ENTRY(zifencei, PRIV_VERSION_1_10_0, ext_ifencei),
56
+ ISA_EXT_DATA_ENTRY(zihintntl, PRIV_VERSION_1_10_0, ext_zihintntl),
57
ISA_EXT_DATA_ENTRY(zihintpause, PRIV_VERSION_1_10_0, ext_zihintpause),
58
ISA_EXT_DATA_ENTRY(zmmul, PRIV_VERSION_1_12_0, ext_zmmul),
59
ISA_EXT_DATA_ENTRY(zawrs, PRIV_VERSION_1_12_0, ext_zawrs),
60
@@ -XXX,XX +XXX,XX @@ static Property riscv_cpu_extensions[] = {
61
DEFINE_PROP_BOOL("sscofpmf", RISCVCPU, cfg.ext_sscofpmf, false),
62
DEFINE_PROP_BOOL("Zifencei", RISCVCPU, cfg.ext_ifencei, true),
63
DEFINE_PROP_BOOL("Zicsr", RISCVCPU, cfg.ext_icsr, true),
64
+ DEFINE_PROP_BOOL("Zihintntl", RISCVCPU, cfg.ext_zihintntl, true),
65
DEFINE_PROP_BOOL("Zihintpause", RISCVCPU, cfg.ext_zihintpause, true),
66
DEFINE_PROP_BOOL("Zawrs", RISCVCPU, cfg.ext_zawrs, true),
67
DEFINE_PROP_BOOL("Zfa", RISCVCPU, cfg.ext_zfa, true),
68
--
69
2.41.0
diff view generated by jsdifflib
New patch
1
From: LIU Zhiwei <zhiwei_liu@linux.alibaba.com>
1
2
3
Commit a47842d ("riscv: Add support for the Zfa extension") implemented the zfa extension.
4
However, it has some typos for fleq.d and fltq.d. Both of them misused the fltq.s
5
helper function.
6
7
Fixes: a47842d ("riscv: Add support for the Zfa extension")
8
Signed-off-by: LIU Zhiwei <zhiwei_liu@linux.alibaba.com>
9
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
10
Reviewed-by: Weiwei Li <liweiwei@iscas.ac.cn>
11
Message-ID: <20230728003906.768-1-zhiwei_liu@linux.alibaba.com>
12
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
13
---
14
target/riscv/insn_trans/trans_rvzfa.c.inc | 4 ++--
15
1 file changed, 2 insertions(+), 2 deletions(-)
16
17
diff --git a/target/riscv/insn_trans/trans_rvzfa.c.inc b/target/riscv/insn_trans/trans_rvzfa.c.inc
18
index XXXXXXX..XXXXXXX 100644
19
--- a/target/riscv/insn_trans/trans_rvzfa.c.inc
20
+++ b/target/riscv/insn_trans/trans_rvzfa.c.inc
21
@@ -XXX,XX +XXX,XX @@ bool trans_fleq_d(DisasContext *ctx, arg_fleq_d *a)
22
TCGv_i64 src1 = get_fpr_hs(ctx, a->rs1);
23
TCGv_i64 src2 = get_fpr_hs(ctx, a->rs2);
24
25
- gen_helper_fltq_s(dest, cpu_env, src1, src2);
26
+ gen_helper_fleq_d(dest, cpu_env, src1, src2);
27
gen_set_gpr(ctx, a->rd, dest);
28
return true;
29
}
30
@@ -XXX,XX +XXX,XX @@ bool trans_fltq_d(DisasContext *ctx, arg_fltq_d *a)
31
TCGv_i64 src1 = get_fpr_hs(ctx, a->rs1);
32
TCGv_i64 src2 = get_fpr_hs(ctx, a->rs2);
33
34
- gen_helper_fltq_s(dest, cpu_env, src1, src2);
35
+ gen_helper_fltq_d(dest, cpu_env, src1, src2);
36
gen_set_gpr(ctx, a->rd, dest);
37
return true;
38
}
39
--
40
2.41.0
diff view generated by jsdifflib
New patch
1
From: Jason Chien <jason.chien@sifive.com>
1
2
3
When writing the upper mtime, we should keep the original lower mtime
4
whose value is given by cpu_riscv_read_rtc() instead of
5
cpu_riscv_read_rtc_raw(). The same logic applies to writes to lower mtime.
6
7
Signed-off-by: Jason Chien <jason.chien@sifive.com>
8
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
9
Message-ID: <20230728082502.26439-1-jason.chien@sifive.com>
10
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
11
---
12
hw/intc/riscv_aclint.c | 5 +++--
13
1 file changed, 3 insertions(+), 2 deletions(-)
14
15
diff --git a/hw/intc/riscv_aclint.c b/hw/intc/riscv_aclint.c
16
index XXXXXXX..XXXXXXX 100644
17
--- a/hw/intc/riscv_aclint.c
18
+++ b/hw/intc/riscv_aclint.c
19
@@ -XXX,XX +XXX,XX @@ static void riscv_aclint_mtimer_write(void *opaque, hwaddr addr,
20
return;
21
} else if (addr == mtimer->time_base || addr == mtimer->time_base + 4) {
22
uint64_t rtc_r = cpu_riscv_read_rtc_raw(mtimer->timebase_freq);
23
+ uint64_t rtc = cpu_riscv_read_rtc(mtimer);
24
25
if (addr == mtimer->time_base) {
26
if (size == 4) {
27
/* time_lo for RV32/RV64 */
28
- mtimer->time_delta = ((rtc_r & ~0xFFFFFFFFULL) | value) - rtc_r;
29
+ mtimer->time_delta = ((rtc & ~0xFFFFFFFFULL) | value) - rtc_r;
30
} else {
31
/* time for RV64 */
32
mtimer->time_delta = value - rtc_r;
33
@@ -XXX,XX +XXX,XX @@ static void riscv_aclint_mtimer_write(void *opaque, hwaddr addr,
34
} else {
35
if (size == 4) {
36
/* time_hi for RV32/RV64 */
37
- mtimer->time_delta = (value << 32 | (rtc_r & 0xFFFFFFFF)) - rtc_r;
38
+ mtimer->time_delta = (value << 32 | (rtc & 0xFFFFFFFF)) - rtc_r;
39
} else {
40
qemu_log_mask(LOG_GUEST_ERROR,
41
"aclint-mtimer: invalid time_hi write: %08x",
42
--
43
2.41.0
diff view generated by jsdifflib
New patch
1
From: Jason Chien <jason.chien@sifive.com>
1
2
3
The variables whose values are given by cpu_riscv_read_rtc() should be named
4
"rtc". The variables whose value are given by cpu_riscv_read_rtc_raw()
5
should be named "rtc_r".
6
7
Signed-off-by: Jason Chien <jason.chien@sifive.com>
8
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
9
Message-ID: <20230728082502.26439-2-jason.chien@sifive.com>
10
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
11
---
12
hw/intc/riscv_aclint.c | 6 +++---
13
1 file changed, 3 insertions(+), 3 deletions(-)
14
15
diff --git a/hw/intc/riscv_aclint.c b/hw/intc/riscv_aclint.c
16
index XXXXXXX..XXXXXXX 100644
17
--- a/hw/intc/riscv_aclint.c
18
+++ b/hw/intc/riscv_aclint.c
19
@@ -XXX,XX +XXX,XX @@ static void riscv_aclint_mtimer_write_timecmp(RISCVAclintMTimerState *mtimer,
20
uint64_t next;
21
uint64_t diff;
22
23
- uint64_t rtc_r = cpu_riscv_read_rtc(mtimer);
24
+ uint64_t rtc = cpu_riscv_read_rtc(mtimer);
25
26
/* Compute the relative hartid w.r.t the socket */
27
hartid = hartid - mtimer->hartid_base;
28
29
mtimer->timecmp[hartid] = value;
30
- if (mtimer->timecmp[hartid] <= rtc_r) {
31
+ if (mtimer->timecmp[hartid] <= rtc) {
32
/*
33
* If we're setting an MTIMECMP value in the "past",
34
* immediately raise the timer interrupt
35
@@ -XXX,XX +XXX,XX @@ static void riscv_aclint_mtimer_write_timecmp(RISCVAclintMTimerState *mtimer,
36
37
/* otherwise, set up the future timer interrupt */
38
qemu_irq_lower(mtimer->timer_irqs[hartid]);
39
- diff = mtimer->timecmp[hartid] - rtc_r;
40
+ diff = mtimer->timecmp[hartid] - rtc;
41
/* back to ns (note args switched in muldiv64) */
42
uint64_t ns_diff = muldiv64(diff, NANOSECONDS_PER_SECOND, timebase_freq);
43
44
--
45
2.41.0
diff view generated by jsdifflib
1
From: LIU Zhiwei <zhiwei_liu@linux.alibaba.com>
2
3
We should not use types dependend on host arch for target_ucontext.
4
This bug is found when run rv32 applications.
5
6
Signed-off-by: LIU Zhiwei <zhiwei_liu@linux.alibaba.com>
7
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
8
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
9
Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org>
10
Message-ID: <20230811055438.1945-1-zhiwei_liu@linux.alibaba.com>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
11
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: 4f227b30cb1816795296c0994f1123fab143666a.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <4f227b30cb1816795296c0994f1123fab143666a.1597259519.git.alistair.francis@wdc.com>
4
---
12
---
5
target/riscv/cpu_bits.h | 14 ++++++++------
13
linux-user/riscv/signal.c | 4 ++--
6
1 file changed, 8 insertions(+), 6 deletions(-)
14
1 file changed, 2 insertions(+), 2 deletions(-)
7
15
8
diff --git a/target/riscv/cpu_bits.h b/target/riscv/cpu_bits.h
16
diff --git a/linux-user/riscv/signal.c b/linux-user/riscv/signal.c
9
index XXXXXXX..XXXXXXX 100644
17
index XXXXXXX..XXXXXXX 100644
10
--- a/target/riscv/cpu_bits.h
18
--- a/linux-user/riscv/signal.c
11
+++ b/target/riscv/cpu_bits.h
19
+++ b/linux-user/riscv/signal.c
12
@@ -XXX,XX +XXX,XX @@
20
@@ -XXX,XX +XXX,XX @@ struct target_sigcontext {
13
#endif
21
}; /* cf. riscv-linux:arch/riscv/include/uapi/asm/ptrace.h */
14
22
15
/* hstatus CSR bits */
23
struct target_ucontext {
16
-#define HSTATUS_SPRV 0x00000001
24
- unsigned long uc_flags;
17
+#define HSTATUS_VSBE 0x00000020
25
- struct target_ucontext *uc_link;
18
+#define HSTATUS_GVA 0x00000040
26
+ abi_ulong uc_flags;
19
#define HSTATUS_SPV 0x00000080
27
+ abi_ptr uc_link;
20
-#define HSTATUS_SP2P 0x00000100
28
target_stack_t uc_stack;
21
-#define HSTATUS_SP2V 0x00000200
29
target_sigset_t uc_sigmask;
22
+#define HSTATUS_SPVP 0x00000100
30
uint8_t __unused[1024 / 8 - sizeof(target_sigset_t)];
23
+#define HSTATUS_HU 0x00000200
24
+#define HSTATUS_VGEIN 0x0003F000
25
#define HSTATUS_VTVM 0x00100000
26
#define HSTATUS_VTSR 0x00400000
27
-#define HSTATUS_HU 0x00000200
28
-#define HSTATUS_GVA 0x00000040
29
-#define HSTATUS_SPVP 0x00000100
30
+#if defined(TARGET_RISCV64)
31
+#define HSTATUS_VSXL 0x300000000
32
+#endif
33
34
#define HSTATUS32_WPRI 0xFF8FF87E
35
#define HSTATUS64_WPRI 0xFFFFFFFFFF8FF87EULL
36
--
31
--
37
2.28.0
32
2.41.0
38
33
39
34
diff view generated by jsdifflib
1
From: Yong-Xuan Wang <yongxuan.wang@sifive.com>
2
3
In this patch, we create the APLIC and IMSIC FDT helper functions and
4
remove M mode AIA devices when using KVM acceleration.
5
6
Signed-off-by: Yong-Xuan Wang <yongxuan.wang@sifive.com>
7
Reviewed-by: Jim Shu <jim.shu@sifive.com>
8
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
9
Reviewed-by: Andrew Jones <ajones@ventanamicro.com>
10
Message-ID: <20230727102439.22554-2-yongxuan.wang@sifive.com>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
11
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: 644b6c114b1a81adbee0ab8c9c66a8672059ec96.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <644b6c114b1a81adbee0ab8c9c66a8672059ec96.1597259519.git.alistair.francis@wdc.com>
4
---
12
---
5
target/riscv/cpu_bits.h | 3 +++
13
hw/riscv/virt.c | 290 +++++++++++++++++++++++-------------------------
6
target/riscv/csr.c | 40 ++++++++++++++++++++++++++++++++++++++++
14
1 file changed, 137 insertions(+), 153 deletions(-)
7
2 files changed, 43 insertions(+)
8
15
9
diff --git a/target/riscv/cpu_bits.h b/target/riscv/cpu_bits.h
16
diff --git a/hw/riscv/virt.c b/hw/riscv/virt.c
10
index XXXXXXX..XXXXXXX 100644
17
index XXXXXXX..XXXXXXX 100644
11
--- a/target/riscv/cpu_bits.h
18
--- a/hw/riscv/virt.c
12
+++ b/target/riscv/cpu_bits.h
19
+++ b/hw/riscv/virt.c
13
@@ -XXX,XX +XXX,XX @@
20
@@ -XXX,XX +XXX,XX @@ static uint32_t imsic_num_bits(uint32_t count)
14
#define CSR_HIDELEG 0x603
15
#define CSR_HIE 0x604
16
#define CSR_HCOUNTEREN 0x606
17
+#define CSR_HGEIE 0x607
18
#define CSR_HTVAL 0x643
19
+#define CSR_HVIP 0x645
20
#define CSR_HIP 0x644
21
#define CSR_HTINST 0x64A
22
+#define CSR_HGEIP 0xE12
23
#define CSR_HGATP 0x680
24
#define CSR_HTIMEDELTA 0x605
25
#define CSR_HTIMEDELTAH 0x615
26
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
27
index XXXXXXX..XXXXXXX 100644
28
--- a/target/riscv/csr.c
29
+++ b/target/riscv/csr.c
30
@@ -XXX,XX +XXX,XX @@ static int write_hideleg(CPURISCVState *env, int csrno, target_ulong val)
31
return 0;
32
}
33
34
+static int rmw_hvip(CPURISCVState *env, int csrno, target_ulong *ret_value,
35
+ target_ulong new_value, target_ulong write_mask)
36
+{
37
+ int ret = rmw_mip(env, 0, ret_value, new_value,
38
+ write_mask & hip_writable_mask);
39
+
40
+ *ret_value &= hip_writable_mask;
41
+
42
+ return ret;
43
+}
44
+
45
static int rmw_hip(CPURISCVState *env, int csrno, target_ulong *ret_value,
46
target_ulong new_value, target_ulong write_mask)
47
{
48
int ret = rmw_mip(env, 0, ret_value, new_value,
49
write_mask & hip_writable_mask);
50
51
+ *ret_value &= hip_writable_mask;
52
+
53
return ret;
21
return ret;
54
}
22
}
55
23
56
@@ -XXX,XX +XXX,XX @@ static int write_hcounteren(CPURISCVState *env, int csrno, target_ulong val)
24
-static void create_fdt_imsic(RISCVVirtState *s, const MemMapEntry *memmap,
57
return 0;
25
- uint32_t *phandle, uint32_t *intc_phandles,
26
- uint32_t *msi_m_phandle, uint32_t *msi_s_phandle)
27
+static void create_fdt_one_imsic(RISCVVirtState *s, hwaddr base_addr,
28
+ uint32_t *intc_phandles, uint32_t msi_phandle,
29
+ bool m_mode, uint32_t imsic_guest_bits)
30
{
31
int cpu, socket;
32
char *imsic_name;
33
MachineState *ms = MACHINE(s);
34
int socket_count = riscv_socket_count(ms);
35
- uint32_t imsic_max_hart_per_socket, imsic_guest_bits;
36
+ uint32_t imsic_max_hart_per_socket;
37
uint32_t *imsic_cells, *imsic_regs, imsic_addr, imsic_size;
38
39
- *msi_m_phandle = (*phandle)++;
40
- *msi_s_phandle = (*phandle)++;
41
imsic_cells = g_new0(uint32_t, ms->smp.cpus * 2);
42
imsic_regs = g_new0(uint32_t, socket_count * 4);
43
44
- /* M-level IMSIC node */
45
for (cpu = 0; cpu < ms->smp.cpus; cpu++) {
46
imsic_cells[cpu * 2 + 0] = cpu_to_be32(intc_phandles[cpu]);
47
- imsic_cells[cpu * 2 + 1] = cpu_to_be32(IRQ_M_EXT);
48
+ imsic_cells[cpu * 2 + 1] = cpu_to_be32(m_mode ? IRQ_M_EXT : IRQ_S_EXT);
49
}
50
- imsic_max_hart_per_socket = 0;
51
- for (socket = 0; socket < socket_count; socket++) {
52
- imsic_addr = memmap[VIRT_IMSIC_M].base +
53
- socket * VIRT_IMSIC_GROUP_MAX_SIZE;
54
- imsic_size = IMSIC_HART_SIZE(0) * s->soc[socket].num_harts;
55
- imsic_regs[socket * 4 + 0] = 0;
56
- imsic_regs[socket * 4 + 1] = cpu_to_be32(imsic_addr);
57
- imsic_regs[socket * 4 + 2] = 0;
58
- imsic_regs[socket * 4 + 3] = cpu_to_be32(imsic_size);
59
- if (imsic_max_hart_per_socket < s->soc[socket].num_harts) {
60
- imsic_max_hart_per_socket = s->soc[socket].num_harts;
61
- }
62
- }
63
- imsic_name = g_strdup_printf("/soc/imsics@%lx",
64
- (unsigned long)memmap[VIRT_IMSIC_M].base);
65
- qemu_fdt_add_subnode(ms->fdt, imsic_name);
66
- qemu_fdt_setprop_string(ms->fdt, imsic_name, "compatible",
67
- "riscv,imsics");
68
- qemu_fdt_setprop_cell(ms->fdt, imsic_name, "#interrupt-cells",
69
- FDT_IMSIC_INT_CELLS);
70
- qemu_fdt_setprop(ms->fdt, imsic_name, "interrupt-controller",
71
- NULL, 0);
72
- qemu_fdt_setprop(ms->fdt, imsic_name, "msi-controller",
73
- NULL, 0);
74
- qemu_fdt_setprop(ms->fdt, imsic_name, "interrupts-extended",
75
- imsic_cells, ms->smp.cpus * sizeof(uint32_t) * 2);
76
- qemu_fdt_setprop(ms->fdt, imsic_name, "reg", imsic_regs,
77
- socket_count * sizeof(uint32_t) * 4);
78
- qemu_fdt_setprop_cell(ms->fdt, imsic_name, "riscv,num-ids",
79
- VIRT_IRQCHIP_NUM_MSIS);
80
- if (socket_count > 1) {
81
- qemu_fdt_setprop_cell(ms->fdt, imsic_name, "riscv,hart-index-bits",
82
- imsic_num_bits(imsic_max_hart_per_socket));
83
- qemu_fdt_setprop_cell(ms->fdt, imsic_name, "riscv,group-index-bits",
84
- imsic_num_bits(socket_count));
85
- qemu_fdt_setprop_cell(ms->fdt, imsic_name, "riscv,group-index-shift",
86
- IMSIC_MMIO_GROUP_MIN_SHIFT);
87
- }
88
- qemu_fdt_setprop_cell(ms->fdt, imsic_name, "phandle", *msi_m_phandle);
89
-
90
- g_free(imsic_name);
91
92
- /* S-level IMSIC node */
93
- for (cpu = 0; cpu < ms->smp.cpus; cpu++) {
94
- imsic_cells[cpu * 2 + 0] = cpu_to_be32(intc_phandles[cpu]);
95
- imsic_cells[cpu * 2 + 1] = cpu_to_be32(IRQ_S_EXT);
96
- }
97
- imsic_guest_bits = imsic_num_bits(s->aia_guests + 1);
98
imsic_max_hart_per_socket = 0;
99
for (socket = 0; socket < socket_count; socket++) {
100
- imsic_addr = memmap[VIRT_IMSIC_S].base +
101
- socket * VIRT_IMSIC_GROUP_MAX_SIZE;
102
+ imsic_addr = base_addr + socket * VIRT_IMSIC_GROUP_MAX_SIZE;
103
imsic_size = IMSIC_HART_SIZE(imsic_guest_bits) *
104
s->soc[socket].num_harts;
105
imsic_regs[socket * 4 + 0] = 0;
106
@@ -XXX,XX +XXX,XX @@ static void create_fdt_imsic(RISCVVirtState *s, const MemMapEntry *memmap,
107
imsic_max_hart_per_socket = s->soc[socket].num_harts;
108
}
109
}
110
- imsic_name = g_strdup_printf("/soc/imsics@%lx",
111
- (unsigned long)memmap[VIRT_IMSIC_S].base);
112
+
113
+ imsic_name = g_strdup_printf("/soc/imsics@%lx", (unsigned long)base_addr);
114
qemu_fdt_add_subnode(ms->fdt, imsic_name);
115
- qemu_fdt_setprop_string(ms->fdt, imsic_name, "compatible",
116
- "riscv,imsics");
117
+ qemu_fdt_setprop_string(ms->fdt, imsic_name, "compatible", "riscv,imsics");
118
qemu_fdt_setprop_cell(ms->fdt, imsic_name, "#interrupt-cells",
119
- FDT_IMSIC_INT_CELLS);
120
- qemu_fdt_setprop(ms->fdt, imsic_name, "interrupt-controller",
121
- NULL, 0);
122
- qemu_fdt_setprop(ms->fdt, imsic_name, "msi-controller",
123
- NULL, 0);
124
+ FDT_IMSIC_INT_CELLS);
125
+ qemu_fdt_setprop(ms->fdt, imsic_name, "interrupt-controller", NULL, 0);
126
+ qemu_fdt_setprop(ms->fdt, imsic_name, "msi-controller", NULL, 0);
127
qemu_fdt_setprop(ms->fdt, imsic_name, "interrupts-extended",
128
- imsic_cells, ms->smp.cpus * sizeof(uint32_t) * 2);
129
+ imsic_cells, ms->smp.cpus * sizeof(uint32_t) * 2);
130
qemu_fdt_setprop(ms->fdt, imsic_name, "reg", imsic_regs,
131
- socket_count * sizeof(uint32_t) * 4);
132
+ socket_count * sizeof(uint32_t) * 4);
133
qemu_fdt_setprop_cell(ms->fdt, imsic_name, "riscv,num-ids",
134
- VIRT_IRQCHIP_NUM_MSIS);
135
+ VIRT_IRQCHIP_NUM_MSIS);
136
+
137
if (imsic_guest_bits) {
138
qemu_fdt_setprop_cell(ms->fdt, imsic_name, "riscv,guest-index-bits",
139
- imsic_guest_bits);
140
+ imsic_guest_bits);
141
}
142
+
143
if (socket_count > 1) {
144
qemu_fdt_setprop_cell(ms->fdt, imsic_name, "riscv,hart-index-bits",
145
- imsic_num_bits(imsic_max_hart_per_socket));
146
+ imsic_num_bits(imsic_max_hart_per_socket));
147
qemu_fdt_setprop_cell(ms->fdt, imsic_name, "riscv,group-index-bits",
148
- imsic_num_bits(socket_count));
149
+ imsic_num_bits(socket_count));
150
qemu_fdt_setprop_cell(ms->fdt, imsic_name, "riscv,group-index-shift",
151
- IMSIC_MMIO_GROUP_MIN_SHIFT);
152
+ IMSIC_MMIO_GROUP_MIN_SHIFT);
153
}
154
- qemu_fdt_setprop_cell(ms->fdt, imsic_name, "phandle", *msi_s_phandle);
155
- g_free(imsic_name);
156
+ qemu_fdt_setprop_cell(ms->fdt, imsic_name, "phandle", msi_phandle);
157
158
+ g_free(imsic_name);
159
g_free(imsic_regs);
160
g_free(imsic_cells);
58
}
161
}
59
162
60
+static int read_hgeie(CPURISCVState *env, int csrno, target_ulong *val)
163
-static void create_fdt_socket_aplic(RISCVVirtState *s,
164
- const MemMapEntry *memmap, int socket,
165
- uint32_t msi_m_phandle,
166
- uint32_t msi_s_phandle,
167
- uint32_t *phandle,
168
- uint32_t *intc_phandles,
169
- uint32_t *aplic_phandles)
170
+static void create_fdt_imsic(RISCVVirtState *s, const MemMapEntry *memmap,
171
+ uint32_t *phandle, uint32_t *intc_phandles,
172
+ uint32_t *msi_m_phandle, uint32_t *msi_s_phandle)
61
+{
173
+{
62
+ qemu_log_mask(LOG_UNIMP, "No support for a non-zero GEILEN.");
174
+ *msi_m_phandle = (*phandle)++;
63
+ return 0;
175
+ *msi_s_phandle = (*phandle)++;
176
+
177
+ if (!kvm_enabled()) {
178
+ /* M-level IMSIC node */
179
+ create_fdt_one_imsic(s, memmap[VIRT_IMSIC_M].base, intc_phandles,
180
+ *msi_m_phandle, true, 0);
181
+ }
182
+
183
+ /* S-level IMSIC node */
184
+ create_fdt_one_imsic(s, memmap[VIRT_IMSIC_S].base, intc_phandles,
185
+ *msi_s_phandle, false,
186
+ imsic_num_bits(s->aia_guests + 1));
187
+
64
+}
188
+}
65
+
189
+
66
+static int write_hgeie(CPURISCVState *env, int csrno, target_ulong val)
190
+static void create_fdt_one_aplic(RISCVVirtState *s, int socket,
191
+ unsigned long aplic_addr, uint32_t aplic_size,
192
+ uint32_t msi_phandle,
193
+ uint32_t *intc_phandles,
194
+ uint32_t aplic_phandle,
195
+ uint32_t aplic_child_phandle,
196
+ bool m_mode)
197
{
198
int cpu;
199
char *aplic_name;
200
uint32_t *aplic_cells;
201
- unsigned long aplic_addr;
202
MachineState *ms = MACHINE(s);
203
- uint32_t aplic_m_phandle, aplic_s_phandle;
204
205
- aplic_m_phandle = (*phandle)++;
206
- aplic_s_phandle = (*phandle)++;
207
aplic_cells = g_new0(uint32_t, s->soc[socket].num_harts * 2);
208
209
- /* M-level APLIC node */
210
for (cpu = 0; cpu < s->soc[socket].num_harts; cpu++) {
211
aplic_cells[cpu * 2 + 0] = cpu_to_be32(intc_phandles[cpu]);
212
- aplic_cells[cpu * 2 + 1] = cpu_to_be32(IRQ_M_EXT);
213
+ aplic_cells[cpu * 2 + 1] = cpu_to_be32(m_mode ? IRQ_M_EXT : IRQ_S_EXT);
214
}
215
- aplic_addr = memmap[VIRT_APLIC_M].base +
216
- (memmap[VIRT_APLIC_M].size * socket);
217
+
218
aplic_name = g_strdup_printf("/soc/aplic@%lx", aplic_addr);
219
qemu_fdt_add_subnode(ms->fdt, aplic_name);
220
qemu_fdt_setprop_string(ms->fdt, aplic_name, "compatible", "riscv,aplic");
221
qemu_fdt_setprop_cell(ms->fdt, aplic_name,
222
- "#interrupt-cells", FDT_APLIC_INT_CELLS);
223
+ "#interrupt-cells", FDT_APLIC_INT_CELLS);
224
qemu_fdt_setprop(ms->fdt, aplic_name, "interrupt-controller", NULL, 0);
225
+
226
if (s->aia_type == VIRT_AIA_TYPE_APLIC) {
227
qemu_fdt_setprop(ms->fdt, aplic_name, "interrupts-extended",
228
- aplic_cells, s->soc[socket].num_harts * sizeof(uint32_t) * 2);
229
+ aplic_cells,
230
+ s->soc[socket].num_harts * sizeof(uint32_t) * 2);
231
} else {
232
- qemu_fdt_setprop_cell(ms->fdt, aplic_name, "msi-parent",
233
- msi_m_phandle);
234
+ qemu_fdt_setprop_cell(ms->fdt, aplic_name, "msi-parent", msi_phandle);
235
}
236
+
237
qemu_fdt_setprop_cells(ms->fdt, aplic_name, "reg",
238
- 0x0, aplic_addr, 0x0, memmap[VIRT_APLIC_M].size);
239
+ 0x0, aplic_addr, 0x0, aplic_size);
240
qemu_fdt_setprop_cell(ms->fdt, aplic_name, "riscv,num-sources",
241
- VIRT_IRQCHIP_NUM_SOURCES);
242
- qemu_fdt_setprop_cell(ms->fdt, aplic_name, "riscv,children",
243
- aplic_s_phandle);
244
- qemu_fdt_setprop_cells(ms->fdt, aplic_name, "riscv,delegate",
245
- aplic_s_phandle, 0x1, VIRT_IRQCHIP_NUM_SOURCES);
246
+ VIRT_IRQCHIP_NUM_SOURCES);
247
+
248
+ if (aplic_child_phandle) {
249
+ qemu_fdt_setprop_cell(ms->fdt, aplic_name, "riscv,children",
250
+ aplic_child_phandle);
251
+ qemu_fdt_setprop_cells(ms->fdt, aplic_name, "riscv,delegate",
252
+ aplic_child_phandle, 0x1,
253
+ VIRT_IRQCHIP_NUM_SOURCES);
254
+ }
255
+
256
riscv_socket_fdt_write_id(ms, aplic_name, socket);
257
- qemu_fdt_setprop_cell(ms->fdt, aplic_name, "phandle", aplic_m_phandle);
258
+ qemu_fdt_setprop_cell(ms->fdt, aplic_name, "phandle", aplic_phandle);
259
+
260
g_free(aplic_name);
261
+ g_free(aplic_cells);
262
+}
263
264
- /* S-level APLIC node */
265
- for (cpu = 0; cpu < s->soc[socket].num_harts; cpu++) {
266
- aplic_cells[cpu * 2 + 0] = cpu_to_be32(intc_phandles[cpu]);
267
- aplic_cells[cpu * 2 + 1] = cpu_to_be32(IRQ_S_EXT);
268
+static void create_fdt_socket_aplic(RISCVVirtState *s,
269
+ const MemMapEntry *memmap, int socket,
270
+ uint32_t msi_m_phandle,
271
+ uint32_t msi_s_phandle,
272
+ uint32_t *phandle,
273
+ uint32_t *intc_phandles,
274
+ uint32_t *aplic_phandles)
67
+{
275
+{
68
+ qemu_log_mask(LOG_UNIMP, "No support for a non-zero GEILEN.");
276
+ char *aplic_name;
69
+ return 0;
277
+ unsigned long aplic_addr;
70
+}
278
+ MachineState *ms = MACHINE(s);
71
+
279
+ uint32_t aplic_m_phandle, aplic_s_phandle;
72
static int read_htval(CPURISCVState *env, int csrno, target_ulong *val)
280
+
73
{
281
+ aplic_m_phandle = (*phandle)++;
74
*val = env->htval;
282
+ aplic_s_phandle = (*phandle)++;
75
@@ -XXX,XX +XXX,XX @@ static int write_htinst(CPURISCVState *env, int csrno, target_ulong val)
283
+
76
return 0;
284
+ if (!kvm_enabled()) {
285
+ /* M-level APLIC node */
286
+ aplic_addr = memmap[VIRT_APLIC_M].base +
287
+ (memmap[VIRT_APLIC_M].size * socket);
288
+ create_fdt_one_aplic(s, socket, aplic_addr, memmap[VIRT_APLIC_M].size,
289
+ msi_m_phandle, intc_phandles,
290
+ aplic_m_phandle, aplic_s_phandle,
291
+ true);
292
}
293
+
294
+ /* S-level APLIC node */
295
aplic_addr = memmap[VIRT_APLIC_S].base +
296
(memmap[VIRT_APLIC_S].size * socket);
297
+ create_fdt_one_aplic(s, socket, aplic_addr, memmap[VIRT_APLIC_S].size,
298
+ msi_s_phandle, intc_phandles,
299
+ aplic_s_phandle, 0,
300
+ false);
301
+
302
aplic_name = g_strdup_printf("/soc/aplic@%lx", aplic_addr);
303
- qemu_fdt_add_subnode(ms->fdt, aplic_name);
304
- qemu_fdt_setprop_string(ms->fdt, aplic_name, "compatible", "riscv,aplic");
305
- qemu_fdt_setprop_cell(ms->fdt, aplic_name,
306
- "#interrupt-cells", FDT_APLIC_INT_CELLS);
307
- qemu_fdt_setprop(ms->fdt, aplic_name, "interrupt-controller", NULL, 0);
308
- if (s->aia_type == VIRT_AIA_TYPE_APLIC) {
309
- qemu_fdt_setprop(ms->fdt, aplic_name, "interrupts-extended",
310
- aplic_cells, s->soc[socket].num_harts * sizeof(uint32_t) * 2);
311
- } else {
312
- qemu_fdt_setprop_cell(ms->fdt, aplic_name, "msi-parent",
313
- msi_s_phandle);
314
- }
315
- qemu_fdt_setprop_cells(ms->fdt, aplic_name, "reg",
316
- 0x0, aplic_addr, 0x0, memmap[VIRT_APLIC_S].size);
317
- qemu_fdt_setprop_cell(ms->fdt, aplic_name, "riscv,num-sources",
318
- VIRT_IRQCHIP_NUM_SOURCES);
319
- riscv_socket_fdt_write_id(ms, aplic_name, socket);
320
- qemu_fdt_setprop_cell(ms->fdt, aplic_name, "phandle", aplic_s_phandle);
321
322
if (!socket) {
323
platform_bus_add_all_fdt_nodes(ms->fdt, aplic_name,
324
@@ -XXX,XX +XXX,XX @@ static void create_fdt_socket_aplic(RISCVVirtState *s,
325
326
g_free(aplic_name);
327
328
- g_free(aplic_cells);
329
aplic_phandles[socket] = aplic_s_phandle;
77
}
330
}
78
331
79
+static int read_hgeip(CPURISCVState *env, int csrno, target_ulong *val)
332
@@ -XXX,XX +XXX,XX @@ static DeviceState *virt_create_aia(RISCVVirtAIAType aia_type, int aia_guests,
80
+{
333
int i;
81
+ qemu_log_mask(LOG_UNIMP, "No support for a non-zero GEILEN.");
334
hwaddr addr;
82
+ return 0;
335
uint32_t guest_bits;
83
+}
336
- DeviceState *aplic_m;
84
+
337
- bool msimode = (aia_type == VIRT_AIA_TYPE_APLIC_IMSIC) ? true : false;
85
+static int write_hgeip(CPURISCVState *env, int csrno, target_ulong val)
338
+ DeviceState *aplic_s = NULL;
86
+{
339
+ DeviceState *aplic_m = NULL;
87
+ qemu_log_mask(LOG_UNIMP, "No support for a non-zero GEILEN.");
340
+ bool msimode = aia_type == VIRT_AIA_TYPE_APLIC_IMSIC;
88
+ return 0;
341
89
+}
342
if (msimode) {
90
+
343
- /* Per-socket M-level IMSICs */
91
static int read_hgatp(CPURISCVState *env, int csrno, target_ulong *val)
344
- addr = memmap[VIRT_IMSIC_M].base + socket * VIRT_IMSIC_GROUP_MAX_SIZE;
92
{
345
- for (i = 0; i < hart_count; i++) {
93
*val = env->hgatp;
346
- riscv_imsic_create(addr + i * IMSIC_HART_SIZE(0),
94
@@ -XXX,XX +XXX,XX @@ static riscv_csr_operations csr_ops[CSR_TABLE_SIZE] = {
347
- base_hartid + i, true, 1,
95
[CSR_HSTATUS] = { hmode, read_hstatus, write_hstatus },
348
- VIRT_IRQCHIP_NUM_MSIS);
96
[CSR_HEDELEG] = { hmode, read_hedeleg, write_hedeleg },
349
+ if (!kvm_enabled()) {
97
[CSR_HIDELEG] = { hmode, read_hideleg, write_hideleg },
350
+ /* Per-socket M-level IMSICs */
98
+ [CSR_HVIP] = { hmode, NULL, NULL, rmw_hvip },
351
+ addr = memmap[VIRT_IMSIC_M].base +
99
[CSR_HIP] = { hmode, NULL, NULL, rmw_hip },
352
+ socket * VIRT_IMSIC_GROUP_MAX_SIZE;
100
[CSR_HIE] = { hmode, read_hie, write_hie },
353
+ for (i = 0; i < hart_count; i++) {
101
[CSR_HCOUNTEREN] = { hmode, read_hcounteren, write_hcounteren },
354
+ riscv_imsic_create(addr + i * IMSIC_HART_SIZE(0),
102
+ [CSR_HGEIE] = { hmode, read_hgeie, write_hgeie },
355
+ base_hartid + i, true, 1,
103
[CSR_HTVAL] = { hmode, read_htval, write_htval },
356
+ VIRT_IRQCHIP_NUM_MSIS);
104
[CSR_HTINST] = { hmode, read_htinst, write_htinst },
357
+ }
105
+ [CSR_HGEIP] = { hmode, read_hgeip, write_hgeip },
358
}
106
[CSR_HGATP] = { hmode, read_hgatp, write_hgatp },
359
107
[CSR_HTIMEDELTA] = { hmode, read_htimedelta, write_htimedelta },
360
/* Per-socket S-level IMSICs */
108
#if defined(TARGET_RISCV32)
361
@@ -XXX,XX +XXX,XX @@ static DeviceState *virt_create_aia(RISCVVirtAIAType aia_type, int aia_guests,
362
}
363
}
364
365
- /* Per-socket M-level APLIC */
366
- aplic_m = riscv_aplic_create(
367
- memmap[VIRT_APLIC_M].base + socket * memmap[VIRT_APLIC_M].size,
368
- memmap[VIRT_APLIC_M].size,
369
- (msimode) ? 0 : base_hartid,
370
- (msimode) ? 0 : hart_count,
371
- VIRT_IRQCHIP_NUM_SOURCES,
372
- VIRT_IRQCHIP_NUM_PRIO_BITS,
373
- msimode, true, NULL);
374
-
375
- if (aplic_m) {
376
- /* Per-socket S-level APLIC */
377
- riscv_aplic_create(
378
- memmap[VIRT_APLIC_S].base + socket * memmap[VIRT_APLIC_S].size,
379
- memmap[VIRT_APLIC_S].size,
380
- (msimode) ? 0 : base_hartid,
381
- (msimode) ? 0 : hart_count,
382
- VIRT_IRQCHIP_NUM_SOURCES,
383
- VIRT_IRQCHIP_NUM_PRIO_BITS,
384
- msimode, false, aplic_m);
385
+ if (!kvm_enabled()) {
386
+ /* Per-socket M-level APLIC */
387
+ aplic_m = riscv_aplic_create(memmap[VIRT_APLIC_M].base +
388
+ socket * memmap[VIRT_APLIC_M].size,
389
+ memmap[VIRT_APLIC_M].size,
390
+ (msimode) ? 0 : base_hartid,
391
+ (msimode) ? 0 : hart_count,
392
+ VIRT_IRQCHIP_NUM_SOURCES,
393
+ VIRT_IRQCHIP_NUM_PRIO_BITS,
394
+ msimode, true, NULL);
395
}
396
397
- return aplic_m;
398
+ /* Per-socket S-level APLIC */
399
+ aplic_s = riscv_aplic_create(memmap[VIRT_APLIC_S].base +
400
+ socket * memmap[VIRT_APLIC_S].size,
401
+ memmap[VIRT_APLIC_S].size,
402
+ (msimode) ? 0 : base_hartid,
403
+ (msimode) ? 0 : hart_count,
404
+ VIRT_IRQCHIP_NUM_SOURCES,
405
+ VIRT_IRQCHIP_NUM_PRIO_BITS,
406
+ msimode, false, aplic_m);
407
+
408
+ return kvm_enabled() ? aplic_s : aplic_m;
409
}
410
411
static void create_platform_bus(RISCVVirtState *s, DeviceState *irqchip)
109
--
412
--
110
2.28.0
413
2.41.0
111
112
diff view generated by jsdifflib
1
From: Anup Patel <anup.patel@wdc.com>
1
From: Yong-Xuan Wang <yongxuan.wang@sifive.com>
2
2
3
We extend RISC-V spike machine to allow creating a multi-socket
3
We check the in-kernel irqchip support when using KVM acceleration.
4
machine. Each RISC-V spike machine socket is a NUMA node having
5
a set of HARTs, a memory instance, and a CLINT instance. Other
6
devices are shared between all sockets. We also update the
7
generated device tree accordingly.
8
4
9
By default, NUMA multi-socket support is disabled for RISC-V spike
5
Signed-off-by: Yong-Xuan Wang <yongxuan.wang@sifive.com>
10
machine. To enable it, users can use "-numa" command-line options
6
Reviewed-by: Jim Shu <jim.shu@sifive.com>
11
of QEMU.
7
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
12
8
Reviewed-by: Andrew Jones <ajones@ventanamicro.com>
13
Example1: For two NUMA nodes with 2 CPUs each, append following
9
Message-ID: <20230727102439.22554-3-yongxuan.wang@sifive.com>
14
to command-line options: "-smp 4 -numa node -numa node"
15
16
Example2: For two NUMA nodes with 1 and 3 CPUs, append following
17
to command-line options:
18
"-smp 4 -numa node -numa node -numa cpu,node-id=0,core-id=0 \
19
-numa cpu,node-id=1,core-id=1 -numa cpu,node-id=1,core-id=2 \
20
-numa cpu,node-id=1,core-id=3"
21
22
The maximum number of sockets in a RISC-V spike machine is 8
23
but this limit can be changed in future.
24
25
Signed-off-by: Anup Patel <anup.patel@wdc.com>
26
Reviewed-by: Atish Patra <atish.patra@wdc.com>
27
Message-Id: <20200616032229.766089-5-anup.patel@wdc.com>
28
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
10
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
29
---
11
---
30
include/hw/riscv/spike.h | 11 +-
12
target/riscv/kvm.c | 10 +++++++++-
31
hw/riscv/spike.c | 232 ++++++++++++++++++++++++++-------------
13
1 file changed, 9 insertions(+), 1 deletion(-)
32
2 files changed, 167 insertions(+), 76 deletions(-)
33
14
34
diff --git a/include/hw/riscv/spike.h b/include/hw/riscv/spike.h
15
diff --git a/target/riscv/kvm.c b/target/riscv/kvm.c
35
index XXXXXXX..XXXXXXX 100644
16
index XXXXXXX..XXXXXXX 100644
36
--- a/include/hw/riscv/spike.h
17
--- a/target/riscv/kvm.c
37
+++ b/include/hw/riscv/spike.h
18
+++ b/target/riscv/kvm.c
38
@@ -XXX,XX +XXX,XX @@
19
@@ -XXX,XX +XXX,XX @@ int kvm_arch_init(MachineState *ms, KVMState *s)
39
#include "hw/riscv/riscv_hart.h"
20
40
#include "hw/sysbus.h"
21
int kvm_arch_irqchip_create(KVMState *s)
41
42
+#define SPIKE_CPUS_MAX 8
43
+#define SPIKE_SOCKETS_MAX 8
44
+
45
+#define TYPE_SPIKE_MACHINE MACHINE_TYPE_NAME("spike")
46
+#define SPIKE_MACHINE(obj) \
47
+ OBJECT_CHECK(SpikeState, (obj), TYPE_SPIKE_MACHINE)
48
+
49
typedef struct {
50
/*< private >*/
51
- SysBusDevice parent_obj;
52
+ MachineState parent;
53
54
/*< public >*/
55
- RISCVHartArrayState soc;
56
+ RISCVHartArrayState soc[SPIKE_SOCKETS_MAX];
57
void *fdt;
58
int fdt_size;
59
} SpikeState;
60
diff --git a/hw/riscv/spike.c b/hw/riscv/spike.c
61
index XXXXXXX..XXXXXXX 100644
62
--- a/hw/riscv/spike.c
63
+++ b/hw/riscv/spike.c
64
@@ -XXX,XX +XXX,XX @@
65
#include "hw/riscv/sifive_clint.h"
66
#include "hw/riscv/spike.h"
67
#include "hw/riscv/boot.h"
68
+#include "hw/riscv/numa.h"
69
#include "chardev/char.h"
70
#include "sysemu/arch_init.h"
71
#include "sysemu/device_tree.h"
72
@@ -XXX,XX +XXX,XX @@ static void create_fdt(SpikeState *s, const struct MemmapEntry *memmap,
73
uint64_t mem_size, const char *cmdline)
74
{
22
{
75
void *fdt;
23
- return 0;
76
- int cpu;
24
+ if (kvm_kernel_irqchip_split()) {
77
- uint32_t *cells;
25
+ error_report("-machine kernel_irqchip=split is not supported on RISC-V.");
78
- char *nodename;
79
+ uint64_t addr, size;
80
+ unsigned long clint_addr;
81
+ int cpu, socket;
82
+ MachineState *mc = MACHINE(s);
83
+ uint32_t *clint_cells;
84
+ uint32_t cpu_phandle, intc_phandle, phandle = 1;
85
+ char *name, *mem_name, *clint_name, *clust_name;
86
+ char *core_name, *cpu_name, *intc_name;
87
88
fdt = s->fdt = create_device_tree(&s->fdt_size);
89
if (!fdt) {
90
@@ -XXX,XX +XXX,XX @@ static void create_fdt(SpikeState *s, const struct MemmapEntry *memmap,
91
qemu_fdt_setprop_cell(fdt, "/soc", "#size-cells", 0x2);
92
qemu_fdt_setprop_cell(fdt, "/soc", "#address-cells", 0x2);
93
94
- nodename = g_strdup_printf("/memory@%lx",
95
- (long)memmap[SPIKE_DRAM].base);
96
- qemu_fdt_add_subnode(fdt, nodename);
97
- qemu_fdt_setprop_cells(fdt, nodename, "reg",
98
- memmap[SPIKE_DRAM].base >> 32, memmap[SPIKE_DRAM].base,
99
- mem_size >> 32, mem_size);
100
- qemu_fdt_setprop_string(fdt, nodename, "device_type", "memory");
101
- g_free(nodename);
102
-
103
qemu_fdt_add_subnode(fdt, "/cpus");
104
qemu_fdt_setprop_cell(fdt, "/cpus", "timebase-frequency",
105
SIFIVE_CLINT_TIMEBASE_FREQ);
106
qemu_fdt_setprop_cell(fdt, "/cpus", "#size-cells", 0x0);
107
qemu_fdt_setprop_cell(fdt, "/cpus", "#address-cells", 0x1);
108
+ qemu_fdt_add_subnode(fdt, "/cpus/cpu-map");
109
+
110
+ for (socket = (riscv_socket_count(mc) - 1); socket >= 0; socket--) {
111
+ clust_name = g_strdup_printf("/cpus/cpu-map/cluster%d", socket);
112
+ qemu_fdt_add_subnode(fdt, clust_name);
113
+
114
+ clint_cells = g_new0(uint32_t, s->soc[socket].num_harts * 4);
115
116
- for (cpu = s->soc.num_harts - 1; cpu >= 0; cpu--) {
117
- nodename = g_strdup_printf("/cpus/cpu@%d", cpu);
118
- char *intc = g_strdup_printf("/cpus/cpu@%d/interrupt-controller", cpu);
119
- char *isa = riscv_isa_string(&s->soc.harts[cpu]);
120
- qemu_fdt_add_subnode(fdt, nodename);
121
+ for (cpu = s->soc[socket].num_harts - 1; cpu >= 0; cpu--) {
122
+ cpu_phandle = phandle++;
123
+
124
+ cpu_name = g_strdup_printf("/cpus/cpu@%d",
125
+ s->soc[socket].hartid_base + cpu);
126
+ qemu_fdt_add_subnode(fdt, cpu_name);
127
#if defined(TARGET_RISCV32)
128
- qemu_fdt_setprop_string(fdt, nodename, "mmu-type", "riscv,sv32");
129
+ qemu_fdt_setprop_string(fdt, cpu_name, "mmu-type", "riscv,sv32");
130
#else
131
- qemu_fdt_setprop_string(fdt, nodename, "mmu-type", "riscv,sv48");
132
+ qemu_fdt_setprop_string(fdt, cpu_name, "mmu-type", "riscv,sv48");
133
#endif
134
- qemu_fdt_setprop_string(fdt, nodename, "riscv,isa", isa);
135
- qemu_fdt_setprop_string(fdt, nodename, "compatible", "riscv");
136
- qemu_fdt_setprop_string(fdt, nodename, "status", "okay");
137
- qemu_fdt_setprop_cell(fdt, nodename, "reg", cpu);
138
- qemu_fdt_setprop_string(fdt, nodename, "device_type", "cpu");
139
- qemu_fdt_add_subnode(fdt, intc);
140
- qemu_fdt_setprop_cell(fdt, intc, "phandle", 1);
141
- qemu_fdt_setprop_string(fdt, intc, "compatible", "riscv,cpu-intc");
142
- qemu_fdt_setprop(fdt, intc, "interrupt-controller", NULL, 0);
143
- qemu_fdt_setprop_cell(fdt, intc, "#interrupt-cells", 1);
144
- g_free(isa);
145
- g_free(intc);
146
- g_free(nodename);
147
- }
148
+ name = riscv_isa_string(&s->soc[socket].harts[cpu]);
149
+ qemu_fdt_setprop_string(fdt, cpu_name, "riscv,isa", name);
150
+ g_free(name);
151
+ qemu_fdt_setprop_string(fdt, cpu_name, "compatible", "riscv");
152
+ qemu_fdt_setprop_string(fdt, cpu_name, "status", "okay");
153
+ qemu_fdt_setprop_cell(fdt, cpu_name, "reg",
154
+ s->soc[socket].hartid_base + cpu);
155
+ qemu_fdt_setprop_string(fdt, cpu_name, "device_type", "cpu");
156
+ riscv_socket_fdt_write_id(mc, fdt, cpu_name, socket);
157
+ qemu_fdt_setprop_cell(fdt, cpu_name, "phandle", cpu_phandle);
158
159
- cells = g_new0(uint32_t, s->soc.num_harts * 4);
160
- for (cpu = 0; cpu < s->soc.num_harts; cpu++) {
161
- nodename =
162
- g_strdup_printf("/cpus/cpu@%d/interrupt-controller", cpu);
163
- uint32_t intc_phandle = qemu_fdt_get_phandle(fdt, nodename);
164
- cells[cpu * 4 + 0] = cpu_to_be32(intc_phandle);
165
- cells[cpu * 4 + 1] = cpu_to_be32(IRQ_M_SOFT);
166
- cells[cpu * 4 + 2] = cpu_to_be32(intc_phandle);
167
- cells[cpu * 4 + 3] = cpu_to_be32(IRQ_M_TIMER);
168
- g_free(nodename);
169
+ intc_name = g_strdup_printf("%s/interrupt-controller", cpu_name);
170
+ qemu_fdt_add_subnode(fdt, intc_name);
171
+ intc_phandle = phandle++;
172
+ qemu_fdt_setprop_cell(fdt, intc_name, "phandle", intc_phandle);
173
+ qemu_fdt_setprop_string(fdt, intc_name, "compatible",
174
+ "riscv,cpu-intc");
175
+ qemu_fdt_setprop(fdt, intc_name, "interrupt-controller", NULL, 0);
176
+ qemu_fdt_setprop_cell(fdt, intc_name, "#interrupt-cells", 1);
177
+
178
+ clint_cells[cpu * 4 + 0] = cpu_to_be32(intc_phandle);
179
+ clint_cells[cpu * 4 + 1] = cpu_to_be32(IRQ_M_SOFT);
180
+ clint_cells[cpu * 4 + 2] = cpu_to_be32(intc_phandle);
181
+ clint_cells[cpu * 4 + 3] = cpu_to_be32(IRQ_M_TIMER);
182
+
183
+ core_name = g_strdup_printf("%s/core%d", clust_name, cpu);
184
+ qemu_fdt_add_subnode(fdt, core_name);
185
+ qemu_fdt_setprop_cell(fdt, core_name, "cpu", cpu_phandle);
186
+
187
+ g_free(core_name);
188
+ g_free(intc_name);
189
+ g_free(cpu_name);
190
+ }
191
+
192
+ addr = memmap[SPIKE_DRAM].base + riscv_socket_mem_offset(mc, socket);
193
+ size = riscv_socket_mem_size(mc, socket);
194
+ mem_name = g_strdup_printf("/memory@%lx", (long)addr);
195
+ qemu_fdt_add_subnode(fdt, mem_name);
196
+ qemu_fdt_setprop_cells(fdt, mem_name, "reg",
197
+ addr >> 32, addr, size >> 32, size);
198
+ qemu_fdt_setprop_string(fdt, mem_name, "device_type", "memory");
199
+ riscv_socket_fdt_write_id(mc, fdt, mem_name, socket);
200
+ g_free(mem_name);
201
+
202
+ clint_addr = memmap[SPIKE_CLINT].base +
203
+ (memmap[SPIKE_CLINT].size * socket);
204
+ clint_name = g_strdup_printf("/soc/clint@%lx", clint_addr);
205
+ qemu_fdt_add_subnode(fdt, clint_name);
206
+ qemu_fdt_setprop_string(fdt, clint_name, "compatible", "riscv,clint0");
207
+ qemu_fdt_setprop_cells(fdt, clint_name, "reg",
208
+ 0x0, clint_addr, 0x0, memmap[SPIKE_CLINT].size);
209
+ qemu_fdt_setprop(fdt, clint_name, "interrupts-extended",
210
+ clint_cells, s->soc[socket].num_harts * sizeof(uint32_t) * 4);
211
+ riscv_socket_fdt_write_id(mc, fdt, clint_name, socket);
212
+
213
+ g_free(clint_name);
214
+ g_free(clint_cells);
215
+ g_free(clust_name);
216
}
217
- nodename = g_strdup_printf("/soc/clint@%lx",
218
- (long)memmap[SPIKE_CLINT].base);
219
- qemu_fdt_add_subnode(fdt, nodename);
220
- qemu_fdt_setprop_string(fdt, nodename, "compatible", "riscv,clint0");
221
- qemu_fdt_setprop_cells(fdt, nodename, "reg",
222
- 0x0, memmap[SPIKE_CLINT].base,
223
- 0x0, memmap[SPIKE_CLINT].size);
224
- qemu_fdt_setprop(fdt, nodename, "interrupts-extended",
225
- cells, s->soc.num_harts * sizeof(uint32_t) * 4);
226
- g_free(cells);
227
- g_free(nodename);
228
+
229
+ riscv_socket_fdt_write_distance_matrix(mc, fdt);
230
231
if (cmdline) {
232
qemu_fdt_add_subnode(fdt, "/chosen");
233
@@ -XXX,XX +XXX,XX @@ static void create_fdt(SpikeState *s, const struct MemmapEntry *memmap,
234
static void spike_board_init(MachineState *machine)
235
{
236
const struct MemmapEntry *memmap = spike_memmap;
237
-
238
- SpikeState *s = g_new0(SpikeState, 1);
239
+ SpikeState *s = SPIKE_MACHINE(machine);
240
MemoryRegion *system_memory = get_system_memory();
241
MemoryRegion *main_mem = g_new(MemoryRegion, 1);
242
MemoryRegion *mask_rom = g_new(MemoryRegion, 1);
243
- unsigned int smp_cpus = machine->smp.cpus;
244
uint32_t fdt_load_addr;
245
uint64_t kernel_entry;
246
+ char *soc_name;
247
+ int i, base_hartid, hart_count;
248
249
- /* Initialize SOC */
250
- object_initialize_child(OBJECT(machine), "soc", &s->soc,
251
- TYPE_RISCV_HART_ARRAY);
252
- object_property_set_str(OBJECT(&s->soc), "cpu-type", machine->cpu_type,
253
- &error_abort);
254
- object_property_set_int(OBJECT(&s->soc), "num-harts", smp_cpus,
255
- &error_abort);
256
- sysbus_realize(SYS_BUS_DEVICE(&s->soc), &error_abort);
257
+ /* Check socket count limit */
258
+ if (SPIKE_SOCKETS_MAX < riscv_socket_count(machine)) {
259
+ error_report("number of sockets/nodes should be less than %d",
260
+ SPIKE_SOCKETS_MAX);
261
+ exit(1);
26
+ exit(1);
262
+ }
27
+ }
263
+
28
+
264
+ /* Initialize sockets */
29
+ /*
265
+ for (i = 0; i < riscv_socket_count(machine); i++) {
30
+ * We can create the VAIA using the newer device control API.
266
+ if (!riscv_socket_check_hartids(machine, i)) {
31
+ */
267
+ error_report("discontinuous hartids in socket%d", i);
32
+ return kvm_check_extension(s, KVM_CAP_DEVICE_CTRL);
268
+ exit(1);
269
+ }
270
+
271
+ base_hartid = riscv_socket_first_hartid(machine, i);
272
+ if (base_hartid < 0) {
273
+ error_report("can't find hartid base for socket%d", i);
274
+ exit(1);
275
+ }
276
+
277
+ hart_count = riscv_socket_hart_count(machine, i);
278
+ if (hart_count < 0) {
279
+ error_report("can't find hart count for socket%d", i);
280
+ exit(1);
281
+ }
282
+
283
+ soc_name = g_strdup_printf("soc%d", i);
284
+ object_initialize_child(OBJECT(machine), soc_name, &s->soc[i],
285
+ TYPE_RISCV_HART_ARRAY);
286
+ g_free(soc_name);
287
+ object_property_set_str(OBJECT(&s->soc[i]), "cpu-type",
288
+ machine->cpu_type, &error_abort);
289
+ object_property_set_int(OBJECT(&s->soc[i]), "hartid-base",
290
+ base_hartid, &error_abort);
291
+ object_property_set_int(OBJECT(&s->soc[i]), "num-harts",
292
+ hart_count, &error_abort);
293
+ sysbus_realize(SYS_BUS_DEVICE(&s->soc[i]), &error_abort);
294
+
295
+ /* Core Local Interruptor (timer and IPI) for each socket */
296
+ sifive_clint_create(
297
+ memmap[SPIKE_CLINT].base + i * memmap[SPIKE_CLINT].size,
298
+ memmap[SPIKE_CLINT].size, base_hartid, hart_count,
299
+ SIFIVE_SIP_BASE, SIFIVE_TIMECMP_BASE, SIFIVE_TIME_BASE, false);
300
+ }
301
302
/* register system main memory (actual RAM) */
303
memory_region_init_ram(main_mem, NULL, "riscv.spike.ram",
304
@@ -XXX,XX +XXX,XX @@ static void spike_board_init(MachineState *machine)
305
fdt_load_addr, s->fdt);
306
307
/* initialize HTIF using symbols found in load_kernel */
308
- htif_mm_init(system_memory, mask_rom, &s->soc.harts[0].env, serial_hd(0));
309
+ htif_mm_init(system_memory, mask_rom,
310
+ &s->soc[0].harts[0].env, serial_hd(0));
311
+}
312
313
- /* Core Local Interruptor (timer and IPI) */
314
- sifive_clint_create(memmap[SPIKE_CLINT].base, memmap[SPIKE_CLINT].size,
315
- 0, smp_cpus, SIFIVE_SIP_BASE, SIFIVE_TIMECMP_BASE, SIFIVE_TIME_BASE,
316
- false);
317
+static void spike_machine_instance_init(Object *obj)
318
+{
319
}
33
}
320
34
321
-static void spike_machine_init(MachineClass *mc)
35
int kvm_arch_process_async_events(CPUState *cs)
322
+static void spike_machine_class_init(ObjectClass *oc, void *data)
323
{
324
- mc->desc = "RISC-V Spike Board";
325
+ MachineClass *mc = MACHINE_CLASS(oc);
326
+
327
+ mc->desc = "RISC-V Spike board";
328
mc->init = spike_board_init;
329
- mc->max_cpus = 8;
330
+ mc->max_cpus = SPIKE_CPUS_MAX;
331
mc->is_default = true;
332
mc->default_cpu_type = SPIKE_V1_10_0_CPU;
333
+ mc->possible_cpu_arch_ids = riscv_numa_possible_cpu_arch_ids;
334
+ mc->cpu_index_to_instance_props = riscv_numa_cpu_index_to_props;
335
+ mc->get_default_cpu_node_id = riscv_numa_get_default_cpu_node_id;
336
+ mc->numa_mem_supported = true;
337
+}
338
+
339
+static const TypeInfo spike_machine_typeinfo = {
340
+ .name = MACHINE_TYPE_NAME("spike"),
341
+ .parent = TYPE_MACHINE,
342
+ .class_init = spike_machine_class_init,
343
+ .instance_init = spike_machine_instance_init,
344
+ .instance_size = sizeof(SpikeState),
345
+};
346
+
347
+static void spike_machine_init_register_types(void)
348
+{
349
+ type_register_static(&spike_machine_typeinfo);
350
}
351
352
-DEFINE_MACHINE("spike", spike_machine_init)
353
+type_init(spike_machine_init_register_types)
354
--
36
--
355
2.28.0
37
2.41.0
356
357
diff view generated by jsdifflib
New patch
1
From: Yong-Xuan Wang <yongxuan.wang@sifive.com>
1
2
3
We create a vAIA chip by using the KVM_DEV_TYPE_RISCV_AIA and then set up
4
the chip with the KVM_DEV_RISCV_AIA_GRP_* APIs.
5
We also extend KVM accelerator to specify the KVM AIA mode. The "riscv-aia"
6
parameter is passed along with --accel in QEMU command-line.
7
1) "riscv-aia=emul": IMSIC is emulated by hypervisor
8
2) "riscv-aia=hwaccel": use hardware guest IMSIC
9
3) "riscv-aia=auto": use the hardware guest IMSICs whenever available
10
otherwise we fallback to software emulation.
11
12
Signed-off-by: Yong-Xuan Wang <yongxuan.wang@sifive.com>
13
Reviewed-by: Jim Shu <jim.shu@sifive.com>
14
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
15
Reviewed-by: Andrew Jones <ajones@ventanamicro.com>
16
Message-ID: <20230727102439.22554-4-yongxuan.wang@sifive.com>
17
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
18
---
19
target/riscv/kvm_riscv.h | 4 +
20
target/riscv/kvm.c | 186 +++++++++++++++++++++++++++++++++++++++
21
2 files changed, 190 insertions(+)
22
23
diff --git a/target/riscv/kvm_riscv.h b/target/riscv/kvm_riscv.h
24
index XXXXXXX..XXXXXXX 100644
25
--- a/target/riscv/kvm_riscv.h
26
+++ b/target/riscv/kvm_riscv.h
27
@@ -XXX,XX +XXX,XX @@
28
void kvm_riscv_init_user_properties(Object *cpu_obj);
29
void kvm_riscv_reset_vcpu(RISCVCPU *cpu);
30
void kvm_riscv_set_irq(RISCVCPU *cpu, int irq, int level);
31
+void kvm_riscv_aia_create(MachineState *machine, uint64_t group_shift,
32
+ uint64_t aia_irq_num, uint64_t aia_msi_num,
33
+ uint64_t aplic_base, uint64_t imsic_base,
34
+ uint64_t guest_num);
35
36
#endif
37
diff --git a/target/riscv/kvm.c b/target/riscv/kvm.c
38
index XXXXXXX..XXXXXXX 100644
39
--- a/target/riscv/kvm.c
40
+++ b/target/riscv/kvm.c
41
@@ -XXX,XX +XXX,XX @@
42
#include "exec/address-spaces.h"
43
#include "hw/boards.h"
44
#include "hw/irq.h"
45
+#include "hw/intc/riscv_imsic.h"
46
#include "qemu/log.h"
47
#include "hw/loader.h"
48
#include "kvm_riscv.h"
49
@@ -XXX,XX +XXX,XX @@
50
#include "chardev/char-fe.h"
51
#include "migration/migration.h"
52
#include "sysemu/runstate.h"
53
+#include "hw/riscv/numa.h"
54
55
static uint64_t kvm_riscv_reg_id(CPURISCVState *env, uint64_t type,
56
uint64_t idx)
57
@@ -XXX,XX +XXX,XX @@ bool kvm_arch_cpu_check_are_resettable(void)
58
return true;
59
}
60
61
+static int aia_mode;
62
+
63
+static const char *kvm_aia_mode_str(uint64_t mode)
64
+{
65
+ switch (mode) {
66
+ case KVM_DEV_RISCV_AIA_MODE_EMUL:
67
+ return "emul";
68
+ case KVM_DEV_RISCV_AIA_MODE_HWACCEL:
69
+ return "hwaccel";
70
+ case KVM_DEV_RISCV_AIA_MODE_AUTO:
71
+ default:
72
+ return "auto";
73
+ };
74
+}
75
+
76
+static char *riscv_get_kvm_aia(Object *obj, Error **errp)
77
+{
78
+ return g_strdup(kvm_aia_mode_str(aia_mode));
79
+}
80
+
81
+static void riscv_set_kvm_aia(Object *obj, const char *val, Error **errp)
82
+{
83
+ if (!strcmp(val, "emul")) {
84
+ aia_mode = KVM_DEV_RISCV_AIA_MODE_EMUL;
85
+ } else if (!strcmp(val, "hwaccel")) {
86
+ aia_mode = KVM_DEV_RISCV_AIA_MODE_HWACCEL;
87
+ } else if (!strcmp(val, "auto")) {
88
+ aia_mode = KVM_DEV_RISCV_AIA_MODE_AUTO;
89
+ } else {
90
+ error_setg(errp, "Invalid KVM AIA mode");
91
+ error_append_hint(errp, "Valid values are emul, hwaccel, and auto.\n");
92
+ }
93
+}
94
+
95
void kvm_arch_accel_class_init(ObjectClass *oc)
96
{
97
+ object_class_property_add_str(oc, "riscv-aia", riscv_get_kvm_aia,
98
+ riscv_set_kvm_aia);
99
+ object_class_property_set_description(oc, "riscv-aia",
100
+ "Set KVM AIA mode. Valid values are "
101
+ "emul, hwaccel, and auto. Default "
102
+ "is auto.");
103
+ object_property_set_default_str(object_class_property_find(oc, "riscv-aia"),
104
+ "auto");
105
+}
106
+
107
+void kvm_riscv_aia_create(MachineState *machine, uint64_t group_shift,
108
+ uint64_t aia_irq_num, uint64_t aia_msi_num,
109
+ uint64_t aplic_base, uint64_t imsic_base,
110
+ uint64_t guest_num)
111
+{
112
+ int ret, i;
113
+ int aia_fd = -1;
114
+ uint64_t default_aia_mode;
115
+ uint64_t socket_count = riscv_socket_count(machine);
116
+ uint64_t max_hart_per_socket = 0;
117
+ uint64_t socket, base_hart, hart_count, socket_imsic_base, imsic_addr;
118
+ uint64_t socket_bits, hart_bits, guest_bits;
119
+
120
+ aia_fd = kvm_create_device(kvm_state, KVM_DEV_TYPE_RISCV_AIA, false);
121
+
122
+ if (aia_fd < 0) {
123
+ error_report("Unable to create in-kernel irqchip");
124
+ exit(1);
125
+ }
126
+
127
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
128
+ KVM_DEV_RISCV_AIA_CONFIG_MODE,
129
+ &default_aia_mode, false, NULL);
130
+ if (ret < 0) {
131
+ error_report("KVM AIA: failed to get current KVM AIA mode");
132
+ exit(1);
133
+ }
134
+ qemu_log("KVM AIA: default mode is %s\n",
135
+ kvm_aia_mode_str(default_aia_mode));
136
+
137
+ if (default_aia_mode != aia_mode) {
138
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
139
+ KVM_DEV_RISCV_AIA_CONFIG_MODE,
140
+ &aia_mode, true, NULL);
141
+ if (ret < 0)
142
+ warn_report("KVM AIA: failed to set KVM AIA mode");
143
+ else
144
+ qemu_log("KVM AIA: set current mode to %s\n",
145
+ kvm_aia_mode_str(aia_mode));
146
+ }
147
+
148
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
149
+ KVM_DEV_RISCV_AIA_CONFIG_SRCS,
150
+ &aia_irq_num, true, NULL);
151
+ if (ret < 0) {
152
+ error_report("KVM AIA: failed to set number of input irq lines");
153
+ exit(1);
154
+ }
155
+
156
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
157
+ KVM_DEV_RISCV_AIA_CONFIG_IDS,
158
+ &aia_msi_num, true, NULL);
159
+ if (ret < 0) {
160
+ error_report("KVM AIA: failed to set number of msi");
161
+ exit(1);
162
+ }
163
+
164
+ socket_bits = find_last_bit(&socket_count, BITS_PER_LONG) + 1;
165
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
166
+ KVM_DEV_RISCV_AIA_CONFIG_GROUP_BITS,
167
+ &socket_bits, true, NULL);
168
+ if (ret < 0) {
169
+ error_report("KVM AIA: failed to set group_bits");
170
+ exit(1);
171
+ }
172
+
173
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
174
+ KVM_DEV_RISCV_AIA_CONFIG_GROUP_SHIFT,
175
+ &group_shift, true, NULL);
176
+ if (ret < 0) {
177
+ error_report("KVM AIA: failed to set group_shift");
178
+ exit(1);
179
+ }
180
+
181
+ guest_bits = guest_num == 0 ? 0 :
182
+ find_last_bit(&guest_num, BITS_PER_LONG) + 1;
183
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
184
+ KVM_DEV_RISCV_AIA_CONFIG_GUEST_BITS,
185
+ &guest_bits, true, NULL);
186
+ if (ret < 0) {
187
+ error_report("KVM AIA: failed to set guest_bits");
188
+ exit(1);
189
+ }
190
+
191
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_ADDR,
192
+ KVM_DEV_RISCV_AIA_ADDR_APLIC,
193
+ &aplic_base, true, NULL);
194
+ if (ret < 0) {
195
+ error_report("KVM AIA: failed to set the base address of APLIC");
196
+ exit(1);
197
+ }
198
+
199
+ for (socket = 0; socket < socket_count; socket++) {
200
+ socket_imsic_base = imsic_base + socket * (1U << group_shift);
201
+ hart_count = riscv_socket_hart_count(machine, socket);
202
+ base_hart = riscv_socket_first_hartid(machine, socket);
203
+
204
+ if (max_hart_per_socket < hart_count) {
205
+ max_hart_per_socket = hart_count;
206
+ }
207
+
208
+ for (i = 0; i < hart_count; i++) {
209
+ imsic_addr = socket_imsic_base + i * IMSIC_HART_SIZE(guest_bits);
210
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_ADDR,
211
+ KVM_DEV_RISCV_AIA_ADDR_IMSIC(i + base_hart),
212
+ &imsic_addr, true, NULL);
213
+ if (ret < 0) {
214
+ error_report("KVM AIA: failed to set the IMSIC address for hart %d", i);
215
+ exit(1);
216
+ }
217
+ }
218
+ }
219
+
220
+ hart_bits = find_last_bit(&max_hart_per_socket, BITS_PER_LONG) + 1;
221
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CONFIG,
222
+ KVM_DEV_RISCV_AIA_CONFIG_HART_BITS,
223
+ &hart_bits, true, NULL);
224
+ if (ret < 0) {
225
+ error_report("KVM AIA: failed to set hart_bits");
226
+ exit(1);
227
+ }
228
+
229
+ if (kvm_has_gsi_routing()) {
230
+ for (uint64_t idx = 0; idx < aia_irq_num + 1; ++idx) {
231
+ /* KVM AIA only has one APLIC instance */
232
+ kvm_irqchip_add_irq_route(kvm_state, idx, 0, idx);
233
+ }
234
+ kvm_gsi_routing_allowed = true;
235
+ kvm_irqchip_commit_routes(kvm_state);
236
+ }
237
+
238
+ ret = kvm_device_access(aia_fd, KVM_DEV_RISCV_AIA_GRP_CTRL,
239
+ KVM_DEV_RISCV_AIA_CTRL_INIT,
240
+ NULL, true, NULL);
241
+ if (ret < 0) {
242
+ error_report("KVM AIA: initialized fail");
243
+ exit(1);
244
+ }
245
+
246
+ kvm_msi_via_irqfd_allowed = kvm_irqfds_enabled();
247
}
248
--
249
2.41.0
diff view generated by jsdifflib
New patch
1
From: Yong-Xuan Wang <yongxuan.wang@sifive.com>
1
2
3
KVM AIA can't emulate APLIC only. When "aia=aplic" parameter is passed,
4
APLIC devices is emulated by QEMU. For "aia=aplic-imsic", remove the
5
mmio operations of APLIC when using KVM AIA and send wired interrupt
6
signal via KVM_IRQ_LINE API.
7
After KVM AIA enabled, MSI messages are delivered by KVM_SIGNAL_MSI API
8
when the IMSICs receive mmio write requests.
9
10
Signed-off-by: Yong-Xuan Wang <yongxuan.wang@sifive.com>
11
Reviewed-by: Jim Shu <jim.shu@sifive.com>
12
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
13
Reviewed-by: Andrew Jones <ajones@ventanamicro.com>
14
Message-ID: <20230727102439.22554-5-yongxuan.wang@sifive.com>
15
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
16
---
17
hw/intc/riscv_aplic.c | 56 ++++++++++++++++++++++++++++++-------------
18
hw/intc/riscv_imsic.c | 25 +++++++++++++++----
19
2 files changed, 61 insertions(+), 20 deletions(-)
20
21
diff --git a/hw/intc/riscv_aplic.c b/hw/intc/riscv_aplic.c
22
index XXXXXXX..XXXXXXX 100644
23
--- a/hw/intc/riscv_aplic.c
24
+++ b/hw/intc/riscv_aplic.c
25
@@ -XXX,XX +XXX,XX @@
26
#include "hw/irq.h"
27
#include "target/riscv/cpu.h"
28
#include "sysemu/sysemu.h"
29
+#include "sysemu/kvm.h"
30
#include "migration/vmstate.h"
31
32
#define APLIC_MAX_IDC (1UL << 14)
33
@@ -XXX,XX +XXX,XX @@
34
35
#define APLIC_IDC_CLAIMI 0x1c
36
37
+/*
38
+ * KVM AIA only supports APLIC MSI, fallback to QEMU emulation if we want to use
39
+ * APLIC Wired.
40
+ */
41
+static bool is_kvm_aia(bool msimode)
42
+{
43
+ return kvm_irqchip_in_kernel() && msimode;
44
+}
45
+
46
static uint32_t riscv_aplic_read_input_word(RISCVAPLICState *aplic,
47
uint32_t word)
48
{
49
@@ -XXX,XX +XXX,XX @@ static uint32_t riscv_aplic_idc_claimi(RISCVAPLICState *aplic, uint32_t idc)
50
return topi;
51
}
52
53
+static void riscv_kvm_aplic_request(void *opaque, int irq, int level)
54
+{
55
+ kvm_set_irq(kvm_state, irq, !!level);
56
+}
57
+
58
static void riscv_aplic_request(void *opaque, int irq, int level)
59
{
60
bool update = false;
61
@@ -XXX,XX +XXX,XX @@ static void riscv_aplic_realize(DeviceState *dev, Error **errp)
62
uint32_t i;
63
RISCVAPLICState *aplic = RISCV_APLIC(dev);
64
65
- aplic->bitfield_words = (aplic->num_irqs + 31) >> 5;
66
- aplic->sourcecfg = g_new0(uint32_t, aplic->num_irqs);
67
- aplic->state = g_new0(uint32_t, aplic->num_irqs);
68
- aplic->target = g_new0(uint32_t, aplic->num_irqs);
69
- if (!aplic->msimode) {
70
- for (i = 0; i < aplic->num_irqs; i++) {
71
- aplic->target[i] = 1;
72
+ if (!is_kvm_aia(aplic->msimode)) {
73
+ aplic->bitfield_words = (aplic->num_irqs + 31) >> 5;
74
+ aplic->sourcecfg = g_new0(uint32_t, aplic->num_irqs);
75
+ aplic->state = g_new0(uint32_t, aplic->num_irqs);
76
+ aplic->target = g_new0(uint32_t, aplic->num_irqs);
77
+ if (!aplic->msimode) {
78
+ for (i = 0; i < aplic->num_irqs; i++) {
79
+ aplic->target[i] = 1;
80
+ }
81
}
82
- }
83
- aplic->idelivery = g_new0(uint32_t, aplic->num_harts);
84
- aplic->iforce = g_new0(uint32_t, aplic->num_harts);
85
- aplic->ithreshold = g_new0(uint32_t, aplic->num_harts);
86
+ aplic->idelivery = g_new0(uint32_t, aplic->num_harts);
87
+ aplic->iforce = g_new0(uint32_t, aplic->num_harts);
88
+ aplic->ithreshold = g_new0(uint32_t, aplic->num_harts);
89
90
- memory_region_init_io(&aplic->mmio, OBJECT(dev), &riscv_aplic_ops, aplic,
91
- TYPE_RISCV_APLIC, aplic->aperture_size);
92
- sysbus_init_mmio(SYS_BUS_DEVICE(dev), &aplic->mmio);
93
+ memory_region_init_io(&aplic->mmio, OBJECT(dev), &riscv_aplic_ops,
94
+ aplic, TYPE_RISCV_APLIC, aplic->aperture_size);
95
+ sysbus_init_mmio(SYS_BUS_DEVICE(dev), &aplic->mmio);
96
+ }
97
98
/*
99
* Only root APLICs have hardware IRQ lines. All non-root APLICs
100
* have IRQ lines delegated by their parent APLIC.
101
*/
102
if (!aplic->parent) {
103
- qdev_init_gpio_in(dev, riscv_aplic_request, aplic->num_irqs);
104
+ if (is_kvm_aia(aplic->msimode)) {
105
+ qdev_init_gpio_in(dev, riscv_kvm_aplic_request, aplic->num_irqs);
106
+ } else {
107
+ qdev_init_gpio_in(dev, riscv_aplic_request, aplic->num_irqs);
108
+ }
109
}
110
111
/* Create output IRQ lines for non-MSI mode */
112
@@ -XXX,XX +XXX,XX @@ DeviceState *riscv_aplic_create(hwaddr addr, hwaddr size,
113
qdev_prop_set_bit(dev, "mmode", mmode);
114
115
sysbus_realize_and_unref(SYS_BUS_DEVICE(dev), &error_fatal);
116
- sysbus_mmio_map(SYS_BUS_DEVICE(dev), 0, addr);
117
+
118
+ if (!is_kvm_aia(msimode)) {
119
+ sysbus_mmio_map(SYS_BUS_DEVICE(dev), 0, addr);
120
+ }
121
122
if (parent) {
123
riscv_aplic_add_child(parent, dev);
124
diff --git a/hw/intc/riscv_imsic.c b/hw/intc/riscv_imsic.c
125
index XXXXXXX..XXXXXXX 100644
126
--- a/hw/intc/riscv_imsic.c
127
+++ b/hw/intc/riscv_imsic.c
128
@@ -XXX,XX +XXX,XX @@
129
#include "target/riscv/cpu.h"
130
#include "target/riscv/cpu_bits.h"
131
#include "sysemu/sysemu.h"
132
+#include "sysemu/kvm.h"
133
#include "migration/vmstate.h"
134
135
#define IMSIC_MMIO_PAGE_LE 0x00
136
@@ -XXX,XX +XXX,XX @@ static void riscv_imsic_write(void *opaque, hwaddr addr, uint64_t value,
137
goto err;
138
}
139
140
+#if defined(CONFIG_KVM)
141
+ if (kvm_irqchip_in_kernel()) {
142
+ struct kvm_msi msi;
143
+
144
+ msi.address_lo = extract64(imsic->mmio.addr + addr, 0, 32);
145
+ msi.address_hi = extract64(imsic->mmio.addr + addr, 32, 32);
146
+ msi.data = le32_to_cpu(value);
147
+
148
+ kvm_vm_ioctl(kvm_state, KVM_SIGNAL_MSI, &msi);
149
+
150
+ return;
151
+ }
152
+#endif
153
+
154
/* Writes only supported for MSI little-endian registers */
155
page = addr >> IMSIC_MMIO_PAGE_SHIFT;
156
if ((addr & (IMSIC_MMIO_PAGE_SZ - 1)) == IMSIC_MMIO_PAGE_LE) {
157
@@ -XXX,XX +XXX,XX @@ static void riscv_imsic_realize(DeviceState *dev, Error **errp)
158
CPUState *cpu = cpu_by_arch_id(imsic->hartid);
159
CPURISCVState *env = cpu ? cpu->env_ptr : NULL;
160
161
- imsic->num_eistate = imsic->num_pages * imsic->num_irqs;
162
- imsic->eidelivery = g_new0(uint32_t, imsic->num_pages);
163
- imsic->eithreshold = g_new0(uint32_t, imsic->num_pages);
164
- imsic->eistate = g_new0(uint32_t, imsic->num_eistate);
165
+ if (!kvm_irqchip_in_kernel()) {
166
+ imsic->num_eistate = imsic->num_pages * imsic->num_irqs;
167
+ imsic->eidelivery = g_new0(uint32_t, imsic->num_pages);
168
+ imsic->eithreshold = g_new0(uint32_t, imsic->num_pages);
169
+ imsic->eistate = g_new0(uint32_t, imsic->num_eistate);
170
+ }
171
172
memory_region_init_io(&imsic->mmio, OBJECT(dev), &riscv_imsic_ops,
173
imsic, TYPE_RISCV_IMSIC,
174
--
175
2.41.0
diff view generated by jsdifflib
1
From: Anup Patel <anup.patel@wdc.com>
1
From: Yong-Xuan Wang <yongxuan.wang@sifive.com>
2
2
3
We extend RISC-V virt machine to allow creating a multi-socket
3
Select KVM AIA when the host kernel has in-kernel AIA chip support.
4
machine. Each RISC-V virt machine socket is a NUMA node having
4
Since KVM AIA only has one APLIC instance, we map the QEMU APLIC
5
a set of HARTs, a memory instance, a CLINT instance, and a PLIC
5
devices to KVM APLIC.
6
instance. Other devices are shared between all sockets. We also
7
update the generated device tree accordingly.
8
6
9
By default, NUMA multi-socket support is disabled for RISC-V virt
7
Signed-off-by: Yong-Xuan Wang <yongxuan.wang@sifive.com>
10
machine. To enable it, users can use "-numa" command-line options
8
Reviewed-by: Jim Shu <jim.shu@sifive.com>
11
of QEMU.
9
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
12
10
Reviewed-by: Andrew Jones <ajones@ventanamicro.com>
13
Example1: For two NUMA nodes with 2 CPUs each, append following
11
Message-ID: <20230727102439.22554-6-yongxuan.wang@sifive.com>
14
to command-line options: "-smp 4 -numa node -numa node"
15
16
Example2: For two NUMA nodes with 1 and 3 CPUs, append following
17
to command-line options:
18
"-smp 4 -numa node -numa node -numa cpu,node-id=0,core-id=0 \
19
-numa cpu,node-id=1,core-id=1 -numa cpu,node-id=1,core-id=2 \
20
-numa cpu,node-id=1,core-id=3"
21
22
The maximum number of sockets in a RISC-V virt machine is 8
23
but this limit can be changed in future.
24
25
Signed-off-by: Anup Patel <anup.patel@wdc.com>
26
Reviewed-by: Atish Patra <atish.patra@wdc.com>
27
Message-Id: <20200616032229.766089-6-anup.patel@wdc.com>
28
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
12
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
29
---
13
---
30
include/hw/riscv/virt.h | 9 +-
14
hw/riscv/virt.c | 94 +++++++++++++++++++++++++++++++++----------------
31
hw/riscv/virt.c | 526 +++++++++++++++++++++++-----------------
15
1 file changed, 63 insertions(+), 31 deletions(-)
32
2 files changed, 306 insertions(+), 229 deletions(-)
33
16
34
diff --git a/include/hw/riscv/virt.h b/include/hw/riscv/virt.h
35
index XXXXXXX..XXXXXXX 100644
36
--- a/include/hw/riscv/virt.h
37
+++ b/include/hw/riscv/virt.h
38
@@ -XXX,XX +XXX,XX @@
39
#include "hw/sysbus.h"
40
#include "hw/block/flash.h"
41
42
+#define VIRT_CPUS_MAX 8
43
+#define VIRT_SOCKETS_MAX 8
44
+
45
#define TYPE_RISCV_VIRT_MACHINE MACHINE_TYPE_NAME("virt")
46
#define RISCV_VIRT_MACHINE(obj) \
47
OBJECT_CHECK(RISCVVirtState, (obj), TYPE_RISCV_VIRT_MACHINE)
48
@@ -XXX,XX +XXX,XX @@ typedef struct {
49
MachineState parent;
50
51
/*< public >*/
52
- RISCVHartArrayState soc;
53
- DeviceState *plic;
54
+ RISCVHartArrayState soc[VIRT_SOCKETS_MAX];
55
+ DeviceState *plic[VIRT_SOCKETS_MAX];
56
PFlashCFI01 *flash[2];
57
58
void *fdt;
59
@@ -XXX,XX +XXX,XX @@ enum {
60
#define VIRT_PLIC_ENABLE_STRIDE 0x80
61
#define VIRT_PLIC_CONTEXT_BASE 0x200000
62
#define VIRT_PLIC_CONTEXT_STRIDE 0x1000
63
+#define VIRT_PLIC_SIZE(__num_context) \
64
+ (VIRT_PLIC_CONTEXT_BASE + (__num_context) * VIRT_PLIC_CONTEXT_STRIDE)
65
66
#define FDT_PCI_ADDR_CELLS 3
67
#define FDT_PCI_INT_CELLS 1
68
diff --git a/hw/riscv/virt.c b/hw/riscv/virt.c
17
diff --git a/hw/riscv/virt.c b/hw/riscv/virt.c
69
index XXXXXXX..XXXXXXX 100644
18
index XXXXXXX..XXXXXXX 100644
70
--- a/hw/riscv/virt.c
19
--- a/hw/riscv/virt.c
71
+++ b/hw/riscv/virt.c
20
+++ b/hw/riscv/virt.c
72
@@ -XXX,XX +XXX,XX @@
21
@@ -XXX,XX +XXX,XX @@
73
#include "hw/riscv/sifive_test.h"
74
#include "hw/riscv/virt.h"
22
#include "hw/riscv/virt.h"
75
#include "hw/riscv/boot.h"
23
#include "hw/riscv/boot.h"
76
+#include "hw/riscv/numa.h"
24
#include "hw/riscv/numa.h"
77
#include "chardev/char.h"
25
+#include "kvm_riscv.h"
78
#include "sysemu/arch_init.h"
26
#include "hw/intc/riscv_aclint.h"
79
#include "sysemu/device_tree.h"
27
#include "hw/intc/riscv_aplic.h"
80
@@ -XXX,XX +XXX,XX @@ static const struct MemmapEntry {
28
#include "hw/intc/riscv_imsic.h"
81
[VIRT_RTC] = { 0x101000, 0x1000 },
29
@@ -XXX,XX +XXX,XX @@
82
[VIRT_CLINT] = { 0x2000000, 0x10000 },
30
#error "Can't accommodate all IMSIC groups in address space"
83
[VIRT_PCIE_PIO] = { 0x3000000, 0x10000 },
31
#endif
84
- [VIRT_PLIC] = { 0xc000000, 0x4000000 },
32
85
+ [VIRT_PLIC] = { 0xc000000, VIRT_PLIC_SIZE(VIRT_CPUS_MAX * 2) },
33
+/* KVM AIA only supports APLIC MSI. APLIC Wired is always emulated by QEMU. */
86
[VIRT_UART0] = { 0x10000000, 0x100 },
34
+static bool virt_use_kvm_aia(RISCVVirtState *s)
87
[VIRT_VIRTIO] = { 0x10001000, 0x1000 },
35
+{
88
[VIRT_FLASH] = { 0x20000000, 0x4000000 },
36
+ return kvm_irqchip_in_kernel() && s->aia_type == VIRT_AIA_TYPE_APLIC_IMSIC;
89
@@ -XXX,XX +XXX,XX @@ static void create_fdt(RISCVVirtState *s, const struct MemmapEntry *memmap,
37
+}
90
uint64_t mem_size, const char *cmdline)
38
+
39
static const MemMapEntry virt_memmap[] = {
40
[VIRT_DEBUG] = { 0x0, 0x100 },
41
[VIRT_MROM] = { 0x1000, 0xf000 },
42
@@ -XXX,XX +XXX,XX @@ static void create_fdt_one_aplic(RISCVVirtState *s, int socket,
43
uint32_t *intc_phandles,
44
uint32_t aplic_phandle,
45
uint32_t aplic_child_phandle,
46
- bool m_mode)
47
+ bool m_mode, int num_harts)
91
{
48
{
92
void *fdt;
49
int cpu;
93
- int cpu, i;
50
char *aplic_name;
94
- uint32_t *cells;
51
uint32_t *aplic_cells;
95
- char *nodename;
52
MachineState *ms = MACHINE(s);
96
- uint32_t plic_phandle, test_phandle, phandle = 1;
53
97
+ int i, cpu, socket;
54
- aplic_cells = g_new0(uint32_t, s->soc[socket].num_harts * 2);
98
+ MachineState *mc = MACHINE(s);
55
+ aplic_cells = g_new0(uint32_t, num_harts * 2);
99
+ uint64_t addr, size;
56
100
+ uint32_t *clint_cells, *plic_cells;
57
- for (cpu = 0; cpu < s->soc[socket].num_harts; cpu++) {
101
+ unsigned long clint_addr, plic_addr;
58
+ for (cpu = 0; cpu < num_harts; cpu++) {
102
+ uint32_t plic_phandle[MAX_NODES];
59
aplic_cells[cpu * 2 + 0] = cpu_to_be32(intc_phandles[cpu]);
103
+ uint32_t cpu_phandle, intc_phandle, test_phandle;
60
aplic_cells[cpu * 2 + 1] = cpu_to_be32(m_mode ? IRQ_M_EXT : IRQ_S_EXT);
104
+ uint32_t phandle = 1, plic_mmio_phandle = 1;
61
}
105
+ uint32_t plic_pcie_phandle = 1, plic_virtio_phandle = 1;
62
@@ -XXX,XX +XXX,XX @@ static void create_fdt_one_aplic(RISCVVirtState *s, int socket,
106
+ char *mem_name, *cpu_name, *core_name, *intc_name;
63
107
+ char *name, *clint_name, *plic_name, *clust_name;
64
if (s->aia_type == VIRT_AIA_TYPE_APLIC) {
108
hwaddr flashsize = virt_memmap[VIRT_FLASH].size / 2;
65
qemu_fdt_setprop(ms->fdt, aplic_name, "interrupts-extended",
109
hwaddr flashbase = virt_memmap[VIRT_FLASH].base;
66
- aplic_cells,
110
67
- s->soc[socket].num_harts * sizeof(uint32_t) * 2);
111
@@ -XXX,XX +XXX,XX @@ static void create_fdt(RISCVVirtState *s, const struct MemmapEntry *memmap,
68
+ aplic_cells, num_harts * sizeof(uint32_t) * 2);
112
qemu_fdt_setprop_cell(fdt, "/soc", "#size-cells", 0x2);
69
} else {
113
qemu_fdt_setprop_cell(fdt, "/soc", "#address-cells", 0x2);
70
qemu_fdt_setprop_cell(ms->fdt, aplic_name, "msi-parent", msi_phandle);
114
71
}
115
- nodename = g_strdup_printf("/memory@%lx",
72
@@ -XXX,XX +XXX,XX @@ static void create_fdt_socket_aplic(RISCVVirtState *s,
116
- (long)memmap[VIRT_DRAM].base);
73
uint32_t msi_s_phandle,
117
- qemu_fdt_add_subnode(fdt, nodename);
74
uint32_t *phandle,
118
- qemu_fdt_setprop_cells(fdt, nodename, "reg",
75
uint32_t *intc_phandles,
119
- memmap[VIRT_DRAM].base >> 32, memmap[VIRT_DRAM].base,
76
- uint32_t *aplic_phandles)
120
- mem_size >> 32, mem_size);
77
+ uint32_t *aplic_phandles,
121
- qemu_fdt_setprop_string(fdt, nodename, "device_type", "memory");
78
+ int num_harts)
122
- g_free(nodename);
79
{
80
char *aplic_name;
81
unsigned long aplic_addr;
82
@@ -XXX,XX +XXX,XX @@ static void create_fdt_socket_aplic(RISCVVirtState *s,
83
create_fdt_one_aplic(s, socket, aplic_addr, memmap[VIRT_APLIC_M].size,
84
msi_m_phandle, intc_phandles,
85
aplic_m_phandle, aplic_s_phandle,
86
- true);
87
+ true, num_harts);
88
}
89
90
/* S-level APLIC node */
91
@@ -XXX,XX +XXX,XX @@ static void create_fdt_socket_aplic(RISCVVirtState *s,
92
create_fdt_one_aplic(s, socket, aplic_addr, memmap[VIRT_APLIC_S].size,
93
msi_s_phandle, intc_phandles,
94
aplic_s_phandle, 0,
95
- false);
96
+ false, num_harts);
97
98
aplic_name = g_strdup_printf("/soc/aplic@%lx", aplic_addr);
99
100
@@ -XXX,XX +XXX,XX @@ static void create_fdt_sockets(RISCVVirtState *s, const MemMapEntry *memmap,
101
*msi_pcie_phandle = msi_s_phandle;
102
}
103
104
- phandle_pos = ms->smp.cpus;
105
- for (socket = (socket_count - 1); socket >= 0; socket--) {
106
- phandle_pos -= s->soc[socket].num_harts;
123
-
107
-
124
qemu_fdt_add_subnode(fdt, "/cpus");
108
- if (s->aia_type == VIRT_AIA_TYPE_NONE) {
125
qemu_fdt_setprop_cell(fdt, "/cpus", "timebase-frequency",
109
- create_fdt_socket_plic(s, memmap, socket, phandle,
126
SIFIVE_CLINT_TIMEBASE_FREQ);
110
- &intc_phandles[phandle_pos], xplic_phandles);
127
qemu_fdt_setprop_cell(fdt, "/cpus", "#size-cells", 0x0);
111
- } else {
128
qemu_fdt_setprop_cell(fdt, "/cpus", "#address-cells", 0x1);
112
- create_fdt_socket_aplic(s, memmap, socket,
129
+ qemu_fdt_add_subnode(fdt, "/cpus/cpu-map");
113
- msi_m_phandle, msi_s_phandle, phandle,
114
- &intc_phandles[phandle_pos], xplic_phandles);
115
+ /* KVM AIA only has one APLIC instance */
116
+ if (virt_use_kvm_aia(s)) {
117
+ create_fdt_socket_aplic(s, memmap, 0,
118
+ msi_m_phandle, msi_s_phandle, phandle,
119
+ &intc_phandles[0], xplic_phandles,
120
+ ms->smp.cpus);
121
+ } else {
122
+ phandle_pos = ms->smp.cpus;
123
+ for (socket = (socket_count - 1); socket >= 0; socket--) {
124
+ phandle_pos -= s->soc[socket].num_harts;
130
+
125
+
131
+ for (socket = (riscv_socket_count(mc) - 1); socket >= 0; socket--) {
126
+ if (s->aia_type == VIRT_AIA_TYPE_NONE) {
132
+ clust_name = g_strdup_printf("/cpus/cpu-map/cluster%d", socket);
127
+ create_fdt_socket_plic(s, memmap, socket, phandle,
133
+ qemu_fdt_add_subnode(fdt, clust_name);
128
+ &intc_phandles[phandle_pos],
134
+
129
+ xplic_phandles);
135
+ plic_cells = g_new0(uint32_t, s->soc[socket].num_harts * 4);
130
+ } else {
136
+ clint_cells = g_new0(uint32_t, s->soc[socket].num_harts * 4);
131
+ create_fdt_socket_aplic(s, memmap, socket,
137
+
132
+ msi_m_phandle, msi_s_phandle, phandle,
138
+ for (cpu = s->soc[socket].num_harts - 1; cpu >= 0; cpu--) {
133
+ &intc_phandles[phandle_pos],
139
+ cpu_phandle = phandle++;
134
+ xplic_phandles,
140
135
+ s->soc[socket].num_harts);
141
- for (cpu = s->soc.num_harts - 1; cpu >= 0; cpu--) {
136
+ }
142
- int cpu_phandle = phandle++;
137
}
143
- int intc_phandle;
144
- nodename = g_strdup_printf("/cpus/cpu@%d", cpu);
145
- char *intc = g_strdup_printf("/cpus/cpu@%d/interrupt-controller", cpu);
146
- char *isa = riscv_isa_string(&s->soc.harts[cpu]);
147
- qemu_fdt_add_subnode(fdt, nodename);
148
+ cpu_name = g_strdup_printf("/cpus/cpu@%d",
149
+ s->soc[socket].hartid_base + cpu);
150
+ qemu_fdt_add_subnode(fdt, cpu_name);
151
#if defined(TARGET_RISCV32)
152
- qemu_fdt_setprop_string(fdt, nodename, "mmu-type", "riscv,sv32");
153
+ qemu_fdt_setprop_string(fdt, cpu_name, "mmu-type", "riscv,sv32");
154
#else
155
- qemu_fdt_setprop_string(fdt, nodename, "mmu-type", "riscv,sv48");
156
+ qemu_fdt_setprop_string(fdt, cpu_name, "mmu-type", "riscv,sv48");
157
#endif
158
- qemu_fdt_setprop_string(fdt, nodename, "riscv,isa", isa);
159
- qemu_fdt_setprop_string(fdt, nodename, "compatible", "riscv");
160
- qemu_fdt_setprop_string(fdt, nodename, "status", "okay");
161
- qemu_fdt_setprop_cell(fdt, nodename, "reg", cpu);
162
- qemu_fdt_setprop_string(fdt, nodename, "device_type", "cpu");
163
- qemu_fdt_setprop_cell(fdt, nodename, "phandle", cpu_phandle);
164
- intc_phandle = phandle++;
165
- qemu_fdt_add_subnode(fdt, intc);
166
- qemu_fdt_setprop_cell(fdt, intc, "phandle", intc_phandle);
167
- qemu_fdt_setprop_string(fdt, intc, "compatible", "riscv,cpu-intc");
168
- qemu_fdt_setprop(fdt, intc, "interrupt-controller", NULL, 0);
169
- qemu_fdt_setprop_cell(fdt, intc, "#interrupt-cells", 1);
170
- g_free(isa);
171
- g_free(intc);
172
- g_free(nodename);
173
- }
174
+ name = riscv_isa_string(&s->soc[socket].harts[cpu]);
175
+ qemu_fdt_setprop_string(fdt, cpu_name, "riscv,isa", name);
176
+ g_free(name);
177
+ qemu_fdt_setprop_string(fdt, cpu_name, "compatible", "riscv");
178
+ qemu_fdt_setprop_string(fdt, cpu_name, "status", "okay");
179
+ qemu_fdt_setprop_cell(fdt, cpu_name, "reg",
180
+ s->soc[socket].hartid_base + cpu);
181
+ qemu_fdt_setprop_string(fdt, cpu_name, "device_type", "cpu");
182
+ riscv_socket_fdt_write_id(mc, fdt, cpu_name, socket);
183
+ qemu_fdt_setprop_cell(fdt, cpu_name, "phandle", cpu_phandle);
184
+
185
+ intc_name = g_strdup_printf("%s/interrupt-controller", cpu_name);
186
+ qemu_fdt_add_subnode(fdt, intc_name);
187
+ intc_phandle = phandle++;
188
+ qemu_fdt_setprop_cell(fdt, intc_name, "phandle", intc_phandle);
189
+ qemu_fdt_setprop_string(fdt, intc_name, "compatible",
190
+ "riscv,cpu-intc");
191
+ qemu_fdt_setprop(fdt, intc_name, "interrupt-controller", NULL, 0);
192
+ qemu_fdt_setprop_cell(fdt, intc_name, "#interrupt-cells", 1);
193
+
194
+ clint_cells[cpu * 4 + 0] = cpu_to_be32(intc_phandle);
195
+ clint_cells[cpu * 4 + 1] = cpu_to_be32(IRQ_M_SOFT);
196
+ clint_cells[cpu * 4 + 2] = cpu_to_be32(intc_phandle);
197
+ clint_cells[cpu * 4 + 3] = cpu_to_be32(IRQ_M_TIMER);
198
+
199
+ plic_cells[cpu * 4 + 0] = cpu_to_be32(intc_phandle);
200
+ plic_cells[cpu * 4 + 1] = cpu_to_be32(IRQ_M_EXT);
201
+ plic_cells[cpu * 4 + 2] = cpu_to_be32(intc_phandle);
202
+ plic_cells[cpu * 4 + 3] = cpu_to_be32(IRQ_S_EXT);
203
+
204
+ core_name = g_strdup_printf("%s/core%d", clust_name, cpu);
205
+ qemu_fdt_add_subnode(fdt, core_name);
206
+ qemu_fdt_setprop_cell(fdt, core_name, "cpu", cpu_phandle);
207
+
208
+ g_free(core_name);
209
+ g_free(intc_name);
210
+ g_free(cpu_name);
211
+ }
212
213
- /* Add cpu-topology node */
214
- qemu_fdt_add_subnode(fdt, "/cpus/cpu-map");
215
- qemu_fdt_add_subnode(fdt, "/cpus/cpu-map/cluster0");
216
- for (cpu = s->soc.num_harts - 1; cpu >= 0; cpu--) {
217
- char *core_nodename = g_strdup_printf("/cpus/cpu-map/cluster0/core%d",
218
- cpu);
219
- char *cpu_nodename = g_strdup_printf("/cpus/cpu@%d", cpu);
220
- uint32_t intc_phandle = qemu_fdt_get_phandle(fdt, cpu_nodename);
221
- qemu_fdt_add_subnode(fdt, core_nodename);
222
- qemu_fdt_setprop_cell(fdt, core_nodename, "cpu", intc_phandle);
223
- g_free(core_nodename);
224
- g_free(cpu_nodename);
225
+ addr = memmap[VIRT_DRAM].base + riscv_socket_mem_offset(mc, socket);
226
+ size = riscv_socket_mem_size(mc, socket);
227
+ mem_name = g_strdup_printf("/memory@%lx", (long)addr);
228
+ qemu_fdt_add_subnode(fdt, mem_name);
229
+ qemu_fdt_setprop_cells(fdt, mem_name, "reg",
230
+ addr >> 32, addr, size >> 32, size);
231
+ qemu_fdt_setprop_string(fdt, mem_name, "device_type", "memory");
232
+ riscv_socket_fdt_write_id(mc, fdt, mem_name, socket);
233
+ g_free(mem_name);
234
+
235
+ clint_addr = memmap[VIRT_CLINT].base +
236
+ (memmap[VIRT_CLINT].size * socket);
237
+ clint_name = g_strdup_printf("/soc/clint@%lx", clint_addr);
238
+ qemu_fdt_add_subnode(fdt, clint_name);
239
+ qemu_fdt_setprop_string(fdt, clint_name, "compatible", "riscv,clint0");
240
+ qemu_fdt_setprop_cells(fdt, clint_name, "reg",
241
+ 0x0, clint_addr, 0x0, memmap[VIRT_CLINT].size);
242
+ qemu_fdt_setprop(fdt, clint_name, "interrupts-extended",
243
+ clint_cells, s->soc[socket].num_harts * sizeof(uint32_t) * 4);
244
+ riscv_socket_fdt_write_id(mc, fdt, clint_name, socket);
245
+ g_free(clint_name);
246
+
247
+ plic_phandle[socket] = phandle++;
248
+ plic_addr = memmap[VIRT_PLIC].base + (memmap[VIRT_PLIC].size * socket);
249
+ plic_name = g_strdup_printf("/soc/plic@%lx", plic_addr);
250
+ qemu_fdt_add_subnode(fdt, plic_name);
251
+ qemu_fdt_setprop_cell(fdt, plic_name,
252
+ "#address-cells", FDT_PLIC_ADDR_CELLS);
253
+ qemu_fdt_setprop_cell(fdt, plic_name,
254
+ "#interrupt-cells", FDT_PLIC_INT_CELLS);
255
+ qemu_fdt_setprop_string(fdt, plic_name, "compatible", "riscv,plic0");
256
+ qemu_fdt_setprop(fdt, plic_name, "interrupt-controller", NULL, 0);
257
+ qemu_fdt_setprop(fdt, plic_name, "interrupts-extended",
258
+ plic_cells, s->soc[socket].num_harts * sizeof(uint32_t) * 4);
259
+ qemu_fdt_setprop_cells(fdt, plic_name, "reg",
260
+ 0x0, plic_addr, 0x0, memmap[VIRT_PLIC].size);
261
+ qemu_fdt_setprop_cell(fdt, plic_name, "riscv,ndev", VIRTIO_NDEV);
262
+ riscv_socket_fdt_write_id(mc, fdt, plic_name, socket);
263
+ qemu_fdt_setprop_cell(fdt, plic_name, "phandle", plic_phandle[socket]);
264
+ g_free(plic_name);
265
+
266
+ g_free(clint_cells);
267
+ g_free(plic_cells);
268
+ g_free(clust_name);
269
}
138
}
270
139
271
- cells = g_new0(uint32_t, s->soc.num_harts * 4);
140
g_free(intc_phandles);
272
- for (cpu = 0; cpu < s->soc.num_harts; cpu++) {
141
273
- nodename =
142
- for (socket = 0; socket < socket_count; socket++) {
274
- g_strdup_printf("/cpus/cpu@%d/interrupt-controller", cpu);
143
- if (socket == 0) {
275
- uint32_t intc_phandle = qemu_fdt_get_phandle(fdt, nodename);
144
- *irq_mmio_phandle = xplic_phandles[socket];
276
- cells[cpu * 4 + 0] = cpu_to_be32(intc_phandle);
145
- *irq_virtio_phandle = xplic_phandles[socket];
277
- cells[cpu * 4 + 1] = cpu_to_be32(IRQ_M_SOFT);
146
- *irq_pcie_phandle = xplic_phandles[socket];
278
- cells[cpu * 4 + 2] = cpu_to_be32(intc_phandle);
147
- }
279
- cells[cpu * 4 + 3] = cpu_to_be32(IRQ_M_TIMER);
148
- if (socket == 1) {
280
- g_free(nodename);
149
- *irq_virtio_phandle = xplic_phandles[socket];
281
- }
150
- *irq_pcie_phandle = xplic_phandles[socket];
282
- nodename = g_strdup_printf("/soc/clint@%lx",
151
- }
283
- (long)memmap[VIRT_CLINT].base);
152
- if (socket == 2) {
284
- qemu_fdt_add_subnode(fdt, nodename);
153
- *irq_pcie_phandle = xplic_phandles[socket];
285
- qemu_fdt_setprop_string(fdt, nodename, "compatible", "riscv,clint0");
154
+ if (virt_use_kvm_aia(s)) {
286
- qemu_fdt_setprop_cells(fdt, nodename, "reg",
155
+ *irq_mmio_phandle = xplic_phandles[0];
287
- 0x0, memmap[VIRT_CLINT].base,
156
+ *irq_virtio_phandle = xplic_phandles[0];
288
- 0x0, memmap[VIRT_CLINT].size);
157
+ *irq_pcie_phandle = xplic_phandles[0];
289
- qemu_fdt_setprop(fdt, nodename, "interrupts-extended",
158
+ } else {
290
- cells, s->soc.num_harts * sizeof(uint32_t) * 4);
159
+ for (socket = 0; socket < socket_count; socket++) {
291
- g_free(cells);
160
+ if (socket == 0) {
292
- g_free(nodename);
161
+ *irq_mmio_phandle = xplic_phandles[socket];
293
-
162
+ *irq_virtio_phandle = xplic_phandles[socket];
294
- plic_phandle = phandle++;
163
+ *irq_pcie_phandle = xplic_phandles[socket];
295
- cells = g_new0(uint32_t, s->soc.num_harts * 4);
164
+ }
296
- for (cpu = 0; cpu < s->soc.num_harts; cpu++) {
165
+ if (socket == 1) {
297
- nodename =
166
+ *irq_virtio_phandle = xplic_phandles[socket];
298
- g_strdup_printf("/cpus/cpu@%d/interrupt-controller", cpu);
167
+ *irq_pcie_phandle = xplic_phandles[socket];
299
- uint32_t intc_phandle = qemu_fdt_get_phandle(fdt, nodename);
168
+ }
300
- cells[cpu * 4 + 0] = cpu_to_be32(intc_phandle);
169
+ if (socket == 2) {
301
- cells[cpu * 4 + 1] = cpu_to_be32(IRQ_M_EXT);
170
+ *irq_pcie_phandle = xplic_phandles[socket];
302
- cells[cpu * 4 + 2] = cpu_to_be32(intc_phandle);
171
+ }
303
- cells[cpu * 4 + 3] = cpu_to_be32(IRQ_S_EXT);
172
}
304
- g_free(nodename);
305
+ for (socket = 0; socket < riscv_socket_count(mc); socket++) {
306
+ if (socket == 0) {
307
+ plic_mmio_phandle = plic_phandle[socket];
308
+ plic_virtio_phandle = plic_phandle[socket];
309
+ plic_pcie_phandle = plic_phandle[socket];
310
+ }
311
+ if (socket == 1) {
312
+ plic_virtio_phandle = plic_phandle[socket];
313
+ plic_pcie_phandle = plic_phandle[socket];
314
+ }
315
+ if (socket == 2) {
316
+ plic_pcie_phandle = plic_phandle[socket];
317
+ }
318
}
173
}
319
- nodename = g_strdup_printf("/soc/interrupt-controller@%lx",
174
320
- (long)memmap[VIRT_PLIC].base);
175
@@ -XXX,XX +XXX,XX @@ static void virt_machine_init(MachineState *machine)
321
- qemu_fdt_add_subnode(fdt, nodename);
176
}
322
- qemu_fdt_setprop_cell(fdt, nodename, "#address-cells",
323
- FDT_PLIC_ADDR_CELLS);
324
- qemu_fdt_setprop_cell(fdt, nodename, "#interrupt-cells",
325
- FDT_PLIC_INT_CELLS);
326
- qemu_fdt_setprop_string(fdt, nodename, "compatible", "riscv,plic0");
327
- qemu_fdt_setprop(fdt, nodename, "interrupt-controller", NULL, 0);
328
- qemu_fdt_setprop(fdt, nodename, "interrupts-extended",
329
- cells, s->soc.num_harts * sizeof(uint32_t) * 4);
330
- qemu_fdt_setprop_cells(fdt, nodename, "reg",
331
- 0x0, memmap[VIRT_PLIC].base,
332
- 0x0, memmap[VIRT_PLIC].size);
333
- qemu_fdt_setprop_cell(fdt, nodename, "riscv,ndev", VIRTIO_NDEV);
334
- qemu_fdt_setprop_cell(fdt, nodename, "phandle", plic_phandle);
335
- plic_phandle = qemu_fdt_get_phandle(fdt, nodename);
336
- g_free(cells);
337
- g_free(nodename);
338
+
339
+ riscv_socket_fdt_write_distance_matrix(mc, fdt);
340
341
for (i = 0; i < VIRTIO_COUNT; i++) {
342
- nodename = g_strdup_printf("/virtio_mmio@%lx",
343
+ name = g_strdup_printf("/soc/virtio_mmio@%lx",
344
(long)(memmap[VIRT_VIRTIO].base + i * memmap[VIRT_VIRTIO].size));
345
- qemu_fdt_add_subnode(fdt, nodename);
346
- qemu_fdt_setprop_string(fdt, nodename, "compatible", "virtio,mmio");
347
- qemu_fdt_setprop_cells(fdt, nodename, "reg",
348
+ qemu_fdt_add_subnode(fdt, name);
349
+ qemu_fdt_setprop_string(fdt, name, "compatible", "virtio,mmio");
350
+ qemu_fdt_setprop_cells(fdt, name, "reg",
351
0x0, memmap[VIRT_VIRTIO].base + i * memmap[VIRT_VIRTIO].size,
352
0x0, memmap[VIRT_VIRTIO].size);
353
- qemu_fdt_setprop_cell(fdt, nodename, "interrupt-parent", plic_phandle);
354
- qemu_fdt_setprop_cell(fdt, nodename, "interrupts", VIRTIO_IRQ + i);
355
- g_free(nodename);
356
+ qemu_fdt_setprop_cell(fdt, name, "interrupt-parent",
357
+ plic_virtio_phandle);
358
+ qemu_fdt_setprop_cell(fdt, name, "interrupts", VIRTIO_IRQ + i);
359
+ g_free(name);
360
}
177
}
361
178
362
- nodename = g_strdup_printf("/soc/pci@%lx",
179
+ if (virt_use_kvm_aia(s)) {
363
+ name = g_strdup_printf("/soc/pci@%lx",
180
+ kvm_riscv_aia_create(machine, IMSIC_MMIO_GROUP_MIN_SHIFT,
364
(long) memmap[VIRT_PCIE_ECAM].base);
181
+ VIRT_IRQCHIP_NUM_SOURCES, VIRT_IRQCHIP_NUM_MSIS,
365
- qemu_fdt_add_subnode(fdt, nodename);
182
+ memmap[VIRT_APLIC_S].base,
366
- qemu_fdt_setprop_cell(fdt, nodename, "#address-cells",
183
+ memmap[VIRT_IMSIC_S].base,
367
- FDT_PCI_ADDR_CELLS);
184
+ s->aia_guests);
368
- qemu_fdt_setprop_cell(fdt, nodename, "#interrupt-cells",
369
- FDT_PCI_INT_CELLS);
370
- qemu_fdt_setprop_cell(fdt, nodename, "#size-cells", 0x2);
371
- qemu_fdt_setprop_string(fdt, nodename, "compatible",
372
- "pci-host-ecam-generic");
373
- qemu_fdt_setprop_string(fdt, nodename, "device_type", "pci");
374
- qemu_fdt_setprop_cell(fdt, nodename, "linux,pci-domain", 0);
375
- qemu_fdt_setprop_cells(fdt, nodename, "bus-range", 0,
376
- memmap[VIRT_PCIE_ECAM].size /
377
- PCIE_MMCFG_SIZE_MIN - 1);
378
- qemu_fdt_setprop(fdt, nodename, "dma-coherent", NULL, 0);
379
- qemu_fdt_setprop_cells(fdt, nodename, "reg", 0, memmap[VIRT_PCIE_ECAM].base,
380
- 0, memmap[VIRT_PCIE_ECAM].size);
381
- qemu_fdt_setprop_sized_cells(fdt, nodename, "ranges",
382
+ qemu_fdt_add_subnode(fdt, name);
383
+ qemu_fdt_setprop_cell(fdt, name, "#address-cells", FDT_PCI_ADDR_CELLS);
384
+ qemu_fdt_setprop_cell(fdt, name, "#interrupt-cells", FDT_PCI_INT_CELLS);
385
+ qemu_fdt_setprop_cell(fdt, name, "#size-cells", 0x2);
386
+ qemu_fdt_setprop_string(fdt, name, "compatible", "pci-host-ecam-generic");
387
+ qemu_fdt_setprop_string(fdt, name, "device_type", "pci");
388
+ qemu_fdt_setprop_cell(fdt, name, "linux,pci-domain", 0);
389
+ qemu_fdt_setprop_cells(fdt, name, "bus-range", 0,
390
+ memmap[VIRT_PCIE_ECAM].size / PCIE_MMCFG_SIZE_MIN - 1);
391
+ qemu_fdt_setprop(fdt, name, "dma-coherent", NULL, 0);
392
+ qemu_fdt_setprop_cells(fdt, name, "reg", 0,
393
+ memmap[VIRT_PCIE_ECAM].base, 0, memmap[VIRT_PCIE_ECAM].size);
394
+ qemu_fdt_setprop_sized_cells(fdt, name, "ranges",
395
1, FDT_PCI_RANGE_IOPORT, 2, 0,
396
2, memmap[VIRT_PCIE_PIO].base, 2, memmap[VIRT_PCIE_PIO].size,
397
1, FDT_PCI_RANGE_MMIO,
398
2, memmap[VIRT_PCIE_MMIO].base,
399
2, memmap[VIRT_PCIE_MMIO].base, 2, memmap[VIRT_PCIE_MMIO].size);
400
- create_pcie_irq_map(fdt, nodename, plic_phandle);
401
- g_free(nodename);
402
+ create_pcie_irq_map(fdt, name, plic_pcie_phandle);
403
+ g_free(name);
404
405
test_phandle = phandle++;
406
- nodename = g_strdup_printf("/test@%lx",
407
+ name = g_strdup_printf("/soc/test@%lx",
408
(long)memmap[VIRT_TEST].base);
409
- qemu_fdt_add_subnode(fdt, nodename);
410
+ qemu_fdt_add_subnode(fdt, name);
411
{
412
const char compat[] = "sifive,test1\0sifive,test0\0syscon";
413
- qemu_fdt_setprop(fdt, nodename, "compatible", compat, sizeof(compat));
414
+ qemu_fdt_setprop(fdt, name, "compatible", compat, sizeof(compat));
415
}
416
- qemu_fdt_setprop_cells(fdt, nodename, "reg",
417
+ qemu_fdt_setprop_cells(fdt, name, "reg",
418
0x0, memmap[VIRT_TEST].base,
419
0x0, memmap[VIRT_TEST].size);
420
- qemu_fdt_setprop_cell(fdt, nodename, "phandle", test_phandle);
421
- test_phandle = qemu_fdt_get_phandle(fdt, nodename);
422
- g_free(nodename);
423
-
424
- nodename = g_strdup_printf("/reboot");
425
- qemu_fdt_add_subnode(fdt, nodename);
426
- qemu_fdt_setprop_string(fdt, nodename, "compatible", "syscon-reboot");
427
- qemu_fdt_setprop_cell(fdt, nodename, "regmap", test_phandle);
428
- qemu_fdt_setprop_cell(fdt, nodename, "offset", 0x0);
429
- qemu_fdt_setprop_cell(fdt, nodename, "value", FINISHER_RESET);
430
- g_free(nodename);
431
-
432
- nodename = g_strdup_printf("/poweroff");
433
- qemu_fdt_add_subnode(fdt, nodename);
434
- qemu_fdt_setprop_string(fdt, nodename, "compatible", "syscon-poweroff");
435
- qemu_fdt_setprop_cell(fdt, nodename, "regmap", test_phandle);
436
- qemu_fdt_setprop_cell(fdt, nodename, "offset", 0x0);
437
- qemu_fdt_setprop_cell(fdt, nodename, "value", FINISHER_PASS);
438
- g_free(nodename);
439
-
440
- nodename = g_strdup_printf("/uart@%lx",
441
- (long)memmap[VIRT_UART0].base);
442
- qemu_fdt_add_subnode(fdt, nodename);
443
- qemu_fdt_setprop_string(fdt, nodename, "compatible", "ns16550a");
444
- qemu_fdt_setprop_cells(fdt, nodename, "reg",
445
+ qemu_fdt_setprop_cell(fdt, name, "phandle", test_phandle);
446
+ test_phandle = qemu_fdt_get_phandle(fdt, name);
447
+ g_free(name);
448
+
449
+ name = g_strdup_printf("/soc/reboot");
450
+ qemu_fdt_add_subnode(fdt, name);
451
+ qemu_fdt_setprop_string(fdt, name, "compatible", "syscon-reboot");
452
+ qemu_fdt_setprop_cell(fdt, name, "regmap", test_phandle);
453
+ qemu_fdt_setprop_cell(fdt, name, "offset", 0x0);
454
+ qemu_fdt_setprop_cell(fdt, name, "value", FINISHER_RESET);
455
+ g_free(name);
456
+
457
+ name = g_strdup_printf("/soc/poweroff");
458
+ qemu_fdt_add_subnode(fdt, name);
459
+ qemu_fdt_setprop_string(fdt, name, "compatible", "syscon-poweroff");
460
+ qemu_fdt_setprop_cell(fdt, name, "regmap", test_phandle);
461
+ qemu_fdt_setprop_cell(fdt, name, "offset", 0x0);
462
+ qemu_fdt_setprop_cell(fdt, name, "value", FINISHER_PASS);
463
+ g_free(name);
464
+
465
+ name = g_strdup_printf("/soc/uart@%lx", (long)memmap[VIRT_UART0].base);
466
+ qemu_fdt_add_subnode(fdt, name);
467
+ qemu_fdt_setprop_string(fdt, name, "compatible", "ns16550a");
468
+ qemu_fdt_setprop_cells(fdt, name, "reg",
469
0x0, memmap[VIRT_UART0].base,
470
0x0, memmap[VIRT_UART0].size);
471
- qemu_fdt_setprop_cell(fdt, nodename, "clock-frequency", 3686400);
472
- qemu_fdt_setprop_cell(fdt, nodename, "interrupt-parent", plic_phandle);
473
- qemu_fdt_setprop_cell(fdt, nodename, "interrupts", UART0_IRQ);
474
+ qemu_fdt_setprop_cell(fdt, name, "clock-frequency", 3686400);
475
+ qemu_fdt_setprop_cell(fdt, name, "interrupt-parent", plic_mmio_phandle);
476
+ qemu_fdt_setprop_cell(fdt, name, "interrupts", UART0_IRQ);
477
478
qemu_fdt_add_subnode(fdt, "/chosen");
479
- qemu_fdt_setprop_string(fdt, "/chosen", "stdout-path", nodename);
480
+ qemu_fdt_setprop_string(fdt, "/chosen", "stdout-path", name);
481
if (cmdline) {
482
qemu_fdt_setprop_string(fdt, "/chosen", "bootargs", cmdline);
483
}
484
- g_free(nodename);
485
-
486
- nodename = g_strdup_printf("/rtc@%lx",
487
- (long)memmap[VIRT_RTC].base);
488
- qemu_fdt_add_subnode(fdt, nodename);
489
- qemu_fdt_setprop_string(fdt, nodename, "compatible",
490
- "google,goldfish-rtc");
491
- qemu_fdt_setprop_cells(fdt, nodename, "reg",
492
+ g_free(name);
493
+
494
+ name = g_strdup_printf("/soc/rtc@%lx", (long)memmap[VIRT_RTC].base);
495
+ qemu_fdt_add_subnode(fdt, name);
496
+ qemu_fdt_setprop_string(fdt, name, "compatible", "google,goldfish-rtc");
497
+ qemu_fdt_setprop_cells(fdt, name, "reg",
498
0x0, memmap[VIRT_RTC].base,
499
0x0, memmap[VIRT_RTC].size);
500
- qemu_fdt_setprop_cell(fdt, nodename, "interrupt-parent", plic_phandle);
501
- qemu_fdt_setprop_cell(fdt, nodename, "interrupts", RTC_IRQ);
502
- g_free(nodename);
503
-
504
- nodename = g_strdup_printf("/flash@%" PRIx64, flashbase);
505
- qemu_fdt_add_subnode(s->fdt, nodename);
506
- qemu_fdt_setprop_string(s->fdt, nodename, "compatible", "cfi-flash");
507
- qemu_fdt_setprop_sized_cells(s->fdt, nodename, "reg",
508
+ qemu_fdt_setprop_cell(fdt, name, "interrupt-parent", plic_mmio_phandle);
509
+ qemu_fdt_setprop_cell(fdt, name, "interrupts", RTC_IRQ);
510
+ g_free(name);
511
+
512
+ name = g_strdup_printf("/soc/flash@%" PRIx64, flashbase);
513
+ qemu_fdt_add_subnode(s->fdt, name);
514
+ qemu_fdt_setprop_string(s->fdt, name, "compatible", "cfi-flash");
515
+ qemu_fdt_setprop_sized_cells(s->fdt, name, "reg",
516
2, flashbase, 2, flashsize,
517
2, flashbase + flashsize, 2, flashsize);
518
- qemu_fdt_setprop_cell(s->fdt, nodename, "bank-width", 4);
519
- g_free(nodename);
520
+ qemu_fdt_setprop_cell(s->fdt, name, "bank-width", 4);
521
+ g_free(name);
522
}
523
524
-
525
static inline DeviceState *gpex_pcie_init(MemoryRegion *sys_mem,
526
hwaddr ecam_base, hwaddr ecam_size,
527
hwaddr mmio_base, hwaddr mmio_size,
528
@@ -XXX,XX +XXX,XX @@ static void virt_machine_init(MachineState *machine)
529
MemoryRegion *system_memory = get_system_memory();
530
MemoryRegion *main_mem = g_new(MemoryRegion, 1);
531
MemoryRegion *mask_rom = g_new(MemoryRegion, 1);
532
- char *plic_hart_config;
533
+ char *plic_hart_config, *soc_name;
534
size_t plic_hart_config_len;
535
target_ulong start_addr = memmap[VIRT_DRAM].base;
536
uint32_t fdt_load_addr;
537
uint64_t kernel_entry;
538
- int i;
539
- unsigned int smp_cpus = machine->smp.cpus;
540
+ DeviceState *mmio_plic, *virtio_plic, *pcie_plic;
541
+ int i, j, base_hartid, hart_count;
542
543
- /* Initialize SOC */
544
- object_initialize_child(OBJECT(machine), "soc", &s->soc,
545
- TYPE_RISCV_HART_ARRAY);
546
- object_property_set_str(OBJECT(&s->soc), "cpu-type", machine->cpu_type,
547
- &error_abort);
548
- object_property_set_int(OBJECT(&s->soc), "num-harts", smp_cpus,
549
- &error_abort);
550
- sysbus_realize(SYS_BUS_DEVICE(&s->soc), &error_abort);
551
+ /* Check socket count limit */
552
+ if (VIRT_SOCKETS_MAX < riscv_socket_count(machine)) {
553
+ error_report("number of sockets/nodes should be less than %d",
554
+ VIRT_SOCKETS_MAX);
555
+ exit(1);
556
+ }
185
+ }
557
+
186
+
558
+ /* Initialize sockets */
187
if (riscv_is_32bit(&s->soc[0])) {
559
+ mmio_plic = virtio_plic = pcie_plic = NULL;
188
#if HOST_LONG_BITS == 64
560
+ for (i = 0; i < riscv_socket_count(machine); i++) {
189
/* limit RAM size in a 32-bit system */
561
+ if (!riscv_socket_check_hartids(machine, i)) {
562
+ error_report("discontinuous hartids in socket%d", i);
563
+ exit(1);
564
+ }
565
+
566
+ base_hartid = riscv_socket_first_hartid(machine, i);
567
+ if (base_hartid < 0) {
568
+ error_report("can't find hartid base for socket%d", i);
569
+ exit(1);
570
+ }
571
+
572
+ hart_count = riscv_socket_hart_count(machine, i);
573
+ if (hart_count < 0) {
574
+ error_report("can't find hart count for socket%d", i);
575
+ exit(1);
576
+ }
577
+
578
+ soc_name = g_strdup_printf("soc%d", i);
579
+ object_initialize_child(OBJECT(machine), soc_name, &s->soc[i],
580
+ TYPE_RISCV_HART_ARRAY);
581
+ g_free(soc_name);
582
+ object_property_set_str(OBJECT(&s->soc[i]), "cpu-type",
583
+ machine->cpu_type, &error_abort);
584
+ object_property_set_int(OBJECT(&s->soc[i]), "hartid-base",
585
+ base_hartid, &error_abort);
586
+ object_property_set_int(OBJECT(&s->soc[i]), "num-harts",
587
+ hart_count, &error_abort);
588
+ sysbus_realize(SYS_BUS_DEVICE(&s->soc[i]), &error_abort);
589
+
590
+ /* Per-socket CLINT */
591
+ sifive_clint_create(
592
+ memmap[VIRT_CLINT].base + i * memmap[VIRT_CLINT].size,
593
+ memmap[VIRT_CLINT].size, base_hartid, hart_count,
594
+ SIFIVE_SIP_BASE, SIFIVE_TIMECMP_BASE, SIFIVE_TIME_BASE, true);
595
+
596
+ /* Per-socket PLIC hart topology configuration string */
597
+ plic_hart_config_len =
598
+ (strlen(VIRT_PLIC_HART_CONFIG) + 1) * hart_count;
599
+ plic_hart_config = g_malloc0(plic_hart_config_len);
600
+ for (j = 0; j < hart_count; j++) {
601
+ if (j != 0) {
602
+ strncat(plic_hart_config, ",", plic_hart_config_len);
603
+ }
604
+ strncat(plic_hart_config, VIRT_PLIC_HART_CONFIG,
605
+ plic_hart_config_len);
606
+ plic_hart_config_len -= (strlen(VIRT_PLIC_HART_CONFIG) + 1);
607
+ }
608
+
609
+ /* Per-socket PLIC */
610
+ s->plic[i] = sifive_plic_create(
611
+ memmap[VIRT_PLIC].base + i * memmap[VIRT_PLIC].size,
612
+ plic_hart_config, base_hartid,
613
+ VIRT_PLIC_NUM_SOURCES,
614
+ VIRT_PLIC_NUM_PRIORITIES,
615
+ VIRT_PLIC_PRIORITY_BASE,
616
+ VIRT_PLIC_PENDING_BASE,
617
+ VIRT_PLIC_ENABLE_BASE,
618
+ VIRT_PLIC_ENABLE_STRIDE,
619
+ VIRT_PLIC_CONTEXT_BASE,
620
+ VIRT_PLIC_CONTEXT_STRIDE,
621
+ memmap[VIRT_PLIC].size);
622
+ g_free(plic_hart_config);
623
+
624
+ /* Try to use different PLIC instance based device type */
625
+ if (i == 0) {
626
+ mmio_plic = s->plic[i];
627
+ virtio_plic = s->plic[i];
628
+ pcie_plic = s->plic[i];
629
+ }
630
+ if (i == 1) {
631
+ virtio_plic = s->plic[i];
632
+ pcie_plic = s->plic[i];
633
+ }
634
+ if (i == 2) {
635
+ pcie_plic = s->plic[i];
636
+ }
637
+ }
638
639
/* register system main memory (actual RAM) */
640
memory_region_init_ram(main_mem, NULL, "riscv_virt_board.ram",
641
@@ -XXX,XX +XXX,XX @@ static void virt_machine_init(MachineState *machine)
642
virt_memmap[VIRT_MROM].size, kernel_entry,
643
fdt_load_addr, s->fdt);
644
645
- /* create PLIC hart topology configuration string */
646
- plic_hart_config_len = (strlen(VIRT_PLIC_HART_CONFIG) + 1) * smp_cpus;
647
- plic_hart_config = g_malloc0(plic_hart_config_len);
648
- for (i = 0; i < smp_cpus; i++) {
649
- if (i != 0) {
650
- strncat(plic_hart_config, ",", plic_hart_config_len);
651
- }
652
- strncat(plic_hart_config, VIRT_PLIC_HART_CONFIG, plic_hart_config_len);
653
- plic_hart_config_len -= (strlen(VIRT_PLIC_HART_CONFIG) + 1);
654
- }
655
-
656
- /* MMIO */
657
- s->plic = sifive_plic_create(memmap[VIRT_PLIC].base,
658
- plic_hart_config, 0,
659
- VIRT_PLIC_NUM_SOURCES,
660
- VIRT_PLIC_NUM_PRIORITIES,
661
- VIRT_PLIC_PRIORITY_BASE,
662
- VIRT_PLIC_PENDING_BASE,
663
- VIRT_PLIC_ENABLE_BASE,
664
- VIRT_PLIC_ENABLE_STRIDE,
665
- VIRT_PLIC_CONTEXT_BASE,
666
- VIRT_PLIC_CONTEXT_STRIDE,
667
- memmap[VIRT_PLIC].size);
668
- sifive_clint_create(memmap[VIRT_CLINT].base,
669
- memmap[VIRT_CLINT].size, 0, smp_cpus,
670
- SIFIVE_SIP_BASE, SIFIVE_TIMECMP_BASE, SIFIVE_TIME_BASE, true);
671
+ /* SiFive Test MMIO device */
672
sifive_test_create(memmap[VIRT_TEST].base);
673
674
+ /* VirtIO MMIO devices */
675
for (i = 0; i < VIRTIO_COUNT; i++) {
676
sysbus_create_simple("virtio-mmio",
677
memmap[VIRT_VIRTIO].base + i * memmap[VIRT_VIRTIO].size,
678
- qdev_get_gpio_in(DEVICE(s->plic), VIRTIO_IRQ + i));
679
+ qdev_get_gpio_in(DEVICE(virtio_plic), VIRTIO_IRQ + i));
680
}
681
682
gpex_pcie_init(system_memory,
683
@@ -XXX,XX +XXX,XX @@ static void virt_machine_init(MachineState *machine)
684
memmap[VIRT_PCIE_MMIO].base,
685
memmap[VIRT_PCIE_MMIO].size,
686
memmap[VIRT_PCIE_PIO].base,
687
- DEVICE(s->plic), true);
688
+ DEVICE(pcie_plic), true);
689
690
serial_mm_init(system_memory, memmap[VIRT_UART0].base,
691
- 0, qdev_get_gpio_in(DEVICE(s->plic), UART0_IRQ), 399193,
692
+ 0, qdev_get_gpio_in(DEVICE(mmio_plic), UART0_IRQ), 399193,
693
serial_hd(0), DEVICE_LITTLE_ENDIAN);
694
695
sysbus_create_simple("goldfish_rtc", memmap[VIRT_RTC].base,
696
- qdev_get_gpio_in(DEVICE(s->plic), RTC_IRQ));
697
+ qdev_get_gpio_in(DEVICE(mmio_plic), RTC_IRQ));
698
699
virt_flash_create(s);
700
701
@@ -XXX,XX +XXX,XX @@ static void virt_machine_init(MachineState *machine)
702
drive_get(IF_PFLASH, 0, i));
703
}
704
virt_flash_map(s, system_memory);
705
-
706
- g_free(plic_hart_config);
707
}
708
709
static void virt_machine_instance_init(Object *obj)
710
@@ -XXX,XX +XXX,XX @@ static void virt_machine_class_init(ObjectClass *oc, void *data)
711
712
mc->desc = "RISC-V VirtIO board";
713
mc->init = virt_machine_init;
714
- mc->max_cpus = 8;
715
+ mc->max_cpus = VIRT_CPUS_MAX;
716
mc->default_cpu_type = VIRT_CPU;
717
mc->pci_allow_0_address = true;
718
+ mc->possible_cpu_arch_ids = riscv_numa_possible_cpu_arch_ids;
719
+ mc->cpu_index_to_instance_props = riscv_numa_cpu_index_to_props;
720
+ mc->get_default_cpu_node_id = riscv_numa_get_default_cpu_node_id;
721
+ mc->numa_mem_supported = true;
722
}
723
724
static const TypeInfo virt_machine_typeinfo = {
725
--
190
--
726
2.28.0
191
2.41.0
727
728
diff view generated by jsdifflib
New patch
1
From: Conor Dooley <conor.dooley@microchip.com>
1
2
3
On a dtb dumped from the virt machine, dt-validate complains:
4
soc: pmu: {'riscv,event-to-mhpmcounters': [[1, 1, 524281], [2, 2, 524284], [65561, 65561, 524280], [65563, 65563, 524280], [65569, 65569, 524280]], 'compatible': ['riscv,pmu']} should not be valid under {'type': 'object'}
5
from schema $id: http://devicetree.org/schemas/simple-bus.yaml#
6
That's pretty cryptic, but running the dtb back through dtc produces
7
something a lot more reasonable:
8
Warning (simple_bus_reg): /soc/pmu: missing or empty reg/ranges property
9
10
Moving the riscv,pmu node out of the soc bus solves the problem.
11
12
Signed-off-by: Conor Dooley <conor.dooley@microchip.com>
13
Acked-by: Alistair Francis <alistair.francis@wdc.com>
14
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
15
Message-ID: <20230727-groom-decline-2c57ce42841c@spud>
16
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
17
---
18
hw/riscv/virt.c | 2 +-
19
1 file changed, 1 insertion(+), 1 deletion(-)
20
21
diff --git a/hw/riscv/virt.c b/hw/riscv/virt.c
22
index XXXXXXX..XXXXXXX 100644
23
--- a/hw/riscv/virt.c
24
+++ b/hw/riscv/virt.c
25
@@ -XXX,XX +XXX,XX @@ static void create_fdt_pmu(RISCVVirtState *s)
26
MachineState *ms = MACHINE(s);
27
RISCVCPU hart = s->soc[0].harts[0];
28
29
- pmu_name = g_strdup_printf("/soc/pmu");
30
+ pmu_name = g_strdup_printf("/pmu");
31
qemu_fdt_add_subnode(ms->fdt, pmu_name);
32
qemu_fdt_setprop_string(ms->fdt, pmu_name, "compatible", "riscv,pmu");
33
riscv_pmu_generate_fdt_node(ms->fdt, hart.cfg.pmu_num, pmu_name);
34
--
35
2.41.0
diff view generated by jsdifflib
1
From: Weiwei Li <liweiwei@iscas.ac.cn>
2
3
The Svadu specification updated the name of the *envcfg bit from
4
HADE to ADUE.
5
6
Signed-off-by: Weiwei Li <liweiwei@iscas.ac.cn>
7
Signed-off-by: Junqiang Wang <wangjunqiang@iscas.ac.cn>
8
Reviewed-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
9
Message-ID: <20230816141916.66898-1-liweiwei@iscas.ac.cn>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
10
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: 9308432988946de550a68524ed76e4b8683f10e2.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <9308432988946de550a68524ed76e4b8683f10e2.1597259519.git.alistair.francis@wdc.com>
4
---
11
---
5
target/riscv/cpu_bits.h | 5 +++--
12
target/riscv/cpu_bits.h | 8 ++++----
6
target/riscv/cpu_helper.c | 24 ++++++++++++++++++++----
13
target/riscv/cpu.c | 4 ++--
7
target/riscv/csr.c | 6 +++---
14
target/riscv/cpu_helper.c | 6 +++---
8
3 files changed, 26 insertions(+), 9 deletions(-)
15
target/riscv/csr.c | 12 ++++++------
16
4 files changed, 15 insertions(+), 15 deletions(-)
9
17
10
diff --git a/target/riscv/cpu_bits.h b/target/riscv/cpu_bits.h
18
diff --git a/target/riscv/cpu_bits.h b/target/riscv/cpu_bits.h
11
index XXXXXXX..XXXXXXX 100644
19
index XXXXXXX..XXXXXXX 100644
12
--- a/target/riscv/cpu_bits.h
20
--- a/target/riscv/cpu_bits.h
13
+++ b/target/riscv/cpu_bits.h
21
+++ b/target/riscv/cpu_bits.h
14
@@ -XXX,XX +XXX,XX @@
22
@@ -XXX,XX +XXX,XX @@ typedef enum RISCVException {
15
#define MSTATUS_TW 0x20000000 /* since: priv-1.10 */
23
#define MENVCFG_CBIE (3UL << 4)
16
#define MSTATUS_TSR 0x40000000 /* since: priv-1.10 */
24
#define MENVCFG_CBCFE BIT(6)
17
#if defined(TARGET_RISCV64)
25
#define MENVCFG_CBZE BIT(7)
18
-#define MSTATUS_MTL 0x4000000000ULL
26
-#define MENVCFG_HADE (1ULL << 61)
19
+#define MSTATUS_GVA 0x4000000000ULL
27
+#define MENVCFG_ADUE (1ULL << 61)
20
#define MSTATUS_MPV 0x8000000000ULL
28
#define MENVCFG_PBMTE (1ULL << 62)
21
#elif defined(TARGET_RISCV32)
29
#define MENVCFG_STCE (1ULL << 63)
22
-#define MSTATUS_MTL 0x00000040
30
23
+#define MSTATUS_GVA 0x00000040
31
/* For RV32 */
24
#define MSTATUS_MPV 0x00000080
32
-#define MENVCFGH_HADE BIT(29)
25
#endif
33
+#define MENVCFGH_ADUE BIT(29)
26
34
#define MENVCFGH_PBMTE BIT(30)
27
@@ -XXX,XX +XXX,XX @@
35
#define MENVCFGH_STCE BIT(31)
28
#define HSTATUS_VTVM 0x00100000
36
29
#define HSTATUS_VTSR 0x00400000
37
@@ -XXX,XX +XXX,XX @@ typedef enum RISCVException {
30
#define HSTATUS_HU 0x00000200
38
#define HENVCFG_CBIE MENVCFG_CBIE
31
+#define HSTATUS_GVA 0x00000040
39
#define HENVCFG_CBCFE MENVCFG_CBCFE
32
40
#define HENVCFG_CBZE MENVCFG_CBZE
33
#define HSTATUS32_WPRI 0xFF8FF87E
41
-#define HENVCFG_HADE MENVCFG_HADE
34
#define HSTATUS64_WPRI 0xFFFFFFFFFF8FF87EULL
42
+#define HENVCFG_ADUE MENVCFG_ADUE
43
#define HENVCFG_PBMTE MENVCFG_PBMTE
44
#define HENVCFG_STCE MENVCFG_STCE
45
46
/* For RV32 */
47
-#define HENVCFGH_HADE MENVCFGH_HADE
48
+#define HENVCFGH_ADUE MENVCFGH_ADUE
49
#define HENVCFGH_PBMTE MENVCFGH_PBMTE
50
#define HENVCFGH_STCE MENVCFGH_STCE
51
52
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
53
index XXXXXXX..XXXXXXX 100644
54
--- a/target/riscv/cpu.c
55
+++ b/target/riscv/cpu.c
56
@@ -XXX,XX +XXX,XX @@ static void riscv_cpu_reset_hold(Object *obj)
57
env->two_stage_lookup = false;
58
59
env->menvcfg = (cpu->cfg.ext_svpbmt ? MENVCFG_PBMTE : 0) |
60
- (cpu->cfg.ext_svadu ? MENVCFG_HADE : 0);
61
+ (cpu->cfg.ext_svadu ? MENVCFG_ADUE : 0);
62
env->henvcfg = (cpu->cfg.ext_svpbmt ? HENVCFG_PBMTE : 0) |
63
- (cpu->cfg.ext_svadu ? HENVCFG_HADE : 0);
64
+ (cpu->cfg.ext_svadu ? HENVCFG_ADUE : 0);
65
66
/* Initialized default priorities of local interrupts. */
67
for (i = 0; i < ARRAY_SIZE(env->miprio); i++) {
35
diff --git a/target/riscv/cpu_helper.c b/target/riscv/cpu_helper.c
68
diff --git a/target/riscv/cpu_helper.c b/target/riscv/cpu_helper.c
36
index XXXXXXX..XXXXXXX 100644
69
index XXXXXXX..XXXXXXX 100644
37
--- a/target/riscv/cpu_helper.c
70
--- a/target/riscv/cpu_helper.c
38
+++ b/target/riscv/cpu_helper.c
71
+++ b/target/riscv/cpu_helper.c
39
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_do_interrupt(CPUState *cs)
72
@@ -XXX,XX +XXX,XX @@ static int get_physical_address(CPURISCVState *env, hwaddr *physical,
40
if (riscv_has_ext(env, RVH)) {
73
}
41
target_ulong hdeleg = async ? env->hideleg : env->hedeleg;
74
42
75
bool pbmte = env->menvcfg & MENVCFG_PBMTE;
43
+ if ((riscv_cpu_virt_enabled(env) ||
76
- bool hade = env->menvcfg & MENVCFG_HADE;
44
+ riscv_cpu_two_stage_lookup(env)) && tval) {
77
+ bool adue = env->menvcfg & MENVCFG_ADUE;
45
+ /*
78
46
+ * If we are writing a guest virtual address to stval, set
79
if (first_stage && two_stage && env->virt_enabled) {
47
+ * this to 1. If we are trapping to VS we will set this to 0
80
pbmte = pbmte && (env->henvcfg & HENVCFG_PBMTE);
48
+ * later.
81
- hade = hade && (env->henvcfg & HENVCFG_HADE);
49
+ */
82
+ adue = adue && (env->henvcfg & HENVCFG_ADUE);
50
+ env->hstatus = set_field(env->hstatus, HSTATUS_GVA, 1);
83
}
51
+ } else {
84
52
+ /* For other HS-mode traps, we set this to 0. */
85
int ptshift = (levels - 1) * ptidxbits;
53
+ env->hstatus = set_field(env->hstatus, HSTATUS_GVA, 0);
86
@@ -XXX,XX +XXX,XX @@ restart:
54
+ }
87
55
+
88
/* Page table updates need to be atomic with MTTCG enabled */
56
if (riscv_cpu_virt_enabled(env) && ((hdeleg >> cause) & 1) &&
89
if (updated_pte != pte && !is_debug) {
57
!force_hs_execp) {
90
- if (!hade) {
58
/*
91
+ if (!adue) {
59
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_do_interrupt(CPUState *cs)
92
return TRANSLATE_FAIL;
60
cause == IRQ_VS_EXT)
93
}
61
cause = cause - 1;
94
62
/* Trap to VS mode */
63
+ env->hstatus = set_field(env->hstatus, HSTATUS_GVA, 0);
64
} else if (riscv_cpu_virt_enabled(env)) {
65
/* Trap into HS mode, from virt */
66
riscv_cpu_swap_hypervisor_regs(env);
67
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_do_interrupt(CPUState *cs)
68
#ifdef TARGET_RISCV32
69
env->mstatush = set_field(env->mstatush, MSTATUS_MPV,
70
riscv_cpu_virt_enabled(env));
71
- env->mstatush = set_field(env->mstatush, MSTATUS_MTL,
72
- riscv_cpu_force_hs_excep_enabled(env));
73
+ if (riscv_cpu_virt_enabled(env) && tval) {
74
+ env->mstatush = set_field(env->mstatush, MSTATUS_GVA, 1);
75
+ }
76
#else
77
env->mstatus = set_field(env->mstatus, MSTATUS_MPV,
78
riscv_cpu_virt_enabled(env));
79
- env->mstatus = set_field(env->mstatus, MSTATUS_MTL,
80
- riscv_cpu_force_hs_excep_enabled(env));
81
+ if (riscv_cpu_virt_enabled(env) && tval) {
82
+ env->mstatus = set_field(env->mstatus, MSTATUS_GVA, 1);
83
+ }
84
#endif
85
86
mtval2 = env->guest_phys_fault_addr;
87
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
95
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
88
index XXXXXXX..XXXXXXX 100644
96
index XXXXXXX..XXXXXXX 100644
89
--- a/target/riscv/csr.c
97
--- a/target/riscv/csr.c
90
+++ b/target/riscv/csr.c
98
+++ b/target/riscv/csr.c
91
@@ -XXX,XX +XXX,XX @@ static int write_mstatus(CPURISCVState *env, int csrno, target_ulong val)
99
@@ -XXX,XX +XXX,XX @@ static RISCVException write_menvcfg(CPURISCVState *env, int csrno,
92
MSTATUS_TW;
100
if (riscv_cpu_mxl(env) == MXL_RV64) {
93
#if defined(TARGET_RISCV64)
101
mask |= (cfg->ext_svpbmt ? MENVCFG_PBMTE : 0) |
94
/*
102
(cfg->ext_sstc ? MENVCFG_STCE : 0) |
95
- * RV32: MPV and MTL are not in mstatus. The current plan is to
103
- (cfg->ext_svadu ? MENVCFG_HADE : 0);
96
+ * RV32: MPV and GVA are not in mstatus. The current plan is to
104
+ (cfg->ext_svadu ? MENVCFG_ADUE : 0);
97
* add them to mstatush. For now, we just don't support it.
105
}
106
env->menvcfg = (env->menvcfg & ~mask) | (val & mask);
107
108
@@ -XXX,XX +XXX,XX @@ static RISCVException write_menvcfgh(CPURISCVState *env, int csrno,
109
const RISCVCPUConfig *cfg = riscv_cpu_cfg(env);
110
uint64_t mask = (cfg->ext_svpbmt ? MENVCFG_PBMTE : 0) |
111
(cfg->ext_sstc ? MENVCFG_STCE : 0) |
112
- (cfg->ext_svadu ? MENVCFG_HADE : 0);
113
+ (cfg->ext_svadu ? MENVCFG_ADUE : 0);
114
uint64_t valh = (uint64_t)val << 32;
115
116
env->menvcfg = (env->menvcfg & ~mask) | (valh & mask);
117
@@ -XXX,XX +XXX,XX @@ static RISCVException read_henvcfg(CPURISCVState *env, int csrno,
118
* henvcfg.stce is read_only 0 when menvcfg.stce = 0
119
* henvcfg.hade is read_only 0 when menvcfg.hade = 0
98
*/
120
*/
99
- mask |= MSTATUS_MTL | MSTATUS_MPV;
121
- *val = env->henvcfg & (~(HENVCFG_PBMTE | HENVCFG_STCE | HENVCFG_HADE) |
100
+ mask |= MSTATUS_MPV | MSTATUS_GVA;
122
+ *val = env->henvcfg & (~(HENVCFG_PBMTE | HENVCFG_STCE | HENVCFG_ADUE) |
101
#endif
123
env->menvcfg);
102
124
return RISCV_EXCP_NONE;
103
mstatus = (mstatus & ~mask) | (val & mask);
125
}
104
@@ -XXX,XX +XXX,XX @@ static int write_mstatush(CPURISCVState *env, int csrno, target_ulong val)
126
@@ -XXX,XX +XXX,XX @@ static RISCVException write_henvcfg(CPURISCVState *env, int csrno,
105
tlb_flush(env_cpu(env));
106
}
127
}
107
128
108
- val &= MSTATUS_MPV | MSTATUS_MTL;
129
if (riscv_cpu_mxl(env) == MXL_RV64) {
109
+ val &= MSTATUS_MPV | MSTATUS_GVA;
130
- mask |= env->menvcfg & (HENVCFG_PBMTE | HENVCFG_STCE | HENVCFG_HADE);
110
131
+ mask |= env->menvcfg & (HENVCFG_PBMTE | HENVCFG_STCE | HENVCFG_ADUE);
111
env->mstatush = val;
132
}
133
134
env->henvcfg = (env->henvcfg & ~mask) | (val & mask);
135
@@ -XXX,XX +XXX,XX @@ static RISCVException read_henvcfgh(CPURISCVState *env, int csrno,
136
return ret;
137
}
138
139
- *val = (env->henvcfg & (~(HENVCFG_PBMTE | HENVCFG_STCE | HENVCFG_HADE) |
140
+ *val = (env->henvcfg & (~(HENVCFG_PBMTE | HENVCFG_STCE | HENVCFG_ADUE) |
141
env->menvcfg)) >> 32;
142
return RISCV_EXCP_NONE;
143
}
144
@@ -XXX,XX +XXX,XX @@ static RISCVException write_henvcfgh(CPURISCVState *env, int csrno,
145
target_ulong val)
146
{
147
uint64_t mask = env->menvcfg & (HENVCFG_PBMTE | HENVCFG_STCE |
148
- HENVCFG_HADE);
149
+ HENVCFG_ADUE);
150
uint64_t valh = (uint64_t)val << 32;
151
RISCVException ret;
112
152
113
--
153
--
114
2.28.0
154
2.41.0
115
116
diff view generated by jsdifflib
New patch
1
From: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
1
2
3
In the same emulated RISC-V host, the 'host' KVM CPU takes 4 times
4
longer to boot than the 'rv64' KVM CPU.
5
6
The reason is an unintended behavior of riscv_cpu_satp_mode_finalize()
7
when satp_mode.supported = 0, i.e. when cpu_init() does not set
8
satp_mode_max_supported(). satp_mode_max_from_map(map) does:
9
10
31 - __builtin_clz(map)
11
12
This means that, if satp_mode.supported = 0, satp_mode_supported_max
13
wil be '31 - 32'. But this is C, so satp_mode_supported_max will gladly
14
set it to UINT_MAX (4294967295). After that, if the user didn't set a
15
satp_mode, set_satp_mode_default_map(cpu) will make
16
17
cfg.satp_mode.map = cfg.satp_mode.supported
18
19
So satp_mode.map = 0. And then satp_mode_map_max will be set to
20
satp_mode_max_from_map(cpu->cfg.satp_mode.map), i.e. also UINT_MAX. The
21
guard "satp_mode_map_max > satp_mode_supported_max" doesn't protect us
22
here since both are UINT_MAX.
23
24
And finally we have 2 loops:
25
26
for (int i = satp_mode_map_max - 1; i >= 0; --i) {
27
28
Which are, in fact, 2 loops from UINT_MAX -1 to -1. This is where the
29
extra delay when booting the 'host' CPU is coming from.
30
31
Commit 43d1de32f8 already set a precedence for satp_mode.supported = 0
32
in a different manner. We're doing the same here. If supported == 0,
33
interpret as 'the CPU wants the OS to handle satp mode alone' and skip
34
satp_mode_finalize().
35
36
We'll also put a guard in satp_mode_max_from_map() to assert out if map
37
is 0 since the function is not ready to deal with it.
38
39
Cc: Alexandre Ghiti <alexghiti@rivosinc.com>
40
Fixes: 6f23aaeb9b ("riscv: Allow user to set the satp mode")
41
Signed-off-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
42
Reviewed-by: Andrew Jones <ajones@ventanamicro.com>
43
Message-ID: <20230817152903.694926-1-dbarboza@ventanamicro.com>
44
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
45
---
46
target/riscv/cpu.c | 23 ++++++++++++++++++++---
47
1 file changed, 20 insertions(+), 3 deletions(-)
48
49
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
50
index XXXXXXX..XXXXXXX 100644
51
--- a/target/riscv/cpu.c
52
+++ b/target/riscv/cpu.c
53
@@ -XXX,XX +XXX,XX @@ static uint8_t satp_mode_from_str(const char *satp_mode_str)
54
55
uint8_t satp_mode_max_from_map(uint32_t map)
56
{
57
+ /*
58
+ * 'map = 0' will make us return (31 - 32), which C will
59
+ * happily overflow to UINT_MAX. There's no good result to
60
+ * return if 'map = 0' (e.g. returning 0 will be ambiguous
61
+ * with the result for 'map = 1').
62
+ *
63
+ * Assert out if map = 0. Callers will have to deal with
64
+ * it outside of this function.
65
+ */
66
+ g_assert(map > 0);
67
+
68
/* map here has at least one bit set, so no problem with clz */
69
return 31 - __builtin_clz(map);
70
}
71
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_validate_set_extensions(RISCVCPU *cpu, Error **errp)
72
static void riscv_cpu_satp_mode_finalize(RISCVCPU *cpu, Error **errp)
73
{
74
bool rv32 = riscv_cpu_mxl(&cpu->env) == MXL_RV32;
75
- uint8_t satp_mode_map_max;
76
- uint8_t satp_mode_supported_max =
77
- satp_mode_max_from_map(cpu->cfg.satp_mode.supported);
78
+ uint8_t satp_mode_map_max, satp_mode_supported_max;
79
+
80
+ /* The CPU wants the OS to decide which satp mode to use */
81
+ if (cpu->cfg.satp_mode.supported == 0) {
82
+ return;
83
+ }
84
+
85
+ satp_mode_supported_max =
86
+ satp_mode_max_from_map(cpu->cfg.satp_mode.supported);
87
88
if (cpu->cfg.satp_mode.map == 0) {
89
if (cpu->cfg.satp_mode.init == 0) {
90
--
91
2.41.0
diff view generated by jsdifflib
New patch
1
From: Vineet Gupta <vineetg@rivosinc.com>
1
2
3
zicond is now codegen supported in both llvm and gcc.
4
5
This change allows seamless enabling/testing of zicond in downstream
6
projects. e.g. currently riscv-gnu-toolchain parses elf attributes
7
to create a cmdline for qemu but fails short of enabling it because of
8
the "x-" prefix.
9
10
Signed-off-by: Vineet Gupta <vineetg@rivosinc.com>
11
Message-ID: <20230808181715.436395-1-vineetg@rivosinc.com>
12
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
13
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
14
---
15
target/riscv/cpu.c | 2 +-
16
1 file changed, 1 insertion(+), 1 deletion(-)
17
18
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
19
index XXXXXXX..XXXXXXX 100644
20
--- a/target/riscv/cpu.c
21
+++ b/target/riscv/cpu.c
22
@@ -XXX,XX +XXX,XX @@ static Property riscv_cpu_extensions[] = {
23
DEFINE_PROP_BOOL("zcf", RISCVCPU, cfg.ext_zcf, false),
24
DEFINE_PROP_BOOL("zcmp", RISCVCPU, cfg.ext_zcmp, false),
25
DEFINE_PROP_BOOL("zcmt", RISCVCPU, cfg.ext_zcmt, false),
26
+ DEFINE_PROP_BOOL("zicond", RISCVCPU, cfg.ext_zicond, false),
27
28
/* Vendor-specific custom extensions */
29
DEFINE_PROP_BOOL("xtheadba", RISCVCPU, cfg.ext_xtheadba, false),
30
@@ -XXX,XX +XXX,XX @@ static Property riscv_cpu_extensions[] = {
31
DEFINE_PROP_BOOL("xventanacondops", RISCVCPU, cfg.ext_XVentanaCondOps, false),
32
33
/* These are experimental so mark with 'x-' */
34
- DEFINE_PROP_BOOL("x-zicond", RISCVCPU, cfg.ext_zicond, false),
35
36
/* ePMP 0.9.3 */
37
DEFINE_PROP_BOOL("x-epmp", RISCVCPU, cfg.epmp, false),
38
--
39
2.41.0
diff view generated by jsdifflib
1
From: Anup Patel <anup.patel@wdc.com>
1
From: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
2
2
3
We extend PLIC emulation to allow multiple instances of PLIC in
3
A build with --enable-debug and without KVM will fail as follows:
4
a QEMU RISC-V machine. To achieve this, we remove first HART id
5
zero assumption from PLIC emulation.
6
4
7
Signed-off-by: Anup Patel <anup.patel@wdc.com>
5
/usr/bin/ld: libqemu-riscv64-softmmu.fa.p/hw_riscv_virt.c.o: in function `virt_machine_init':
8
Reviewed-by: Palmer Dabbelt <palmerdabbelt@google.com>
6
./qemu/build/../hw/riscv/virt.c:1465: undefined reference to `kvm_riscv_aia_create'
9
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
7
10
Message-Id: <20200616032229.766089-3-anup.patel@wdc.com>
8
This happens because the code block with "if virt_use_kvm_aia(s)" isn't
9
being ignored by the debug build, resulting in an undefined reference to
10
a KVM only function.
11
12
Add a 'kvm_enabled()' conditional together with virt_use_kvm_aia() will
13
make the compiler crop the kvm_riscv_aia_create() call entirely from a
14
non-KVM build. Note that adding the 'kvm_enabled()' conditional inside
15
virt_use_kvm_aia() won't fix the build because this function would need
16
to be inlined multiple times to make the compiler zero out the entire
17
block.
18
19
While we're at it, use kvm_enabled() in all instances where
20
virt_use_kvm_aia() is checked to allow the compiler to elide these other
21
kvm-only instances as well.
22
23
Suggested-by: Richard Henderson <richard.henderson@linaro.org>
24
Fixes: dbdb99948e ("target/riscv: select KVM AIA in riscv virt machine")
25
Signed-off-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
26
Reviewed-by: Andrew Jones <ajones@ventanamicro.com>
27
Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org>
28
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
29
Message-ID: <20230830133503.711138-2-dbarboza@ventanamicro.com>
11
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
30
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
12
---
31
---
13
include/hw/riscv/sifive_plic.h | 12 +++++++-----
32
hw/riscv/virt.c | 6 +++---
14
hw/riscv/sifive_e.c | 2 +-
33
1 file changed, 3 insertions(+), 3 deletions(-)
15
hw/riscv/sifive_plic.c | 24 +++++++++++++-----------
16
hw/riscv/sifive_u.c | 2 +-
17
hw/riscv/virt.c | 2 +-
18
5 files changed, 23 insertions(+), 19 deletions(-)
19
34
20
diff --git a/include/hw/riscv/sifive_plic.h b/include/hw/riscv/sifive_plic.h
21
index XXXXXXX..XXXXXXX 100644
22
--- a/include/hw/riscv/sifive_plic.h
23
+++ b/include/hw/riscv/sifive_plic.h
24
@@ -XXX,XX +XXX,XX @@ typedef struct SiFivePLICState {
25
/*< public >*/
26
MemoryRegion mmio;
27
uint32_t num_addrs;
28
+ uint32_t num_harts;
29
uint32_t bitfield_words;
30
PLICAddr *addr_config;
31
uint32_t *source_priority;
32
@@ -XXX,XX +XXX,XX @@ typedef struct SiFivePLICState {
33
34
/* config */
35
char *hart_config;
36
+ uint32_t hartid_base;
37
uint32_t num_sources;
38
uint32_t num_priorities;
39
uint32_t priority_base;
40
@@ -XXX,XX +XXX,XX @@ typedef struct SiFivePLICState {
41
} SiFivePLICState;
42
43
DeviceState *sifive_plic_create(hwaddr addr, char *hart_config,
44
- uint32_t num_sources, uint32_t num_priorities,
45
- uint32_t priority_base, uint32_t pending_base,
46
- uint32_t enable_base, uint32_t enable_stride,
47
- uint32_t context_base, uint32_t context_stride,
48
- uint32_t aperture_size);
49
+ uint32_t hartid_base, uint32_t num_sources,
50
+ uint32_t num_priorities, uint32_t priority_base,
51
+ uint32_t pending_base, uint32_t enable_base,
52
+ uint32_t enable_stride, uint32_t context_base,
53
+ uint32_t context_stride, uint32_t aperture_size);
54
55
#endif
56
diff --git a/hw/riscv/sifive_e.c b/hw/riscv/sifive_e.c
57
index XXXXXXX..XXXXXXX 100644
58
--- a/hw/riscv/sifive_e.c
59
+++ b/hw/riscv/sifive_e.c
60
@@ -XXX,XX +XXX,XX @@ static void sifive_e_soc_realize(DeviceState *dev, Error **errp)
61
62
/* MMIO */
63
s->plic = sifive_plic_create(memmap[SIFIVE_E_PLIC].base,
64
- (char *)SIFIVE_E_PLIC_HART_CONFIG,
65
+ (char *)SIFIVE_E_PLIC_HART_CONFIG, 0,
66
SIFIVE_E_PLIC_NUM_SOURCES,
67
SIFIVE_E_PLIC_NUM_PRIORITIES,
68
SIFIVE_E_PLIC_PRIORITY_BASE,
69
diff --git a/hw/riscv/sifive_plic.c b/hw/riscv/sifive_plic.c
70
index XXXXXXX..XXXXXXX 100644
71
--- a/hw/riscv/sifive_plic.c
72
+++ b/hw/riscv/sifive_plic.c
73
@@ -XXX,XX +XXX,XX @@ static const MemoryRegionOps sifive_plic_ops = {
74
75
static Property sifive_plic_properties[] = {
76
DEFINE_PROP_STRING("hart-config", SiFivePLICState, hart_config),
77
+ DEFINE_PROP_UINT32("hartid-base", SiFivePLICState, hartid_base, 0),
78
DEFINE_PROP_UINT32("num-sources", SiFivePLICState, num_sources, 0),
79
DEFINE_PROP_UINT32("num-priorities", SiFivePLICState, num_priorities, 0),
80
DEFINE_PROP_UINT32("priority-base", SiFivePLICState, priority_base, 0),
81
@@ -XXX,XX +XXX,XX @@ static void parse_hart_config(SiFivePLICState *plic)
82
}
83
hartid++;
84
85
- /* store hart/mode combinations */
86
plic->num_addrs = addrid;
87
+ plic->num_harts = hartid;
88
+
89
+ /* store hart/mode combinations */
90
plic->addr_config = g_new(PLICAddr, plic->num_addrs);
91
- addrid = 0, hartid = 0;
92
+ addrid = 0, hartid = plic->hartid_base;
93
p = plic->hart_config;
94
while ((c = *p++)) {
95
if (c == ',') {
96
@@ -XXX,XX +XXX,XX @@ static void sifive_plic_irq_request(void *opaque, int irq, int level)
97
98
static void sifive_plic_realize(DeviceState *dev, Error **errp)
99
{
100
- MachineState *ms = MACHINE(qdev_get_machine());
101
- unsigned int smp_cpus = ms->smp.cpus;
102
SiFivePLICState *plic = SIFIVE_PLIC(dev);
103
int i;
104
105
@@ -XXX,XX +XXX,XX @@ static void sifive_plic_realize(DeviceState *dev, Error **errp)
106
* lost a interrupt in the case a PLIC is attached. The SEIP bit must be
107
* hardware controlled when a PLIC is attached.
108
*/
109
- for (i = 0; i < smp_cpus; i++) {
110
- RISCVCPU *cpu = RISCV_CPU(qemu_get_cpu(i));
111
+ for (i = 0; i < plic->num_harts; i++) {
112
+ RISCVCPU *cpu = RISCV_CPU(qemu_get_cpu(plic->hartid_base + i));
113
if (riscv_cpu_claim_interrupts(cpu, MIP_SEIP) < 0) {
114
error_report("SEIP already claimed");
115
exit(1);
116
@@ -XXX,XX +XXX,XX @@ type_init(sifive_plic_register_types)
117
* Create PLIC device.
118
*/
119
DeviceState *sifive_plic_create(hwaddr addr, char *hart_config,
120
- uint32_t num_sources, uint32_t num_priorities,
121
- uint32_t priority_base, uint32_t pending_base,
122
- uint32_t enable_base, uint32_t enable_stride,
123
- uint32_t context_base, uint32_t context_stride,
124
- uint32_t aperture_size)
125
+ uint32_t hartid_base, uint32_t num_sources,
126
+ uint32_t num_priorities, uint32_t priority_base,
127
+ uint32_t pending_base, uint32_t enable_base,
128
+ uint32_t enable_stride, uint32_t context_base,
129
+ uint32_t context_stride, uint32_t aperture_size)
130
{
131
DeviceState *dev = qdev_new(TYPE_SIFIVE_PLIC);
132
assert(enable_stride == (enable_stride & -enable_stride));
133
assert(context_stride == (context_stride & -context_stride));
134
qdev_prop_set_string(dev, "hart-config", hart_config);
135
+ qdev_prop_set_uint32(dev, "hartid-base", hartid_base);
136
qdev_prop_set_uint32(dev, "num-sources", num_sources);
137
qdev_prop_set_uint32(dev, "num-priorities", num_priorities);
138
qdev_prop_set_uint32(dev, "priority-base", priority_base);
139
diff --git a/hw/riscv/sifive_u.c b/hw/riscv/sifive_u.c
140
index XXXXXXX..XXXXXXX 100644
141
--- a/hw/riscv/sifive_u.c
142
+++ b/hw/riscv/sifive_u.c
143
@@ -XXX,XX +XXX,XX @@ static void sifive_u_soc_realize(DeviceState *dev, Error **errp)
144
145
/* MMIO */
146
s->plic = sifive_plic_create(memmap[SIFIVE_U_PLIC].base,
147
- plic_hart_config,
148
+ plic_hart_config, 0,
149
SIFIVE_U_PLIC_NUM_SOURCES,
150
SIFIVE_U_PLIC_NUM_PRIORITIES,
151
SIFIVE_U_PLIC_PRIORITY_BASE,
152
diff --git a/hw/riscv/virt.c b/hw/riscv/virt.c
35
diff --git a/hw/riscv/virt.c b/hw/riscv/virt.c
153
index XXXXXXX..XXXXXXX 100644
36
index XXXXXXX..XXXXXXX 100644
154
--- a/hw/riscv/virt.c
37
--- a/hw/riscv/virt.c
155
+++ b/hw/riscv/virt.c
38
+++ b/hw/riscv/virt.c
39
@@ -XXX,XX +XXX,XX @@ static void create_fdt_sockets(RISCVVirtState *s, const MemMapEntry *memmap,
40
}
41
42
/* KVM AIA only has one APLIC instance */
43
- if (virt_use_kvm_aia(s)) {
44
+ if (kvm_enabled() && virt_use_kvm_aia(s)) {
45
create_fdt_socket_aplic(s, memmap, 0,
46
msi_m_phandle, msi_s_phandle, phandle,
47
&intc_phandles[0], xplic_phandles,
48
@@ -XXX,XX +XXX,XX @@ static void create_fdt_sockets(RISCVVirtState *s, const MemMapEntry *memmap,
49
50
g_free(intc_phandles);
51
52
- if (virt_use_kvm_aia(s)) {
53
+ if (kvm_enabled() && virt_use_kvm_aia(s)) {
54
*irq_mmio_phandle = xplic_phandles[0];
55
*irq_virtio_phandle = xplic_phandles[0];
56
*irq_pcie_phandle = xplic_phandles[0];
156
@@ -XXX,XX +XXX,XX @@ static void virt_machine_init(MachineState *machine)
57
@@ -XXX,XX +XXX,XX @@ static void virt_machine_init(MachineState *machine)
157
58
}
158
/* MMIO */
59
}
159
s->plic = sifive_plic_create(memmap[VIRT_PLIC].base,
60
160
- plic_hart_config,
61
- if (virt_use_kvm_aia(s)) {
161
+ plic_hart_config, 0,
62
+ if (kvm_enabled() && virt_use_kvm_aia(s)) {
162
VIRT_PLIC_NUM_SOURCES,
63
kvm_riscv_aia_create(machine, IMSIC_MMIO_GROUP_MIN_SHIFT,
163
VIRT_PLIC_NUM_PRIORITIES,
64
VIRT_IRQCHIP_NUM_SOURCES, VIRT_IRQCHIP_NUM_MSIS,
164
VIRT_PLIC_PRIORITY_BASE,
65
memmap[VIRT_APLIC_S].base,
165
--
66
--
166
2.28.0
67
2.41.0
167
68
168
69
diff view generated by jsdifflib
1
From: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
2
3
Commit 6df0b37e2ab breaks a --enable-debug build in a non-KVM
4
environment with the following error:
5
6
/usr/bin/ld: libqemu-riscv64-softmmu.fa.p/hw_intc_riscv_aplic.c.o: in function `riscv_kvm_aplic_request':
7
./qemu/build/../hw/intc/riscv_aplic.c:486: undefined reference to `kvm_set_irq'
8
collect2: error: ld returned 1 exit status
9
10
This happens because the debug build will poke into the
11
'if (is_kvm_aia(aplic->msimode))' block and fail to find a reference to
12
the KVM only function riscv_kvm_aplic_request().
13
14
There are multiple solutions to fix this. We'll go with the same
15
solution from the previous patch, i.e. add a kvm_enabled() conditional
16
to filter out the block. But there's a catch: riscv_kvm_aplic_request()
17
is a local function that would end up being used if the compiler crops
18
the block, and this won't work. Quoting Richard Henderson's explanation
19
in [1]:
20
21
"(...) the compiler won't eliminate entire unused functions with -O0"
22
23
We'll solve it by moving riscv_kvm_aplic_request() to kvm.c and add its
24
declaration in kvm_riscv.h, where all other KVM specific public
25
functions are already declared. Other archs handles KVM specific code in
26
this manner and we expect to do the same from now on.
27
28
[1] https://lore.kernel.org/qemu-riscv/d2f1ad02-eb03-138f-9d08-db676deeed05@linaro.org/
29
30
Signed-off-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com>
31
Reviewed-by: Andrew Jones <ajones@ventanamicro.com>
32
Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org>
33
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
34
Message-ID: <20230830133503.711138-3-dbarboza@ventanamicro.com>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
35
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: 85b7fdba8abd87adb83275cdc3043ce35a1ed5c3.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <85b7fdba8abd87adb83275cdc3043ce35a1ed5c3.1597259519.git.alistair.francis@wdc.com>
4
---
36
---
5
target/riscv/cpu_helper.c | 5 +++--
37
target/riscv/kvm_riscv.h | 1 +
6
1 file changed, 3 insertions(+), 2 deletions(-)
38
hw/intc/riscv_aplic.c | 8 ++------
39
target/riscv/kvm.c | 5 +++++
40
3 files changed, 8 insertions(+), 6 deletions(-)
7
41
8
diff --git a/target/riscv/cpu_helper.c b/target/riscv/cpu_helper.c
42
diff --git a/target/riscv/kvm_riscv.h b/target/riscv/kvm_riscv.h
9
index XXXXXXX..XXXXXXX 100644
43
index XXXXXXX..XXXXXXX 100644
10
--- a/target/riscv/cpu_helper.c
44
--- a/target/riscv/kvm_riscv.h
11
+++ b/target/riscv/cpu_helper.c
45
+++ b/target/riscv/kvm_riscv.h
12
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_do_interrupt(CPUState *cs)
46
@@ -XXX,XX +XXX,XX @@ void kvm_riscv_aia_create(MachineState *machine, uint64_t group_shift,
13
47
uint64_t aia_irq_num, uint64_t aia_msi_num,
14
if (riscv_cpu_virt_enabled(env) && ((hdeleg >> cause) & 1) &&
48
uint64_t aplic_base, uint64_t imsic_base,
15
!force_hs_execp) {
49
uint64_t guest_num);
16
+ /* Trap to VS mode */
50
+void riscv_kvm_aplic_request(void *opaque, int irq, int level);
17
/*
51
18
* See if we need to adjust cause. Yes if its VS mode interrupt
52
#endif
19
* no if hypervisor has delegated one of hs mode's interrupt
53
diff --git a/hw/intc/riscv_aplic.c b/hw/intc/riscv_aplic.c
20
*/
54
index XXXXXXX..XXXXXXX 100644
21
if (cause == IRQ_VS_TIMER || cause == IRQ_VS_SOFT ||
55
--- a/hw/intc/riscv_aplic.c
22
- cause == IRQ_VS_EXT)
56
+++ b/hw/intc/riscv_aplic.c
23
+ cause == IRQ_VS_EXT) {
57
@@ -XXX,XX +XXX,XX @@
24
cause = cause - 1;
58
#include "target/riscv/cpu.h"
25
- /* Trap to VS mode */
59
#include "sysemu/sysemu.h"
26
+ }
60
#include "sysemu/kvm.h"
27
env->hstatus = set_field(env->hstatus, HSTATUS_GVA, 0);
61
+#include "kvm_riscv.h"
28
} else if (riscv_cpu_virt_enabled(env)) {
62
#include "migration/vmstate.h"
29
/* Trap into HS mode, from virt */
63
64
#define APLIC_MAX_IDC (1UL << 14)
65
@@ -XXX,XX +XXX,XX @@ static uint32_t riscv_aplic_idc_claimi(RISCVAPLICState *aplic, uint32_t idc)
66
return topi;
67
}
68
69
-static void riscv_kvm_aplic_request(void *opaque, int irq, int level)
70
-{
71
- kvm_set_irq(kvm_state, irq, !!level);
72
-}
73
-
74
static void riscv_aplic_request(void *opaque, int irq, int level)
75
{
76
bool update = false;
77
@@ -XXX,XX +XXX,XX @@ static void riscv_aplic_realize(DeviceState *dev, Error **errp)
78
* have IRQ lines delegated by their parent APLIC.
79
*/
80
if (!aplic->parent) {
81
- if (is_kvm_aia(aplic->msimode)) {
82
+ if (kvm_enabled() && is_kvm_aia(aplic->msimode)) {
83
qdev_init_gpio_in(dev, riscv_kvm_aplic_request, aplic->num_irqs);
84
} else {
85
qdev_init_gpio_in(dev, riscv_aplic_request, aplic->num_irqs);
86
diff --git a/target/riscv/kvm.c b/target/riscv/kvm.c
87
index XXXXXXX..XXXXXXX 100644
88
--- a/target/riscv/kvm.c
89
+++ b/target/riscv/kvm.c
90
@@ -XXX,XX +XXX,XX @@
91
#include "sysemu/runstate.h"
92
#include "hw/riscv/numa.h"
93
94
+void riscv_kvm_aplic_request(void *opaque, int irq, int level)
95
+{
96
+ kvm_set_irq(kvm_state, irq, !!level);
97
+}
98
+
99
static uint64_t kvm_riscv_reg_id(CPURISCVState *env, uint64_t type,
100
uint64_t idx)
101
{
30
--
102
--
31
2.28.0
103
2.41.0
32
104
33
105
diff view generated by jsdifflib
New patch
1
From: Robbin Ehn <rehn@rivosinc.com>
1
2
3
This patch adds the new extensions in
4
linux 6.5 to the hwprobe syscall.
5
6
And fixes RVC check to OR with correct value.
7
The previous variable contains 0 therefore it
8
did work.
9
10
Signed-off-by: Robbin Ehn <rehn@rivosinc.com>
11
Acked-by: Richard Henderson <richard.henderson@linaro.org>
12
Acked-by: Alistair Francis <alistair.francis@wdc.com>
13
Message-ID: <bc82203b72d7efb30f1b4a8f9eb3d94699799dc8.camel@rivosinc.com>
14
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
15
---
16
linux-user/syscall.c | 14 +++++++++++++-
17
1 file changed, 13 insertions(+), 1 deletion(-)
18
19
diff --git a/linux-user/syscall.c b/linux-user/syscall.c
20
index XXXXXXX..XXXXXXX 100644
21
--- a/linux-user/syscall.c
22
+++ b/linux-user/syscall.c
23
@@ -XXX,XX +XXX,XX @@ static int do_getdents64(abi_long dirfd, abi_long arg2, abi_long count)
24
#define RISCV_HWPROBE_KEY_IMA_EXT_0 4
25
#define RISCV_HWPROBE_IMA_FD (1 << 0)
26
#define RISCV_HWPROBE_IMA_C (1 << 1)
27
+#define RISCV_HWPROBE_IMA_V (1 << 2)
28
+#define RISCV_HWPROBE_EXT_ZBA (1 << 3)
29
+#define RISCV_HWPROBE_EXT_ZBB (1 << 4)
30
+#define RISCV_HWPROBE_EXT_ZBS (1 << 5)
31
32
#define RISCV_HWPROBE_KEY_CPUPERF_0 5
33
#define RISCV_HWPROBE_MISALIGNED_UNKNOWN (0 << 0)
34
@@ -XXX,XX +XXX,XX @@ static void risc_hwprobe_fill_pairs(CPURISCVState *env,
35
riscv_has_ext(env, RVD) ?
36
RISCV_HWPROBE_IMA_FD : 0;
37
value |= riscv_has_ext(env, RVC) ?
38
- RISCV_HWPROBE_IMA_C : pair->value;
39
+ RISCV_HWPROBE_IMA_C : 0;
40
+ value |= riscv_has_ext(env, RVV) ?
41
+ RISCV_HWPROBE_IMA_V : 0;
42
+ value |= cfg->ext_zba ?
43
+ RISCV_HWPROBE_EXT_ZBA : 0;
44
+ value |= cfg->ext_zbb ?
45
+ RISCV_HWPROBE_EXT_ZBB : 0;
46
+ value |= cfg->ext_zbs ?
47
+ RISCV_HWPROBE_EXT_ZBS : 0;
48
__put_user(value, &pair->value);
49
break;
50
case RISCV_HWPROBE_KEY_CPUPERF_0:
51
--
52
2.41.0
diff view generated by jsdifflib
1
From: Anup Patel <anup.patel@wdc.com>
1
From: Ard Biesheuvel <ardb@kernel.org>
2
2
3
We extend CLINT emulation to allow multiple instances of CLINT in
3
Use the accelerated SubBytes/ShiftRows/AddRoundKey AES helper to
4
a QEMU RISC-V machine. To achieve this, we remove first HART id
4
implement the first half of the key schedule derivation. This does not
5
zero assumption from CLINT emulation.
5
actually involve shifting rows, so clone the same value into all four
6
columns of the AES vector to counter that operation.
6
7
7
Signed-off-by: Anup Patel <anup.patel@wdc.com>
8
Cc: Richard Henderson <richard.henderson@linaro.org>
8
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
9
Cc: Philippe Mathieu-Daudé <philmd@linaro.org>
9
Reviewed-by: Palmer Dabbelt <palmerdabbelt@google.com>
10
Cc: Palmer Dabbelt <palmer@dabbelt.com>
10
Message-Id: <20200616032229.766089-2-anup.patel@wdc.com>
11
Cc: Alistair Francis <alistair.francis@wdc.com>
12
Signed-off-by: Ard Biesheuvel <ardb@kernel.org>
13
Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org>
14
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
15
Message-ID: <20230831154118.138727-1-ardb@kernel.org>
11
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
16
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
12
---
17
---
13
include/hw/riscv/sifive_clint.h | 7 ++++---
18
target/riscv/crypto_helper.c | 17 +++++------------
14
hw/riscv/sifive_clint.c | 20 ++++++++++++--------
19
1 file changed, 5 insertions(+), 12 deletions(-)
15
hw/riscv/sifive_e.c | 2 +-
16
hw/riscv/sifive_u.c | 2 +-
17
hw/riscv/spike.c | 2 +-
18
hw/riscv/virt.c | 2 +-
19
6 files changed, 20 insertions(+), 15 deletions(-)
20
20
21
diff --git a/include/hw/riscv/sifive_clint.h b/include/hw/riscv/sifive_clint.h
21
diff --git a/target/riscv/crypto_helper.c b/target/riscv/crypto_helper.c
22
index XXXXXXX..XXXXXXX 100644
22
index XXXXXXX..XXXXXXX 100644
23
--- a/include/hw/riscv/sifive_clint.h
23
--- a/target/riscv/crypto_helper.c
24
+++ b/include/hw/riscv/sifive_clint.h
24
+++ b/target/riscv/crypto_helper.c
25
@@ -XXX,XX +XXX,XX @@ typedef struct SiFiveCLINTState {
25
@@ -XXX,XX +XXX,XX @@ target_ulong HELPER(aes64ks1i)(target_ulong rs1, target_ulong rnum)
26
26
27
/*< public >*/
27
uint8_t enc_rnum = rnum;
28
MemoryRegion mmio;
28
uint32_t temp = (RS1 >> 32) & 0xFFFFFFFF;
29
+ uint32_t hartid_base;
29
- uint8_t rcon_ = 0;
30
uint32_t num_harts;
30
- target_ulong result;
31
uint32_t sip_base;
31
+ AESState t, rc = {};
32
uint32_t timecmp_base;
32
33
@@ -XXX,XX +XXX,XX @@ typedef struct SiFiveCLINTState {
33
if (enc_rnum != 0xA) {
34
uint32_t aperture_size;
34
temp = ror32(temp, 8); /* Rotate right by 8 */
35
} SiFiveCLINTState;
35
- rcon_ = round_consts[enc_rnum];
36
36
+ rc.w[0] = rc.w[1] = round_consts[enc_rnum];
37
-DeviceState *sifive_clint_create(hwaddr addr, hwaddr size, uint32_t num_harts,
38
- uint32_t sip_base, uint32_t timecmp_base, uint32_t time_base,
39
- bool provide_rdtime);
40
+DeviceState *sifive_clint_create(hwaddr addr, hwaddr size,
41
+ uint32_t hartid_base, uint32_t num_harts, uint32_t sip_base,
42
+ uint32_t timecmp_base, uint32_t time_base, bool provide_rdtime);
43
44
enum {
45
SIFIVE_SIP_BASE = 0x0,
46
diff --git a/hw/riscv/sifive_clint.c b/hw/riscv/sifive_clint.c
47
index XXXXXXX..XXXXXXX 100644
48
--- a/hw/riscv/sifive_clint.c
49
+++ b/hw/riscv/sifive_clint.c
50
@@ -XXX,XX +XXX,XX @@ static uint64_t sifive_clint_read(void *opaque, hwaddr addr, unsigned size)
51
SiFiveCLINTState *clint = opaque;
52
if (addr >= clint->sip_base &&
53
addr < clint->sip_base + (clint->num_harts << 2)) {
54
- size_t hartid = (addr - clint->sip_base) >> 2;
55
+ size_t hartid = clint->hartid_base + ((addr - clint->sip_base) >> 2);
56
CPUState *cpu = qemu_get_cpu(hartid);
57
CPURISCVState *env = cpu ? cpu->env_ptr : NULL;
58
if (!env) {
59
@@ -XXX,XX +XXX,XX @@ static uint64_t sifive_clint_read(void *opaque, hwaddr addr, unsigned size)
60
}
61
} else if (addr >= clint->timecmp_base &&
62
addr < clint->timecmp_base + (clint->num_harts << 3)) {
63
- size_t hartid = (addr - clint->timecmp_base) >> 3;
64
+ size_t hartid = clint->hartid_base +
65
+ ((addr - clint->timecmp_base) >> 3);
66
CPUState *cpu = qemu_get_cpu(hartid);
67
CPURISCVState *env = cpu ? cpu->env_ptr : NULL;
68
if (!env) {
69
@@ -XXX,XX +XXX,XX @@ static void sifive_clint_write(void *opaque, hwaddr addr, uint64_t value,
70
71
if (addr >= clint->sip_base &&
72
addr < clint->sip_base + (clint->num_harts << 2)) {
73
- size_t hartid = (addr - clint->sip_base) >> 2;
74
+ size_t hartid = clint->hartid_base + ((addr - clint->sip_base) >> 2);
75
CPUState *cpu = qemu_get_cpu(hartid);
76
CPURISCVState *env = cpu ? cpu->env_ptr : NULL;
77
if (!env) {
78
@@ -XXX,XX +XXX,XX @@ static void sifive_clint_write(void *opaque, hwaddr addr, uint64_t value,
79
return;
80
} else if (addr >= clint->timecmp_base &&
81
addr < clint->timecmp_base + (clint->num_harts << 3)) {
82
- size_t hartid = (addr - clint->timecmp_base) >> 3;
83
+ size_t hartid = clint->hartid_base +
84
+ ((addr - clint->timecmp_base) >> 3);
85
CPUState *cpu = qemu_get_cpu(hartid);
86
CPURISCVState *env = cpu ? cpu->env_ptr : NULL;
87
if (!env) {
88
@@ -XXX,XX +XXX,XX @@ static const MemoryRegionOps sifive_clint_ops = {
89
};
90
91
static Property sifive_clint_properties[] = {
92
+ DEFINE_PROP_UINT32("hartid-base", SiFiveCLINTState, hartid_base, 0),
93
DEFINE_PROP_UINT32("num-harts", SiFiveCLINTState, num_harts, 0),
94
DEFINE_PROP_UINT32("sip-base", SiFiveCLINTState, sip_base, 0),
95
DEFINE_PROP_UINT32("timecmp-base", SiFiveCLINTState, timecmp_base, 0),
96
@@ -XXX,XX +XXX,XX @@ type_init(sifive_clint_register_types)
97
/*
98
* Create CLINT device.
99
*/
100
-DeviceState *sifive_clint_create(hwaddr addr, hwaddr size, uint32_t num_harts,
101
- uint32_t sip_base, uint32_t timecmp_base, uint32_t time_base,
102
- bool provide_rdtime)
103
+DeviceState *sifive_clint_create(hwaddr addr, hwaddr size,
104
+ uint32_t hartid_base, uint32_t num_harts, uint32_t sip_base,
105
+ uint32_t timecmp_base, uint32_t time_base, bool provide_rdtime)
106
{
107
int i;
108
for (i = 0; i < num_harts; i++) {
109
- CPUState *cpu = qemu_get_cpu(i);
110
+ CPUState *cpu = qemu_get_cpu(hartid_base + i);
111
CPURISCVState *env = cpu ? cpu->env_ptr : NULL;
112
if (!env) {
113
continue;
114
@@ -XXX,XX +XXX,XX @@ DeviceState *sifive_clint_create(hwaddr addr, hwaddr size, uint32_t num_harts,
115
}
37
}
116
38
117
DeviceState *dev = qdev_new(TYPE_SIFIVE_CLINT);
39
- temp = ((uint32_t)AES_sbox[(temp >> 24) & 0xFF] << 24) |
118
+ qdev_prop_set_uint32(dev, "hartid-base", hartid_base);
40
- ((uint32_t)AES_sbox[(temp >> 16) & 0xFF] << 16) |
119
qdev_prop_set_uint32(dev, "num-harts", num_harts);
41
- ((uint32_t)AES_sbox[(temp >> 8) & 0xFF] << 8) |
120
qdev_prop_set_uint32(dev, "sip-base", sip_base);
42
- ((uint32_t)AES_sbox[(temp >> 0) & 0xFF] << 0);
121
qdev_prop_set_uint32(dev, "timecmp-base", timecmp_base);
43
+ t.w[0] = t.w[1] = t.w[2] = t.w[3] = temp;
122
diff --git a/hw/riscv/sifive_e.c b/hw/riscv/sifive_e.c
44
+ aesenc_SB_SR_AK(&t, &t, &rc, false);
123
index XXXXXXX..XXXXXXX 100644
45
124
--- a/hw/riscv/sifive_e.c
46
- temp ^= rcon_;
125
+++ b/hw/riscv/sifive_e.c
47
-
126
@@ -XXX,XX +XXX,XX @@ static void sifive_e_soc_realize(DeviceState *dev, Error **errp)
48
- result = ((uint64_t)temp << 32) | temp;
127
SIFIVE_E_PLIC_CONTEXT_STRIDE,
49
-
128
memmap[SIFIVE_E_PLIC].size);
50
- return result;
129
sifive_clint_create(memmap[SIFIVE_E_CLINT].base,
51
+ return t.d[0];
130
- memmap[SIFIVE_E_CLINT].size, ms->smp.cpus,
131
+ memmap[SIFIVE_E_CLINT].size, 0, ms->smp.cpus,
132
SIFIVE_SIP_BASE, SIFIVE_TIMECMP_BASE, SIFIVE_TIME_BASE, false);
133
create_unimplemented_device("riscv.sifive.e.aon",
134
memmap[SIFIVE_E_AON].base, memmap[SIFIVE_E_AON].size);
135
diff --git a/hw/riscv/sifive_u.c b/hw/riscv/sifive_u.c
136
index XXXXXXX..XXXXXXX 100644
137
--- a/hw/riscv/sifive_u.c
138
+++ b/hw/riscv/sifive_u.c
139
@@ -XXX,XX +XXX,XX @@ static void sifive_u_soc_realize(DeviceState *dev, Error **errp)
140
sifive_uart_create(system_memory, memmap[SIFIVE_U_UART1].base,
141
serial_hd(1), qdev_get_gpio_in(DEVICE(s->plic), SIFIVE_U_UART1_IRQ));
142
sifive_clint_create(memmap[SIFIVE_U_CLINT].base,
143
- memmap[SIFIVE_U_CLINT].size, ms->smp.cpus,
144
+ memmap[SIFIVE_U_CLINT].size, 0, ms->smp.cpus,
145
SIFIVE_SIP_BASE, SIFIVE_TIMECMP_BASE, SIFIVE_TIME_BASE, false);
146
147
if (!sysbus_realize(SYS_BUS_DEVICE(&s->prci), errp)) {
148
diff --git a/hw/riscv/spike.c b/hw/riscv/spike.c
149
index XXXXXXX..XXXXXXX 100644
150
--- a/hw/riscv/spike.c
151
+++ b/hw/riscv/spike.c
152
@@ -XXX,XX +XXX,XX @@ static void spike_board_init(MachineState *machine)
153
154
/* Core Local Interruptor (timer and IPI) */
155
sifive_clint_create(memmap[SPIKE_CLINT].base, memmap[SPIKE_CLINT].size,
156
- smp_cpus, SIFIVE_SIP_BASE, SIFIVE_TIMECMP_BASE, SIFIVE_TIME_BASE,
157
+ 0, smp_cpus, SIFIVE_SIP_BASE, SIFIVE_TIMECMP_BASE, SIFIVE_TIME_BASE,
158
false);
159
}
52
}
160
53
161
diff --git a/hw/riscv/virt.c b/hw/riscv/virt.c
54
target_ulong HELPER(aes64im)(target_ulong rs1)
162
index XXXXXXX..XXXXXXX 100644
163
--- a/hw/riscv/virt.c
164
+++ b/hw/riscv/virt.c
165
@@ -XXX,XX +XXX,XX @@ static void virt_machine_init(MachineState *machine)
166
VIRT_PLIC_CONTEXT_STRIDE,
167
memmap[VIRT_PLIC].size);
168
sifive_clint_create(memmap[VIRT_CLINT].base,
169
- memmap[VIRT_CLINT].size, smp_cpus,
170
+ memmap[VIRT_CLINT].size, 0, smp_cpus,
171
SIFIVE_SIP_BASE, SIFIVE_TIMECMP_BASE, SIFIVE_TIME_BASE, true);
172
sifive_test_create(memmap[VIRT_TEST].base);
173
174
--
55
--
175
2.28.0
56
2.41.0
176
57
177
58
diff view generated by jsdifflib
1
From: Akihiko Odaki <akihiko.odaki@daynix.com>
2
3
riscv_trigger_init() had been called on reset events that can happen
4
several times for a CPU and it allocated timers for itrigger. If old
5
timers were present, they were simply overwritten by the new timers,
6
resulting in a memory leak.
7
8
Divide riscv_trigger_init() into two functions, namely
9
riscv_trigger_realize() and riscv_trigger_reset() and call them in
10
appropriate timing. The timer allocation will happen only once for a
11
CPU in riscv_trigger_realize().
12
13
Fixes: 5a4ae64cac ("target/riscv: Add itrigger support when icount is enabled")
14
Signed-off-by: Akihiko Odaki <akihiko.odaki@daynix.com>
15
Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org>
16
Reviewed-by: LIU Zhiwei <zhiwei_liu@linux.alibaba.com>
17
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
18
Message-ID: <20230818034059.9146-1-akihiko.odaki@daynix.com>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
19
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: f3f4fd2ec22a07cc1d750e96895d6813f131de4d.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <f3f4fd2ec22a07cc1d750e96895d6813f131de4d.1597259519.git.alistair.francis@wdc.com>
4
---
20
---
5
target/riscv/csr.c | 9 +++++++++
21
target/riscv/debug.h | 3 ++-
6
1 file changed, 9 insertions(+)
22
target/riscv/cpu.c | 8 +++++++-
23
target/riscv/debug.c | 15 ++++++++++++---
24
3 files changed, 21 insertions(+), 5 deletions(-)
7
25
8
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
26
diff --git a/target/riscv/debug.h b/target/riscv/debug.h
9
index XXXXXXX..XXXXXXX 100644
27
index XXXXXXX..XXXXXXX 100644
10
--- a/target/riscv/csr.c
28
--- a/target/riscv/debug.h
11
+++ b/target/riscv/csr.c
29
+++ b/target/riscv/debug.h
12
@@ -XXX,XX +XXX,XX @@ static int write_satp(CPURISCVState *env, int csrno, target_ulong val)
30
@@ -XXX,XX +XXX,XX @@ void riscv_cpu_debug_excp_handler(CPUState *cs);
13
static int read_hstatus(CPURISCVState *env, int csrno, target_ulong *val)
31
bool riscv_cpu_debug_check_breakpoint(CPUState *cs);
14
{
32
bool riscv_cpu_debug_check_watchpoint(CPUState *cs, CPUWatchpoint *wp);
15
*val = env->hstatus;
33
16
+#ifdef TARGET_RISCV64
34
-void riscv_trigger_init(CPURISCVState *env);
17
+ /* We only support 64-bit VSXL */
35
+void riscv_trigger_realize(CPURISCVState *env);
18
+ *val = set_field(*val, HSTATUS_VSXL, 2);
36
+void riscv_trigger_reset_hold(CPURISCVState *env);
19
+#endif
37
20
return 0;
38
bool riscv_itrigger_enabled(CPURISCVState *env);
21
}
39
void riscv_itrigger_update_priv(CPURISCVState *env);
22
40
diff --git a/target/riscv/cpu.c b/target/riscv/cpu.c
23
static int write_hstatus(CPURISCVState *env, int csrno, target_ulong val)
41
index XXXXXXX..XXXXXXX 100644
24
{
42
--- a/target/riscv/cpu.c
25
env->hstatus = val;
43
+++ b/target/riscv/cpu.c
26
+#ifdef TARGET_RISCV64
44
@@ -XXX,XX +XXX,XX @@ static void riscv_cpu_reset_hold(Object *obj)
27
+ if (get_field(val, HSTATUS_VSXL) != 2) {
45
28
+ qemu_log_mask(LOG_UNIMP, "QEMU does not support mixed HSXLEN options.");
46
#ifndef CONFIG_USER_ONLY
47
if (cpu->cfg.debug) {
48
- riscv_trigger_init(env);
49
+ riscv_trigger_reset_hold(env);
50
}
51
52
if (kvm_enabled()) {
53
@@ -XXX,XX +XXX,XX @@ static void riscv_cpu_realize(DeviceState *dev, Error **errp)
54
55
riscv_cpu_register_gdb_regs_for_features(cs);
56
57
+#ifndef CONFIG_USER_ONLY
58
+ if (cpu->cfg.debug) {
59
+ riscv_trigger_realize(&cpu->env);
29
+ }
60
+ }
30
+#endif
61
+#endif
31
return 0;
62
+
63
qemu_init_vcpu(cs);
64
cpu_reset(cs);
65
66
diff --git a/target/riscv/debug.c b/target/riscv/debug.c
67
index XXXXXXX..XXXXXXX 100644
68
--- a/target/riscv/debug.c
69
+++ b/target/riscv/debug.c
70
@@ -XXX,XX +XXX,XX @@ bool riscv_cpu_debug_check_watchpoint(CPUState *cs, CPUWatchpoint *wp)
71
return false;
32
}
72
}
33
73
74
-void riscv_trigger_init(CPURISCVState *env)
75
+void riscv_trigger_realize(CPURISCVState *env)
76
+{
77
+ int i;
78
+
79
+ for (i = 0; i < RV_MAX_TRIGGERS; i++) {
80
+ env->itrigger_timer[i] = timer_new_ns(QEMU_CLOCK_VIRTUAL,
81
+ riscv_itrigger_timer_cb, env);
82
+ }
83
+}
84
+
85
+void riscv_trigger_reset_hold(CPURISCVState *env)
86
{
87
target_ulong tdata1 = build_tdata1(env, TRIGGER_TYPE_AD_MATCH, 0, 0);
88
int i;
89
@@ -XXX,XX +XXX,XX @@ void riscv_trigger_init(CPURISCVState *env)
90
env->tdata3[i] = 0;
91
env->cpu_breakpoint[i] = NULL;
92
env->cpu_watchpoint[i] = NULL;
93
- env->itrigger_timer[i] = timer_new_ns(QEMU_CLOCK_VIRTUAL,
94
- riscv_itrigger_timer_cb, env);
95
+ timer_del(env->itrigger_timer[i]);
96
}
97
}
34
--
98
--
35
2.28.0
99
2.41.0
36
100
37
101
diff view generated by jsdifflib
New patch
1
From: Leon Schuermann <leons@opentitan.org>
1
2
3
When the rule-lock bypass (RLB) bit is set in the mseccfg CSR, the PMP
4
configuration lock bits must not apply. While this behavior is
5
implemented for the pmpcfgX CSRs, this bit is not respected for
6
changes to the pmpaddrX CSRs. This patch ensures that pmpaddrX CSR
7
writes work even on locked regions when the global rule-lock bypass is
8
enabled.
9
10
Signed-off-by: Leon Schuermann <leons@opentitan.org>
11
Reviewed-by: Mayuresh Chitale <mchitale@ventanamicro.com>
12
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
13
Message-ID: <20230829215046.1430463-1-leon@is.currently.online>
14
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
15
---
16
target/riscv/pmp.c | 4 ++++
17
1 file changed, 4 insertions(+)
18
19
diff --git a/target/riscv/pmp.c b/target/riscv/pmp.c
20
index XXXXXXX..XXXXXXX 100644
21
--- a/target/riscv/pmp.c
22
+++ b/target/riscv/pmp.c
23
@@ -XXX,XX +XXX,XX @@ static inline uint8_t pmp_get_a_field(uint8_t cfg)
24
*/
25
static inline int pmp_is_locked(CPURISCVState *env, uint32_t pmp_index)
26
{
27
+ /* mseccfg.RLB is set */
28
+ if (MSECCFG_RLB_ISSET(env)) {
29
+ return 0;
30
+ }
31
32
if (env->pmp_state.pmp[pmp_index].cfg_reg & PMP_LOCK) {
33
return 1;
34
--
35
2.41.0
diff view generated by jsdifflib
1
When performing a CSR access let's return a negative exception value on
1
From: Tommy Wu <tommy.wu@sifive.com>
2
an error instead of -1. This will allow us to specify the exception in
3
future patches.
4
2
3
According to the new spec, when vsiselect has a reserved value, attempts
4
from M-mode or HS-mode to access vsireg, or from VS-mode to access
5
sireg, should preferably raise an illegal instruction exception.
6
7
Signed-off-by: Tommy Wu <tommy.wu@sifive.com>
8
Reviewed-by: Frank Chang <frank.chang@sifive.com>
9
Message-ID: <20230816061647.600672-1-tommy.wu@sifive.com>
5
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
10
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
6
Message-id: a487dad60c9b8fe7a2b992c5e0dcc2504a9000a7.1597259519.git.alistair.francis@wdc.com
7
Message-Id: <a487dad60c9b8fe7a2b992c5e0dcc2504a9000a7.1597259519.git.alistair.francis@wdc.com>
8
---
11
---
9
target/riscv/csr.c | 46 ++++++++++++++++++++--------------------
12
target/riscv/csr.c | 7 +++++--
10
target/riscv/op_helper.c | 18 ++++++++++------
13
1 file changed, 5 insertions(+), 2 deletions(-)
11
2 files changed, 35 insertions(+), 29 deletions(-)
12
14
13
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
15
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
14
index XXXXXXX..XXXXXXX 100644
16
index XXXXXXX..XXXXXXX 100644
15
--- a/target/riscv/csr.c
17
--- a/target/riscv/csr.c
16
+++ b/target/riscv/csr.c
18
+++ b/target/riscv/csr.c
17
@@ -XXX,XX +XXX,XX @@ static int fs(CPURISCVState *env, int csrno)
19
@@ -XXX,XX +XXX,XX @@ static int rmw_iprio(target_ulong xlen,
18
return 0;
20
static int rmw_xireg(CPURISCVState *env, int csrno, target_ulong *val,
21
target_ulong new_val, target_ulong wr_mask)
22
{
23
- bool virt;
24
+ bool virt, isel_reserved;
25
uint8_t *iprio;
26
int ret = -EINVAL;
27
target_ulong priv, isel, vgein;
28
@@ -XXX,XX +XXX,XX @@ static int rmw_xireg(CPURISCVState *env, int csrno, target_ulong *val,
29
30
/* Decode register details from CSR number */
31
virt = false;
32
+ isel_reserved = false;
33
switch (csrno) {
34
case CSR_MIREG:
35
iprio = env->miprio;
36
@@ -XXX,XX +XXX,XX @@ static int rmw_xireg(CPURISCVState *env, int csrno, target_ulong *val,
37
riscv_cpu_mxl_bits(env)),
38
val, new_val, wr_mask);
39
}
40
+ } else {
41
+ isel_reserved = true;
19
}
42
}
20
if (!env->debugger && !riscv_cpu_fp_enabled(env)) {
43
21
- return -1;
44
done:
22
+ return -RISCV_EXCP_ILLEGAL_INST;
45
if (ret) {
46
- return (env->virt_enabled && virt) ?
47
+ return (env->virt_enabled && virt && !isel_reserved) ?
48
RISCV_EXCP_VIRT_INSTRUCTION_FAULT : RISCV_EXCP_ILLEGAL_INST;
23
}
49
}
24
#endif
50
return RISCV_EXCP_NONE;
25
return 0;
26
@@ -XXX,XX +XXX,XX @@ static int ctr(CPURISCVState *env, int csrno)
27
28
if (!cpu->cfg.ext_counters) {
29
/* The Counters extensions is not enabled */
30
- return -1;
31
+ return -RISCV_EXCP_ILLEGAL_INST;
32
}
33
#endif
34
return 0;
35
@@ -XXX,XX +XXX,XX @@ static int hmode(CPURISCVState *env, int csrno)
36
}
37
}
38
39
- return -1;
40
+ return -RISCV_EXCP_ILLEGAL_INST;
41
}
42
43
static int pmp(CPURISCVState *env, int csrno)
44
@@ -XXX,XX +XXX,XX @@ static int read_fflags(CPURISCVState *env, int csrno, target_ulong *val)
45
{
46
#if !defined(CONFIG_USER_ONLY)
47
if (!env->debugger && !riscv_cpu_fp_enabled(env)) {
48
- return -1;
49
+ return -RISCV_EXCP_ILLEGAL_INST;
50
}
51
#endif
52
*val = riscv_cpu_get_fflags(env);
53
@@ -XXX,XX +XXX,XX @@ static int write_fflags(CPURISCVState *env, int csrno, target_ulong val)
54
{
55
#if !defined(CONFIG_USER_ONLY)
56
if (!env->debugger && !riscv_cpu_fp_enabled(env)) {
57
- return -1;
58
+ return -RISCV_EXCP_ILLEGAL_INST;
59
}
60
env->mstatus |= MSTATUS_FS;
61
#endif
62
@@ -XXX,XX +XXX,XX @@ static int read_frm(CPURISCVState *env, int csrno, target_ulong *val)
63
{
64
#if !defined(CONFIG_USER_ONLY)
65
if (!env->debugger && !riscv_cpu_fp_enabled(env)) {
66
- return -1;
67
+ return -RISCV_EXCP_ILLEGAL_INST;
68
}
69
#endif
70
*val = env->frm;
71
@@ -XXX,XX +XXX,XX @@ static int write_frm(CPURISCVState *env, int csrno, target_ulong val)
72
{
73
#if !defined(CONFIG_USER_ONLY)
74
if (!env->debugger && !riscv_cpu_fp_enabled(env)) {
75
- return -1;
76
+ return -RISCV_EXCP_ILLEGAL_INST;
77
}
78
env->mstatus |= MSTATUS_FS;
79
#endif
80
@@ -XXX,XX +XXX,XX @@ static int read_fcsr(CPURISCVState *env, int csrno, target_ulong *val)
81
{
82
#if !defined(CONFIG_USER_ONLY)
83
if (!env->debugger && !riscv_cpu_fp_enabled(env)) {
84
- return -1;
85
+ return -RISCV_EXCP_ILLEGAL_INST;
86
}
87
#endif
88
*val = (riscv_cpu_get_fflags(env) << FSR_AEXC_SHIFT)
89
@@ -XXX,XX +XXX,XX @@ static int write_fcsr(CPURISCVState *env, int csrno, target_ulong val)
90
{
91
#if !defined(CONFIG_USER_ONLY)
92
if (!env->debugger && !riscv_cpu_fp_enabled(env)) {
93
- return -1;
94
+ return -RISCV_EXCP_ILLEGAL_INST;
95
}
96
env->mstatus |= MSTATUS_FS;
97
#endif
98
@@ -XXX,XX +XXX,XX @@ static int read_time(CPURISCVState *env, int csrno, target_ulong *val)
99
uint64_t delta = riscv_cpu_virt_enabled(env) ? env->htimedelta : 0;
100
101
if (!env->rdtime_fn) {
102
- return -1;
103
+ return -RISCV_EXCP_ILLEGAL_INST;
104
}
105
106
*val = env->rdtime_fn() + delta;
107
@@ -XXX,XX +XXX,XX @@ static int read_timeh(CPURISCVState *env, int csrno, target_ulong *val)
108
uint64_t delta = riscv_cpu_virt_enabled(env) ? env->htimedelta : 0;
109
110
if (!env->rdtime_fn) {
111
- return -1;
112
+ return -RISCV_EXCP_ILLEGAL_INST;
113
}
114
115
*val = (env->rdtime_fn() + delta) >> 32;
116
@@ -XXX,XX +XXX,XX @@ static int write_mcounteren(CPURISCVState *env, int csrno, target_ulong val)
117
static int read_mscounteren(CPURISCVState *env, int csrno, target_ulong *val)
118
{
119
if (env->priv_ver < PRIV_VERSION_1_11_0) {
120
- return -1;
121
+ return -RISCV_EXCP_ILLEGAL_INST;
122
}
123
*val = env->mcounteren;
124
return 0;
125
@@ -XXX,XX +XXX,XX @@ static int read_mscounteren(CPURISCVState *env, int csrno, target_ulong *val)
126
static int write_mscounteren(CPURISCVState *env, int csrno, target_ulong val)
127
{
128
if (env->priv_ver < PRIV_VERSION_1_11_0) {
129
- return -1;
130
+ return -RISCV_EXCP_ILLEGAL_INST;
131
}
132
env->mcounteren = val;
133
return 0;
134
@@ -XXX,XX +XXX,XX @@ static int read_satp(CPURISCVState *env, int csrno, target_ulong *val)
135
}
136
137
if (env->priv == PRV_S && get_field(env->mstatus, MSTATUS_TVM)) {
138
- return -1;
139
+ return -RISCV_EXCP_ILLEGAL_INST;
140
} else {
141
*val = env->satp;
142
}
143
@@ -XXX,XX +XXX,XX @@ static int write_satp(CPURISCVState *env, int csrno, target_ulong val)
144
((val ^ env->satp) & (SATP_MODE | SATP_ASID | SATP_PPN)))
145
{
146
if (env->priv == PRV_S && get_field(env->mstatus, MSTATUS_TVM)) {
147
- return -1;
148
+ return -RISCV_EXCP_ILLEGAL_INST;
149
} else {
150
if((val ^ env->satp) & SATP_ASID) {
151
tlb_flush(env_cpu(env));
152
@@ -XXX,XX +XXX,XX @@ static int write_hgatp(CPURISCVState *env, int csrno, target_ulong val)
153
static int read_htimedelta(CPURISCVState *env, int csrno, target_ulong *val)
154
{
155
if (!env->rdtime_fn) {
156
- return -1;
157
+ return -RISCV_EXCP_ILLEGAL_INST;
158
}
159
160
#if defined(TARGET_RISCV32)
161
@@ -XXX,XX +XXX,XX @@ static int read_htimedelta(CPURISCVState *env, int csrno, target_ulong *val)
162
static int write_htimedelta(CPURISCVState *env, int csrno, target_ulong val)
163
{
164
if (!env->rdtime_fn) {
165
- return -1;
166
+ return -RISCV_EXCP_ILLEGAL_INST;
167
}
168
169
#if defined(TARGET_RISCV32)
170
@@ -XXX,XX +XXX,XX @@ static int write_htimedelta(CPURISCVState *env, int csrno, target_ulong val)
171
static int read_htimedeltah(CPURISCVState *env, int csrno, target_ulong *val)
172
{
173
if (!env->rdtime_fn) {
174
- return -1;
175
+ return -RISCV_EXCP_ILLEGAL_INST;
176
}
177
178
*val = env->htimedelta >> 32;
179
@@ -XXX,XX +XXX,XX @@ static int read_htimedeltah(CPURISCVState *env, int csrno, target_ulong *val)
180
static int write_htimedeltah(CPURISCVState *env, int csrno, target_ulong val)
181
{
182
if (!env->rdtime_fn) {
183
- return -1;
184
+ return -RISCV_EXCP_ILLEGAL_INST;
185
}
186
187
env->htimedelta = deposit64(env->htimedelta, 32, 32, (uint64_t)val);
188
@@ -XXX,XX +XXX,XX @@ int riscv_csrrw(CPURISCVState *env, int csrno, target_ulong *ret_value,
189
190
if ((write_mask && read_only) ||
191
(!env->debugger && (effective_priv < get_field(csrno, 0x300)))) {
192
- return -1;
193
+ return -RISCV_EXCP_ILLEGAL_INST;
194
}
195
#endif
196
197
/* ensure the CSR extension is enabled. */
198
if (!cpu->cfg.ext_icsr) {
199
- return -1;
200
+ return -RISCV_EXCP_ILLEGAL_INST;
201
}
202
203
/* check predicate */
204
if (!csr_ops[csrno].predicate || csr_ops[csrno].predicate(env, csrno) < 0) {
205
- return -1;
206
+ return -RISCV_EXCP_ILLEGAL_INST;
207
}
208
209
/* execute combined read/write operation if it exists */
210
@@ -XXX,XX +XXX,XX @@ int riscv_csrrw(CPURISCVState *env, int csrno, target_ulong *ret_value,
211
212
/* if no accessor exists then return failure */
213
if (!csr_ops[csrno].read) {
214
- return -1;
215
+ return -RISCV_EXCP_ILLEGAL_INST;
216
}
217
218
/* read old value */
219
diff --git a/target/riscv/op_helper.c b/target/riscv/op_helper.c
220
index XXXXXXX..XXXXXXX 100644
221
--- a/target/riscv/op_helper.c
222
+++ b/target/riscv/op_helper.c
223
@@ -XXX,XX +XXX,XX @@ target_ulong helper_csrrw(CPURISCVState *env, target_ulong src,
224
target_ulong csr)
225
{
226
target_ulong val = 0;
227
- if (riscv_csrrw(env, csr, &val, src, -1) < 0) {
228
- riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
229
+ int ret = riscv_csrrw(env, csr, &val, src, -1);
230
+
231
+ if (ret < 0) {
232
+ riscv_raise_exception(env, -ret, GETPC());
233
}
234
return val;
235
}
236
@@ -XXX,XX +XXX,XX @@ target_ulong helper_csrrs(CPURISCVState *env, target_ulong src,
237
target_ulong csr, target_ulong rs1_pass)
238
{
239
target_ulong val = 0;
240
- if (riscv_csrrw(env, csr, &val, -1, rs1_pass ? src : 0) < 0) {
241
- riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
242
+ int ret = riscv_csrrw(env, csr, &val, -1, rs1_pass ? src : 0);
243
+
244
+ if (ret < 0) {
245
+ riscv_raise_exception(env, -ret, GETPC());
246
}
247
return val;
248
}
249
@@ -XXX,XX +XXX,XX @@ target_ulong helper_csrrc(CPURISCVState *env, target_ulong src,
250
target_ulong csr, target_ulong rs1_pass)
251
{
252
target_ulong val = 0;
253
- if (riscv_csrrw(env, csr, &val, 0, rs1_pass ? src : 0) < 0) {
254
- riscv_raise_exception(env, RISCV_EXCP_ILLEGAL_INST, GETPC());
255
+ int ret = riscv_csrrw(env, csr, &val, 0, rs1_pass ? src : 0);
256
+
257
+ if (ret < 0) {
258
+ riscv_raise_exception(env, -ret, GETPC());
259
}
260
return val;
261
}
262
--
51
--
263
2.28.0
52
2.41.0
264
265
diff view generated by jsdifflib
1
From: Nikita Shubin <n.shubin@yadro.com>
2
3
As per ISA:
4
5
"For CSRRWI, if rd=x0, then the instruction shall not read the CSR and
6
shall not cause any of the side effects that might occur on a CSR read."
7
8
trans_csrrwi() and trans_csrrw() call do_csrw() if rd=x0, do_csrw() calls
9
riscv_csrrw_do64(), via helper_csrw() passing NULL as *ret_value.
10
11
Signed-off-by: Nikita Shubin <n.shubin@yadro.com>
12
Reviewed-by: Alistair Francis <alistair.francis@wdc.com>
13
Message-ID: <20230808090914.17634-1-nikita.shubin@maquefel.me>
1
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
14
Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
2
Message-id: 93e5d4f13eca0d2a588e407187f33c6437aeaaf9.1597259519.git.alistair.francis@wdc.com
3
Message-Id: <93e5d4f13eca0d2a588e407187f33c6437aeaaf9.1597259519.git.alistair.francis@wdc.com>
4
---
15
---
5
target/riscv/csr.c | 5 +++++
16
target/riscv/csr.c | 24 +++++++++++++++---------
6
1 file changed, 5 insertions(+)
17
1 file changed, 15 insertions(+), 9 deletions(-)
7
18
8
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
19
diff --git a/target/riscv/csr.c b/target/riscv/csr.c
9
index XXXXXXX..XXXXXXX 100644
20
index XXXXXXX..XXXXXXX 100644
10
--- a/target/riscv/csr.c
21
--- a/target/riscv/csr.c
11
+++ b/target/riscv/csr.c
22
+++ b/target/riscv/csr.c
12
@@ -XXX,XX +XXX,XX @@ static int read_hstatus(CPURISCVState *env, int csrno, target_ulong *val)
23
@@ -XXX,XX +XXX,XX @@ static RISCVException riscv_csrrw_do64(CPURISCVState *env, int csrno,
13
/* We only support 64-bit VSXL */
24
target_ulong write_mask)
14
*val = set_field(*val, HSTATUS_VSXL, 2);
25
{
15
#endif
26
RISCVException ret;
16
+ /* We only support little endian */
27
- target_ulong old_value;
17
+ *val = set_field(*val, HSTATUS_VSBE, 0);
28
+ target_ulong old_value = 0;
18
return 0;
29
19
}
30
/* execute combined read/write operation if it exists */
20
31
if (csr_ops[csrno].op) {
21
@@ -XXX,XX +XXX,XX @@ static int write_hstatus(CPURISCVState *env, int csrno, target_ulong val)
32
return csr_ops[csrno].op(env, csrno, ret_value, new_value, write_mask);
22
qemu_log_mask(LOG_UNIMP, "QEMU does not support mixed HSXLEN options.");
23
}
33
}
24
#endif
34
25
+ if (get_field(val, HSTATUS_VSBE) != 0) {
35
- /* if no accessor exists then return failure */
26
+ qemu_log_mask(LOG_UNIMP, "QEMU does not support big endian guests.");
36
- if (!csr_ops[csrno].read) {
27
+ }
37
- return RISCV_EXCP_ILLEGAL_INST;
28
return 0;
38
- }
29
}
39
- /* read old value */
30
40
- ret = csr_ops[csrno].read(env, csrno, &old_value);
41
- if (ret != RISCV_EXCP_NONE) {
42
- return ret;
43
+ /*
44
+ * ret_value == NULL means that rd=x0 and we're coming from helper_csrw()
45
+ * and we can't throw side effects caused by CSR reads.
46
+ */
47
+ if (ret_value) {
48
+ /* if no accessor exists then return failure */
49
+ if (!csr_ops[csrno].read) {
50
+ return RISCV_EXCP_ILLEGAL_INST;
51
+ }
52
+ /* read old value */
53
+ ret = csr_ops[csrno].read(env, csrno, &old_value);
54
+ if (ret != RISCV_EXCP_NONE) {
55
+ return ret;
56
+ }
57
}
58
59
/* write value if writable and write mask set, otherwise drop writes */
31
--
60
--
32
2.28.0
61
2.41.0
33
34
diff view generated by jsdifflib