The RMPREAD instruction returns an architecture defined format of an
RMP entry. This is the preferred method for examining RMP entries.
In preparation for using the RMPREAD instruction, convert the existing
code that directly accesses the RMP to map the raw RMP information into
the architecture defined format.
RMPREAD output returns a status bit for the 2MB region status. If the
input page address is 2MB aligned and any other pages within the 2MB
region are assigned, then 2MB region status will be set to 1. Otherwise,
the 2MB region status will be set to 0. For systems that do not support
RMPREAD, calculating this value would require looping over all of the RMP
table entries within that range until one is found with the assigned bit
set. Since this bit is not defined in the current format, and so not used
today, do not incur the overhead associated with calculating it.
Signed-off-by: Tom Lendacky <thomas.lendacky@amd.com>
Reviewed-by: Nikunj A Dadhania <nikunj@amd.com>
Reviewed-by: Neeraj Upadhyay <Neeraj.Upadhyay@amd.com>
---
arch/x86/virt/svm/sev.c | 144 ++++++++++++++++++++++++++++------------
1 file changed, 100 insertions(+), 44 deletions(-)
diff --git a/arch/x86/virt/svm/sev.c b/arch/x86/virt/svm/sev.c
index 9a6a943d8e41..cf64e9384ea0 100644
--- a/arch/x86/virt/svm/sev.c
+++ b/arch/x86/virt/svm/sev.c
@@ -31,10 +31,29 @@
#include <asm/iommu.h>
/*
- * The RMP entry format is not architectural. The format is defined in PPR
- * Family 19h Model 01h, Rev B1 processor.
+ * The RMP entry information as returned by the RMPREAD instruction.
*/
struct rmpentry {
+ u64 gpa;
+ u8 assigned :1,
+ rsvd1 :7;
+ u8 pagesize :1,
+ hpage_region_status :1,
+ rsvd2 :6;
+ u8 immutable :1,
+ rsvd3 :7;
+ u8 rsvd4;
+ u32 asid;
+} __packed;
+
+/*
+ * The raw RMP entry format is not architectural. The format is defined in PPR
+ * Family 19h Model 01h, Rev B1 processor. This format represents the actual
+ * entry in the RMP table memory. The bitfield definitions are used for machines
+ * without the RMPREAD instruction (Zen3 and Zen4), otherwise the "hi" and "lo"
+ * fields are only used for dumping the raw data.
+ */
+struct rmpentry_raw {
union {
struct {
u64 assigned : 1,
@@ -62,7 +81,7 @@ struct rmpentry {
#define PFN_PMD_MASK GENMASK_ULL(63, PMD_SHIFT - PAGE_SHIFT)
static u64 probed_rmp_base, probed_rmp_size;
-static struct rmpentry *rmptable __ro_after_init;
+static struct rmpentry_raw *rmptable __ro_after_init;
static u64 rmptable_max_pfn __ro_after_init;
static LIST_HEAD(snp_leaked_pages_list);
@@ -249,8 +268,8 @@ static int __init snp_rmptable_init(void)
rmptable_start += RMPTABLE_CPU_BOOKKEEPING_SZ;
rmptable_size = probed_rmp_size - RMPTABLE_CPU_BOOKKEEPING_SZ;
- rmptable = (struct rmpentry *)rmptable_start;
- rmptable_max_pfn = rmptable_size / sizeof(struct rmpentry) - 1;
+ rmptable = (struct rmpentry_raw *)rmptable_start;
+ rmptable_max_pfn = rmptable_size / sizeof(struct rmpentry_raw) - 1;
cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, "x86/rmptable_init:online", __snp_enable, NULL);
@@ -272,48 +291,77 @@ static int __init snp_rmptable_init(void)
*/
device_initcall(snp_rmptable_init);
-static struct rmpentry *get_rmpentry(u64 pfn)
+static struct rmpentry_raw *get_raw_rmpentry(u64 pfn)
{
- if (WARN_ON_ONCE(pfn > rmptable_max_pfn))
- return ERR_PTR(-EFAULT);
-
- return &rmptable[pfn];
-}
-
-static struct rmpentry *__snp_lookup_rmpentry(u64 pfn, int *level)
-{
- struct rmpentry *large_entry, *entry;
-
- if (!cc_platform_has(CC_ATTR_HOST_SEV_SNP))
+ if (!rmptable)
return ERR_PTR(-ENODEV);
- entry = get_rmpentry(pfn);
- if (IS_ERR(entry))
- return entry;
+ if (unlikely(pfn > rmptable_max_pfn))
+ return ERR_PTR(-EFAULT);
+
+ return rmptable + pfn;
+}
+
+static int get_rmpentry(u64 pfn, struct rmpentry *e)
+{
+ struct rmpentry_raw *e_raw;
+
+ e_raw = get_raw_rmpentry(pfn);
+ if (IS_ERR(e_raw))
+ return PTR_ERR(e_raw);
+
+ /*
+ * Map the raw RMP table entry onto the RMPREAD output format.
+ * The 2MB region status indicator (hpage_region_status field) is not
+ * calculated, since the overhead could be significant and the field
+ * is not used.
+ */
+ memset(e, 0, sizeof(*e));
+ e->gpa = e_raw->gpa << PAGE_SHIFT;
+ e->asid = e_raw->asid;
+ e->assigned = e_raw->assigned;
+ e->pagesize = e_raw->pagesize;
+ e->immutable = e_raw->immutable;
+
+ return 0;
+}
+
+static int __snp_lookup_rmpentry(u64 pfn, struct rmpentry *e, int *level)
+{
+ struct rmpentry e_large;
+ int ret;
+
+ if (!cc_platform_has(CC_ATTR_HOST_SEV_SNP))
+ return -ENODEV;
+
+ ret = get_rmpentry(pfn, e);
+ if (ret)
+ return ret;
/*
* Find the authoritative RMP entry for a PFN. This can be either a 4K
* RMP entry or a special large RMP entry that is authoritative for a
* whole 2M area.
*/
- large_entry = get_rmpentry(pfn & PFN_PMD_MASK);
- if (IS_ERR(large_entry))
- return large_entry;
+ ret = get_rmpentry(pfn & PFN_PMD_MASK, &e_large);
+ if (ret)
+ return ret;
- *level = RMP_TO_PG_LEVEL(large_entry->pagesize);
+ *level = RMP_TO_PG_LEVEL(e_large.pagesize);
- return entry;
+ return 0;
}
int snp_lookup_rmpentry(u64 pfn, bool *assigned, int *level)
{
- struct rmpentry *e;
+ struct rmpentry e;
+ int ret;
- e = __snp_lookup_rmpentry(pfn, level);
- if (IS_ERR(e))
- return PTR_ERR(e);
+ ret = __snp_lookup_rmpentry(pfn, &e, level);
+ if (ret)
+ return ret;
- *assigned = !!e->assigned;
+ *assigned = !!e.assigned;
return 0;
}
EXPORT_SYMBOL_GPL(snp_lookup_rmpentry);
@@ -326,20 +374,28 @@ EXPORT_SYMBOL_GPL(snp_lookup_rmpentry);
*/
static void dump_rmpentry(u64 pfn)
{
+ struct rmpentry_raw *e_raw;
u64 pfn_i, pfn_end;
- struct rmpentry *e;
- int level;
+ struct rmpentry e;
+ int level, ret;
- e = __snp_lookup_rmpentry(pfn, &level);
- if (IS_ERR(e)) {
- pr_err("Failed to read RMP entry for PFN 0x%llx, error %ld\n",
- pfn, PTR_ERR(e));
+ ret = __snp_lookup_rmpentry(pfn, &e, &level);
+ if (ret) {
+ pr_err("Failed to read RMP entry for PFN 0x%llx, error %d\n",
+ pfn, ret);
return;
}
- if (e->assigned) {
+ if (e.assigned) {
+ e_raw = get_raw_rmpentry(pfn);
+ if (IS_ERR(e_raw)) {
+ pr_err("Failed to read RMP contents for PFN 0x%llx, error %ld\n",
+ pfn, PTR_ERR(e_raw));
+ return;
+ }
+
pr_info("PFN 0x%llx, RMP entry: [0x%016llx - 0x%016llx]\n",
- pfn, e->lo, e->hi);
+ pfn, e_raw->lo, e_raw->hi);
return;
}
@@ -358,16 +414,16 @@ static void dump_rmpentry(u64 pfn)
pfn, pfn_i, pfn_end);
while (pfn_i < pfn_end) {
- e = __snp_lookup_rmpentry(pfn_i, &level);
- if (IS_ERR(e)) {
- pr_err("Error %ld reading RMP entry for PFN 0x%llx\n",
- PTR_ERR(e), pfn_i);
+ e_raw = get_raw_rmpentry(pfn_i);
+ if (IS_ERR(e_raw)) {
+ pr_err("Error %ld reading RMP contents for PFN 0x%llx\n",
+ PTR_ERR(e_raw), pfn_i);
pfn_i++;
continue;
}
- if (e->lo || e->hi)
- pr_info("PFN: 0x%llx, [0x%016llx - 0x%016llx]\n", pfn_i, e->lo, e->hi);
+ if (e_raw->lo || e_raw->hi)
+ pr_info("PFN: 0x%llx, [0x%016llx - 0x%016llx]\n", pfn_i, e_raw->lo, e_raw->hi);
pfn_i++;
}
}
--
2.46.2
On Mon, Dec 02, 2024 at 02:50:46PM -0600, Tom Lendacky wrote: > +static int __snp_lookup_rmpentry(u64 pfn, struct rmpentry *e, int *level) > +{ > + struct rmpentry e_large; > + int ret; > + > + if (!cc_platform_has(CC_ATTR_HOST_SEV_SNP)) Btw, just a side note: this is AMD-specific and x86 code so we probably should use: if (!cpu_feature_enabled(X86_FEATURE_SEV_SNP)) For another series. > + return -ENODEV; > + > + ret = get_rmpentry(pfn, e); > + if (ret) > + return ret; > > /* > * Find the authoritative RMP entry for a PFN. This can be either a 4K > * RMP entry or a special large RMP entry that is authoritative for a > * whole 2M area. > */ > - large_entry = get_rmpentry(pfn & PFN_PMD_MASK); > - if (IS_ERR(large_entry)) > - return large_entry; > + ret = get_rmpentry(pfn & PFN_PMD_MASK, &e_large); > + if (ret) > + return ret; > > - *level = RMP_TO_PG_LEVEL(large_entry->pagesize); > + *level = RMP_TO_PG_LEVEL(e_large.pagesize); > > - return entry; > + return 0; > } ... > static void dump_rmpentry(u64 pfn) > { > + struct rmpentry_raw *e_raw; > u64 pfn_i, pfn_end; > - struct rmpentry *e; > - int level; > + struct rmpentry e; > + int level, ret; > > - e = __snp_lookup_rmpentry(pfn, &level); > - if (IS_ERR(e)) { > - pr_err("Failed to read RMP entry for PFN 0x%llx, error %ld\n", > - pfn, PTR_ERR(e)); > + ret = __snp_lookup_rmpentry(pfn, &e, &level); > + if (ret) { > + pr_err("Failed to read RMP entry for PFN 0x%llx, error %d\n", > + pfn, ret); > return; > } > > - if (e->assigned) { > + if (e.assigned) { > + e_raw = get_raw_rmpentry(pfn); > + if (IS_ERR(e_raw)) { > + pr_err("Failed to read RMP contents for PFN 0x%llx, error %ld\n", > + pfn, PTR_ERR(e_raw)); > + return; > + } > + > pr_info("PFN 0x%llx, RMP entry: [0x%016llx - 0x%016llx]\n", > - pfn, e->lo, e->hi); > + pfn, e_raw->lo, e_raw->hi); > return; > } Do I see it correctly that we don't really need to call that get_raw_rmpentry() again for that @pfn because __snp_lookup_rmpentry() returned the whole thing in @e already? IOW: diff --git a/arch/x86/virt/svm/sev.c b/arch/x86/virt/svm/sev.c index cf64e9384ea0..2e1833426b08 100644 --- a/arch/x86/virt/svm/sev.c +++ b/arch/x86/virt/svm/sev.c @@ -387,15 +387,8 @@ static void dump_rmpentry(u64 pfn) } if (e.assigned) { - e_raw = get_raw_rmpentry(pfn); - if (IS_ERR(e_raw)) { - pr_err("Failed to read RMP contents for PFN 0x%llx, error %ld\n", - pfn, PTR_ERR(e_raw)); - return; - } - - pr_info("PFN 0x%llx, RMP entry: [0x%016llx - 0x%016llx]\n", - pfn, e_raw->lo, e_raw->hi); + pr_info("PFN 0x%llx, RMP entry: [ASID: 0x%x, pagesize: 0x%x, immutable: %d]\n", + e.gpa, e.asid, e.pagesize, e.immutable); return; } -- Regards/Gruss, Boris. https://people.kernel.org/tglx/notes-about-netiquette
On 12/3/24 10:01, Borislav Petkov wrote: > On Mon, Dec 02, 2024 at 02:50:46PM -0600, Tom Lendacky wrote: >> +static int __snp_lookup_rmpentry(u64 pfn, struct rmpentry *e, int *level) >> +{ >> + struct rmpentry e_large; >> + int ret; >> + >> + if (!cc_platform_has(CC_ATTR_HOST_SEV_SNP)) > > Btw, just a side note: this is AMD-specific and x86 code so we probably should > use: > > if (!cpu_feature_enabled(X86_FEATURE_SEV_SNP)) > > For another series. > >> + return -ENODEV; >> + >> + ret = get_rmpentry(pfn, e); >> + if (ret) >> + return ret; >> >> /* >> * Find the authoritative RMP entry for a PFN. This can be either a 4K >> * RMP entry or a special large RMP entry that is authoritative for a >> * whole 2M area. >> */ >> - large_entry = get_rmpentry(pfn & PFN_PMD_MASK); >> - if (IS_ERR(large_entry)) >> - return large_entry; >> + ret = get_rmpentry(pfn & PFN_PMD_MASK, &e_large); >> + if (ret) >> + return ret; >> >> - *level = RMP_TO_PG_LEVEL(large_entry->pagesize); >> + *level = RMP_TO_PG_LEVEL(e_large.pagesize); >> >> - return entry; >> + return 0; >> } > > ... > >> static void dump_rmpentry(u64 pfn) >> { >> + struct rmpentry_raw *e_raw; >> u64 pfn_i, pfn_end; >> - struct rmpentry *e; >> - int level; >> + struct rmpentry e; >> + int level, ret; >> >> - e = __snp_lookup_rmpentry(pfn, &level); >> - if (IS_ERR(e)) { >> - pr_err("Failed to read RMP entry for PFN 0x%llx, error %ld\n", >> - pfn, PTR_ERR(e)); >> + ret = __snp_lookup_rmpentry(pfn, &e, &level); >> + if (ret) { >> + pr_err("Failed to read RMP entry for PFN 0x%llx, error %d\n", >> + pfn, ret); >> return; >> } >> >> - if (e->assigned) { >> + if (e.assigned) { >> + e_raw = get_raw_rmpentry(pfn); >> + if (IS_ERR(e_raw)) { >> + pr_err("Failed to read RMP contents for PFN 0x%llx, error %ld\n", >> + pfn, PTR_ERR(e_raw)); >> + return; >> + } >> + >> pr_info("PFN 0x%llx, RMP entry: [0x%016llx - 0x%016llx]\n", >> - pfn, e->lo, e->hi); >> + pfn, e_raw->lo, e_raw->hi); >> return; >> } > > Do I see it correctly that we don't really need to call that > get_raw_rmpentry() again for that @pfn because __snp_lookup_rmpentry() > returned the whole thing in @e already? The idea is to dump the actual RMP contents that exist in memory. The @e value only contains what the RMPREAD instruction chooses to expose. Thanks, Tom > > IOW: > > diff --git a/arch/x86/virt/svm/sev.c b/arch/x86/virt/svm/sev.c > index cf64e9384ea0..2e1833426b08 100644 > --- a/arch/x86/virt/svm/sev.c > +++ b/arch/x86/virt/svm/sev.c > @@ -387,15 +387,8 @@ static void dump_rmpentry(u64 pfn) > } > > if (e.assigned) { > - e_raw = get_raw_rmpentry(pfn); > - if (IS_ERR(e_raw)) { > - pr_err("Failed to read RMP contents for PFN 0x%llx, error %ld\n", > - pfn, PTR_ERR(e_raw)); > - return; > - } > - > - pr_info("PFN 0x%llx, RMP entry: [0x%016llx - 0x%016llx]\n", > - pfn, e_raw->lo, e_raw->hi); > + pr_info("PFN 0x%llx, RMP entry: [ASID: 0x%x, pagesize: 0x%x, immutable: %d]\n", > + e.gpa, e.asid, e.pagesize, e.immutable); > return; > } >
On Tue, Dec 03, 2024 at 10:08:59AM -0600, Tom Lendacky wrote: > The idea is to dump the actual RMP contents that exist in memory. The @e > value only contains what the RMPREAD instruction chooses to expose. Aha, ok. Oh well, get_raw_rmpentry() is fast enough so we can call it again. Thx. -- Regards/Gruss, Boris. https://people.kernel.org/tglx/notes-about-netiquette
© 2016 - 2024 Red Hat, Inc.