Introduces the function is_breg_access_indirect to determine whether a
memory access involving a DW_OP_breg* operation refers to the variable's
value directly or requires dereferencing the variable's type as a
pointer based on the DWARF expression. Previously, all breg based
accesses were assumed to directly access the variable's value
(is_pointer = false).
The is_breg_access_indirect function handles three cases:
1. Base register + offset only: (e.g., DW_OP_breg7 RSP+88) The
calculated address is the location of the variable. The access is
direct, so no type dereference is needed. Returns false.
2. Base register + offset, followed by other operations ending in
DW_OP_stack_value, including DW_OP_deref: (e.g., DW_OP_breg*,
DW_OP_deref, DW_OP_stack_value) The DWARF expression computes the
variable's value, but that value requires a dereference. The memory
access is fetching that value, so no type dereference is needed.
Returns false.
3. Base register + offset, followed only by DW_OP_stack_value: (e.g.,
DW_OP_breg13 R13+256, DW_OP_stack_value) This indicates the value at
the base + offset is the variable's value. Since this value is being
used as an address in the memory access, the variable's type is
treated as a pointer and requires a type dereference. Returns true.
The is_pointer argument passed to match_var_offset is now set by
is_breg_access_indirect for breg accesses.
There are more complex expressions that includes multiple operations and
may require additional handling, such as DW_OP_deref without a
DW_OP_stack_value, or including multiple base registers. They are less
common in the Linux kernel dwarf and are skipped in check_allowed_ops.
Signed-off-by: Zecheng Li <zecheng@google.com>
---
tools/perf/util/dwarf-aux.c | 38 ++++++++++++++++++++++++++++++++-----
1 file changed, 33 insertions(+), 5 deletions(-)
diff --git a/tools/perf/util/dwarf-aux.c b/tools/perf/util/dwarf-aux.c
index 920054425578..449bc9ad7aff 100644
--- a/tools/perf/util/dwarf-aux.c
+++ b/tools/perf/util/dwarf-aux.c
@@ -1423,6 +1423,34 @@ static bool match_var_offset(Dwarf_Die *die_mem, struct find_var_data *data,
return true;
}
+/**
+ * is_breg_access_indirect - Check if breg based access implies type
+ * dereference
+ * @ops: DWARF operations array
+ * @nops: Number of operations in @ops
+ *
+ * Returns true if the DWARF expression evaluates to the variable's
+ * value, so the memory access on that register needs type dereference.
+ * Returns false if the expression evaluates to the variable's address.
+ * This is called after check_allowed_ops.
+ */
+static bool is_breg_access_indirect(Dwarf_Op *ops, size_t nops)
+{
+ /* only the base register */
+ if (nops == 1)
+ return false;
+
+ if (nops == 2 && ops[1].atom == DW_OP_stack_value)
+ return true;
+
+ if (nops == 3 && (ops[1].atom == DW_OP_deref ||
+ ops[1].atom == DW_OP_deref_size) &&
+ ops[2].atom == DW_OP_stack_value)
+ return false;
+ /* unreachable, OP not supported */
+ return false;
+}
+
/* Only checks direct child DIEs in the given scope. */
static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
{
@@ -1451,7 +1479,7 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
if (data->is_fbreg && ops->atom == DW_OP_fbreg &&
check_allowed_ops(ops, nops) &&
match_var_offset(die_mem, data, data->offset, ops->number,
- /*is_pointer=*/false))
+ is_breg_access_indirect(ops, nops)))
return DIE_FIND_CB_END;
/* Only match with a simple case */
@@ -1463,11 +1491,11 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
/*is_pointer=*/true))
return DIE_FIND_CB_END;
- /* Local variables accessed by a register + offset */
+ /* variables accessed by a register + offset */
if (ops->atom == (DW_OP_breg0 + data->reg) &&
check_allowed_ops(ops, nops) &&
match_var_offset(die_mem, data, data->offset, ops->number,
- /*is_pointer=*/false))
+ is_breg_access_indirect(ops, nops)))
return DIE_FIND_CB_END;
} else {
/* pointer variables saved in a register 32 or above */
@@ -1477,11 +1505,11 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
/*is_pointer=*/true))
return DIE_FIND_CB_END;
- /* Local variables accessed by a register + offset */
+ /* variables accessed by a register + offset */
if (ops->atom == DW_OP_bregx && data->reg == ops->number &&
check_allowed_ops(ops, nops) &&
match_var_offset(die_mem, data, data->offset, ops->number2,
- /*is_poitner=*/false))
+ is_breg_access_indirect(ops, nops)))
return DIE_FIND_CB_END;
}
}
--
2.51.0.261.g7ce5a0a67e-goog
On Mon, Aug 25, 2025 at 07:54:04PM +0000, Zecheng Li wrote:
> Introduces the function is_breg_access_indirect to determine whether a
> memory access involving a DW_OP_breg* operation refers to the variable's
> value directly or requires dereferencing the variable's type as a
> pointer based on the DWARF expression. Previously, all breg based
> accesses were assumed to directly access the variable's value
> (is_pointer = false).
>
> The is_breg_access_indirect function handles three cases:
>
> 1. Base register + offset only: (e.g., DW_OP_breg7 RSP+88) The
> calculated address is the location of the variable. The access is
> direct, so no type dereference is needed. Returns false.
I'm afraid there may be cases that the base register doesn't point to
the stack. In that case it may return true, right?
I think struct find_var_data already has 'is_fbreg' field. Maybe you
can add 'is_stack' or 'is_stack_reg' field if the target. Currently we
hardcoded X86_REG_SP but it should be arch-dependent.
>
> 2. Base register + offset, followed by other operations ending in
> DW_OP_stack_value, including DW_OP_deref: (e.g., DW_OP_breg*,
> DW_OP_deref, DW_OP_stack_value) The DWARF expression computes the
> variable's value, but that value requires a dereference. The memory
> access is fetching that value, so no type dereference is needed.
> Returns false.
>
> 3. Base register + offset, followed only by DW_OP_stack_value: (e.g.,
> DW_OP_breg13 R13+256, DW_OP_stack_value) This indicates the value at
> the base + offset is the variable's value. Since this value is being
> used as an address in the memory access, the variable's type is
> treated as a pointer and requires a type dereference. Returns true.
>
> The is_pointer argument passed to match_var_offset is now set by
> is_breg_access_indirect for breg accesses.
>
> There are more complex expressions that includes multiple operations and
> may require additional handling, such as DW_OP_deref without a
> DW_OP_stack_value, or including multiple base registers. They are less
> common in the Linux kernel dwarf and are skipped in check_allowed_ops.
>
> Signed-off-by: Zecheng Li <zecheng@google.com>
> ---
> tools/perf/util/dwarf-aux.c | 38 ++++++++++++++++++++++++++++++++-----
> 1 file changed, 33 insertions(+), 5 deletions(-)
>
> diff --git a/tools/perf/util/dwarf-aux.c b/tools/perf/util/dwarf-aux.c
> index 920054425578..449bc9ad7aff 100644
> --- a/tools/perf/util/dwarf-aux.c
> +++ b/tools/perf/util/dwarf-aux.c
> @@ -1423,6 +1423,34 @@ static bool match_var_offset(Dwarf_Die *die_mem, struct find_var_data *data,
> return true;
> }
>
> +/**
> + * is_breg_access_indirect - Check if breg based access implies type
> + * dereference
> + * @ops: DWARF operations array
> + * @nops: Number of operations in @ops
> + *
> + * Returns true if the DWARF expression evaluates to the variable's
> + * value, so the memory access on that register needs type dereference.
> + * Returns false if the expression evaluates to the variable's address.
> + * This is called after check_allowed_ops.
> + */
> +static bool is_breg_access_indirect(Dwarf_Op *ops, size_t nops)
> +{
> + /* only the base register */
> + if (nops == 1)
> + return false;
Then it could be like below:
if (nops == 1) {
int reg = reg_from_dwarf_op(ops);
return !(reg == DWARF_REG_FB || data->is_fbreg || reg == data->is_stack);
}
Thanks,
Namhyung
> +
> + if (nops == 2 && ops[1].atom == DW_OP_stack_value)
> + return true;
> +
> + if (nops == 3 && (ops[1].atom == DW_OP_deref ||
> + ops[1].atom == DW_OP_deref_size) &&
> + ops[2].atom == DW_OP_stack_value)
> + return false;
> + /* unreachable, OP not supported */
> + return false;
> +}
> +
> /* Only checks direct child DIEs in the given scope. */
> static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> {
> @@ -1451,7 +1479,7 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> if (data->is_fbreg && ops->atom == DW_OP_fbreg &&
> check_allowed_ops(ops, nops) &&
> match_var_offset(die_mem, data, data->offset, ops->number,
> - /*is_pointer=*/false))
> + is_breg_access_indirect(ops, nops)))
> return DIE_FIND_CB_END;
>
> /* Only match with a simple case */
> @@ -1463,11 +1491,11 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> /*is_pointer=*/true))
> return DIE_FIND_CB_END;
>
> - /* Local variables accessed by a register + offset */
> + /* variables accessed by a register + offset */
> if (ops->atom == (DW_OP_breg0 + data->reg) &&
> check_allowed_ops(ops, nops) &&
> match_var_offset(die_mem, data, data->offset, ops->number,
> - /*is_pointer=*/false))
> + is_breg_access_indirect(ops, nops)))
> return DIE_FIND_CB_END;
> } else {
> /* pointer variables saved in a register 32 or above */
> @@ -1477,11 +1505,11 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> /*is_pointer=*/true))
> return DIE_FIND_CB_END;
>
> - /* Local variables accessed by a register + offset */
> + /* variables accessed by a register + offset */
> if (ops->atom == DW_OP_bregx && data->reg == ops->number &&
> check_allowed_ops(ops, nops) &&
> match_var_offset(die_mem, data, data->offset, ops->number2,
> - /*is_poitner=*/false))
> + is_breg_access_indirect(ops, nops)))
> return DIE_FIND_CB_END;
> }
> }
> --
> 2.51.0.261.g7ce5a0a67e-goog
>
On Thu, Aug 28, 2025 at 3:19 AM Namhyung Kim <namhyung@kernel.org> wrote:
>
> On Mon, Aug 25, 2025 at 07:54:04PM +0000, Zecheng Li wrote:
> > Introduces the function is_breg_access_indirect to determine whether a
> > memory access involving a DW_OP_breg* operation refers to the variable's
> > value directly or requires dereferencing the variable's type as a
> > pointer based on the DWARF expression. Previously, all breg based
> > accesses were assumed to directly access the variable's value
> > (is_pointer = false).
> >
> > The is_breg_access_indirect function handles three cases:
> >
> > 1. Base register + offset only: (e.g., DW_OP_breg7 RSP+88) The
> > calculated address is the location of the variable. The access is
> > direct, so no type dereference is needed. Returns false.
>
> I'm afraid there may be cases that the base register doesn't point to
> the stack. In that case it may return true, right?
Hi Namhyung,
In this case, the DWARF specification for a DW_OP_breg* operation is
to always calculate a memory address. So, even if the base register
isn't the stack pointer, the expression still resolves to the
variable's location, meaning the access is direct (is_pointer =
false).
> I think struct find_var_data already has 'is_fbreg' field. Maybe you
> can add 'is_stack' or 'is_stack_reg' field if the target. Currently we
> hardcoded X86_REG_SP but it should be arch-dependent.
Therefore we don't need to check if the register is a stack or frame base.
> >
> > 2. Base register + offset, followed by other operations ending in
> > DW_OP_stack_value, including DW_OP_deref: (e.g., DW_OP_breg*,
> > DW_OP_deref, DW_OP_stack_value) The DWARF expression computes the
> > variable's value, but that value requires a dereference. The memory
> > access is fetching that value, so no type dereference is needed.
> > Returns false.
> >
> > 3. Base register + offset, followed only by DW_OP_stack_value: (e.g.,
> > DW_OP_breg13 R13+256, DW_OP_stack_value) This indicates the value at
> > the base + offset is the variable's value. Since this value is being
> > used as an address in the memory access, the variable's type is
> > treated as a pointer and requires a type dereference. Returns true.
> >
> > The is_pointer argument passed to match_var_offset is now set by
> > is_breg_access_indirect for breg accesses.
> >
> > There are more complex expressions that includes multiple operations and
> > may require additional handling, such as DW_OP_deref without a
> > DW_OP_stack_value, or including multiple base registers. They are less
> > common in the Linux kernel dwarf and are skipped in check_allowed_ops.
> >
> > Signed-off-by: Zecheng Li <zecheng@google.com>
> > ---
> > tools/perf/util/dwarf-aux.c | 38 ++++++++++++++++++++++++++++++++-----
> > 1 file changed, 33 insertions(+), 5 deletions(-)
> >
> > diff --git a/tools/perf/util/dwarf-aux.c b/tools/perf/util/dwarf-aux.c
> > index 920054425578..449bc9ad7aff 100644
> > --- a/tools/perf/util/dwarf-aux.c
> > +++ b/tools/perf/util/dwarf-aux.c
> > @@ -1423,6 +1423,34 @@ static bool match_var_offset(Dwarf_Die *die_mem, struct find_var_data *data,
> > return true;
> > }
> >
> > +/**
> > + * is_breg_access_indirect - Check if breg based access implies type
> > + * dereference
> > + * @ops: DWARF operations array
> > + * @nops: Number of operations in @ops
> > + *
> > + * Returns true if the DWARF expression evaluates to the variable's
> > + * value, so the memory access on that register needs type dereference.
> > + * Returns false if the expression evaluates to the variable's address.
> > + * This is called after check_allowed_ops.
> > + */
> > +static bool is_breg_access_indirect(Dwarf_Op *ops, size_t nops)
> > +{
> > + /* only the base register */
> > + if (nops == 1)
> > + return false;
>
> Then it could be like below:
>
> if (nops == 1) {
> int reg = reg_from_dwarf_op(ops);
> return !(reg == DWARF_REG_FB || data->is_fbreg || reg == data->is_stack);
> }
>
> Thanks,
> Namhyung
>
> > +
> > + if (nops == 2 && ops[1].atom == DW_OP_stack_value)
> > + return true;
> > +
> > + if (nops == 3 && (ops[1].atom == DW_OP_deref ||
> > + ops[1].atom == DW_OP_deref_size) &&
> > + ops[2].atom == DW_OP_stack_value)
> > + return false;
> > + /* unreachable, OP not supported */
> > + return false;
> > +}
> > +
> > /* Only checks direct child DIEs in the given scope. */
> > static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> > {
> > @@ -1451,7 +1479,7 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> > if (data->is_fbreg && ops->atom == DW_OP_fbreg &&
> > check_allowed_ops(ops, nops) &&
> > match_var_offset(die_mem, data, data->offset, ops->number,
> > - /*is_pointer=*/false))
> > + is_breg_access_indirect(ops, nops)))
> > return DIE_FIND_CB_END;
> >
> > /* Only match with a simple case */
> > @@ -1463,11 +1491,11 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> > /*is_pointer=*/true))
> > return DIE_FIND_CB_END;
> >
> > - /* Local variables accessed by a register + offset */
> > + /* variables accessed by a register + offset */
> > if (ops->atom == (DW_OP_breg0 + data->reg) &&
> > check_allowed_ops(ops, nops) &&
> > match_var_offset(die_mem, data, data->offset, ops->number,
> > - /*is_pointer=*/false))
> > + is_breg_access_indirect(ops, nops)))
> > return DIE_FIND_CB_END;
> > } else {
> > /* pointer variables saved in a register 32 or above */
> > @@ -1477,11 +1505,11 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> > /*is_pointer=*/true))
> > return DIE_FIND_CB_END;
> >
> > - /* Local variables accessed by a register + offset */
> > + /* variables accessed by a register + offset */
> > if (ops->atom == DW_OP_bregx && data->reg == ops->number &&
> > check_allowed_ops(ops, nops) &&
> > match_var_offset(die_mem, data, data->offset, ops->number2,
> > - /*is_poitner=*/false))
> > + is_breg_access_indirect(ops, nops)))
> > return DIE_FIND_CB_END;
> > }
> > }
> > --
> > 2.51.0.261.g7ce5a0a67e-goog
> >
Hello,
On Thu, Aug 28, 2025 at 02:36:32PM -0400, Zecheng Li wrote:
> On Thu, Aug 28, 2025 at 3:19 AM Namhyung Kim <namhyung@kernel.org> wrote:
> >
> > On Mon, Aug 25, 2025 at 07:54:04PM +0000, Zecheng Li wrote:
> > > Introduces the function is_breg_access_indirect to determine whether a
> > > memory access involving a DW_OP_breg* operation refers to the variable's
> > > value directly or requires dereferencing the variable's type as a
> > > pointer based on the DWARF expression. Previously, all breg based
> > > accesses were assumed to directly access the variable's value
> > > (is_pointer = false).
> > >
> > > The is_breg_access_indirect function handles three cases:
> > >
> > > 1. Base register + offset only: (e.g., DW_OP_breg7 RSP+88) The
> > > calculated address is the location of the variable. The access is
> > > direct, so no type dereference is needed. Returns false.
> >
> > I'm afraid there may be cases that the base register doesn't point to
> > the stack. In that case it may return true, right?
>
> Hi Namhyung,
>
> In this case, the DWARF specification for a DW_OP_breg* operation is
> to always calculate a memory address. So, even if the base register
> isn't the stack pointer, the expression still resolves to the
> variable's location, meaning the access is direct (is_pointer =
> false).
I've re-read the DWARF spec and I think you're right. :)
>
> > I think struct find_var_data already has 'is_fbreg' field. Maybe you
> > can add 'is_stack' or 'is_stack_reg' field if the target. Currently we
> > hardcoded X86_REG_SP but it should be arch-dependent.
>
> Therefore we don't need to check if the register is a stack or frame base.
Fair enough.
>
> > >
> > > 2. Base register + offset, followed by other operations ending in
> > > DW_OP_stack_value, including DW_OP_deref: (e.g., DW_OP_breg*,
> > > DW_OP_deref, DW_OP_stack_value) The DWARF expression computes the
> > > variable's value, but that value requires a dereference. The memory
> > > access is fetching that value, so no type dereference is needed.
> > > Returns false.
> > >
> > > 3. Base register + offset, followed only by DW_OP_stack_value: (e.g.,
> > > DW_OP_breg13 R13+256, DW_OP_stack_value) This indicates the value at
> > > the base + offset is the variable's value. Since this value is being
> > > used as an address in the memory access, the variable's type is
> > > treated as a pointer and requires a type dereference. Returns true.
> > >
> > > The is_pointer argument passed to match_var_offset is now set by
> > > is_breg_access_indirect for breg accesses.
> > >
> > > There are more complex expressions that includes multiple operations and
> > > may require additional handling, such as DW_OP_deref without a
> > > DW_OP_stack_value, or including multiple base registers. They are less
> > > common in the Linux kernel dwarf and are skipped in check_allowed_ops.
> > >
> > > Signed-off-by: Zecheng Li <zecheng@google.com>
This also improved the data quality!
Reviewed-by: Namhyung Kim <namhyung@kernel.org>
Thanks,
Namhyung
> > > ---
> > > tools/perf/util/dwarf-aux.c | 38 ++++++++++++++++++++++++++++++++-----
> > > 1 file changed, 33 insertions(+), 5 deletions(-)
> > >
> > > diff --git a/tools/perf/util/dwarf-aux.c b/tools/perf/util/dwarf-aux.c
> > > index 920054425578..449bc9ad7aff 100644
> > > --- a/tools/perf/util/dwarf-aux.c
> > > +++ b/tools/perf/util/dwarf-aux.c
> > > @@ -1423,6 +1423,34 @@ static bool match_var_offset(Dwarf_Die *die_mem, struct find_var_data *data,
> > > return true;
> > > }
> > >
> > > +/**
> > > + * is_breg_access_indirect - Check if breg based access implies type
> > > + * dereference
> > > + * @ops: DWARF operations array
> > > + * @nops: Number of operations in @ops
> > > + *
> > > + * Returns true if the DWARF expression evaluates to the variable's
> > > + * value, so the memory access on that register needs type dereference.
> > > + * Returns false if the expression evaluates to the variable's address.
> > > + * This is called after check_allowed_ops.
> > > + */
> > > +static bool is_breg_access_indirect(Dwarf_Op *ops, size_t nops)
> > > +{
> > > + /* only the base register */
> > > + if (nops == 1)
> > > + return false;
> >
> > Then it could be like below:
> >
> > if (nops == 1) {
> > int reg = reg_from_dwarf_op(ops);
> > return !(reg == DWARF_REG_FB || data->is_fbreg || reg == data->is_stack);
> > }
> >
> > Thanks,
> > Namhyung
> >
> > > +
> > > + if (nops == 2 && ops[1].atom == DW_OP_stack_value)
> > > + return true;
> > > +
> > > + if (nops == 3 && (ops[1].atom == DW_OP_deref ||
> > > + ops[1].atom == DW_OP_deref_size) &&
> > > + ops[2].atom == DW_OP_stack_value)
> > > + return false;
> > > + /* unreachable, OP not supported */
> > > + return false;
> > > +}
> > > +
> > > /* Only checks direct child DIEs in the given scope. */
> > > static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> > > {
> > > @@ -1451,7 +1479,7 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> > > if (data->is_fbreg && ops->atom == DW_OP_fbreg &&
> > > check_allowed_ops(ops, nops) &&
> > > match_var_offset(die_mem, data, data->offset, ops->number,
> > > - /*is_pointer=*/false))
> > > + is_breg_access_indirect(ops, nops)))
> > > return DIE_FIND_CB_END;
> > >
> > > /* Only match with a simple case */
> > > @@ -1463,11 +1491,11 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> > > /*is_pointer=*/true))
> > > return DIE_FIND_CB_END;
> > >
> > > - /* Local variables accessed by a register + offset */
> > > + /* variables accessed by a register + offset */
> > > if (ops->atom == (DW_OP_breg0 + data->reg) &&
> > > check_allowed_ops(ops, nops) &&
> > > match_var_offset(die_mem, data, data->offset, ops->number,
> > > - /*is_pointer=*/false))
> > > + is_breg_access_indirect(ops, nops)))
> > > return DIE_FIND_CB_END;
> > > } else {
> > > /* pointer variables saved in a register 32 or above */
> > > @@ -1477,11 +1505,11 @@ static int __die_find_var_reg_cb(Dwarf_Die *die_mem, void *arg)
> > > /*is_pointer=*/true))
> > > return DIE_FIND_CB_END;
> > >
> > > - /* Local variables accessed by a register + offset */
> > > + /* variables accessed by a register + offset */
> > > if (ops->atom == DW_OP_bregx && data->reg == ops->number &&
> > > check_allowed_ops(ops, nops) &&
> > > match_var_offset(die_mem, data, data->offset, ops->number2,
> > > - /*is_poitner=*/false))
> > > + is_breg_access_indirect(ops, nops)))
> > > return DIE_FIND_CB_END;
> > > }
> > > }
> > > --
> > > 2.51.0.261.g7ce5a0a67e-goog
> > >
© 2016 - 2026 Red Hat, Inc.