This patch provides a new feature (i.e., "tunsrc") for the tunnel (i.e.,
"encap") mode of ioam6. Just like seg6 already does, except it is
attached to a route. The "tunsrc" is optional: when not provided (by
default), the automatic resolution is applied. Using "tunsrc" when
possible has a benefit: performance.
Signed-off-by: Justin Iurman <justin.iurman@uliege.be>
---
include/uapi/linux/ioam6_iptunnel.h | 7 +++++
net/ipv6/ioam6_iptunnel.c | 48 ++++++++++++++++++++++++++---
2 files changed, 51 insertions(+), 4 deletions(-)
diff --git a/include/uapi/linux/ioam6_iptunnel.h b/include/uapi/linux/ioam6_iptunnel.h
index 38f6a8fdfd34..6cdbd0da7ad8 100644
--- a/include/uapi/linux/ioam6_iptunnel.h
+++ b/include/uapi/linux/ioam6_iptunnel.h
@@ -50,6 +50,13 @@ enum {
IOAM6_IPTUNNEL_FREQ_K, /* u32 */
IOAM6_IPTUNNEL_FREQ_N, /* u32 */
+ /* Tunnel src address.
+ * For encap,auto modes.
+ * Optional (automatic if
+ * not provided).
+ */
+ IOAM6_IPTUNNEL_SRC, /* struct in6_addr */
+
__IOAM6_IPTUNNEL_MAX,
};
diff --git a/net/ipv6/ioam6_iptunnel.c b/net/ipv6/ioam6_iptunnel.c
index cd2522f04edf..e0e73faf9969 100644
--- a/net/ipv6/ioam6_iptunnel.c
+++ b/net/ipv6/ioam6_iptunnel.c
@@ -42,6 +42,8 @@ struct ioam6_lwt {
struct ioam6_lwt_freq freq;
atomic_t pkt_cnt;
u8 mode;
+ bool has_tunsrc;
+ struct in6_addr tunsrc;
struct in6_addr tundst;
struct ioam6_lwt_encap tuninfo;
};
@@ -72,6 +74,7 @@ static const struct nla_policy ioam6_iptunnel_policy[IOAM6_IPTUNNEL_MAX + 1] = {
[IOAM6_IPTUNNEL_MODE] = NLA_POLICY_RANGE(NLA_U8,
IOAM6_IPTUNNEL_MODE_MIN,
IOAM6_IPTUNNEL_MODE_MAX),
+ [IOAM6_IPTUNNEL_SRC] = NLA_POLICY_EXACT_LEN(sizeof(struct in6_addr)),
[IOAM6_IPTUNNEL_DST] = NLA_POLICY_EXACT_LEN(sizeof(struct in6_addr)),
[IOAM6_IPTUNNEL_TRACE] = NLA_POLICY_EXACT_LEN(
sizeof(struct ioam6_trace_hdr)),
@@ -144,6 +147,11 @@ static int ioam6_build_state(struct net *net, struct nlattr *nla,
else
mode = nla_get_u8(tb[IOAM6_IPTUNNEL_MODE]);
+ if (tb[IOAM6_IPTUNNEL_SRC] && mode == IOAM6_IPTUNNEL_MODE_INLINE) {
+ NL_SET_ERR_MSG(extack, "no tunnel source expected in this mode");
+ return -EINVAL;
+ }
+
if (!tb[IOAM6_IPTUNNEL_DST] && mode != IOAM6_IPTUNNEL_MODE_INLINE) {
NL_SET_ERR_MSG(extack, "this mode needs a tunnel destination");
return -EINVAL;
@@ -178,6 +186,14 @@ static int ioam6_build_state(struct net *net, struct nlattr *nla,
ilwt->freq.n = freq_n;
ilwt->mode = mode;
+
+ if (!tb[IOAM6_IPTUNNEL_SRC]) {
+ ilwt->has_tunsrc = false;
+ } else {
+ ilwt->has_tunsrc = true;
+ ilwt->tunsrc = nla_get_in6_addr(tb[IOAM6_IPTUNNEL_SRC]);
+ }
+
if (tb[IOAM6_IPTUNNEL_DST])
ilwt->tundst = nla_get_in6_addr(tb[IOAM6_IPTUNNEL_DST]);
@@ -257,6 +273,8 @@ static int ioam6_do_inline(struct net *net, struct sk_buff *skb,
static int ioam6_do_encap(struct net *net, struct sk_buff *skb,
struct ioam6_lwt_encap *tuninfo,
+ bool has_tunsrc,
+ struct in6_addr *tunsrc,
struct in6_addr *tundst)
{
struct dst_entry *dst = skb_dst(skb);
@@ -286,8 +304,13 @@ static int ioam6_do_encap(struct net *net, struct sk_buff *skb,
hdr->nexthdr = NEXTHDR_HOP;
hdr->payload_len = cpu_to_be16(skb->len - sizeof(*hdr));
hdr->daddr = *tundst;
- ipv6_dev_get_saddr(net, dst->dev, &hdr->daddr,
- IPV6_PREFER_SRC_PUBLIC, &hdr->saddr);
+
+ if (has_tunsrc && !ipv6_addr_any(tunsrc)) {
+ memcpy(&hdr->saddr, tunsrc, sizeof(*tunsrc));
+ } else {
+ ipv6_dev_get_saddr(net, dst->dev, &hdr->daddr,
+ IPV6_PREFER_SRC_PUBLIC, &hdr->saddr);
+ }
skb_postpush_rcsum(skb, hdr, len);
@@ -329,7 +352,9 @@ static int ioam6_output(struct net *net, struct sock *sk, struct sk_buff *skb)
case IOAM6_IPTUNNEL_MODE_ENCAP:
do_encap:
/* Encapsulation (ip6ip6) */
- err = ioam6_do_encap(net, skb, &ilwt->tuninfo, &ilwt->tundst);
+ err = ioam6_do_encap(net, skb, &ilwt->tuninfo,
+ ilwt->has_tunsrc, &ilwt->tunsrc,
+ &ilwt->tundst);
if (unlikely(err))
goto drop;
@@ -415,6 +440,13 @@ static int ioam6_fill_encap_info(struct sk_buff *skb,
goto ret;
if (ilwt->mode != IOAM6_IPTUNNEL_MODE_INLINE) {
+ if (ilwt->has_tunsrc) {
+ err = nla_put_in6_addr(skb, IOAM6_IPTUNNEL_SRC,
+ &ilwt->tunsrc);
+ if (err)
+ goto ret;
+ }
+
err = nla_put_in6_addr(skb, IOAM6_IPTUNNEL_DST, &ilwt->tundst);
if (err)
goto ret;
@@ -436,8 +468,12 @@ static int ioam6_encap_nlsize(struct lwtunnel_state *lwtstate)
nla_total_size(sizeof(ilwt->mode)) +
nla_total_size(sizeof(ilwt->tuninfo.traceh));
- if (ilwt->mode != IOAM6_IPTUNNEL_MODE_INLINE)
+ if (ilwt->mode != IOAM6_IPTUNNEL_MODE_INLINE) {
+ if (ilwt->has_tunsrc)
+ nlsize += nla_total_size(sizeof(ilwt->tunsrc));
+
nlsize += nla_total_size(sizeof(ilwt->tundst));
+ }
return nlsize;
}
@@ -452,8 +488,12 @@ static int ioam6_encap_cmp(struct lwtunnel_state *a, struct lwtunnel_state *b)
return (ilwt_a->freq.k != ilwt_b->freq.k ||
ilwt_a->freq.n != ilwt_b->freq.n ||
ilwt_a->mode != ilwt_b->mode ||
+ ilwt_a->has_tunsrc != ilwt_b->has_tunsrc ||
(ilwt_a->mode != IOAM6_IPTUNNEL_MODE_INLINE &&
!ipv6_addr_equal(&ilwt_a->tundst, &ilwt_b->tundst)) ||
+ (ilwt_a->mode != IOAM6_IPTUNNEL_MODE_INLINE &&
+ ilwt_a->has_tunsrc &&
+ !ipv6_addr_equal(&ilwt_a->tunsrc, &ilwt_b->tunsrc)) ||
trace_a->namespace_id != trace_b->namespace_id);
}
--
2.34.1
On 8/9/24 14:39, Justin Iurman wrote:
> This patch provides a new feature (i.e., "tunsrc") for the tunnel (i.e.,
> "encap") mode of ioam6. Just like seg6 already does, except it is
> attached to a route. The "tunsrc" is optional: when not provided (by
> default), the automatic resolution is applied. Using "tunsrc" when
> possible has a benefit: performance.
It's customary to include performances figures in performance related
changeset ;)
>
> Signed-off-by: Justin Iurman <justin.iurman@uliege.be>
> ---
> include/uapi/linux/ioam6_iptunnel.h | 7 +++++
> net/ipv6/ioam6_iptunnel.c | 48 ++++++++++++++++++++++++++---
> 2 files changed, 51 insertions(+), 4 deletions(-)
>
> diff --git a/include/uapi/linux/ioam6_iptunnel.h b/include/uapi/linux/ioam6_iptunnel.h
> index 38f6a8fdfd34..6cdbd0da7ad8 100644
> --- a/include/uapi/linux/ioam6_iptunnel.h
> +++ b/include/uapi/linux/ioam6_iptunnel.h
> @@ -50,6 +50,13 @@ enum {
> IOAM6_IPTUNNEL_FREQ_K, /* u32 */
> IOAM6_IPTUNNEL_FREQ_N, /* u32 */
>
> + /* Tunnel src address.
> + * For encap,auto modes.
> + * Optional (automatic if
> + * not provided).
> + */
> + IOAM6_IPTUNNEL_SRC, /* struct in6_addr */
> +
> __IOAM6_IPTUNNEL_MAX,
> };
>
> diff --git a/net/ipv6/ioam6_iptunnel.c b/net/ipv6/ioam6_iptunnel.c
> index cd2522f04edf..e0e73faf9969 100644
> --- a/net/ipv6/ioam6_iptunnel.c
> +++ b/net/ipv6/ioam6_iptunnel.c
> @@ -42,6 +42,8 @@ struct ioam6_lwt {
> struct ioam6_lwt_freq freq;
> atomic_t pkt_cnt;
> u8 mode;
> + bool has_tunsrc;
> + struct in6_addr tunsrc;
> struct in6_addr tundst;
> struct ioam6_lwt_encap tuninfo;
> };
> @@ -72,6 +74,7 @@ static const struct nla_policy ioam6_iptunnel_policy[IOAM6_IPTUNNEL_MAX + 1] = {
> [IOAM6_IPTUNNEL_MODE] = NLA_POLICY_RANGE(NLA_U8,
> IOAM6_IPTUNNEL_MODE_MIN,
> IOAM6_IPTUNNEL_MODE_MAX),
> + [IOAM6_IPTUNNEL_SRC] = NLA_POLICY_EXACT_LEN(sizeof(struct in6_addr)),
> [IOAM6_IPTUNNEL_DST] = NLA_POLICY_EXACT_LEN(sizeof(struct in6_addr)),
> [IOAM6_IPTUNNEL_TRACE] = NLA_POLICY_EXACT_LEN(
> sizeof(struct ioam6_trace_hdr)),
> @@ -144,6 +147,11 @@ static int ioam6_build_state(struct net *net, struct nlattr *nla,
> else
> mode = nla_get_u8(tb[IOAM6_IPTUNNEL_MODE]);
>
> + if (tb[IOAM6_IPTUNNEL_SRC] && mode == IOAM6_IPTUNNEL_MODE_INLINE) {
> + NL_SET_ERR_MSG(extack, "no tunnel source expected in this mode");
> + return -EINVAL;
> + }
when mode is IOAM6_IPTUNNEL_MODE_AUTO, the data path could still add the
encapsulation for forwarded packets, why explicitly preventing this
optimization in such scenario?
> +
> if (!tb[IOAM6_IPTUNNEL_DST] && mode != IOAM6_IPTUNNEL_MODE_INLINE) {
> NL_SET_ERR_MSG(extack, "this mode needs a tunnel destination");
> return -EINVAL;
> @@ -178,6 +186,14 @@ static int ioam6_build_state(struct net *net, struct nlattr *nla,
> ilwt->freq.n = freq_n;
>
> ilwt->mode = mode;
> +
> + if (!tb[IOAM6_IPTUNNEL_SRC]) {
> + ilwt->has_tunsrc = false;
> + } else {
> + ilwt->has_tunsrc = true;
> + ilwt->tunsrc = nla_get_in6_addr(tb[IOAM6_IPTUNNEL_SRC]);
Since you are going to use the source address only if != ANY, I think it
would be cleaner to refuse such addresses here. That will avoid an
additional check in the datapath.
Cheers,
Paolo
On 8/13/24 13:06, Paolo Abeni wrote:
> On 8/9/24 14:39, Justin Iurman wrote:
>> This patch provides a new feature (i.e., "tunsrc") for the tunnel (i.e.,
>> "encap") mode of ioam6. Just like seg6 already does, except it is
>> attached to a route. The "tunsrc" is optional: when not provided (by
>> default), the automatic resolution is applied. Using "tunsrc" when
>> possible has a benefit: performance.
>
> It's customary to include performances figures in performance related
> changeset ;)
>
>>
>> Signed-off-by: Justin Iurman <justin.iurman@uliege.be>
>> ---
>> include/uapi/linux/ioam6_iptunnel.h | 7 +++++
>> net/ipv6/ioam6_iptunnel.c | 48 ++++++++++++++++++++++++++---
>> 2 files changed, 51 insertions(+), 4 deletions(-)
>>
>> diff --git a/include/uapi/linux/ioam6_iptunnel.h
>> b/include/uapi/linux/ioam6_iptunnel.h
>> index 38f6a8fdfd34..6cdbd0da7ad8 100644
>> --- a/include/uapi/linux/ioam6_iptunnel.h
>> +++ b/include/uapi/linux/ioam6_iptunnel.h
>> @@ -50,6 +50,13 @@ enum {
>> IOAM6_IPTUNNEL_FREQ_K, /* u32 */
>> IOAM6_IPTUNNEL_FREQ_N, /* u32 */
>> + /* Tunnel src address.
>> + * For encap,auto modes.
>> + * Optional (automatic if
>> + * not provided).
>> + */
>> + IOAM6_IPTUNNEL_SRC, /* struct in6_addr */
>> +
>> __IOAM6_IPTUNNEL_MAX,
>> };
>> diff --git a/net/ipv6/ioam6_iptunnel.c b/net/ipv6/ioam6_iptunnel.c
>> index cd2522f04edf..e0e73faf9969 100644
>> --- a/net/ipv6/ioam6_iptunnel.c
>> +++ b/net/ipv6/ioam6_iptunnel.c
>> @@ -42,6 +42,8 @@ struct ioam6_lwt {
>> struct ioam6_lwt_freq freq;
>> atomic_t pkt_cnt;
>> u8 mode;
>> + bool has_tunsrc;
>> + struct in6_addr tunsrc;
>> struct in6_addr tundst;
>> struct ioam6_lwt_encap tuninfo;
>> };
>> @@ -72,6 +74,7 @@ static const struct nla_policy
>> ioam6_iptunnel_policy[IOAM6_IPTUNNEL_MAX + 1] = {
>> [IOAM6_IPTUNNEL_MODE] = NLA_POLICY_RANGE(NLA_U8,
>> IOAM6_IPTUNNEL_MODE_MIN,
>> IOAM6_IPTUNNEL_MODE_MAX),
>> + [IOAM6_IPTUNNEL_SRC] = NLA_POLICY_EXACT_LEN(sizeof(struct
>> in6_addr)),
>> [IOAM6_IPTUNNEL_DST] = NLA_POLICY_EXACT_LEN(sizeof(struct
>> in6_addr)),
>> [IOAM6_IPTUNNEL_TRACE] = NLA_POLICY_EXACT_LEN(
>> sizeof(struct ioam6_trace_hdr)),
>> @@ -144,6 +147,11 @@ static int ioam6_build_state(struct net *net,
>> struct nlattr *nla,
>> else
>> mode = nla_get_u8(tb[IOAM6_IPTUNNEL_MODE]);
>> + if (tb[IOAM6_IPTUNNEL_SRC] && mode == IOAM6_IPTUNNEL_MODE_INLINE) {
>> + NL_SET_ERR_MSG(extack, "no tunnel source expected in this
>> mode");
>> + return -EINVAL;
>> + }
>
> when mode is IOAM6_IPTUNNEL_MODE_AUTO, the data path could still add the
> encapsulation for forwarded packets, why explicitly preventing this
> optimization in such scenario?
Actually, this check is correct. We don't want the "tunsrc" with
"inline" mode since it's useless. If the "auto" mode is chosen, then
it's fine (same for the "encap" mode). Preventing "tunsrc" for the
"inline" mode does *not* impact the auto mode. Basically:
tb[IOAM6_IPTUNNEL_SRC] && mode == IOAM6_IPTUNNEL_MODE_INLINE -> error
tb[IOAM6_IPTUNNEL_SRC] && mode == IOAM6_IPTUNNEL_MODE_ENCAP -> OK
tb[IOAM6_IPTUNNEL_SRC] && mode == IOAM6_IPTUNNEL_MODE_AUTO -> OK
It aligns better with the semantics of "tundst", which is a MUST for
"encap"/"auto" modes (and forbidden for the "inline" mode). In the case
of "tunsrc", it is a MAY for "encap"/"auto" modes (and forbidden for the
"inline" mode).
>> +
>> if (!tb[IOAM6_IPTUNNEL_DST] && mode !=
>> IOAM6_IPTUNNEL_MODE_INLINE) {
>> NL_SET_ERR_MSG(extack, "this mode needs a tunnel destination");
>> return -EINVAL;
>> @@ -178,6 +186,14 @@ static int ioam6_build_state(struct net *net,
>> struct nlattr *nla,
>> ilwt->freq.n = freq_n;
>> ilwt->mode = mode;
>> +
>> + if (!tb[IOAM6_IPTUNNEL_SRC]) {
>> + ilwt->has_tunsrc = false;
>> + } else {
>> + ilwt->has_tunsrc = true;
>> + ilwt->tunsrc = nla_get_in6_addr(tb[IOAM6_IPTUNNEL_SRC]);
>
> Since you are going to use the source address only if != ANY, I think it
> would be cleaner to refuse such addresses here. That will avoid an
> additional check in the datapath.
>
> Cheers,
>
> Paolo
>
On 8/13/24 13:06, Paolo Abeni wrote:
> On 8/9/24 14:39, Justin Iurman wrote:
>> This patch provides a new feature (i.e., "tunsrc") for the tunnel (i.e.,
>> "encap") mode of ioam6. Just like seg6 already does, except it is
>> attached to a route. The "tunsrc" is optional: when not provided (by
>> default), the automatic resolution is applied. Using "tunsrc" when
>> possible has a benefit: performance.
>
> It's customary to include performances figures in performance related
> changeset ;)
Indeed, I realized it too late... thx for the reminder!
Before (= "encap" mode): https://ibb.co/bNCzvf7
After (= "encap" mode with "tunsrc"): https://ibb.co/PT8L6yq
I'll add these again to -v2.
>> Signed-off-by: Justin Iurman <justin.iurman@uliege.be>
>> ---
>> include/uapi/linux/ioam6_iptunnel.h | 7 +++++
>> net/ipv6/ioam6_iptunnel.c | 48 ++++++++++++++++++++++++++---
>> 2 files changed, 51 insertions(+), 4 deletions(-)
>>
>> diff --git a/include/uapi/linux/ioam6_iptunnel.h
>> b/include/uapi/linux/ioam6_iptunnel.h
>> index 38f6a8fdfd34..6cdbd0da7ad8 100644
>> --- a/include/uapi/linux/ioam6_iptunnel.h
>> +++ b/include/uapi/linux/ioam6_iptunnel.h
>> @@ -50,6 +50,13 @@ enum {
>> IOAM6_IPTUNNEL_FREQ_K, /* u32 */
>> IOAM6_IPTUNNEL_FREQ_N, /* u32 */
>> + /* Tunnel src address.
>> + * For encap,auto modes.
>> + * Optional (automatic if
>> + * not provided).
>> + */
>> + IOAM6_IPTUNNEL_SRC, /* struct in6_addr */
>> +
>> __IOAM6_IPTUNNEL_MAX,
>> };
>> diff --git a/net/ipv6/ioam6_iptunnel.c b/net/ipv6/ioam6_iptunnel.c
>> index cd2522f04edf..e0e73faf9969 100644
>> --- a/net/ipv6/ioam6_iptunnel.c
>> +++ b/net/ipv6/ioam6_iptunnel.c
>> @@ -42,6 +42,8 @@ struct ioam6_lwt {
>> struct ioam6_lwt_freq freq;
>> atomic_t pkt_cnt;
>> u8 mode;
>> + bool has_tunsrc;
>> + struct in6_addr tunsrc;
>> struct in6_addr tundst;
>> struct ioam6_lwt_encap tuninfo;
>> };
>> @@ -72,6 +74,7 @@ static const struct nla_policy
>> ioam6_iptunnel_policy[IOAM6_IPTUNNEL_MAX + 1] = {
>> [IOAM6_IPTUNNEL_MODE] = NLA_POLICY_RANGE(NLA_U8,
>> IOAM6_IPTUNNEL_MODE_MIN,
>> IOAM6_IPTUNNEL_MODE_MAX),
>> + [IOAM6_IPTUNNEL_SRC] = NLA_POLICY_EXACT_LEN(sizeof(struct
>> in6_addr)),
>> [IOAM6_IPTUNNEL_DST] = NLA_POLICY_EXACT_LEN(sizeof(struct
>> in6_addr)),
>> [IOAM6_IPTUNNEL_TRACE] = NLA_POLICY_EXACT_LEN(
>> sizeof(struct ioam6_trace_hdr)),
>> @@ -144,6 +147,11 @@ static int ioam6_build_state(struct net *net,
>> struct nlattr *nla,
>> else
>> mode = nla_get_u8(tb[IOAM6_IPTUNNEL_MODE]);
>> + if (tb[IOAM6_IPTUNNEL_SRC] && mode == IOAM6_IPTUNNEL_MODE_INLINE) {
>> + NL_SET_ERR_MSG(extack, "no tunnel source expected in this
>> mode");
>> + return -EINVAL;
>> + }
>
> when mode is IOAM6_IPTUNNEL_MODE_AUTO, the data path could still add the
> encapsulation for forwarded packets, why explicitly preventing this
> optimization in such scenario?
Good catch! I guess we can just ignore "tunsrc" if provided with inline
mode, instead of returning an error.
>> +
>> if (!tb[IOAM6_IPTUNNEL_DST] && mode !=
>> IOAM6_IPTUNNEL_MODE_INLINE) {
>> NL_SET_ERR_MSG(extack, "this mode needs a tunnel destination");
>> return -EINVAL;
>> @@ -178,6 +186,14 @@ static int ioam6_build_state(struct net *net,
>> struct nlattr *nla,
>> ilwt->freq.n = freq_n;
>> ilwt->mode = mode;
>> +
>> + if (!tb[IOAM6_IPTUNNEL_SRC]) {
>> + ilwt->has_tunsrc = false;
>> + } else {
>> + ilwt->has_tunsrc = true;
>> + ilwt->tunsrc = nla_get_in6_addr(tb[IOAM6_IPTUNNEL_SRC]);
>
> Since you are going to use the source address only if != ANY, I think it
> would be cleaner to refuse such addresses here. That will avoid an
> additional check in the datapath.
+1.
Thanks,
Justin
> Cheers,
>
> Paolo
>
© 2016 - 2026 Red Hat, Inc.