1 | From: Geliang Tang <tanggeliang@kylinos.cn> | 1 | From: Geliang Tang <tanggeliang@kylinos.cn> |
---|---|---|---|
2 | 2 | ||
3 | get_addr() and dump_addr() interfaces of BPF userspace pm are dropped | 3 | Some path manager related refactoring and cleanups. |
4 | as Matt suggested. | ||
5 | 4 | ||
6 | Based-on: <cover.1736924314.git.tanggeliang@kylinos.cn> | 5 | Geliang Tang (6): |
6 | mptcp: pm: in-kernel: avoid access entry without lock | ||
7 | mptcp: pm: in-kernel: reduce parameters of set_flags | ||
8 | mptcp: pm: use addr entry for get_local_id | ||
9 | mptcp: pm: in-kernel: use kmemdup helper | ||
10 | sock: add sock_kmemdup helper | ||
11 | mptcp: pm: userspace: use sock_kmemdup helper | ||
7 | 12 | ||
8 | In order to implement BPF userspace path manager, it is necessary to | 13 | include/net/sock.h | 1 + |
9 | unify the interfaces of the path manager. This set contains some | 14 | net/core/sock.c | 23 +++++++++++++++++++++++ |
10 | cleanups and refactoring to unify the interfaces in kernel space. | 15 | net/mptcp/pm.c | 9 ++++++--- |
11 | Finally, define a struct mptcp_pm_ops for a userspace path manager | 16 | net/mptcp/pm_netlink.c | 30 +++++++++++++----------------- |
12 | like this: | 17 | net/mptcp/pm_userspace.c | 20 +++++++------------- |
13 | 18 | net/mptcp/protocol.h | 6 ++++-- | |
14 | struct mptcp_pm_ops { | 19 | 6 files changed, 54 insertions(+), 35 deletions(-) |
15 | int (*address_announce)(struct mptcp_sock *msk, | ||
16 | struct mptcp_pm_addr_entry *local); | ||
17 | int (*address_remove)(struct mptcp_sock *msk, u8 id); | ||
18 | int (*subflow_create)(struct mptcp_sock *msk, | ||
19 | struct mptcp_pm_addr_entry *local, | ||
20 | struct mptcp_addr_info *remote); | ||
21 | int (*subflow_destroy)(struct mptcp_sock *msk, | ||
22 | struct mptcp_pm_addr_entry *local, | ||
23 | struct mptcp_addr_info *remote); | ||
24 | int (*get_local_id)(struct mptcp_sock *msk, | ||
25 | struct mptcp_pm_addr_entry *local); | ||
26 | u8 (*get_flags)(struct mptcp_sock *msk, | ||
27 | struct mptcp_addr_info *skc); | ||
28 | int (*set_flags)(struct mptcp_sock *msk, | ||
29 | struct mptcp_pm_addr_entry *local, | ||
30 | struct mptcp_addr_info *remote); | ||
31 | |||
32 | u8 type; | ||
33 | struct module *owner; | ||
34 | struct list_head list; | ||
35 | |||
36 | void (*init)(struct mptcp_sock *msk); | ||
37 | void (*release)(struct mptcp_sock *msk); | ||
38 | } ____cacheline_aligned_in_smp; | ||
39 | |||
40 | Closes: https://github.com/multipath-tcp/mptcp_net-next/issues/74 | ||
41 | |||
42 | Geliang Tang (3): | ||
43 | mptcp: define struct mptcp_pm_ops | ||
44 | mptcp: register default userspace pm | ||
45 | mptcp: init and release mptcp_pm_ops | ||
46 | |||
47 | include/net/mptcp.h | 27 +++ | ||
48 | net/mptcp/pm.c | 8 + | ||
49 | net/mptcp/pm_userspace.c | 362 ++++++++++++++++++++++++++++----------- | ||
50 | net/mptcp/protocol.c | 1 + | ||
51 | net/mptcp/protocol.h | 9 + | ||
52 | 5 files changed, 309 insertions(+), 98 deletions(-) | ||
53 | 20 | ||
54 | -- | 21 | -- |
55 | 2.43.0 | 22 | 2.43.0 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | From: Geliang Tang <tanggeliang@kylinos.cn> | ||
1 | 2 | ||
3 | In mptcp_pm_nl_set_flags(), "entry" is copied to "local" when pernet->lock | ||
4 | is held to avoid direct access to entry without pernet->lock. | ||
5 | |||
6 | Therefore, "local->flags" should be passed to mptcp_nl_set_flags instead | ||
7 | of "entry->flags" when pernet->lock is not held, so as to avoid access to | ||
8 | entry. | ||
9 | |||
10 | Signed-off-by: Geliang Tang <tanggeliang@kylinos.cn> | ||
11 | --- | ||
12 | net/mptcp/pm_netlink.c | 2 +- | ||
13 | 1 file changed, 1 insertion(+), 1 deletion(-) | ||
14 | |||
15 | diff --git a/net/mptcp/pm_netlink.c b/net/mptcp/pm_netlink.c | ||
16 | index XXXXXXX..XXXXXXX 100644 | ||
17 | --- a/net/mptcp/pm_netlink.c | ||
18 | +++ b/net/mptcp/pm_netlink.c | ||
19 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_set_flags(struct mptcp_pm_addr_entry *local, | ||
20 | *local = *entry; | ||
21 | spin_unlock_bh(&pernet->lock); | ||
22 | |||
23 | - mptcp_nl_set_flags(net, &local->addr, entry->flags, changed); | ||
24 | + mptcp_nl_set_flags(net, &local->addr, local->flags, changed); | ||
25 | return 0; | ||
26 | } | ||
27 | |||
28 | -- | ||
29 | 2.43.0 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | From: Geliang Tang <tanggeliang@kylinos.cn> | ||
1 | 2 | ||
3 | The number of parameters in mptcp_nl_set_flags() can be reduced. | ||
4 | Only need to pass a "local" parameter to it instead of "local->addr" | ||
5 | and "local->flags". | ||
6 | |||
7 | Signed-off-by: Geliang Tang <tanggeliang@kylinos.cn> | ||
8 | --- | ||
9 | net/mptcp/pm_netlink.c | 15 ++++++++------- | ||
10 | 1 file changed, 8 insertions(+), 7 deletions(-) | ||
11 | |||
12 | diff --git a/net/mptcp/pm_netlink.c b/net/mptcp/pm_netlink.c | ||
13 | index XXXXXXX..XXXXXXX 100644 | ||
14 | --- a/net/mptcp/pm_netlink.c | ||
15 | +++ b/net/mptcp/pm_netlink.c | ||
16 | @@ -XXX,XX +XXX,XX @@ static void mptcp_pm_nl_fullmesh(struct mptcp_sock *msk, | ||
17 | spin_unlock_bh(&msk->pm.lock); | ||
18 | } | ||
19 | |||
20 | -static void mptcp_nl_set_flags(struct net *net, struct mptcp_addr_info *addr, | ||
21 | - u8 flags, u8 changed) | ||
22 | +static void mptcp_nl_set_flags(struct net *net, | ||
23 | + struct mptcp_pm_addr_entry *local, | ||
24 | + u8 changed) | ||
25 | { | ||
26 | - u8 is_subflow = !!(flags & MPTCP_PM_ADDR_FLAG_SUBFLOW); | ||
27 | - u8 bkup = !!(flags & MPTCP_PM_ADDR_FLAG_BACKUP); | ||
28 | + u8 is_subflow = !!(local->flags & MPTCP_PM_ADDR_FLAG_SUBFLOW); | ||
29 | + u8 bkup = !!(local->flags & MPTCP_PM_ADDR_FLAG_BACKUP); | ||
30 | long s_slot = 0, s_num = 0; | ||
31 | struct mptcp_sock *msk; | ||
32 | |||
33 | @@ -XXX,XX +XXX,XX @@ static void mptcp_nl_set_flags(struct net *net, struct mptcp_addr_info *addr, | ||
34 | |||
35 | lock_sock(sk); | ||
36 | if (changed & MPTCP_PM_ADDR_FLAG_BACKUP) | ||
37 | - mptcp_pm_nl_mp_prio_send_ack(msk, addr, NULL, bkup); | ||
38 | + mptcp_pm_nl_mp_prio_send_ack(msk, &local->addr, NULL, bkup); | ||
39 | /* Subflows will only be recreated if the SUBFLOW flag is set */ | ||
40 | if (is_subflow && (changed & MPTCP_PM_ADDR_FLAG_FULLMESH)) | ||
41 | - mptcp_pm_nl_fullmesh(msk, addr); | ||
42 | + mptcp_pm_nl_fullmesh(msk, &local->addr); | ||
43 | release_sock(sk); | ||
44 | |||
45 | next: | ||
46 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_set_flags(struct mptcp_pm_addr_entry *local, | ||
47 | *local = *entry; | ||
48 | spin_unlock_bh(&pernet->lock); | ||
49 | |||
50 | - mptcp_nl_set_flags(net, &local->addr, local->flags, changed); | ||
51 | + mptcp_nl_set_flags(net, local, changed); | ||
52 | return 0; | ||
53 | } | ||
54 | |||
55 | -- | ||
56 | 2.43.0 | diff view generated by jsdifflib |
1 | From: Geliang Tang <tanggeliang@kylinos.cn> | 1 | From: Geliang Tang <tanggeliang@kylinos.cn> |
---|---|---|---|
2 | 2 | ||
3 | This patch defines the original userspace pm as the default path manager, | 3 | The following code in mptcp_userspace_pm_get_local_id() that assigns "skc" |
4 | named mptcp_userspace_pm, and register it in mptcp_pm_data_init(). | 4 | to "new_entry" is not allowed in BPF if we use the same code to implement |
5 | the get_local_id() interface of a BFP path manager: | ||
5 | 6 | ||
6 | Extract address_announce() interface of the userspace PM from the handler | 7 | memset(&new_entry, 0, sizeof(struct mptcp_pm_addr_entry)); |
7 | of netlink commond MPTCP_PM_CMD_ANNOUNCE mptcp_pm_nl_announce_doit(), only | 8 | new_entry.addr = *skc; |
8 | leave the code for obtaining msk through "info" and parsing address entry | 9 | new_entry.addr.id = 0; |
9 | in the handler. | 10 | new_entry.flags = MPTCP_PM_ADDR_FLAG_IMPLICIT; |
10 | 11 | ||
11 | Extract address_remove() interface of the userspace PM from the handler | 12 | To solve the issue, this patch moves this assignment to "new_entry" forward |
12 | of netlink commond MPTCP_PM_CMD_REMOVE mptcp_pm_nl_remove_doit(), only | 13 | to mptcp_pm_get_local_id(), and then passing "new_entry" as a parameter to |
13 | leave the code for parsing address id and obtaining msk through "info" | 14 | both mptcp_pm_nl_get_local_id() and mptcp_userspace_pm_get_local_id(). |
14 | in the handler. | ||
15 | |||
16 | Extract subflow_create() interface of the userspace PM from the handler of | ||
17 | netlink commond MPTCP_PM_CMD_SUBFLOW_CREATE | ||
18 | |||
19 | mptcp_pm_nl_subflow_create_doit(), | ||
20 | |||
21 | only leave the code for obtaining msk through "info", parsing local address | ||
22 | entry and parsing remote address info in the handler. | ||
23 | |||
24 | Extract subflow_destroy() interface of the userspace PM from the handler of | ||
25 | netlink commond MPTCP_PM_CMD_SUBFLOW_DESTROY | ||
26 | |||
27 | mptcp_pm_nl_subflow_destroy_doit(), | ||
28 | |||
29 | only leave the code for obtaining msk through "info", parsing local address | ||
30 | entry and parsing remote address info in the handler. | ||
31 | |||
32 | Extract set_flags() interface of the userspace PM from function | ||
33 | mptcp_userspace_pm_set_flags(), only leave the code for obtaining | ||
34 | msk through "info" in this function. | ||
35 | |||
36 | All fives interfaces are invoked under holding the msk socket lock. | ||
37 | |||
38 | Other interfaces get_local_id() and get_flags() are only defined as | ||
39 | wrappers. | ||
40 | 15 | ||
41 | Signed-off-by: Geliang Tang <tanggeliang@kylinos.cn> | 16 | Signed-off-by: Geliang Tang <tanggeliang@kylinos.cn> |
42 | --- | 17 | --- |
43 | net/mptcp/pm.c | 1 + | 18 | net/mptcp/pm.c | 9 ++++++--- |
44 | net/mptcp/pm_userspace.c | 261 ++++++++++++++++++++++++--------------- | 19 | net/mptcp/pm_netlink.c | 11 ++++------- |
45 | net/mptcp/protocol.h | 1 + | 20 | net/mptcp/pm_userspace.c | 17 ++++++----------- |
46 | 3 files changed, 165 insertions(+), 98 deletions(-) | 21 | net/mptcp/protocol.h | 6 ++++-- |
22 | 4 files changed, 20 insertions(+), 23 deletions(-) | ||
47 | 23 | ||
48 | diff --git a/net/mptcp/pm.c b/net/mptcp/pm.c | 24 | diff --git a/net/mptcp/pm.c b/net/mptcp/pm.c |
49 | index XXXXXXX..XXXXXXX 100644 | 25 | index XXXXXXX..XXXXXXX 100644 |
50 | --- a/net/mptcp/pm.c | 26 | --- a/net/mptcp/pm.c |
51 | +++ b/net/mptcp/pm.c | 27 | +++ b/net/mptcp/pm.c |
52 | @@ -XXX,XX +XXX,XX @@ void mptcp_pm_data_init(struct mptcp_sock *msk) | 28 | @@ -XXX,XX +XXX,XX @@ bool mptcp_pm_rm_addr_signal(struct mptcp_sock *msk, unsigned int remaining, |
53 | void __init mptcp_pm_init(void) | 29 | |
30 | int mptcp_pm_get_local_id(struct mptcp_sock *msk, struct sock_common *skc) | ||
54 | { | 31 | { |
55 | mptcp_pm_nl_init(); | 32 | - struct mptcp_addr_info skc_local; |
56 | + mptcp_userspace_pm_init(); | 33 | + struct mptcp_pm_addr_entry skc_local = { 0 }; |
34 | struct mptcp_addr_info msk_local; | ||
35 | |||
36 | if (WARN_ON_ONCE(!msk)) | ||
37 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_get_local_id(struct mptcp_sock *msk, struct sock_common *skc) | ||
38 | * addr | ||
39 | */ | ||
40 | mptcp_local_address((struct sock_common *)msk, &msk_local); | ||
41 | - mptcp_local_address((struct sock_common *)skc, &skc_local); | ||
42 | - if (mptcp_addresses_equal(&msk_local, &skc_local, false)) | ||
43 | + mptcp_local_address((struct sock_common *)skc, &skc_local.addr); | ||
44 | + if (mptcp_addresses_equal(&msk_local, &skc_local.addr, false)) | ||
45 | return 0; | ||
46 | |||
47 | + skc_local.addr.id = 0; | ||
48 | + skc_local.flags = MPTCP_PM_ADDR_FLAG_IMPLICIT; | ||
49 | + | ||
50 | if (mptcp_pm_is_userspace(msk)) | ||
51 | return mptcp_userspace_pm_get_local_id(msk, &skc_local); | ||
52 | return mptcp_pm_nl_get_local_id(msk, &skc_local); | ||
53 | diff --git a/net/mptcp/pm_netlink.c b/net/mptcp/pm_netlink.c | ||
54 | index XXXXXXX..XXXXXXX 100644 | ||
55 | --- a/net/mptcp/pm_netlink.c | ||
56 | +++ b/net/mptcp/pm_netlink.c | ||
57 | @@ -XXX,XX +XXX,XX @@ static int mptcp_pm_nl_create_listen_socket(struct sock *sk, | ||
58 | return err; | ||
57 | } | 59 | } |
60 | |||
61 | -int mptcp_pm_nl_get_local_id(struct mptcp_sock *msk, struct mptcp_addr_info *skc) | ||
62 | +int mptcp_pm_nl_get_local_id(struct mptcp_sock *msk, | ||
63 | + struct mptcp_pm_addr_entry *skc) | ||
64 | { | ||
65 | struct mptcp_pm_addr_entry *entry; | ||
66 | struct pm_nl_pernet *pernet; | ||
67 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_get_local_id(struct mptcp_sock *msk, struct mptcp_addr_info *skc | ||
68 | pernet = pm_nl_get_pernet_from_msk(msk); | ||
69 | |||
70 | rcu_read_lock(); | ||
71 | - entry = __lookup_addr(pernet, skc); | ||
72 | + entry = __lookup_addr(pernet, &skc->addr); | ||
73 | ret = entry ? entry->addr.id : -1; | ||
74 | rcu_read_unlock(); | ||
75 | if (ret >= 0) | ||
76 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_get_local_id(struct mptcp_sock *msk, struct mptcp_addr_info *skc | ||
77 | if (!entry) | ||
78 | return -ENOMEM; | ||
79 | |||
80 | - entry->addr = *skc; | ||
81 | - entry->addr.id = 0; | ||
82 | + *entry = *skc; | ||
83 | entry->addr.port = 0; | ||
84 | - entry->ifindex = 0; | ||
85 | - entry->flags = MPTCP_PM_ADDR_FLAG_IMPLICIT; | ||
86 | - entry->lsk = NULL; | ||
87 | ret = mptcp_pm_nl_append_new_local_addr(pernet, entry, true); | ||
88 | if (ret < 0) | ||
89 | kfree(entry); | ||
58 | diff --git a/net/mptcp/pm_userspace.c b/net/mptcp/pm_userspace.c | 90 | diff --git a/net/mptcp/pm_userspace.c b/net/mptcp/pm_userspace.c |
59 | index XXXXXXX..XXXXXXX 100644 | 91 | index XXXXXXX..XXXXXXX 100644 |
60 | --- a/net/mptcp/pm_userspace.c | 92 | --- a/net/mptcp/pm_userspace.c |
61 | +++ b/net/mptcp/pm_userspace.c | 93 | +++ b/net/mptcp/pm_userspace.c |
62 | @@ -XXX,XX +XXX,XX @@ mptcp_userspace_pm_lookup_addr_by_id(struct mptcp_sock *msk, unsigned int id) | 94 | @@ -XXX,XX +XXX,XX @@ mptcp_userspace_pm_lookup_addr_by_id(struct mptcp_sock *msk, unsigned int id) |
63 | return NULL; | ||
64 | } | 95 | } |
65 | 96 | ||
66 | -int mptcp_userspace_pm_get_local_id(struct mptcp_sock *msk, | 97 | int mptcp_userspace_pm_get_local_id(struct mptcp_sock *msk, |
67 | - struct mptcp_pm_addr_entry *local) | 98 | - struct mptcp_addr_info *skc) |
68 | +static int userspace_pm_get_local_id(struct mptcp_sock *msk, | 99 | + struct mptcp_pm_addr_entry *skc) |
69 | + struct mptcp_pm_addr_entry *local) | ||
70 | { | 100 | { |
101 | - struct mptcp_pm_addr_entry *entry = NULL, new_entry; | ||
71 | __be16 msk_sport = ((struct inet_sock *) | 102 | __be16 msk_sport = ((struct inet_sock *) |
72 | inet_sk((struct sock *)msk))->inet_sport; | 103 | inet_sk((struct sock *)msk))->inet_sport; |
73 | @@ -XXX,XX +XXX,XX @@ int mptcp_userspace_pm_get_local_id(struct mptcp_sock *msk, | 104 | + struct mptcp_pm_addr_entry *entry; |
74 | return mptcp_userspace_pm_append_new_local_addr(msk, local, true); | 105 | |
106 | spin_lock_bh(&msk->pm.lock); | ||
107 | - entry = mptcp_userspace_pm_lookup_addr(msk, skc); | ||
108 | + entry = mptcp_userspace_pm_lookup_addr(msk, &skc->addr); | ||
109 | spin_unlock_bh(&msk->pm.lock); | ||
110 | if (entry) | ||
111 | return entry->addr.id; | ||
112 | |||
113 | - memset(&new_entry, 0, sizeof(struct mptcp_pm_addr_entry)); | ||
114 | - new_entry.addr = *skc; | ||
115 | - new_entry.addr.id = 0; | ||
116 | - new_entry.flags = MPTCP_PM_ADDR_FLAG_IMPLICIT; | ||
117 | - | ||
118 | - if (new_entry.addr.port == msk_sport) | ||
119 | - new_entry.addr.port = 0; | ||
120 | + if (skc->addr.port == msk_sport) | ||
121 | + skc->addr.port = 0; | ||
122 | |||
123 | - return mptcp_userspace_pm_append_new_local_addr(msk, &new_entry, true); | ||
124 | + return mptcp_userspace_pm_append_new_local_addr(msk, skc, true); | ||
75 | } | 125 | } |
76 | 126 | ||
77 | -u8 mptcp_userspace_pm_get_flags(struct mptcp_sock *msk, | 127 | bool mptcp_userspace_pm_is_backup(struct mptcp_sock *msk, |
78 | - struct mptcp_addr_info *skc) | ||
79 | +int mptcp_userspace_pm_get_local_id(struct mptcp_sock *msk, | ||
80 | + struct mptcp_pm_addr_entry *local) | ||
81 | +{ | ||
82 | + return userspace_pm_get_local_id(msk, local); | ||
83 | +} | ||
84 | + | ||
85 | +static u8 userspace_pm_get_flags(struct mptcp_sock *msk, | ||
86 | + struct mptcp_addr_info *skc) | ||
87 | { | ||
88 | struct mptcp_pm_addr_entry *entry; | ||
89 | u8 flags; | ||
90 | @@ -XXX,XX +XXX,XX @@ u8 mptcp_userspace_pm_get_flags(struct mptcp_sock *msk, | ||
91 | return flags; | ||
92 | } | ||
93 | |||
94 | +u8 mptcp_userspace_pm_get_flags(struct mptcp_sock *msk, | ||
95 | + struct mptcp_addr_info *skc) | ||
96 | +{ | ||
97 | + return userspace_pm_get_flags(msk, skc); | ||
98 | +} | ||
99 | + | ||
100 | static struct mptcp_sock *mptcp_userspace_pm_get_sock(const struct genl_info *info) | ||
101 | { | ||
102 | struct mptcp_sock *msk; | ||
103 | @@ -XXX,XX +XXX,XX @@ static struct mptcp_sock *mptcp_userspace_pm_get_sock(const struct genl_info *in | ||
104 | return msk; | ||
105 | } | ||
106 | |||
107 | +static int userspace_pm_address_announce(struct mptcp_sock *msk, | ||
108 | + struct mptcp_pm_addr_entry *local) | ||
109 | +{ | ||
110 | + int err; | ||
111 | + | ||
112 | + err = mptcp_userspace_pm_append_new_local_addr(msk, local, false); | ||
113 | + if (err < 0) | ||
114 | + return err; | ||
115 | + | ||
116 | + spin_lock_bh(&msk->pm.lock); | ||
117 | + | ||
118 | + if (mptcp_pm_alloc_anno_list(msk, &local->addr)) { | ||
119 | + msk->pm.add_addr_signaled++; | ||
120 | + mptcp_pm_announce_addr(msk, &local->addr, false); | ||
121 | + mptcp_pm_nl_addr_send_ack(msk); | ||
122 | + } | ||
123 | + | ||
124 | + spin_unlock_bh(&msk->pm.lock); | ||
125 | + | ||
126 | + return 0; | ||
127 | +} | ||
128 | + | ||
129 | int mptcp_pm_nl_announce_doit(struct sk_buff *skb, struct genl_info *info) | ||
130 | { | ||
131 | struct mptcp_pm_addr_entry addr_val; | ||
132 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_announce_doit(struct sk_buff *skb, struct genl_info *info) | ||
133 | goto announce_err; | ||
134 | } | ||
135 | |||
136 | - err = mptcp_userspace_pm_append_new_local_addr(msk, &addr_val, false); | ||
137 | - if (err < 0) { | ||
138 | - NL_SET_ERR_MSG_ATTR(info->extack, addr, | ||
139 | - "did not match address and id"); | ||
140 | - goto announce_err; | ||
141 | - } | ||
142 | - | ||
143 | lock_sock(sk); | ||
144 | - spin_lock_bh(&msk->pm.lock); | ||
145 | - | ||
146 | - if (mptcp_pm_alloc_anno_list(msk, &addr_val.addr)) { | ||
147 | - msk->pm.add_addr_signaled++; | ||
148 | - mptcp_pm_announce_addr(msk, &addr_val.addr, false); | ||
149 | - mptcp_pm_nl_addr_send_ack(msk); | ||
150 | - } | ||
151 | - | ||
152 | - spin_unlock_bh(&msk->pm.lock); | ||
153 | + err = userspace_pm_address_announce(msk, &addr_val); | ||
154 | release_sock(sk); | ||
155 | + if (err) | ||
156 | + NL_SET_ERR_MSG_ATTR(info->extack, addr, | ||
157 | + "did not match address and id"); | ||
158 | |||
159 | - err = 0; | ||
160 | announce_err: | ||
161 | sock_put(sk); | ||
162 | return err; | ||
163 | @@ -XXX,XX +XXX,XX @@ void mptcp_pm_remove_addr_entry(struct mptcp_sock *msk, | ||
164 | spin_unlock_bh(&msk->pm.lock); | ||
165 | } | ||
166 | |||
167 | +static int userspace_pm_address_remove(struct mptcp_sock *msk, u8 id) | ||
168 | +{ | ||
169 | + struct mptcp_pm_addr_entry *entry; | ||
170 | + | ||
171 | + if (id == 0) | ||
172 | + return mptcp_userspace_pm_remove_id_zero_address(msk); | ||
173 | + | ||
174 | + spin_lock_bh(&msk->pm.lock); | ||
175 | + entry = mptcp_userspace_pm_lookup_addr_by_id(msk, id); | ||
176 | + if (!entry) { | ||
177 | + spin_unlock_bh(&msk->pm.lock); | ||
178 | + return -EINVAL; | ||
179 | + } | ||
180 | + | ||
181 | + list_del_rcu(&entry->list); | ||
182 | + spin_unlock_bh(&msk->pm.lock); | ||
183 | + | ||
184 | + mptcp_pm_remove_addr_entry(msk, entry); | ||
185 | + | ||
186 | + sock_kfree_s((struct sock *)msk, entry, sizeof(*entry)); | ||
187 | + | ||
188 | + return 0; | ||
189 | +} | ||
190 | + | ||
191 | int mptcp_pm_nl_remove_doit(struct sk_buff *skb, struct genl_info *info) | ||
192 | { | ||
193 | - struct mptcp_pm_addr_entry *match; | ||
194 | struct mptcp_sock *msk; | ||
195 | struct nlattr *id; | ||
196 | int err = -EINVAL; | ||
197 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_remove_doit(struct sk_buff *skb, struct genl_info *info) | ||
198 | sk = (struct sock *)msk; | ||
199 | |||
200 | lock_sock(sk); | ||
201 | - | ||
202 | - if (id_val == 0) { | ||
203 | - err = mptcp_userspace_pm_remove_id_zero_address(msk); | ||
204 | - release_sock(sk); | ||
205 | - goto out; | ||
206 | - } | ||
207 | - | ||
208 | - spin_lock_bh(&msk->pm.lock); | ||
209 | - match = mptcp_userspace_pm_lookup_addr_by_id(msk, id_val); | ||
210 | - if (!match) { | ||
211 | - spin_unlock_bh(&msk->pm.lock); | ||
212 | - release_sock(sk); | ||
213 | - goto out; | ||
214 | - } | ||
215 | - | ||
216 | - list_del_rcu(&match->list); | ||
217 | - spin_unlock_bh(&msk->pm.lock); | ||
218 | - | ||
219 | - mptcp_pm_remove_addr_entry(msk, match); | ||
220 | - | ||
221 | + err = userspace_pm_address_remove(msk, id_val); | ||
222 | release_sock(sk); | ||
223 | - | ||
224 | - sock_kfree_s(sk, match, sizeof(*match)); | ||
225 | - | ||
226 | - err = 0; | ||
227 | -out: | ||
228 | if (err) | ||
229 | NL_SET_ERR_MSG_ATTR_FMT(info->extack, id, | ||
230 | "address with id %u not found", | ||
231 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_remove_doit(struct sk_buff *skb, struct genl_info *info) | ||
232 | return err; | ||
233 | } | ||
234 | |||
235 | +static int userspace_pm_subflow_create(struct mptcp_sock *msk, | ||
236 | + struct mptcp_pm_addr_entry *entry, | ||
237 | + struct mptcp_addr_info *remote) | ||
238 | +{ | ||
239 | + struct sock *sk = (struct sock *)msk; | ||
240 | + struct mptcp_pm_local local; | ||
241 | + int err; | ||
242 | + | ||
243 | + err = mptcp_userspace_pm_append_new_local_addr(msk, entry, false); | ||
244 | + if (err < 0) | ||
245 | + return err; | ||
246 | + | ||
247 | + local.addr = entry->addr; | ||
248 | + local.flags = entry->flags; | ||
249 | + local.ifindex = entry->ifindex; | ||
250 | + | ||
251 | + err = __mptcp_subflow_connect(sk, &local, remote); | ||
252 | + spin_lock_bh(&msk->pm.lock); | ||
253 | + if (err) | ||
254 | + mptcp_userspace_pm_delete_local_addr(msk, entry); | ||
255 | + else | ||
256 | + msk->pm.subflows++; | ||
257 | + spin_unlock_bh(&msk->pm.lock); | ||
258 | + | ||
259 | + return 0; | ||
260 | +} | ||
261 | + | ||
262 | int mptcp_pm_nl_subflow_create_doit(struct sk_buff *skb, struct genl_info *info) | ||
263 | { | ||
264 | struct mptcp_pm_addr_entry entry = { 0 }; | ||
265 | struct mptcp_addr_info addr_r; | ||
266 | struct nlattr *raddr, *laddr; | ||
267 | - struct mptcp_pm_local local; | ||
268 | struct mptcp_sock *msk; | ||
269 | int err = -EINVAL; | ||
270 | struct sock *sk; | ||
271 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_subflow_create_doit(struct sk_buff *skb, struct genl_info *info) | ||
272 | goto create_err; | ||
273 | } | ||
274 | |||
275 | - err = mptcp_userspace_pm_append_new_local_addr(msk, &entry, false); | ||
276 | - if (err < 0) { | ||
277 | - NL_SET_ERR_MSG_ATTR(info->extack, laddr, | ||
278 | - "did not match address and id"); | ||
279 | - goto create_err; | ||
280 | - } | ||
281 | - | ||
282 | - local.addr = entry.addr; | ||
283 | - local.flags = entry.flags; | ||
284 | - local.ifindex = entry.ifindex; | ||
285 | - | ||
286 | lock_sock(sk); | ||
287 | - err = __mptcp_subflow_connect(sk, &local, &addr_r); | ||
288 | + err = userspace_pm_subflow_create(msk, &entry, &addr_r); | ||
289 | release_sock(sk); | ||
290 | |||
291 | if (err) | ||
292 | GENL_SET_ERR_MSG_FMT(info, "connect error: %d", err); | ||
293 | |||
294 | - spin_lock_bh(&msk->pm.lock); | ||
295 | - if (err) | ||
296 | - mptcp_userspace_pm_delete_local_addr(msk, &entry); | ||
297 | - else | ||
298 | - msk->pm.subflows++; | ||
299 | - spin_unlock_bh(&msk->pm.lock); | ||
300 | - | ||
301 | create_err: | ||
302 | sock_put(sk); | ||
303 | return err; | ||
304 | @@ -XXX,XX +XXX,XX @@ static struct sock *mptcp_nl_find_ssk(struct mptcp_sock *msk, | ||
305 | return NULL; | ||
306 | } | ||
307 | |||
308 | +static int userspace_pm_subflow_destroy(struct mptcp_sock *msk, | ||
309 | + struct mptcp_pm_addr_entry *local, | ||
310 | + struct mptcp_addr_info *remote) | ||
311 | +{ | ||
312 | + struct sock *ssk, *sk = (struct sock *)msk; | ||
313 | + | ||
314 | + ssk = mptcp_nl_find_ssk(msk, &local->addr, remote); | ||
315 | + if (!ssk) | ||
316 | + return -ESRCH; | ||
317 | + | ||
318 | + spin_lock_bh(&msk->pm.lock); | ||
319 | + mptcp_userspace_pm_delete_local_addr(msk, local); | ||
320 | + spin_unlock_bh(&msk->pm.lock); | ||
321 | + mptcp_subflow_shutdown(sk, ssk, RCV_SHUTDOWN | SEND_SHUTDOWN); | ||
322 | + mptcp_close_ssk(sk, ssk, mptcp_subflow_ctx(ssk)); | ||
323 | + MPTCP_INC_STATS(sock_net(sk), MPTCP_MIB_RMSUBFLOW); | ||
324 | + | ||
325 | + return 0; | ||
326 | +} | ||
327 | + | ||
328 | int mptcp_pm_nl_subflow_destroy_doit(struct sk_buff *skb, struct genl_info *info) | ||
329 | { | ||
330 | struct mptcp_pm_addr_entry addr_l; | ||
331 | struct mptcp_addr_info addr_r; | ||
332 | struct nlattr *raddr, *laddr; | ||
333 | struct mptcp_sock *msk; | ||
334 | - struct sock *sk, *ssk; | ||
335 | int err = -EINVAL; | ||
336 | + struct sock *sk; | ||
337 | |||
338 | if (GENL_REQ_ATTR_CHECK(info, MPTCP_PM_ATTR_ADDR) || | ||
339 | GENL_REQ_ATTR_CHECK(info, MPTCP_PM_ATTR_ADDR_REMOTE)) | ||
340 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_subflow_destroy_doit(struct sk_buff *skb, struct genl_info *info | ||
341 | } | ||
342 | |||
343 | lock_sock(sk); | ||
344 | - ssk = mptcp_nl_find_ssk(msk, &addr_l.addr, &addr_r); | ||
345 | - if (!ssk) { | ||
346 | - GENL_SET_ERR_MSG(info, "subflow not found"); | ||
347 | - err = -ESRCH; | ||
348 | - goto release_sock; | ||
349 | - } | ||
350 | - | ||
351 | - spin_lock_bh(&msk->pm.lock); | ||
352 | - mptcp_userspace_pm_delete_local_addr(msk, &addr_l); | ||
353 | - spin_unlock_bh(&msk->pm.lock); | ||
354 | - mptcp_subflow_shutdown(sk, ssk, RCV_SHUTDOWN | SEND_SHUTDOWN); | ||
355 | - mptcp_close_ssk(sk, ssk, mptcp_subflow_ctx(ssk)); | ||
356 | - MPTCP_INC_STATS(sock_net(sk), MPTCP_MIB_RMSUBFLOW); | ||
357 | -release_sock: | ||
358 | + err = userspace_pm_subflow_destroy(msk, &addr_l, &addr_r); | ||
359 | release_sock(sk); | ||
360 | + if (err) | ||
361 | + GENL_SET_ERR_MSG(info, "subflow not found"); | ||
362 | |||
363 | destroy_err: | ||
364 | sock_put(sk); | ||
365 | return err; | ||
366 | } | ||
367 | |||
368 | +static int userspace_pm_set_flags(struct mptcp_sock *msk, | ||
369 | + struct mptcp_pm_addr_entry *local, | ||
370 | + struct mptcp_addr_info *remote) | ||
371 | +{ | ||
372 | + struct mptcp_pm_addr_entry *entry; | ||
373 | + u8 bkup = 0; | ||
374 | + | ||
375 | + if (local->flags & MPTCP_PM_ADDR_FLAG_BACKUP) | ||
376 | + bkup = 1; | ||
377 | + | ||
378 | + spin_lock_bh(&msk->pm.lock); | ||
379 | + entry = mptcp_userspace_pm_lookup_addr(msk, &local->addr); | ||
380 | + if (entry) { | ||
381 | + if (bkup) | ||
382 | + entry->flags |= MPTCP_PM_ADDR_FLAG_BACKUP; | ||
383 | + else | ||
384 | + entry->flags &= ~MPTCP_PM_ADDR_FLAG_BACKUP; | ||
385 | + } | ||
386 | + spin_unlock_bh(&msk->pm.lock); | ||
387 | + | ||
388 | + return mptcp_pm_nl_mp_prio_send_ack(msk, &local->addr, remote, bkup); | ||
389 | +} | ||
390 | + | ||
391 | int mptcp_userspace_pm_set_flags(struct mptcp_pm_addr_entry *local, | ||
392 | struct genl_info *info) | ||
393 | { | ||
394 | struct mptcp_addr_info rem = { .family = AF_UNSPEC, }; | ||
395 | - struct mptcp_pm_addr_entry *entry; | ||
396 | struct nlattr *attr, *attr_rem; | ||
397 | struct mptcp_sock *msk; | ||
398 | int ret = -EINVAL; | ||
399 | struct sock *sk; | ||
400 | - u8 bkup = 0; | ||
401 | |||
402 | if (GENL_REQ_ATTR_CHECK(info, MPTCP_PM_ATTR_ADDR_REMOTE)) | ||
403 | return ret; | ||
404 | @@ -XXX,XX +XXX,XX @@ int mptcp_userspace_pm_set_flags(struct mptcp_pm_addr_entry *local, | ||
405 | goto set_flags_err; | ||
406 | } | ||
407 | |||
408 | - if (local->flags & MPTCP_PM_ADDR_FLAG_BACKUP) | ||
409 | - bkup = 1; | ||
410 | - | ||
411 | - spin_lock_bh(&msk->pm.lock); | ||
412 | - entry = mptcp_userspace_pm_lookup_addr(msk, &local->addr); | ||
413 | - if (entry) { | ||
414 | - if (bkup) | ||
415 | - entry->flags |= MPTCP_PM_ADDR_FLAG_BACKUP; | ||
416 | - else | ||
417 | - entry->flags &= ~MPTCP_PM_ADDR_FLAG_BACKUP; | ||
418 | - } | ||
419 | - spin_unlock_bh(&msk->pm.lock); | ||
420 | - | ||
421 | lock_sock(sk); | ||
422 | - ret = mptcp_pm_nl_mp_prio_send_ack(msk, &local->addr, &rem, bkup); | ||
423 | + ret = userspace_pm_set_flags(msk, local, &rem); | ||
424 | release_sock(sk); | ||
425 | |||
426 | /* mptcp_pm_nl_mp_prio_send_ack() only fails in one case */ | ||
427 | @@ -XXX,XX +XXX,XX @@ int mptcp_userspace_pm_get_addr(u8 id, struct mptcp_pm_addr_entry *addr, | ||
428 | return ret; | ||
429 | } | ||
430 | |||
431 | +static struct mptcp_pm_ops mptcp_userspace_pm = { | ||
432 | + .address_announce = userspace_pm_address_announce, | ||
433 | + .address_remove = userspace_pm_address_remove, | ||
434 | + .subflow_create = userspace_pm_subflow_create, | ||
435 | + .subflow_destroy = userspace_pm_subflow_destroy, | ||
436 | + .get_local_id = userspace_pm_get_local_id, | ||
437 | + .get_flags = userspace_pm_get_flags, | ||
438 | + .set_flags = userspace_pm_set_flags, | ||
439 | + .type = MPTCP_PM_TYPE_USERSPACE, | ||
440 | + .owner = THIS_MODULE, | ||
441 | +}; | ||
442 | + | ||
443 | /* Must be called with rcu read lock held */ | ||
444 | struct mptcp_pm_ops *mptcp_pm_find(enum mptcp_pm_type type) | ||
445 | { | ||
446 | @@ -XXX,XX +XXX,XX @@ int mptcp_register_path_manager(struct mptcp_pm_ops *pm) | ||
447 | |||
448 | void mptcp_unregister_path_manager(struct mptcp_pm_ops *pm) | ||
449 | { | ||
450 | + if (pm == &mptcp_userspace_pm) | ||
451 | + return; | ||
452 | + | ||
453 | spin_lock(&mptcp_pm_list_lock); | ||
454 | list_del_rcu(&pm->list); | ||
455 | spin_unlock(&mptcp_pm_list_lock); | ||
456 | } | ||
457 | + | ||
458 | +void __init mptcp_userspace_pm_init(void) | ||
459 | +{ | ||
460 | + mptcp_register_path_manager(&mptcp_userspace_pm); | ||
461 | +} | ||
462 | diff --git a/net/mptcp/protocol.h b/net/mptcp/protocol.h | 128 | diff --git a/net/mptcp/protocol.h b/net/mptcp/protocol.h |
463 | index XXXXXXX..XXXXXXX 100644 | 129 | index XXXXXXX..XXXXXXX 100644 |
464 | --- a/net/mptcp/protocol.h | 130 | --- a/net/mptcp/protocol.h |
465 | +++ b/net/mptcp/protocol.h | 131 | +++ b/net/mptcp/protocol.h |
466 | @@ -XXX,XX +XXX,XX @@ static inline u8 subflow_get_local_id(const struct mptcp_subflow_context *subflo | 132 | @@ -XXX,XX +XXX,XX @@ bool mptcp_pm_add_addr_signal(struct mptcp_sock *msk, const struct sk_buff *skb, |
467 | } | 133 | bool mptcp_pm_rm_addr_signal(struct mptcp_sock *msk, unsigned int remaining, |
468 | 134 | struct mptcp_rm_list *rm_list); | |
469 | void __init mptcp_pm_nl_init(void); | 135 | int mptcp_pm_get_local_id(struct mptcp_sock *msk, struct sock_common *skc); |
470 | +void __init mptcp_userspace_pm_init(void); | 136 | -int mptcp_pm_nl_get_local_id(struct mptcp_sock *msk, struct mptcp_addr_info *skc); |
471 | void mptcp_pm_nl_work(struct mptcp_sock *msk); | 137 | -int mptcp_userspace_pm_get_local_id(struct mptcp_sock *msk, struct mptcp_addr_info *skc); |
472 | unsigned int mptcp_pm_get_add_addr_signal_max(const struct mptcp_sock *msk); | 138 | +int mptcp_pm_nl_get_local_id(struct mptcp_sock *msk, |
473 | unsigned int mptcp_pm_get_add_addr_accept_max(const struct mptcp_sock *msk); | 139 | + struct mptcp_pm_addr_entry *skc); |
140 | +int mptcp_userspace_pm_get_local_id(struct mptcp_sock *msk, | ||
141 | + struct mptcp_pm_addr_entry *skc); | ||
142 | bool mptcp_pm_is_backup(struct mptcp_sock *msk, struct sock_common *skc); | ||
143 | bool mptcp_pm_nl_is_backup(struct mptcp_sock *msk, struct mptcp_addr_info *skc); | ||
144 | bool mptcp_userspace_pm_is_backup(struct mptcp_sock *msk, struct mptcp_addr_info *skc); | ||
474 | -- | 145 | -- |
475 | 2.43.0 | 146 | 2.43.0 | diff view generated by jsdifflib |
1 | From: Geliang Tang <tanggeliang@kylinos.cn> | 1 | From: Geliang Tang <tanggeliang@kylinos.cn> |
---|---|---|---|
2 | 2 | ||
3 | Add a struct mptcp_pm_ops pointer "ops" in struct mptcp_pm_data, and two | 3 | Instead of using kmalloc() or kzalloc() to allocate an entry and |
4 | functions mptcp_init_pm() and mptcp_release_pm(), to set and release this | 4 | then immediately duplicate another entry to the newly allocated |
5 | pointer. mptcp_init_pm() is invoked in mptcp_pm_data_reset(), while | 5 | one, kmemdup() helper can be used to simplify the code. |
6 | mptcp_release_pm() is invoked in __mptcp_destroy_sock(). | ||
7 | |||
8 | In this way, different userspace path managers can be initialized through | ||
9 | the pm_type sysctl, and then called into their respective interfaces | ||
10 | through "ops" of "msk->pm". | ||
11 | 6 | ||
12 | Signed-off-by: Geliang Tang <tanggeliang@kylinos.cn> | 7 | Signed-off-by: Geliang Tang <tanggeliang@kylinos.cn> |
13 | --- | 8 | --- |
14 | net/mptcp/pm.c | 7 +++++ | 9 | net/mptcp/pm_netlink.c | 6 ++---- |
15 | net/mptcp/pm_userspace.c | 58 +++++++++++++++++++++++++++++++++++----- | 10 | 1 file changed, 2 insertions(+), 4 deletions(-) |
16 | net/mptcp/protocol.c | 1 + | ||
17 | net/mptcp/protocol.h | 3 +++ | ||
18 | 4 files changed, 62 insertions(+), 7 deletions(-) | ||
19 | 11 | ||
20 | diff --git a/net/mptcp/pm.c b/net/mptcp/pm.c | 12 | diff --git a/net/mptcp/pm_netlink.c b/net/mptcp/pm_netlink.c |
21 | index XXXXXXX..XXXXXXX 100644 | 13 | index XXXXXXX..XXXXXXX 100644 |
22 | --- a/net/mptcp/pm.c | 14 | --- a/net/mptcp/pm_netlink.c |
23 | +++ b/net/mptcp/pm.c | 15 | +++ b/net/mptcp/pm_netlink.c |
24 | @@ -XXX,XX +XXX,XX @@ void mptcp_pm_data_reset(struct mptcp_sock *msk) | 16 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_get_local_id(struct mptcp_sock *msk, |
25 | { | 17 | return ret; |
26 | u8 pm_type = mptcp_get_pm_type(sock_net((struct sock *)msk)); | 18 | |
27 | struct mptcp_pm_data *pm = &msk->pm; | 19 | /* address not found, add to local list */ |
28 | + int ret; | 20 | - entry = kmalloc(sizeof(*entry), GFP_ATOMIC); |
29 | 21 | + entry = kmemdup(skc, sizeof(*skc), GFP_ATOMIC); | |
30 | pm->add_addr_signaled = 0; | 22 | if (!entry) |
31 | pm->add_addr_accepted = 0; | 23 | return -ENOMEM; |
32 | @@ -XXX,XX +XXX,XX @@ void mptcp_pm_data_reset(struct mptcp_sock *msk) | 24 | |
33 | WRITE_ONCE(pm->work_pending, 0); | 25 | - *entry = *skc; |
34 | WRITE_ONCE(pm->accept_addr, 0); | 26 | entry->addr.port = 0; |
35 | WRITE_ONCE(pm->accept_subflow, 0); | 27 | ret = mptcp_pm_nl_append_new_local_addr(pernet, entry, true); |
36 | + | 28 | if (ret < 0) |
37 | + rcu_read_lock(); | 29 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_add_addr_doit(struct sk_buff *skb, struct genl_info *info) |
38 | + ret = mptcp_init_pm(msk, mptcp_pm_find(pm_type)); | 30 | return -EINVAL; |
39 | + rcu_read_unlock(); | ||
40 | + if (ret) | ||
41 | + return; | ||
42 | } | 31 | } |
43 | 32 | ||
44 | WRITE_ONCE(pm->addr_signal, 0); | 33 | - entry = kzalloc(sizeof(*entry), GFP_KERNEL_ACCOUNT); |
45 | diff --git a/net/mptcp/pm_userspace.c b/net/mptcp/pm_userspace.c | 34 | + entry = kmemdup(&addr, sizeof(addr), GFP_KERNEL_ACCOUNT); |
46 | index XXXXXXX..XXXXXXX 100644 | 35 | if (!entry) { |
47 | --- a/net/mptcp/pm_userspace.c | 36 | GENL_SET_ERR_MSG(info, "can't allocate addr"); |
48 | +++ b/net/mptcp/pm_userspace.c | 37 | return -ENOMEM; |
49 | @@ -XXX,XX +XXX,XX @@ static int userspace_pm_get_local_id(struct mptcp_sock *msk, | ||
50 | int mptcp_userspace_pm_get_local_id(struct mptcp_sock *msk, | ||
51 | struct mptcp_pm_addr_entry *local) | ||
52 | { | ||
53 | - return userspace_pm_get_local_id(msk, local); | ||
54 | + return msk->pm.ops->get_local_id ? | ||
55 | + msk->pm.ops->get_local_id(msk, local) : | ||
56 | + userspace_pm_get_local_id(msk, local); | ||
57 | } | ||
58 | |||
59 | static u8 userspace_pm_get_flags(struct mptcp_sock *msk, | ||
60 | @@ -XXX,XX +XXX,XX @@ static u8 userspace_pm_get_flags(struct mptcp_sock *msk, | ||
61 | u8 mptcp_userspace_pm_get_flags(struct mptcp_sock *msk, | ||
62 | struct mptcp_addr_info *skc) | ||
63 | { | ||
64 | - return userspace_pm_get_flags(msk, skc); | ||
65 | + return msk->pm.ops->get_flags ? | ||
66 | + msk->pm.ops->get_flags(msk, skc) : | ||
67 | + userspace_pm_get_flags(msk, skc); | ||
68 | } | ||
69 | |||
70 | static struct mptcp_sock *mptcp_userspace_pm_get_sock(const struct genl_info *info) | ||
71 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_announce_doit(struct sk_buff *skb, struct genl_info *info) | ||
72 | } | 38 | } |
73 | 39 | ||
74 | lock_sock(sk); | 40 | - *entry = addr; |
75 | - err = userspace_pm_address_announce(msk, &addr_val); | 41 | if (entry->addr.port) { |
76 | + err = msk->pm.ops->address_announce ? | 42 | ret = mptcp_pm_nl_create_listen_socket(skb->sk, entry); |
77 | + msk->pm.ops->address_announce(msk, &addr_val) : | 43 | if (ret) { |
78 | + userspace_pm_address_announce(msk, &addr_val); | ||
79 | release_sock(sk); | ||
80 | if (err) | ||
81 | NL_SET_ERR_MSG_ATTR(info->extack, addr, | ||
82 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_remove_doit(struct sk_buff *skb, struct genl_info *info) | ||
83 | sk = (struct sock *)msk; | ||
84 | |||
85 | lock_sock(sk); | ||
86 | - err = userspace_pm_address_remove(msk, id_val); | ||
87 | + err = msk->pm.ops->address_remove ? | ||
88 | + msk->pm.ops->address_remove(msk, id_val) : | ||
89 | + userspace_pm_address_remove(msk, id_val); | ||
90 | release_sock(sk); | ||
91 | if (err) | ||
92 | NL_SET_ERR_MSG_ATTR_FMT(info->extack, id, | ||
93 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_subflow_create_doit(struct sk_buff *skb, struct genl_info *info) | ||
94 | } | ||
95 | |||
96 | lock_sock(sk); | ||
97 | - err = userspace_pm_subflow_create(msk, &entry, &addr_r); | ||
98 | + err = msk->pm.ops->subflow_create ? | ||
99 | + msk->pm.ops->subflow_create(msk, &entry, &addr_r) : | ||
100 | + userspace_pm_subflow_create(msk, &entry, &addr_r); | ||
101 | release_sock(sk); | ||
102 | |||
103 | if (err) | ||
104 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_nl_subflow_destroy_doit(struct sk_buff *skb, struct genl_info *info | ||
105 | } | ||
106 | |||
107 | lock_sock(sk); | ||
108 | - err = userspace_pm_subflow_destroy(msk, &addr_l, &addr_r); | ||
109 | + err = msk->pm.ops->subflow_destroy ? | ||
110 | + msk->pm.ops->subflow_destroy(msk, &addr_l, &addr_r) : | ||
111 | + userspace_pm_subflow_destroy(msk, &addr_l, &addr_r); | ||
112 | release_sock(sk); | ||
113 | if (err) | ||
114 | GENL_SET_ERR_MSG(info, "subflow not found"); | ||
115 | @@ -XXX,XX +XXX,XX @@ int mptcp_userspace_pm_set_flags(struct mptcp_pm_addr_entry *local, | ||
116 | } | ||
117 | |||
118 | lock_sock(sk); | ||
119 | - ret = userspace_pm_set_flags(msk, local, &rem); | ||
120 | + ret = msk->pm.ops->set_flags ? | ||
121 | + msk->pm.ops->set_flags(msk, local, &rem) : | ||
122 | + userspace_pm_set_flags(msk, local, &rem); | ||
123 | release_sock(sk); | ||
124 | |||
125 | /* mptcp_pm_nl_mp_prio_send_ack() only fails in one case */ | ||
126 | @@ -XXX,XX +XXX,XX @@ void mptcp_unregister_path_manager(struct mptcp_pm_ops *pm) | ||
127 | spin_unlock(&mptcp_pm_list_lock); | ||
128 | } | ||
129 | |||
130 | +int mptcp_init_pm(struct mptcp_sock *msk, struct mptcp_pm_ops *pm) | ||
131 | +{ | ||
132 | + if (!pm) | ||
133 | + pm = &mptcp_userspace_pm; | ||
134 | + | ||
135 | + if (!bpf_try_module_get(pm, pm->owner)) | ||
136 | + return -EBUSY; | ||
137 | + | ||
138 | + msk->pm.ops = pm; | ||
139 | + if (msk->pm.ops->init) | ||
140 | + msk->pm.ops->init(msk); | ||
141 | + | ||
142 | + pr_debug("userspace_pm type %u initialized\n", msk->pm.ops->type); | ||
143 | + return 0; | ||
144 | +} | ||
145 | + | ||
146 | +void mptcp_release_pm(struct mptcp_sock *msk) | ||
147 | +{ | ||
148 | + struct mptcp_pm_ops *pm = msk->pm.ops; | ||
149 | + | ||
150 | + if (!pm) | ||
151 | + return; | ||
152 | + | ||
153 | + msk->pm.ops = NULL; | ||
154 | + if (pm->release) | ||
155 | + pm->release(msk); | ||
156 | + | ||
157 | + bpf_module_put(pm, pm->owner); | ||
158 | +} | ||
159 | + | ||
160 | void __init mptcp_userspace_pm_init(void) | ||
161 | { | ||
162 | mptcp_register_path_manager(&mptcp_userspace_pm); | ||
163 | diff --git a/net/mptcp/protocol.c b/net/mptcp/protocol.c | ||
164 | index XXXXXXX..XXXXXXX 100644 | ||
165 | --- a/net/mptcp/protocol.c | ||
166 | +++ b/net/mptcp/protocol.c | ||
167 | @@ -XXX,XX +XXX,XX @@ static void __mptcp_destroy_sock(struct sock *sk) | ||
168 | sk_stop_timer(sk, &sk->sk_timer); | ||
169 | msk->pm.status = 0; | ||
170 | mptcp_release_sched(msk); | ||
171 | + mptcp_release_pm(msk); | ||
172 | |||
173 | sk->sk_prot->destroy(sk); | ||
174 | |||
175 | diff --git a/net/mptcp/protocol.h b/net/mptcp/protocol.h | ||
176 | index XXXXXXX..XXXXXXX 100644 | ||
177 | --- a/net/mptcp/protocol.h | ||
178 | +++ b/net/mptcp/protocol.h | ||
179 | @@ -XXX,XX +XXX,XX @@ struct mptcp_pm_data { | ||
180 | struct mptcp_addr_info remote; | ||
181 | struct list_head anno_list; | ||
182 | struct list_head userspace_pm_local_addr_list; | ||
183 | + struct mptcp_pm_ops *ops; | ||
184 | |||
185 | spinlock_t lock; /*protects the whole PM data */ | ||
186 | |||
187 | @@ -XXX,XX +XXX,XX @@ struct mptcp_pm_ops *mptcp_pm_find(enum mptcp_pm_type type); | ||
188 | int mptcp_validate_path_manager(struct mptcp_pm_ops *pm); | ||
189 | int mptcp_register_path_manager(struct mptcp_pm_ops *pm); | ||
190 | void mptcp_unregister_path_manager(struct mptcp_pm_ops *pm); | ||
191 | +int mptcp_init_pm(struct mptcp_sock *msk, struct mptcp_pm_ops *pm); | ||
192 | +void mptcp_release_pm(struct mptcp_sock *msk); | ||
193 | |||
194 | void mptcp_free_local_addr_list(struct mptcp_sock *msk); | ||
195 | |||
196 | -- | 44 | -- |
197 | 2.43.0 | 45 | 2.43.0 | diff view generated by jsdifflib |
New patch | |||
---|---|---|---|
1 | From: Geliang Tang <tanggeliang@kylinos.cn> | ||
1 | 2 | ||
3 | This patch adds the sock version of kmemdup() helper, named sock_kmemdup(), | ||
4 | to duplicate a memory block using the socket's option memory buffer. | ||
5 | |||
6 | Signed-off-by: Geliang Tang <tanggeliang@kylinos.cn> | ||
7 | --- | ||
8 | include/net/sock.h | 1 + | ||
9 | net/core/sock.c | 23 +++++++++++++++++++++++ | ||
10 | 2 files changed, 24 insertions(+) | ||
11 | |||
12 | diff --git a/include/net/sock.h b/include/net/sock.h | ||
13 | index XXXXXXX..XXXXXXX 100644 | ||
14 | --- a/include/net/sock.h | ||
15 | +++ b/include/net/sock.h | ||
16 | @@ -XXX,XX +XXX,XX @@ static inline struct sk_buff *sock_alloc_send_skb(struct sock *sk, | ||
17 | } | ||
18 | |||
19 | void *sock_kmalloc(struct sock *sk, int size, gfp_t priority); | ||
20 | +void *sock_kmemdup(struct sock *sk, const void *src, int size, gfp_t priority); | ||
21 | void sock_kfree_s(struct sock *sk, void *mem, int size); | ||
22 | void sock_kzfree_s(struct sock *sk, void *mem, int size); | ||
23 | void sk_send_sigurg(struct sock *sk); | ||
24 | diff --git a/net/core/sock.c b/net/core/sock.c | ||
25 | index XXXXXXX..XXXXXXX 100644 | ||
26 | --- a/net/core/sock.c | ||
27 | +++ b/net/core/sock.c | ||
28 | @@ -XXX,XX +XXX,XX @@ void *sock_kmalloc(struct sock *sk, int size, gfp_t priority) | ||
29 | } | ||
30 | EXPORT_SYMBOL(sock_kmalloc); | ||
31 | |||
32 | +/* | ||
33 | + * Duplicate a memory block using the socket's option memory buffer. | ||
34 | + */ | ||
35 | +void *sock_kmemdup(struct sock *sk, const void *src, int size, gfp_t priority) | ||
36 | +{ | ||
37 | + int optmem_max = READ_ONCE(sock_net(sk)->core.sysctl_optmem_max); | ||
38 | + | ||
39 | + if ((unsigned int)size <= optmem_max && | ||
40 | + atomic_read(&sk->sk_omem_alloc) + size < optmem_max) { | ||
41 | + void *mem; | ||
42 | + /* First do the add, to avoid the race if kmalloc | ||
43 | + * might sleep. | ||
44 | + */ | ||
45 | + atomic_add(size, &sk->sk_omem_alloc); | ||
46 | + mem = kmemdup(src, size, priority); | ||
47 | + if (mem) | ||
48 | + return mem; | ||
49 | + atomic_sub(size, &sk->sk_omem_alloc); | ||
50 | + } | ||
51 | + return NULL; | ||
52 | +} | ||
53 | +EXPORT_SYMBOL(sock_kmemdup); | ||
54 | + | ||
55 | /* Free an option memory block. Note, we actually want the inline | ||
56 | * here as this allows gcc to detect the nullify and fold away the | ||
57 | * condition entirely. | ||
58 | -- | ||
59 | 2.43.0 | diff view generated by jsdifflib |
1 | From: Geliang Tang <tanggeliang@kylinos.cn> | 1 | From: Geliang Tang <tanggeliang@kylinos.cn> |
---|---|---|---|
2 | 2 | ||
3 | In order to allow users to develop their own BPF-based path manager, | 3 | Instead of using sock_kmalloc() to allocate an entry and then |
4 | this patch defines a struct ops "mptcp_pm_ops" for a userspace path | 4 | immediately duplicate another entry to the newly allocated one, |
5 | manager, which contains a set of interfaces. | 5 | sock_kmemdup() helper can be used to simplify the code. |
6 | 6 | ||
7 | Add a set of functions to register, unregister, find and validate a | 7 | More importantly, the code "*e = *entry;" that assigns "entry" |
8 | given struct ops. | 8 | to "e" is not easy to implemented in BPF if we use the same code |
9 | to implement an append_new_local_addr() helper of a BFP path | ||
10 | manager. This patch avoids this type of memory assignment | ||
11 | operation. | ||
9 | 12 | ||
10 | Signed-off-by: Geliang Tang <tanggeliang@kylinos.cn> | 13 | Signed-off-by: Geliang Tang <tanggeliang@kylinos.cn> |
11 | --- | 14 | --- |
12 | include/net/mptcp.h | 27 +++++++++++++++++++ | 15 | net/mptcp/pm_userspace.c | 3 +-- |
13 | net/mptcp/pm_userspace.c | 57 ++++++++++++++++++++++++++++++++++++++++ | 16 | 1 file changed, 1 insertion(+), 2 deletions(-) |
14 | net/mptcp/protocol.h | 5 ++++ | ||
15 | 3 files changed, 89 insertions(+) | ||
16 | 17 | ||
17 | diff --git a/include/net/mptcp.h b/include/net/mptcp.h | ||
18 | index XXXXXXX..XXXXXXX 100644 | ||
19 | --- a/include/net/mptcp.h | ||
20 | +++ b/include/net/mptcp.h | ||
21 | @@ -XXX,XX +XXX,XX @@ | ||
22 | |||
23 | struct mptcp_info; | ||
24 | struct mptcp_sock; | ||
25 | +struct mptcp_pm_addr_entry; | ||
26 | struct seq_file; | ||
27 | |||
28 | /* MPTCP sk_buff extension data */ | ||
29 | @@ -XXX,XX +XXX,XX @@ struct mptcp_sched_ops { | ||
30 | void (*release)(struct mptcp_sock *msk); | ||
31 | } ____cacheline_aligned_in_smp; | ||
32 | |||
33 | +struct mptcp_pm_ops { | ||
34 | + int (*address_announce)(struct mptcp_sock *msk, | ||
35 | + struct mptcp_pm_addr_entry *local); | ||
36 | + int (*address_remove)(struct mptcp_sock *msk, u8 id); | ||
37 | + int (*subflow_create)(struct mptcp_sock *msk, | ||
38 | + struct mptcp_pm_addr_entry *local, | ||
39 | + struct mptcp_addr_info *remote); | ||
40 | + int (*subflow_destroy)(struct mptcp_sock *msk, | ||
41 | + struct mptcp_pm_addr_entry *local, | ||
42 | + struct mptcp_addr_info *remote); | ||
43 | + int (*get_local_id)(struct mptcp_sock *msk, | ||
44 | + struct mptcp_pm_addr_entry *local); | ||
45 | + u8 (*get_flags)(struct mptcp_sock *msk, | ||
46 | + struct mptcp_addr_info *skc); | ||
47 | + int (*set_flags)(struct mptcp_sock *msk, | ||
48 | + struct mptcp_pm_addr_entry *local, | ||
49 | + struct mptcp_addr_info *remote); | ||
50 | + | ||
51 | + u8 type; | ||
52 | + struct module *owner; | ||
53 | + struct list_head list; | ||
54 | + | ||
55 | + void (*init)(struct mptcp_sock *msk); | ||
56 | + void (*release)(struct mptcp_sock *msk); | ||
57 | +} ____cacheline_aligned_in_smp; | ||
58 | + | ||
59 | #ifdef CONFIG_MPTCP | ||
60 | void mptcp_init(void); | ||
61 | |||
62 | diff --git a/net/mptcp/pm_userspace.c b/net/mptcp/pm_userspace.c | 18 | diff --git a/net/mptcp/pm_userspace.c b/net/mptcp/pm_userspace.c |
63 | index XXXXXXX..XXXXXXX 100644 | 19 | index XXXXXXX..XXXXXXX 100644 |
64 | --- a/net/mptcp/pm_userspace.c | 20 | --- a/net/mptcp/pm_userspace.c |
65 | +++ b/net/mptcp/pm_userspace.c | 21 | +++ b/net/mptcp/pm_userspace.c |
66 | @@ -XXX,XX +XXX,XX @@ | 22 | @@ -XXX,XX +XXX,XX @@ static int mptcp_userspace_pm_append_new_local_addr(struct mptcp_sock *msk, |
67 | * Copyright (c) 2022, Intel Corporation. | 23 | /* Memory for the entry is allocated from the |
68 | */ | 24 | * sock option buffer. |
69 | 25 | */ | |
70 | +#include <linux/rculist.h> | 26 | - e = sock_kmalloc(sk, sizeof(*e), GFP_ATOMIC); |
71 | +#include <linux/spinlock.h> | 27 | + e = sock_kmemdup(sk, entry, sizeof(*entry), GFP_ATOMIC); |
72 | #include "protocol.h" | 28 | if (!e) { |
73 | #include "mib.h" | 29 | ret = -ENOMEM; |
74 | #include "mptcp_pm_gen.h" | 30 | goto append_err; |
75 | @@ -XXX,XX +XXX,XX @@ | 31 | } |
76 | list_for_each_entry(__entry, \ | 32 | |
77 | &((__msk)->pm.userspace_pm_local_addr_list), list) | 33 | - *e = *entry; |
78 | 34 | if (!e->addr.id && needs_id) | |
79 | +static DEFINE_SPINLOCK(mptcp_pm_list_lock); | 35 | e->addr.id = find_next_zero_bit(id_bitmap, |
80 | +static LIST_HEAD(mptcp_pm_list); | 36 | MPTCP_PM_MAX_ADDR_ID + 1, |
81 | + | ||
82 | void mptcp_free_local_addr_list(struct mptcp_sock *msk) | ||
83 | { | ||
84 | struct mptcp_pm_addr_entry *entry, *tmp; | ||
85 | @@ -XXX,XX +XXX,XX @@ int mptcp_userspace_pm_get_addr(u8 id, struct mptcp_pm_addr_entry *addr, | ||
86 | sock_put(sk); | ||
87 | return ret; | ||
88 | } | ||
89 | + | ||
90 | +/* Must be called with rcu read lock held */ | ||
91 | +struct mptcp_pm_ops *mptcp_pm_find(enum mptcp_pm_type type) | ||
92 | +{ | ||
93 | + struct mptcp_pm_ops *pm; | ||
94 | + | ||
95 | + list_for_each_entry_rcu(pm, &mptcp_pm_list, list) { | ||
96 | + if (pm->type == type) | ||
97 | + return pm; | ||
98 | + } | ||
99 | + | ||
100 | + return NULL; | ||
101 | +} | ||
102 | + | ||
103 | +int mptcp_validate_path_manager(struct mptcp_pm_ops *pm) | ||
104 | +{ | ||
105 | + if (!pm->address_announce && !pm->address_remove && | ||
106 | + !pm->subflow_create && !pm->subflow_destroy && | ||
107 | + !pm->get_local_id && !pm->get_flags && !pm->set_flags) { | ||
108 | + pr_err("%u does not implement required ops\n", pm->type); | ||
109 | + return -EINVAL; | ||
110 | + } | ||
111 | + | ||
112 | + return 0; | ||
113 | +} | ||
114 | + | ||
115 | +int mptcp_register_path_manager(struct mptcp_pm_ops *pm) | ||
116 | +{ | ||
117 | + int ret; | ||
118 | + | ||
119 | + ret = mptcp_validate_path_manager(pm); | ||
120 | + if (ret) | ||
121 | + return ret; | ||
122 | + | ||
123 | + spin_lock(&mptcp_pm_list_lock); | ||
124 | + if (mptcp_pm_find(pm->type)) { | ||
125 | + spin_unlock(&mptcp_pm_list_lock); | ||
126 | + return -EEXIST; | ||
127 | + } | ||
128 | + list_add_tail_rcu(&pm->list, &mptcp_pm_list); | ||
129 | + spin_unlock(&mptcp_pm_list_lock); | ||
130 | + | ||
131 | + pr_debug("userspace_pm type %u registered\n", pm->type); | ||
132 | + return 0; | ||
133 | +} | ||
134 | + | ||
135 | +void mptcp_unregister_path_manager(struct mptcp_pm_ops *pm) | ||
136 | +{ | ||
137 | + spin_lock(&mptcp_pm_list_lock); | ||
138 | + list_del_rcu(&pm->list); | ||
139 | + spin_unlock(&mptcp_pm_list_lock); | ||
140 | +} | ||
141 | diff --git a/net/mptcp/protocol.h b/net/mptcp/protocol.h | ||
142 | index XXXXXXX..XXXXXXX 100644 | ||
143 | --- a/net/mptcp/protocol.h | ||
144 | +++ b/net/mptcp/protocol.h | ||
145 | @@ -XXX,XX +XXX,XX @@ int mptcp_pm_remove_addr(struct mptcp_sock *msk, const struct mptcp_rm_list *rm_ | ||
146 | void mptcp_pm_remove_addr_entry(struct mptcp_sock *msk, | ||
147 | struct mptcp_pm_addr_entry *entry); | ||
148 | |||
149 | +struct mptcp_pm_ops *mptcp_pm_find(enum mptcp_pm_type type); | ||
150 | +int mptcp_validate_path_manager(struct mptcp_pm_ops *pm); | ||
151 | +int mptcp_register_path_manager(struct mptcp_pm_ops *pm); | ||
152 | +void mptcp_unregister_path_manager(struct mptcp_pm_ops *pm); | ||
153 | + | ||
154 | void mptcp_free_local_addr_list(struct mptcp_sock *msk); | ||
155 | |||
156 | void mptcp_event(enum mptcp_event_type type, const struct mptcp_sock *msk, | ||
157 | -- | 37 | -- |
158 | 2.43.0 | 38 | 2.43.0 | diff view generated by jsdifflib |