From: Geliang Tang <tanggeliang@kylinos.cn>
An MPTCP-specific version of struct nvme_tcp_proto is implemented,
and it is assigned to ctrl->proto when the transport string is "mptcp".
The socket option setting logic is similar to the target side, except that
mptcp_sock_set_syncnt is newly defined for the host side.
It sets the value on the first subflow socket of an MPTCP connection.
The value is then synchronized to other newly created subflows in
sync_socket_options().
A separate nvme_mptcp_ctrl_ops structure with .name = "mptcp" is defined
and used for MPTCP controllers.
Cc: Hannes Reinecke <hare@suse.de>
Co-developed-by: zhenwei pi <zhenwei.pi@linux.dev>
Signed-off-by: zhenwei pi <zhenwei.pi@linux.dev>
Co-developed-by: Hui Zhu <zhuhui@kylinos.cn>
Signed-off-by: Hui Zhu <zhuhui@kylinos.cn>
Co-developed-by: Gang Yan <yangang@kylinos.cn>
Signed-off-by: Gang Yan <yangang@kylinos.cn>
Signed-off-by: Geliang Tang <tanggeliang@kylinos.cn>
---
drivers/nvme/host/tcp.c | 34 ++++++++++++++++++++++++++++++++++
include/net/mptcp.h | 7 +++++++
net/mptcp/protocol.h | 1 +
net/mptcp/sockopt.c | 25 +++++++++++++++++++++++++
4 files changed, 67 insertions(+)
diff --git a/drivers/nvme/host/tcp.c b/drivers/nvme/host/tcp.c
index 30ff6e03b32f..54d27acdd4b5 100644
--- a/drivers/nvme/host/tcp.c
+++ b/drivers/nvme/host/tcp.c
@@ -2889,6 +2889,24 @@ static const struct nvme_ctrl_ops nvme_tcp_ctrl_ops = {
.get_virt_boundary = nvmf_get_virt_boundary,
};
+#ifdef CONFIG_MPTCP
+static const struct nvme_ctrl_ops nvme_mptcp_ctrl_ops = {
+ .name = "mptcp",
+ .module = THIS_MODULE,
+ .flags = NVME_F_FABRICS | NVME_F_BLOCKING,
+ .reg_read32 = nvmf_reg_read32,
+ .reg_read64 = nvmf_reg_read64,
+ .reg_write32 = nvmf_reg_write32,
+ .subsystem_reset = nvmf_subsystem_reset,
+ .free_ctrl = nvme_tcp_free_ctrl,
+ .submit_async_event = nvme_tcp_submit_async_event,
+ .delete_ctrl = nvme_tcp_delete_ctrl,
+ .get_address = nvme_tcp_get_address,
+ .stop_ctrl = nvme_tcp_stop_ctrl,
+ .get_virt_boundary = nvmf_get_virt_boundary,
+};
+#endif
+
static bool
nvme_tcp_existing_controller(struct nvmf_ctrl_options *opts)
{
@@ -2916,6 +2934,18 @@ static const struct nvme_tcp_proto nvme_tcp_proto = {
.ops = &nvme_tcp_ctrl_ops,
};
+#ifdef CONFIG_MPTCP
+static const struct nvme_tcp_proto nvme_mptcp_proto = {
+ .protocol = IPPROTO_MPTCP,
+ .set_syncnt = mptcp_sock_set_syncnt,
+ .set_nodelay = mptcp_sock_set_nodelay,
+ .no_linger = mptcp_sock_no_linger,
+ .set_priority = mptcp_sock_set_priority,
+ .set_tos = mptcp_sock_set_tos,
+ .ops = &nvme_mptcp_ctrl_ops,
+};
+#endif
+
static struct nvme_tcp_ctrl *nvme_tcp_alloc_ctrl(struct device *dev,
struct nvmf_ctrl_options *opts)
{
@@ -2982,6 +3012,10 @@ static struct nvme_tcp_ctrl *nvme_tcp_alloc_ctrl(struct device *dev,
if (!strcmp(ctrl->ctrl.opts->transport, "tcp")) {
rcu_assign_pointer(ctrl->proto, &nvme_tcp_proto);
+#ifdef CONFIG_MPTCP
+ } else if (!strcmp(ctrl->ctrl.opts->transport, "mptcp")) {
+ rcu_assign_pointer(ctrl->proto, &nvme_mptcp_proto);
+#endif
} else {
ret = -EINVAL;
goto out_free_ctrl;
diff --git a/include/net/mptcp.h b/include/net/mptcp.h
index 91ce7b9b639d..49031a111e69 100644
--- a/include/net/mptcp.h
+++ b/include/net/mptcp.h
@@ -247,6 +247,8 @@ void mptcp_sock_set_priority(struct sock *sk, u32 priority);
void mptcp_sock_no_linger(struct sock *sk);
void mptcp_sock_set_tos(struct sock *sk, int val);
+
+int mptcp_sock_set_syncnt(struct sock *sk, int val);
#else
static inline void mptcp_init(void)
@@ -343,6 +345,11 @@ static inline void mptcp_sock_set_priority(struct sock *sk, u32 priority) { }
static inline void mptcp_sock_no_linger(struct sock *sk) { }
static inline void mptcp_sock_set_tos(struct sock *sk, int val) { }
+
+static inline int mptcp_sock_set_syncnt(struct sock *sk, int val)
+{
+ return 0;
+}
#endif /* CONFIG_MPTCP */
#if IS_ENABLED(CONFIG_MPTCP_IPV6)
diff --git a/net/mptcp/protocol.h b/net/mptcp/protocol.h
index f5d4d7d030f2..84e80816b2a4 100644
--- a/net/mptcp/protocol.h
+++ b/net/mptcp/protocol.h
@@ -335,6 +335,7 @@ struct mptcp_sock {
int keepalive_idle;
int keepalive_intvl;
int maxseg;
+ int icsk_syn_retries;
struct work_struct work;
struct sk_buff *ooo_last_skb;
struct rb_root out_of_order_queue;
diff --git a/net/mptcp/sockopt.c b/net/mptcp/sockopt.c
index 0f18398932a0..814cebc9125f 100644
--- a/net/mptcp/sockopt.c
+++ b/net/mptcp/sockopt.c
@@ -1592,6 +1592,7 @@ static void sync_socket_options(struct mptcp_sock *msk, struct sock *ssk)
priority = READ_ONCE(sk->sk_priority);
if (priority > 0)
sock_set_priority(ssk, priority);
+ tcp_sock_set_syncnt(ssk, msk->icsk_syn_retries);
}
void mptcp_sockopt_sync_locked(struct mptcp_sock *msk, struct sock *ssk)
@@ -1743,3 +1744,27 @@ void mptcp_sock_set_tos(struct sock *sk, int val)
release_sock(sk);
}
EXPORT_SYMBOL(mptcp_sock_set_tos);
+
+int mptcp_sock_set_syncnt(struct sock *sk, int val)
+{
+ struct mptcp_sock *msk = mptcp_sk(sk);
+ struct sock *ssk;
+ int ret = 0;
+
+ if (val < 1 || val > MAX_TCP_SYNCNT)
+ return -EINVAL;
+
+ lock_sock(sk);
+ sockopt_seq_inc(msk);
+ msk->icsk_syn_retries = val;
+ ssk = __mptcp_nmpc_sk(msk);
+ if (IS_ERR(ssk)) {
+ ret = PTR_ERR(ssk);
+ goto unlock;
+ }
+ tcp_sock_set_syncnt(ssk, val);
+unlock:
+ release_sock(sk);
+ return ret;
+}
+EXPORT_SYMBOL(mptcp_sock_set_syncnt);
--
2.51.0