Commit 46c28dbd authored by Ursula Braun's avatar Ursula Braun Committed by David S. Miller

net/smc: no socket state changes in tasklet context

Several state changes occur during SMC socket closing. Currently
state changes triggered locally occur in process context with
lock_sock() taken while state changes triggered by peer occur in
tasklet context with bh_lock_sock() taken. bh_lock_sock() does not
wait till a lock_sock(() task in process context is finished. This
may lead to races in socket state transitions resulting in dangling
SMC-sockets, or it may lead to duplicate SMC socket freeing.
This patch introduces a closing worker to run all state changes under
lock_sock().
Signed-off-by: default avatarUrsula Braun <ubraun@linux.vnet.ibm.com>
Reviewed-by: default avatarThomas Richter <tmricht@linux.vnet.ibm.com>
Reported-by: default avatarDave Jones <davej@codemonkey.org.uk>
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parent 90e9517e
...@@ -451,6 +451,9 @@ static int smc_connect_rdma(struct smc_sock *smc) ...@@ -451,6 +451,9 @@ static int smc_connect_rdma(struct smc_sock *smc)
goto decline_rdma_unlock; goto decline_rdma_unlock;
} }
smc_close_init(smc);
smc_rx_init(smc);
if (local_contact == SMC_FIRST_CONTACT) { if (local_contact == SMC_FIRST_CONTACT) {
rc = smc_ib_ready_link(link); rc = smc_ib_ready_link(link);
if (rc) { if (rc) {
...@@ -477,7 +480,6 @@ static int smc_connect_rdma(struct smc_sock *smc) ...@@ -477,7 +480,6 @@ static int smc_connect_rdma(struct smc_sock *smc)
mutex_unlock(&smc_create_lgr_pending); mutex_unlock(&smc_create_lgr_pending);
smc_tx_init(smc); smc_tx_init(smc);
smc_rx_init(smc);
out_connected: out_connected:
smc_copy_sock_settings_to_clc(smc); smc_copy_sock_settings_to_clc(smc);
...@@ -800,6 +802,9 @@ static void smc_listen_work(struct work_struct *work) ...@@ -800,6 +802,9 @@ static void smc_listen_work(struct work_struct *work)
goto decline_rdma; goto decline_rdma;
} }
smc_close_init(new_smc);
smc_rx_init(new_smc);
rc = smc_clc_send_accept(new_smc, local_contact); rc = smc_clc_send_accept(new_smc, local_contact);
if (rc) if (rc)
goto out_err; goto out_err;
...@@ -839,7 +844,6 @@ static void smc_listen_work(struct work_struct *work) ...@@ -839,7 +844,6 @@ static void smc_listen_work(struct work_struct *work)
} }
smc_tx_init(new_smc); smc_tx_init(new_smc);
smc_rx_init(new_smc);
out_connected: out_connected:
sk_refcnt_debug_inc(newsmcsk); sk_refcnt_debug_inc(newsmcsk);
......
...@@ -164,6 +164,7 @@ struct smc_connection { ...@@ -164,6 +164,7 @@ struct smc_connection {
#ifndef KERNEL_HAS_ATOMIC64 #ifndef KERNEL_HAS_ATOMIC64
spinlock_t acurs_lock; /* protect cursors */ spinlock_t acurs_lock; /* protect cursors */
#endif #endif
struct work_struct close_work; /* peer sent some closing */
}; };
struct smc_sock { /* smc sock container */ struct smc_sock { /* smc sock container */
......
...@@ -217,8 +217,13 @@ static void smc_cdc_msg_recv_action(struct smc_sock *smc, ...@@ -217,8 +217,13 @@ static void smc_cdc_msg_recv_action(struct smc_sock *smc,
smc->sk.sk_err = ECONNRESET; smc->sk.sk_err = ECONNRESET;
conn->local_tx_ctrl.conn_state_flags.peer_conn_abort = 1; conn->local_tx_ctrl.conn_state_flags.peer_conn_abort = 1;
} }
if (smc_cdc_rxed_any_close_or_senddone(conn)) if (smc_cdc_rxed_any_close_or_senddone(conn)) {
smc_close_passive_received(smc); smc->sk.sk_shutdown |= RCV_SHUTDOWN;
if (smc->clcsock && smc->clcsock->sk)
smc->clcsock->sk->sk_shutdown |= RCV_SHUTDOWN;
sock_set_flag(&smc->sk, SOCK_DONE);
schedule_work(&conn->close_work);
}
/* piggy backed tx info */ /* piggy backed tx info */
/* trigger sndbuf consumer: RDMA write into peer RMBE and CDC */ /* trigger sndbuf consumer: RDMA write into peer RMBE and CDC */
......
...@@ -117,7 +117,6 @@ void smc_close_active_abort(struct smc_sock *smc) ...@@ -117,7 +117,6 @@ void smc_close_active_abort(struct smc_sock *smc)
struct smc_cdc_conn_state_flags *txflags = struct smc_cdc_conn_state_flags *txflags =
&smc->conn.local_tx_ctrl.conn_state_flags; &smc->conn.local_tx_ctrl.conn_state_flags;
bh_lock_sock(&smc->sk);
smc->sk.sk_err = ECONNABORTED; smc->sk.sk_err = ECONNABORTED;
if (smc->clcsock && smc->clcsock->sk) { if (smc->clcsock && smc->clcsock->sk) {
smc->clcsock->sk->sk_err = ECONNABORTED; smc->clcsock->sk->sk_err = ECONNABORTED;
...@@ -125,6 +124,7 @@ void smc_close_active_abort(struct smc_sock *smc) ...@@ -125,6 +124,7 @@ void smc_close_active_abort(struct smc_sock *smc)
} }
switch (smc->sk.sk_state) { switch (smc->sk.sk_state) {
case SMC_INIT: case SMC_INIT:
case SMC_ACTIVE:
smc->sk.sk_state = SMC_PEERABORTWAIT; smc->sk.sk_state = SMC_PEERABORTWAIT;
break; break;
case SMC_APPCLOSEWAIT1: case SMC_APPCLOSEWAIT1:
...@@ -161,7 +161,6 @@ void smc_close_active_abort(struct smc_sock *smc) ...@@ -161,7 +161,6 @@ void smc_close_active_abort(struct smc_sock *smc)
} }
sock_set_flag(&smc->sk, SOCK_DEAD); sock_set_flag(&smc->sk, SOCK_DEAD);
bh_unlock_sock(&smc->sk);
smc->sk.sk_state_change(&smc->sk); smc->sk.sk_state_change(&smc->sk);
} }
...@@ -185,7 +184,7 @@ int smc_close_active(struct smc_sock *smc) ...@@ -185,7 +184,7 @@ int smc_close_active(struct smc_sock *smc)
case SMC_INIT: case SMC_INIT:
sk->sk_state = SMC_CLOSED; sk->sk_state = SMC_CLOSED;
if (smc->smc_listen_work.func) if (smc->smc_listen_work.func)
flush_work(&smc->smc_listen_work); cancel_work_sync(&smc->smc_listen_work);
sock_put(sk); sock_put(sk);
break; break;
case SMC_LISTEN: case SMC_LISTEN:
...@@ -198,7 +197,7 @@ int smc_close_active(struct smc_sock *smc) ...@@ -198,7 +197,7 @@ int smc_close_active(struct smc_sock *smc)
} }
release_sock(sk); release_sock(sk);
smc_close_cleanup_listen(sk); smc_close_cleanup_listen(sk);
flush_work(&smc->tcp_listen_work); cancel_work_sync(&smc->smc_listen_work);
lock_sock(sk); lock_sock(sk);
break; break;
case SMC_ACTIVE: case SMC_ACTIVE:
...@@ -306,22 +305,27 @@ static void smc_close_passive_abort_received(struct smc_sock *smc) ...@@ -306,22 +305,27 @@ static void smc_close_passive_abort_received(struct smc_sock *smc)
/* Some kind of closing has been received: peer_conn_closed, peer_conn_abort, /* Some kind of closing has been received: peer_conn_closed, peer_conn_abort,
* or peer_done_writing. * or peer_done_writing.
* Called under tasklet context.
*/ */
void smc_close_passive_received(struct smc_sock *smc) static void smc_close_passive_work(struct work_struct *work)
{ {
struct smc_cdc_conn_state_flags *rxflags = struct smc_connection *conn = container_of(work,
&smc->conn.local_rx_ctrl.conn_state_flags; struct smc_connection,
close_work);
struct smc_sock *smc = container_of(conn, struct smc_sock, conn);
struct smc_cdc_conn_state_flags *rxflags;
struct sock *sk = &smc->sk; struct sock *sk = &smc->sk;
int old_state; int old_state;
sk->sk_shutdown |= RCV_SHUTDOWN; lock_sock(&smc->sk);
if (smc->clcsock && smc->clcsock->sk)
smc->clcsock->sk->sk_shutdown |= RCV_SHUTDOWN;
sock_set_flag(&smc->sk, SOCK_DONE);
old_state = sk->sk_state; old_state = sk->sk_state;
if (!conn->alert_token_local) {
/* abnormal termination */
smc_close_active_abort(smc);
goto wakeup;
}
rxflags = &smc->conn.local_rx_ctrl.conn_state_flags;
if (rxflags->peer_conn_abort) { if (rxflags->peer_conn_abort) {
smc_close_passive_abort_received(smc); smc_close_passive_abort_received(smc);
goto wakeup; goto wakeup;
...@@ -373,11 +377,12 @@ void smc_close_passive_received(struct smc_sock *smc) ...@@ -373,11 +377,12 @@ void smc_close_passive_received(struct smc_sock *smc)
sk->sk_write_space(sk); /* wakeup blocked sndbuf producers */ sk->sk_write_space(sk); /* wakeup blocked sndbuf producers */
if ((sk->sk_state == SMC_CLOSED) && if ((sk->sk_state == SMC_CLOSED) &&
(sock_flag(sk, SOCK_DEAD) || (old_state == SMC_INIT))) { (sock_flag(sk, SOCK_DEAD) || !sk->sk_socket)) {
smc_conn_free(&smc->conn); smc_conn_free(&smc->conn);
schedule_delayed_work(&smc->sock_put_work, schedule_delayed_work(&smc->sock_put_work,
SMC_CLOSE_SOCK_PUT_DELAY); SMC_CLOSE_SOCK_PUT_DELAY);
} }
release_sock(&smc->sk);
} }
void smc_close_sock_put_work(struct work_struct *work) void smc_close_sock_put_work(struct work_struct *work)
...@@ -442,3 +447,9 @@ int smc_close_shutdown_write(struct smc_sock *smc) ...@@ -442,3 +447,9 @@ int smc_close_shutdown_write(struct smc_sock *smc)
sk->sk_state_change(&smc->sk); sk->sk_state_change(&smc->sk);
return rc; return rc;
} }
/* Initialize close properties on connection establishment. */
void smc_close_init(struct smc_sock *smc)
{
INIT_WORK(&smc->conn.close_work, smc_close_passive_work);
}
...@@ -21,8 +21,8 @@ ...@@ -21,8 +21,8 @@
void smc_close_wake_tx_prepared(struct smc_sock *smc); void smc_close_wake_tx_prepared(struct smc_sock *smc);
void smc_close_active_abort(struct smc_sock *smc); void smc_close_active_abort(struct smc_sock *smc);
int smc_close_active(struct smc_sock *smc); int smc_close_active(struct smc_sock *smc);
void smc_close_passive_received(struct smc_sock *smc);
void smc_close_sock_put_work(struct work_struct *work); void smc_close_sock_put_work(struct work_struct *work);
int smc_close_shutdown_write(struct smc_sock *smc); int smc_close_shutdown_write(struct smc_sock *smc);
void smc_close_init(struct smc_sock *smc);
#endif /* SMC_CLOSE_H */ #endif /* SMC_CLOSE_H */
...@@ -316,7 +316,7 @@ void smc_lgr_terminate(struct smc_link_group *lgr) ...@@ -316,7 +316,7 @@ void smc_lgr_terminate(struct smc_link_group *lgr)
smc = container_of(conn, struct smc_sock, conn); smc = container_of(conn, struct smc_sock, conn);
sock_hold(&smc->sk); sock_hold(&smc->sk);
__smc_lgr_unregister_conn(conn); __smc_lgr_unregister_conn(conn);
smc_close_active_abort(smc); schedule_work(&conn->close_work);
sock_put(&smc->sk); sock_put(&smc->sk);
node = rb_first(&lgr->conns_all); node = rb_first(&lgr->conns_all);
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment