Commit bc5e3a54 authored by David Howells's avatar David Howells

rxrpc: Use MSG_WAITALL to tell sendmsg() to temporarily ignore signals

Make AF_RXRPC accept MSG_WAITALL as a flag to sendmsg() to tell it to
ignore signals whilst loading up the message queue, provided progress is
being made in emptying the queue at the other side.

Progress is defined as the base of the transmit window having being
advanced within 2 RTT periods.  If the period is exceeded with no progress,
sendmsg() will return anyway, indicating how much data has been copied, if
any.

Once the supplied buffer is entirely decanted, the sendmsg() will return.
Signed-off-by: default avatarDavid Howells <dhowells@redhat.com>
parent f4d15fb6
...@@ -280,6 +280,18 @@ Interaction with the user of the RxRPC socket: ...@@ -280,6 +280,18 @@ Interaction with the user of the RxRPC socket:
nominated by a socket option. nominated by a socket option.
Notes on sendmsg:
(*) MSG_WAITALL can be set to tell sendmsg to ignore signals if the peer is
making progress at accepting packets within a reasonable time such that we
manage to queue up all the data for transmission. This requires the
client to accept at least one packet per 2*RTT time period.
If this isn't set, sendmsg() will return immediately, either returning
EINTR/ERESTARTSYS if nothing was consumed or returning the amount of data
consumed.
Notes on recvmsg: Notes on recvmsg:
(*) If there's a sequence of data messages belonging to a particular call on (*) If there's a sequence of data messages belonging to a particular call on
......
...@@ -407,7 +407,7 @@ int afs_make_call(struct in_addr *addr, struct afs_call *call, gfp_t gfp, ...@@ -407,7 +407,7 @@ int afs_make_call(struct in_addr *addr, struct afs_call *call, gfp_t gfp,
call->request_size); call->request_size);
msg.msg_control = NULL; msg.msg_control = NULL;
msg.msg_controllen = 0; msg.msg_controllen = 0;
msg.msg_flags = (call->send_pages ? MSG_MORE : 0); msg.msg_flags = MSG_WAITALL | (call->send_pages ? MSG_MORE : 0);
/* We have to change the state *before* sending the last packet as /* We have to change the state *before* sending the last packet as
* rxrpc might give us the reply before it returns from sending the * rxrpc might give us the reply before it returns from sending the
...@@ -538,15 +538,26 @@ static void afs_deliver_to_call(struct afs_call *call) ...@@ -538,15 +538,26 @@ static void afs_deliver_to_call(struct afs_call *call)
*/ */
static int afs_wait_for_call_to_complete(struct afs_call *call) static int afs_wait_for_call_to_complete(struct afs_call *call)
{ {
signed long rtt2, timeout;
int ret; int ret;
u64 rtt;
u32 life, last_life;
DECLARE_WAITQUEUE(myself, current); DECLARE_WAITQUEUE(myself, current);
_enter(""); _enter("");
rtt = rxrpc_kernel_get_rtt(afs_socket, call->rxcall);
rtt2 = nsecs_to_jiffies64(rtt) * 2;
if (rtt2 < 2)
rtt2 = 2;
timeout = rtt2;
last_life = rxrpc_kernel_check_life(afs_socket, call->rxcall);
add_wait_queue(&call->waitq, &myself); add_wait_queue(&call->waitq, &myself);
for (;;) { for (;;) {
set_current_state(TASK_INTERRUPTIBLE); set_current_state(TASK_UNINTERRUPTIBLE);
/* deliver any messages that are in the queue */ /* deliver any messages that are in the queue */
if (call->state < AFS_CALL_COMPLETE && call->need_attention) { if (call->state < AFS_CALL_COMPLETE && call->need_attention) {
...@@ -556,10 +567,20 @@ static int afs_wait_for_call_to_complete(struct afs_call *call) ...@@ -556,10 +567,20 @@ static int afs_wait_for_call_to_complete(struct afs_call *call)
continue; continue;
} }
if (call->state == AFS_CALL_COMPLETE || if (call->state == AFS_CALL_COMPLETE)
signal_pending(current))
break; break;
schedule();
life = rxrpc_kernel_check_life(afs_socket, call->rxcall);
if (timeout == 0 &&
life == last_life && signal_pending(current))
break;
if (life != last_life) {
timeout = rtt2;
last_life = life;
}
timeout = schedule_timeout(timeout);
} }
remove_wait_queue(&call->waitq, &myself); remove_wait_queue(&call->waitq, &myself);
......
...@@ -38,46 +38,100 @@ struct rxrpc_send_params { ...@@ -38,46 +38,100 @@ struct rxrpc_send_params {
}; };
/* /*
* wait for space to appear in the transmit/ACK window * Wait for space to appear in the Tx queue or a signal to occur.
* - caller holds the socket locked
*/ */
static int rxrpc_wait_for_tx_window(struct rxrpc_sock *rx, static int rxrpc_wait_for_tx_window_intr(struct rxrpc_sock *rx,
struct rxrpc_call *call, struct rxrpc_call *call,
long *timeo) long *timeo)
{ {
DECLARE_WAITQUEUE(myself, current);
int ret;
_enter(",{%u,%u,%u}",
call->tx_hard_ack, call->tx_top, call->tx_winsize);
add_wait_queue(&call->waitq, &myself);
for (;;) { for (;;) {
set_current_state(TASK_INTERRUPTIBLE); set_current_state(TASK_INTERRUPTIBLE);
ret = 0;
if (call->tx_top - call->tx_hard_ack < if (call->tx_top - call->tx_hard_ack <
min_t(unsigned int, call->tx_winsize, min_t(unsigned int, call->tx_winsize,
call->cong_cwnd + call->cong_extra)) call->cong_cwnd + call->cong_extra))
break; return 0;
if (call->state >= RXRPC_CALL_COMPLETE) {
ret = call->error; if (call->state >= RXRPC_CALL_COMPLETE)
break; return call->error;
}
if (signal_pending(current)) { if (signal_pending(current))
ret = sock_intr_errno(*timeo); return sock_intr_errno(*timeo);
break;
}
trace_rxrpc_transmit(call, rxrpc_transmit_wait); trace_rxrpc_transmit(call, rxrpc_transmit_wait);
mutex_unlock(&call->user_mutex); mutex_unlock(&call->user_mutex);
*timeo = schedule_timeout(*timeo); *timeo = schedule_timeout(*timeo);
if (mutex_lock_interruptible(&call->user_mutex) < 0) { if (mutex_lock_interruptible(&call->user_mutex) < 0)
ret = sock_intr_errno(*timeo); return sock_intr_errno(*timeo);
break;
} }
}
/*
* Wait for space to appear in the Tx queue uninterruptibly, but with
* a timeout of 2*RTT if no progress was made and a signal occurred.
*/
static int rxrpc_wait_for_tx_window_nonintr(struct rxrpc_sock *rx,
struct rxrpc_call *call)
{
rxrpc_seq_t tx_start, tx_win;
signed long rtt2, timeout;
u64 rtt;
rtt = READ_ONCE(call->peer->rtt);
rtt2 = nsecs_to_jiffies64(rtt) * 2;
if (rtt2 < 1)
rtt2 = 1;
timeout = rtt2;
tx_start = READ_ONCE(call->tx_hard_ack);
for (;;) {
set_current_state(TASK_UNINTERRUPTIBLE);
tx_win = READ_ONCE(call->tx_hard_ack);
if (call->tx_top - tx_win <
min_t(unsigned int, call->tx_winsize,
call->cong_cwnd + call->cong_extra))
return 0;
if (call->state >= RXRPC_CALL_COMPLETE)
return call->error;
if (timeout == 0 &&
tx_win == tx_start && signal_pending(current))
return -EINTR;
if (tx_win != tx_start) {
timeout = rtt2;
tx_start = tx_win;
} }
trace_rxrpc_transmit(call, rxrpc_transmit_wait);
timeout = schedule_timeout(timeout);
}
}
/*
* wait for space to appear in the transmit/ACK window
* - caller holds the socket locked
*/
static int rxrpc_wait_for_tx_window(struct rxrpc_sock *rx,
struct rxrpc_call *call,
long *timeo,
bool waitall)
{
DECLARE_WAITQUEUE(myself, current);
int ret;
_enter(",{%u,%u,%u}",
call->tx_hard_ack, call->tx_top, call->tx_winsize);
add_wait_queue(&call->waitq, &myself);
if (waitall)
ret = rxrpc_wait_for_tx_window_nonintr(rx, call);
else
ret = rxrpc_wait_for_tx_window_intr(rx, call, timeo);
remove_wait_queue(&call->waitq, &myself); remove_wait_queue(&call->waitq, &myself);
set_current_state(TASK_RUNNING); set_current_state(TASK_RUNNING);
_leave(" = %d", ret); _leave(" = %d", ret);
...@@ -254,7 +308,8 @@ static int rxrpc_send_data(struct rxrpc_sock *rx, ...@@ -254,7 +308,8 @@ static int rxrpc_send_data(struct rxrpc_sock *rx,
if (msg->msg_flags & MSG_DONTWAIT) if (msg->msg_flags & MSG_DONTWAIT)
goto maybe_error; goto maybe_error;
ret = rxrpc_wait_for_tx_window(rx, call, ret = rxrpc_wait_for_tx_window(rx, call,
&timeo); &timeo,
msg->msg_flags & MSG_WAITALL);
if (ret < 0) if (ret < 0)
goto maybe_error; goto maybe_error;
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment