1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /* Management of Tx window, Tx resend, ACKs and out-of-sequence reception
4 * Copyright (C) 2007 Red Hat, Inc. All Rights Reserved.
5 * Written by David Howells (dhowells@redhat.com)
8 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
10 #include <linux/module.h>
11 #include <linux/circ_buf.h>
12 #include <linux/net.h>
13 #include <linux/skbuff.h>
14 #include <linux/slab.h>
15 #include <linux/udp.h>
17 #include <net/af_rxrpc.h>
18 #include "ar-internal.h"
21 * Propose a PING ACK be sent.
23 static void rxrpc_propose_ping(struct rxrpc_call
*call
,
24 bool immediate
, bool background
)
28 !test_and_set_bit(RXRPC_CALL_EV_PING
, &call
->events
))
29 rxrpc_queue_call(call
);
31 unsigned long now
= jiffies
;
32 unsigned long ping_at
= now
+ rxrpc_idle_ack_delay
;
34 if (time_before(ping_at
, call
->ping_at
)) {
35 WRITE_ONCE(call
->ping_at
, ping_at
);
36 rxrpc_reduce_call_timer(call
, ping_at
, now
,
37 rxrpc_timer_set_for_ping
);
43 * propose an ACK be sent
45 static void __rxrpc_propose_ACK(struct rxrpc_call
*call
, u8 ack_reason
,
46 u32 serial
, bool immediate
, bool background
,
47 enum rxrpc_propose_ack_trace why
)
49 enum rxrpc_propose_ack_outcome outcome
= rxrpc_propose_ack_use
;
50 unsigned long expiry
= rxrpc_soft_ack_delay
;
51 s8 prior
= rxrpc_ack_priority
[ack_reason
];
53 /* Pings are handled specially because we don't want to accidentally
54 * lose a ping response by subsuming it into a ping.
56 if (ack_reason
== RXRPC_ACK_PING
) {
57 rxrpc_propose_ping(call
, immediate
, background
);
61 /* Update DELAY, IDLE, REQUESTED and PING_RESPONSE ACK serial
62 * numbers, but we don't alter the timeout.
64 _debug("prior %u %u vs %u %u",
66 call
->ackr_reason
, rxrpc_ack_priority
[call
->ackr_reason
]);
67 if (ack_reason
== call
->ackr_reason
) {
68 if (RXRPC_ACK_UPDATEABLE
& (1 << ack_reason
)) {
69 outcome
= rxrpc_propose_ack_update
;
70 call
->ackr_serial
= serial
;
74 } else if (prior
> rxrpc_ack_priority
[call
->ackr_reason
]) {
75 call
->ackr_reason
= ack_reason
;
76 call
->ackr_serial
= serial
;
78 outcome
= rxrpc_propose_ack_subsume
;
82 case RXRPC_ACK_REQUESTED
:
83 if (rxrpc_requested_ack_delay
< expiry
)
84 expiry
= rxrpc_requested_ack_delay
;
90 if (rxrpc_soft_ack_delay
< expiry
)
91 expiry
= rxrpc_soft_ack_delay
;
95 if (rxrpc_idle_ack_delay
< expiry
)
96 expiry
= rxrpc_idle_ack_delay
;
104 if (test_bit(RXRPC_CALL_EV_ACK
, &call
->events
)) {
105 _debug("already scheduled");
106 } else if (immediate
|| expiry
== 0) {
107 _debug("immediate ACK %lx", call
->events
);
108 if (!test_and_set_bit(RXRPC_CALL_EV_ACK
, &call
->events
) &&
110 rxrpc_queue_call(call
);
112 unsigned long now
= jiffies
, ack_at
;
114 if (call
->peer
->rtt_usage
> 0)
115 ack_at
= nsecs_to_jiffies(call
->peer
->rtt
);
119 ack_at
+= READ_ONCE(call
->tx_backoff
);
121 if (time_before(ack_at
, call
->ack_at
)) {
122 WRITE_ONCE(call
->ack_at
, ack_at
);
123 rxrpc_reduce_call_timer(call
, ack_at
, now
,
124 rxrpc_timer_set_for_ack
);
129 trace_rxrpc_propose_ack(call
, why
, ack_reason
, serial
, immediate
,
130 background
, outcome
);
134 * propose an ACK be sent, locking the call structure
136 void rxrpc_propose_ACK(struct rxrpc_call
*call
, u8 ack_reason
,
137 u32 serial
, bool immediate
, bool background
,
138 enum rxrpc_propose_ack_trace why
)
140 spin_lock_bh(&call
->lock
);
141 __rxrpc_propose_ACK(call
, ack_reason
, serial
,
142 immediate
, background
, why
);
143 spin_unlock_bh(&call
->lock
);
147 * Handle congestion being detected by the retransmit timeout.
149 static void rxrpc_congestion_timeout(struct rxrpc_call
*call
)
151 set_bit(RXRPC_CALL_RETRANS_TIMEOUT
, &call
->flags
);
155 * Perform retransmission of NAK'd and unack'd packets.
157 static void rxrpc_resend(struct rxrpc_call
*call
, unsigned long now_j
)
160 unsigned long resend_at
;
161 rxrpc_seq_t cursor
, seq
, top
;
162 ktime_t now
, max_age
, oldest
, ack_ts
, timeout
, min_timeo
;
164 u8 annotation
, anno_type
, retrans
= 0, unacked
= 0;
166 _enter("{%d,%d}", call
->tx_hard_ack
, call
->tx_top
);
168 if (call
->peer
->rtt_usage
> 1)
169 timeout
= ns_to_ktime(call
->peer
->rtt
* 3 / 2);
171 timeout
= ms_to_ktime(rxrpc_resend_timeout
);
172 min_timeo
= ns_to_ktime((1000000000 / HZ
) * 4);
173 if (ktime_before(timeout
, min_timeo
))
176 now
= ktime_get_real();
177 max_age
= ktime_sub(now
, timeout
);
179 spin_lock_bh(&call
->lock
);
181 cursor
= call
->tx_hard_ack
;
183 ASSERT(before_eq(cursor
, top
));
187 /* Scan the packet list without dropping the lock and decide which of
188 * the packets in the Tx buffer we're going to resend and what the new
189 * resend timeout will be.
191 trace_rxrpc_resend(call
, (cursor
+ 1) & RXRPC_RXTX_BUFF_MASK
);
193 for (seq
= cursor
+ 1; before_eq(seq
, top
); seq
++) {
194 ix
= seq
& RXRPC_RXTX_BUFF_MASK
;
195 annotation
= call
->rxtx_annotations
[ix
];
196 anno_type
= annotation
& RXRPC_TX_ANNO_MASK
;
197 annotation
&= ~RXRPC_TX_ANNO_MASK
;
198 if (anno_type
== RXRPC_TX_ANNO_ACK
)
201 skb
= call
->rxtx_buffer
[ix
];
202 rxrpc_see_skb(skb
, rxrpc_skb_seen
);
204 if (anno_type
== RXRPC_TX_ANNO_UNACK
) {
205 if (ktime_after(skb
->tstamp
, max_age
)) {
206 if (ktime_before(skb
->tstamp
, oldest
))
207 oldest
= skb
->tstamp
;
210 if (!(annotation
& RXRPC_TX_ANNO_RESENT
))
214 /* Okay, we need to retransmit a packet. */
215 call
->rxtx_annotations
[ix
] = RXRPC_TX_ANNO_RETRANS
| annotation
;
217 trace_rxrpc_retransmit(call
, seq
, annotation
| anno_type
,
218 ktime_to_ns(ktime_sub(skb
->tstamp
, max_age
)));
221 resend_at
= nsecs_to_jiffies(ktime_to_ns(ktime_sub(now
, oldest
)));
222 resend_at
+= jiffies
+ rxrpc_resend_timeout
;
223 WRITE_ONCE(call
->resend_at
, resend_at
);
226 rxrpc_congestion_timeout(call
);
228 /* If there was nothing that needed retransmission then it's likely
229 * that an ACK got lost somewhere. Send a ping to find out instead of
230 * retransmitting data.
233 rxrpc_reduce_call_timer(call
, resend_at
, now_j
,
234 rxrpc_timer_set_for_resend
);
235 spin_unlock_bh(&call
->lock
);
236 ack_ts
= ktime_sub(now
, call
->acks_latest_ts
);
237 if (ktime_to_ns(ack_ts
) < call
->peer
->rtt
)
239 rxrpc_propose_ACK(call
, RXRPC_ACK_PING
, 0, true, false,
240 rxrpc_propose_ack_ping_for_lost_ack
);
241 rxrpc_send_ack_packet(call
, true, NULL
);
245 /* Now go through the Tx window and perform the retransmissions. We
246 * have to drop the lock for each send. If an ACK comes in whilst the
247 * lock is dropped, it may clear some of the retransmission markers for
248 * packets that it soft-ACKs.
250 for (seq
= cursor
+ 1; before_eq(seq
, top
); seq
++) {
251 ix
= seq
& RXRPC_RXTX_BUFF_MASK
;
252 annotation
= call
->rxtx_annotations
[ix
];
253 anno_type
= annotation
& RXRPC_TX_ANNO_MASK
;
254 if (anno_type
!= RXRPC_TX_ANNO_RETRANS
)
257 skb
= call
->rxtx_buffer
[ix
];
258 rxrpc_get_skb(skb
, rxrpc_skb_got
);
259 spin_unlock_bh(&call
->lock
);
261 if (rxrpc_send_data_packet(call
, skb
, true) < 0) {
262 rxrpc_free_skb(skb
, rxrpc_skb_freed
);
266 if (rxrpc_is_client_call(call
))
267 rxrpc_expose_client_call(call
);
269 rxrpc_free_skb(skb
, rxrpc_skb_freed
);
270 spin_lock_bh(&call
->lock
);
272 /* We need to clear the retransmit state, but there are two
273 * things we need to be aware of: A new ACK/NAK might have been
274 * received and the packet might have been hard-ACK'd (in which
275 * case it will no longer be in the buffer).
277 if (after(seq
, call
->tx_hard_ack
)) {
278 annotation
= call
->rxtx_annotations
[ix
];
279 anno_type
= annotation
& RXRPC_TX_ANNO_MASK
;
280 if (anno_type
== RXRPC_TX_ANNO_RETRANS
||
281 anno_type
== RXRPC_TX_ANNO_NAK
) {
282 annotation
&= ~RXRPC_TX_ANNO_MASK
;
283 annotation
|= RXRPC_TX_ANNO_UNACK
;
285 annotation
|= RXRPC_TX_ANNO_RESENT
;
286 call
->rxtx_annotations
[ix
] = annotation
;
289 if (after(call
->tx_hard_ack
, seq
))
290 seq
= call
->tx_hard_ack
;
294 spin_unlock_bh(&call
->lock
);
300 * Handle retransmission and deferred ACK/abort generation.
302 void rxrpc_process_call(struct work_struct
*work
)
304 struct rxrpc_call
*call
=
305 container_of(work
, struct rxrpc_call
, processor
);
306 rxrpc_serial_t
*send_ack
;
307 unsigned long now
, next
, t
;
308 unsigned int iterations
= 0;
310 rxrpc_see_call(call
);
312 //printk("\n--------------------\n");
313 _enter("{%d,%s,%lx}",
314 call
->debug_id
, rxrpc_call_states
[call
->state
], call
->events
);
317 /* Limit the number of times we do this before returning to the manager */
322 if (test_and_clear_bit(RXRPC_CALL_EV_ABORT
, &call
->events
)) {
323 rxrpc_send_abort_packet(call
);
327 if (call
->state
== RXRPC_CALL_COMPLETE
) {
328 del_timer_sync(&call
->timer
);
329 rxrpc_notify_socket(call
);
333 /* Work out if any timeouts tripped */
335 t
= READ_ONCE(call
->expect_rx_by
);
336 if (time_after_eq(now
, t
)) {
337 trace_rxrpc_timer(call
, rxrpc_timer_exp_normal
, now
);
338 set_bit(RXRPC_CALL_EV_EXPIRED
, &call
->events
);
341 t
= READ_ONCE(call
->expect_req_by
);
342 if (call
->state
== RXRPC_CALL_SERVER_RECV_REQUEST
&&
343 time_after_eq(now
, t
)) {
344 trace_rxrpc_timer(call
, rxrpc_timer_exp_idle
, now
);
345 set_bit(RXRPC_CALL_EV_EXPIRED
, &call
->events
);
348 t
= READ_ONCE(call
->expect_term_by
);
349 if (time_after_eq(now
, t
)) {
350 trace_rxrpc_timer(call
, rxrpc_timer_exp_hard
, now
);
351 set_bit(RXRPC_CALL_EV_EXPIRED
, &call
->events
);
354 t
= READ_ONCE(call
->ack_at
);
355 if (time_after_eq(now
, t
)) {
356 trace_rxrpc_timer(call
, rxrpc_timer_exp_ack
, now
);
357 cmpxchg(&call
->ack_at
, t
, now
+ MAX_JIFFY_OFFSET
);
358 set_bit(RXRPC_CALL_EV_ACK
, &call
->events
);
361 t
= READ_ONCE(call
->ack_lost_at
);
362 if (time_after_eq(now
, t
)) {
363 trace_rxrpc_timer(call
, rxrpc_timer_exp_lost_ack
, now
);
364 cmpxchg(&call
->ack_lost_at
, t
, now
+ MAX_JIFFY_OFFSET
);
365 set_bit(RXRPC_CALL_EV_ACK_LOST
, &call
->events
);
368 t
= READ_ONCE(call
->keepalive_at
);
369 if (time_after_eq(now
, t
)) {
370 trace_rxrpc_timer(call
, rxrpc_timer_exp_keepalive
, now
);
371 cmpxchg(&call
->keepalive_at
, t
, now
+ MAX_JIFFY_OFFSET
);
372 rxrpc_propose_ACK(call
, RXRPC_ACK_PING
, 0, true, true,
373 rxrpc_propose_ack_ping_for_keepalive
);
374 set_bit(RXRPC_CALL_EV_PING
, &call
->events
);
377 t
= READ_ONCE(call
->ping_at
);
378 if (time_after_eq(now
, t
)) {
379 trace_rxrpc_timer(call
, rxrpc_timer_exp_ping
, now
);
380 cmpxchg(&call
->ping_at
, t
, now
+ MAX_JIFFY_OFFSET
);
381 set_bit(RXRPC_CALL_EV_PING
, &call
->events
);
384 t
= READ_ONCE(call
->resend_at
);
385 if (time_after_eq(now
, t
)) {
386 trace_rxrpc_timer(call
, rxrpc_timer_exp_resend
, now
);
387 cmpxchg(&call
->resend_at
, t
, now
+ MAX_JIFFY_OFFSET
);
388 set_bit(RXRPC_CALL_EV_RESEND
, &call
->events
);
392 if (test_and_clear_bit(RXRPC_CALL_EV_EXPIRED
, &call
->events
)) {
393 if (test_bit(RXRPC_CALL_RX_HEARD
, &call
->flags
) &&
394 (int)call
->conn
->hi_serial
- (int)call
->rx_serial
> 0) {
395 trace_rxrpc_call_reset(call
);
396 rxrpc_abort_call("EXP", call
, 0, RX_USER_ABORT
, -ECONNRESET
);
398 rxrpc_abort_call("EXP", call
, 0, RX_USER_ABORT
, -ETIME
);
400 set_bit(RXRPC_CALL_EV_ABORT
, &call
->events
);
405 if (test_and_clear_bit(RXRPC_CALL_EV_ACK_LOST
, &call
->events
)) {
406 call
->acks_lost_top
= call
->tx_top
;
407 rxrpc_propose_ACK(call
, RXRPC_ACK_PING
, 0, true, false,
408 rxrpc_propose_ack_ping_for_lost_ack
);
409 send_ack
= &call
->acks_lost_ping
;
412 if (test_and_clear_bit(RXRPC_CALL_EV_ACK
, &call
->events
) ||
414 if (call
->ackr_reason
) {
415 rxrpc_send_ack_packet(call
, false, send_ack
);
420 if (test_and_clear_bit(RXRPC_CALL_EV_PING
, &call
->events
)) {
421 rxrpc_send_ack_packet(call
, true, NULL
);
425 if (test_and_clear_bit(RXRPC_CALL_EV_RESEND
, &call
->events
)) {
426 rxrpc_resend(call
, now
);
430 /* Make sure the timer is restarted */
431 next
= call
->expect_rx_by
;
433 #define set(T) { t = READ_ONCE(T); if (time_before(t, next)) next = t; }
435 set(call
->expect_req_by
);
436 set(call
->expect_term_by
);
438 set(call
->ack_lost_at
);
439 set(call
->resend_at
);
440 set(call
->keepalive_at
);
444 if (time_after_eq(now
, next
))
447 rxrpc_reduce_call_timer(call
, next
, now
, rxrpc_timer_restart
);
449 /* other events may have been raised since we started checking */
450 if (call
->events
&& call
->state
< RXRPC_CALL_COMPLETE
)
454 rxrpc_put_call(call
, rxrpc_call_put
);
460 __rxrpc_queue_call(call
);