1 /* Management of Tx window, Tx resend, ACKs and out-of-sequence reception
3 * Copyright (C) 2007 Red Hat, Inc. All Rights Reserved.
4 * Written by David Howells (dhowells@redhat.com)
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
12 #include <linux/module.h>
13 #include <linux/circ_buf.h>
14 #include <linux/net.h>
15 #include <linux/skbuff.h>
16 #include <linux/slab.h>
17 #include <linux/udp.h>
19 #include <net/af_rxrpc.h>
20 #include "ar-internal.h"
22 static unsigned rxrpc_ack_defer
= 1;
24 static const char *const rxrpc_acks
[] = {
25 "---", "REQ", "DUP", "OOS", "WIN", "MEM", "PNG", "PNR", "DLY", "IDL",
29 static const s8 rxrpc_ack_priority
[] = {
31 [RXRPC_ACK_DELAY
] = 1,
32 [RXRPC_ACK_REQUESTED
] = 2,
34 [RXRPC_ACK_PING_RESPONSE
] = 4,
35 [RXRPC_ACK_DUPLICATE
] = 5,
36 [RXRPC_ACK_OUT_OF_SEQUENCE
] = 6,
37 [RXRPC_ACK_EXCEEDS_WINDOW
] = 7,
38 [RXRPC_ACK_NOSPACE
] = 8,
42 * propose an ACK be sent
44 void __rxrpc_propose_ACK(struct rxrpc_call
*call
, u8 ack_reason
,
45 __be32 serial
, bool immediate
)
48 s8 prior
= rxrpc_ack_priority
[ack_reason
];
50 ASSERTCMP(prior
, >, 0);
52 _enter("{%d},%s,%%%x,%u",
53 call
->debug_id
, rxrpc_acks
[ack_reason
], ntohl(serial
),
56 if (prior
< rxrpc_ack_priority
[call
->ackr_reason
]) {
62 /* update DELAY, IDLE, REQUESTED and PING_RESPONSE ACK serial
64 if (prior
== rxrpc_ack_priority
[call
->ackr_reason
]) {
66 call
->ackr_serial
= serial
;
72 call
->ackr_reason
= ack_reason
;
73 call
->ackr_serial
= serial
;
77 _debug("run delay timer");
78 call
->ack_timer
.expires
= jiffies
+ rxrpc_ack_timeout
* HZ
;
79 add_timer(&call
->ack_timer
);
84 _debug("run defer timer");
90 case RXRPC_ACK_REQUESTED
:
93 if (!immediate
|| serial
== cpu_to_be32(1)) {
94 _debug("run defer timer");
95 expiry
= rxrpc_ack_defer
;
100 _debug("immediate ACK");
106 if (!timer_pending(&call
->ack_timer
) ||
107 time_after(call
->ack_timer
.expires
, expiry
))
108 mod_timer(&call
->ack_timer
, expiry
);
112 _debug("cancel timer %%%u", ntohl(serial
));
113 try_to_del_timer_sync(&call
->ack_timer
);
114 read_lock_bh(&call
->state_lock
);
115 if (call
->state
<= RXRPC_CALL_COMPLETE
&&
116 !test_and_set_bit(RXRPC_CALL_ACK
, &call
->events
))
117 rxrpc_queue_call(call
);
118 read_unlock_bh(&call
->state_lock
);
122 * propose an ACK be sent, locking the call structure
124 void rxrpc_propose_ACK(struct rxrpc_call
*call
, u8 ack_reason
,
125 __be32 serial
, bool immediate
)
127 s8 prior
= rxrpc_ack_priority
[ack_reason
];
129 if (prior
> rxrpc_ack_priority
[call
->ackr_reason
]) {
130 spin_lock_bh(&call
->lock
);
131 __rxrpc_propose_ACK(call
, ack_reason
, serial
, immediate
);
132 spin_unlock_bh(&call
->lock
);
137 * set the resend timer
139 static void rxrpc_set_resend(struct rxrpc_call
*call
, u8 resend
,
140 unsigned long resend_at
)
142 read_lock_bh(&call
->state_lock
);
143 if (call
->state
>= RXRPC_CALL_COMPLETE
)
147 _debug("SET RESEND");
148 set_bit(RXRPC_CALL_RESEND
, &call
->events
);
152 _debug("MODIFY RESEND TIMER");
153 set_bit(RXRPC_CALL_RUN_RTIMER
, &call
->flags
);
154 mod_timer(&call
->resend_timer
, resend_at
);
156 _debug("KILL RESEND TIMER");
157 del_timer_sync(&call
->resend_timer
);
158 clear_bit(RXRPC_CALL_RESEND_TIMER
, &call
->events
);
159 clear_bit(RXRPC_CALL_RUN_RTIMER
, &call
->flags
);
161 read_unlock_bh(&call
->state_lock
);
167 static void rxrpc_resend(struct rxrpc_call
*call
)
169 struct rxrpc_skb_priv
*sp
;
170 struct rxrpc_header
*hdr
;
172 unsigned long *p_txb
, resend_at
;
176 _enter("{%d,%d,%d,%d},",
177 call
->acks_hard
, call
->acks_unacked
,
178 atomic_read(&call
->sequence
),
179 CIRC_CNT(call
->acks_head
, call
->acks_tail
, call
->acks_winsz
));
185 for (loop
= call
->acks_tail
;
186 loop
!= call
->acks_head
|| stop
;
187 loop
= (loop
+ 1) & (call
->acks_winsz
- 1)
189 p_txb
= call
->acks_window
+ loop
;
190 smp_read_barrier_depends();
194 txb
= (struct sk_buff
*) *p_txb
;
197 if (sp
->need_resend
) {
200 /* each Tx packet has a new serial number */
202 htonl(atomic_inc_return(&call
->conn
->serial
));
204 hdr
= (struct rxrpc_header
*) txb
->head
;
205 hdr
->serial
= sp
->hdr
.serial
;
207 _proto("Tx DATA %%%u { #%d }",
208 ntohl(sp
->hdr
.serial
), ntohl(sp
->hdr
.seq
));
209 if (rxrpc_send_packet(call
->conn
->trans
, txb
) < 0) {
211 sp
->resend_at
= jiffies
+ 3;
214 jiffies
+ rxrpc_resend_timeout
* HZ
;
218 if (time_after_eq(jiffies
+ 1, sp
->resend_at
)) {
221 } else if (resend
& 2) {
222 if (time_before(sp
->resend_at
, resend_at
))
223 resend_at
= sp
->resend_at
;
225 resend_at
= sp
->resend_at
;
230 rxrpc_set_resend(call
, resend
, resend_at
);
235 * handle resend timer expiry
237 static void rxrpc_resend_timer(struct rxrpc_call
*call
)
239 struct rxrpc_skb_priv
*sp
;
241 unsigned long *p_txb
, resend_at
;
246 call
->acks_tail
, call
->acks_unacked
, call
->acks_head
);
251 for (loop
= call
->acks_unacked
;
252 loop
!= call
->acks_head
;
253 loop
= (loop
+ 1) & (call
->acks_winsz
- 1)
255 p_txb
= call
->acks_window
+ loop
;
256 smp_read_barrier_depends();
257 txb
= (struct sk_buff
*) (*p_txb
& ~1);
260 ASSERT(!(*p_txb
& 1));
262 if (sp
->need_resend
) {
264 } else if (time_after_eq(jiffies
+ 1, sp
->resend_at
)) {
267 } else if (resend
& 2) {
268 if (time_before(sp
->resend_at
, resend_at
))
269 resend_at
= sp
->resend_at
;
271 resend_at
= sp
->resend_at
;
276 rxrpc_set_resend(call
, resend
, resend_at
);
281 * process soft ACKs of our transmitted packets
282 * - these indicate packets the peer has or has not received, but hasn't yet
283 * given to the consumer, and so can still be discarded and re-requested
285 static int rxrpc_process_soft_ACKs(struct rxrpc_call
*call
,
286 struct rxrpc_ackpacket
*ack
,
289 struct rxrpc_skb_priv
*sp
;
291 unsigned long *p_txb
, resend_at
;
293 u8 sacks
[RXRPC_MAXACKS
], resend
;
295 _enter("{%d,%d},{%d},",
297 CIRC_CNT(call
->acks_head
, call
->acks_tail
, call
->acks_winsz
),
300 if (skb_copy_bits(skb
, 0, sacks
, ack
->nAcks
) < 0)
305 for (loop
= 0; loop
< ack
->nAcks
; loop
++) {
306 p_txb
= call
->acks_window
;
307 p_txb
+= (call
->acks_tail
+ loop
) & (call
->acks_winsz
- 1);
308 smp_read_barrier_depends();
309 txb
= (struct sk_buff
*) (*p_txb
& ~1);
312 switch (sacks
[loop
]) {
313 case RXRPC_ACK_TYPE_ACK
:
317 case RXRPC_ACK_TYPE_NACK
:
323 _debug("Unsupported ACK type %d", sacks
[loop
]);
329 call
->acks_unacked
= (call
->acks_tail
+ loop
) & (call
->acks_winsz
- 1);
331 /* anything not explicitly ACK'd is implicitly NACK'd, but may just not
332 * have been received or processed yet by the far end */
333 for (loop
= call
->acks_unacked
;
334 loop
!= call
->acks_head
;
335 loop
= (loop
+ 1) & (call
->acks_winsz
- 1)
337 p_txb
= call
->acks_window
+ loop
;
338 smp_read_barrier_depends();
339 txb
= (struct sk_buff
*) (*p_txb
& ~1);
343 /* packet must have been discarded */
347 } else if (sp
->need_resend
) {
349 } else if (time_after_eq(jiffies
+ 1, sp
->resend_at
)) {
352 } else if (resend
& 2) {
353 if (time_before(sp
->resend_at
, resend_at
))
354 resend_at
= sp
->resend_at
;
356 resend_at
= sp
->resend_at
;
361 rxrpc_set_resend(call
, resend
, resend_at
);
366 _leave(" = -EPROTO");
371 * discard hard-ACK'd packets from the Tx window
373 static void rxrpc_rotate_tx_window(struct rxrpc_call
*call
, u32 hard
)
375 struct rxrpc_skb_priv
*sp
;
377 int tail
= call
->acks_tail
, old_tail
;
378 int win
= CIRC_CNT(call
->acks_head
, tail
, call
->acks_winsz
);
380 _enter("{%u,%u},%u", call
->acks_hard
, win
, hard
);
382 ASSERTCMP(hard
- call
->acks_hard
, <=, win
);
384 while (call
->acks_hard
< hard
) {
385 smp_read_barrier_depends();
386 _skb
= call
->acks_window
[tail
] & ~1;
387 sp
= rxrpc_skb((struct sk_buff
*) _skb
);
388 rxrpc_free_skb((struct sk_buff
*) _skb
);
390 tail
= (tail
+ 1) & (call
->acks_winsz
- 1);
391 call
->acks_tail
= tail
;
392 if (call
->acks_unacked
== old_tail
)
393 call
->acks_unacked
= tail
;
397 wake_up(&call
->tx_waitq
);
401 * clear the Tx window in the event of a failure
403 static void rxrpc_clear_tx_window(struct rxrpc_call
*call
)
405 rxrpc_rotate_tx_window(call
, atomic_read(&call
->sequence
));
409 * drain the out of sequence received packet queue into the packet Rx queue
411 static int rxrpc_drain_rx_oos_queue(struct rxrpc_call
*call
)
413 struct rxrpc_skb_priv
*sp
;
418 _enter("{%d,%d}", call
->rx_data_post
, call
->rx_first_oos
);
420 spin_lock_bh(&call
->lock
);
423 if (test_bit(RXRPC_CALL_RELEASED
, &call
->flags
))
424 goto socket_unavailable
;
426 skb
= skb_dequeue(&call
->rx_oos_queue
);
430 _debug("drain OOS packet %d [%d]",
431 ntohl(sp
->hdr
.seq
), call
->rx_first_oos
);
433 if (ntohl(sp
->hdr
.seq
) != call
->rx_first_oos
) {
434 skb_queue_head(&call
->rx_oos_queue
, skb
);
435 call
->rx_first_oos
= ntohl(rxrpc_skb(skb
)->hdr
.seq
);
436 _debug("requeue %p {%u}", skb
, call
->rx_first_oos
);
438 skb
->mark
= RXRPC_SKB_MARK_DATA
;
439 terminal
= ((sp
->hdr
.flags
& RXRPC_LAST_PACKET
) &&
440 !(sp
->hdr
.flags
& RXRPC_CLIENT_INITIATED
));
441 ret
= rxrpc_queue_rcv_skb(call
, skb
, true, terminal
);
443 _debug("drain #%u", call
->rx_data_post
);
444 call
->rx_data_post
++;
446 /* find out what the next packet is */
447 skb
= skb_peek(&call
->rx_oos_queue
);
450 ntohl(rxrpc_skb(skb
)->hdr
.seq
);
452 call
->rx_first_oos
= 0;
453 _debug("peek %p {%u}", skb
, call
->rx_first_oos
);
459 spin_unlock_bh(&call
->lock
);
460 _leave(" = %d", ret
);
465 * insert an out of sequence packet into the buffer
467 static void rxrpc_insert_oos_packet(struct rxrpc_call
*call
,
470 struct rxrpc_skb_priv
*sp
, *psp
;
475 seq
= ntohl(sp
->hdr
.seq
);
476 _enter(",,{%u}", seq
);
478 skb
->destructor
= rxrpc_packet_destructor
;
479 ASSERTCMP(sp
->call
, ==, NULL
);
481 rxrpc_get_call(call
);
483 /* insert into the buffer in sequence order */
484 spin_lock_bh(&call
->lock
);
486 skb_queue_walk(&call
->rx_oos_queue
, p
) {
488 if (ntohl(psp
->hdr
.seq
) > seq
) {
489 _debug("insert oos #%u before #%u",
490 seq
, ntohl(psp
->hdr
.seq
));
491 skb_insert(p
, skb
, &call
->rx_oos_queue
);
496 _debug("append oos #%u", seq
);
497 skb_queue_tail(&call
->rx_oos_queue
, skb
);
500 /* we might now have a new front to the queue */
501 if (call
->rx_first_oos
== 0 || seq
< call
->rx_first_oos
)
502 call
->rx_first_oos
= seq
;
504 read_lock(&call
->state_lock
);
505 if (call
->state
< RXRPC_CALL_COMPLETE
&&
506 call
->rx_data_post
== call
->rx_first_oos
) {
507 _debug("drain rx oos now");
508 set_bit(RXRPC_CALL_DRAIN_RX_OOS
, &call
->events
);
510 read_unlock(&call
->state_lock
);
512 spin_unlock_bh(&call
->lock
);
513 _leave(" [stored #%u]", call
->rx_first_oos
);
517 * clear the Tx window on final ACK reception
519 static void rxrpc_zap_tx_window(struct rxrpc_call
*call
)
521 struct rxrpc_skb_priv
*sp
;
523 unsigned long _skb
, *acks_window
;
524 u8 winsz
= call
->acks_winsz
;
527 acks_window
= call
->acks_window
;
528 call
->acks_window
= NULL
;
530 while (CIRC_CNT(call
->acks_head
, call
->acks_tail
, winsz
) > 0) {
531 tail
= call
->acks_tail
;
532 smp_read_barrier_depends();
533 _skb
= acks_window
[tail
] & ~1;
535 call
->acks_tail
= (call
->acks_tail
+ 1) & (winsz
- 1);
537 skb
= (struct sk_buff
*) _skb
;
539 _debug("+++ clear Tx %u", ntohl(sp
->hdr
.seq
));
547 * process the extra information that may be appended to an ACK packet
549 static void rxrpc_extract_ackinfo(struct rxrpc_call
*call
, struct sk_buff
*skb
,
550 unsigned latest
, int nAcks
)
552 struct rxrpc_ackinfo ackinfo
;
553 struct rxrpc_peer
*peer
;
556 if (skb_copy_bits(skb
, nAcks
+ 3, &ackinfo
, sizeof(ackinfo
)) < 0) {
557 _leave(" [no ackinfo]");
561 _proto("Rx ACK %%%u Info { rx=%u max=%u rwin=%u jm=%u }",
563 ntohl(ackinfo
.rxMTU
), ntohl(ackinfo
.maxMTU
),
564 ntohl(ackinfo
.rwind
), ntohl(ackinfo
.jumbo_max
));
566 mtu
= min(ntohl(ackinfo
.rxMTU
), ntohl(ackinfo
.maxMTU
));
568 peer
= call
->conn
->trans
->peer
;
569 if (mtu
< peer
->maxdata
) {
570 spin_lock_bh(&peer
->lock
);
572 peer
->mtu
= mtu
+ peer
->hdrsize
;
573 spin_unlock_bh(&peer
->lock
);
574 _net("Net MTU %u (maxdata %u)", peer
->mtu
, peer
->maxdata
);
579 * process packets in the reception queue
581 static int rxrpc_process_rx_queue(struct rxrpc_call
*call
,
584 struct rxrpc_ackpacket ack
;
585 struct rxrpc_skb_priv
*sp
;
594 skb
= skb_dequeue(&call
->rx_queue
);
598 _net("deferred skb %p", skb
);
602 _debug("process %s [st %d]", rxrpc_pkts
[sp
->hdr
.type
], call
->state
);
606 switch (sp
->hdr
.type
) {
607 /* data packets that wind up here have been received out of
608 * order, need security processing or are jumbo packets */
609 case RXRPC_PACKET_TYPE_DATA
:
610 _proto("OOSQ DATA %%%u { #%u }",
611 ntohl(sp
->hdr
.serial
), ntohl(sp
->hdr
.seq
));
613 /* secured packets must be verified and possibly decrypted */
614 if (rxrpc_verify_packet(call
, skb
, _abort_code
) < 0)
617 rxrpc_insert_oos_packet(call
, skb
);
618 goto process_further
;
620 /* partial ACK to process */
621 case RXRPC_PACKET_TYPE_ACK
:
622 if (skb_copy_bits(skb
, 0, &ack
, sizeof(ack
)) < 0) {
623 _debug("extraction failure");
626 if (!skb_pull(skb
, sizeof(ack
)))
629 latest
= ntohl(sp
->hdr
.serial
);
630 hard
= ntohl(ack
.firstPacket
);
631 tx
= atomic_read(&call
->sequence
);
633 _proto("Rx ACK %%%u { m=%hu f=#%u p=#%u s=%%%u r=%s n=%u }",
637 ntohl(ack
.previousPacket
),
639 rxrpc_acks
[ack
.reason
],
642 rxrpc_extract_ackinfo(call
, skb
, latest
, ack
.nAcks
);
644 if (ack
.reason
== RXRPC_ACK_PING
) {
645 _proto("Rx ACK %%%u PING Request", latest
);
646 rxrpc_propose_ACK(call
, RXRPC_ACK_PING_RESPONSE
,
647 sp
->hdr
.serial
, true);
650 /* discard any out-of-order or duplicate ACKs */
651 if (latest
- call
->acks_latest
<= 0) {
652 _debug("discard ACK %d <= %d",
653 latest
, call
->acks_latest
);
656 call
->acks_latest
= latest
;
658 if (call
->state
!= RXRPC_CALL_CLIENT_SEND_REQUEST
&&
659 call
->state
!= RXRPC_CALL_CLIENT_AWAIT_REPLY
&&
660 call
->state
!= RXRPC_CALL_SERVER_SEND_REPLY
&&
661 call
->state
!= RXRPC_CALL_SERVER_AWAIT_ACK
)
664 _debug("Tx=%d H=%u S=%d", tx
, call
->acks_hard
, call
->state
);
668 _debug("hard-ACK'd packet %d not transmitted"
674 if ((call
->state
== RXRPC_CALL_CLIENT_AWAIT_REPLY
||
675 call
->state
== RXRPC_CALL_SERVER_AWAIT_ACK
) &&
680 rxrpc_rotate_tx_window(call
, hard
- 1);
684 if (hard
- 1 + ack
.nAcks
> tx
) {
685 _debug("soft-ACK'd packet %d+%d not"
686 " transmitted (%d top)",
687 hard
- 1, ack
.nAcks
, tx
);
691 if (rxrpc_process_soft_ACKs(call
, &ack
, skb
) < 0)
696 /* complete ACK to process */
697 case RXRPC_PACKET_TYPE_ACKALL
:
700 /* abort and busy are handled elsewhere */
701 case RXRPC_PACKET_TYPE_BUSY
:
702 case RXRPC_PACKET_TYPE_ABORT
:
705 /* connection level events - also handled elsewhere */
706 case RXRPC_PACKET_TYPE_CHALLENGE
:
707 case RXRPC_PACKET_TYPE_RESPONSE
:
708 case RXRPC_PACKET_TYPE_DEBUG
:
712 /* if we've had a hard ACK that covers all the packets we've sent, then
713 * that ends that phase of the operation */
715 write_lock_bh(&call
->state_lock
);
716 _debug("ack all %d", call
->state
);
718 switch (call
->state
) {
719 case RXRPC_CALL_CLIENT_AWAIT_REPLY
:
720 call
->state
= RXRPC_CALL_CLIENT_RECV_REPLY
;
722 case RXRPC_CALL_SERVER_AWAIT_ACK
:
723 _debug("srv complete");
724 call
->state
= RXRPC_CALL_COMPLETE
;
727 case RXRPC_CALL_CLIENT_SEND_REQUEST
:
728 case RXRPC_CALL_SERVER_RECV_REQUEST
:
729 goto protocol_error_unlock
; /* can't occur yet */
731 write_unlock_bh(&call
->state_lock
);
732 goto discard
; /* assume packet left over from earlier phase */
735 write_unlock_bh(&call
->state_lock
);
737 /* if all the packets we sent are hard-ACK'd, then we can discard
738 * whatever we've got left */
739 _debug("clear Tx %d",
740 CIRC_CNT(call
->acks_head
, call
->acks_tail
, call
->acks_winsz
));
742 del_timer_sync(&call
->resend_timer
);
743 clear_bit(RXRPC_CALL_RUN_RTIMER
, &call
->flags
);
744 clear_bit(RXRPC_CALL_RESEND_TIMER
, &call
->events
);
746 if (call
->acks_window
)
747 rxrpc_zap_tx_window(call
);
750 /* post the final ACK message for userspace to pick up */
752 skb
->mark
= RXRPC_SKB_MARK_FINAL_ACK
;
754 rxrpc_get_call(call
);
755 spin_lock_bh(&call
->lock
);
756 if (rxrpc_queue_rcv_skb(call
, skb
, true, true) < 0)
758 spin_unlock_bh(&call
->lock
);
759 goto process_further
;
764 goto process_further
;
766 protocol_error_unlock
:
767 write_unlock_bh(&call
->state_lock
);
770 _leave(" = -EPROTO");
775 * post a message to the socket Rx queue for recvmsg() to pick up
777 static int rxrpc_post_message(struct rxrpc_call
*call
, u32 mark
, u32 error
,
780 struct rxrpc_skb_priv
*sp
;
784 _enter("{%d,%lx},%u,%u,%d",
785 call
->debug_id
, call
->flags
, mark
, error
, fatal
);
787 /* remove timers and things for fatal messages */
789 del_timer_sync(&call
->resend_timer
);
790 del_timer_sync(&call
->ack_timer
);
791 clear_bit(RXRPC_CALL_RUN_RTIMER
, &call
->flags
);
794 if (mark
!= RXRPC_SKB_MARK_NEW_CALL
&&
795 !test_bit(RXRPC_CALL_HAS_USERID
, &call
->flags
)) {
796 _leave("[no userid]");
800 if (!test_bit(RXRPC_CALL_TERMINAL_MSG
, &call
->flags
)) {
801 skb
= alloc_skb(0, GFP_NOFS
);
810 memset(sp
, 0, sizeof(*sp
));
813 rxrpc_get_call(call
);
815 spin_lock_bh(&call
->lock
);
816 ret
= rxrpc_queue_rcv_skb(call
, skb
, true, fatal
);
817 spin_unlock_bh(&call
->lock
);
825 * handle background processing of incoming call packets and ACK / abort
828 void rxrpc_process_call(struct work_struct
*work
)
830 struct rxrpc_call
*call
=
831 container_of(work
, struct rxrpc_call
, processor
);
832 struct rxrpc_ackpacket ack
;
833 struct rxrpc_ackinfo ackinfo
;
834 struct rxrpc_header hdr
;
840 int genbit
, loop
, nbit
, ioc
, ret
, mtu
;
841 u32 abort_code
= RX_PROTOCOL_ERROR
;
844 //printk("\n--------------------\n");
845 _enter("{%d,%s,%lx} [%lu]",
846 call
->debug_id
, rxrpc_call_states
[call
->state
], call
->events
,
847 (jiffies
- call
->creation_jif
) / (HZ
/ 10));
849 if (test_and_set_bit(RXRPC_CALL_PROC_BUSY
, &call
->flags
)) {
850 _debug("XXXXXXXXXXXXX RUNNING ON MULTIPLE CPUS XXXXXXXXXXXXX");
854 /* there's a good chance we're going to have to send a message, so set
855 * one up in advance */
856 msg
.msg_name
= &call
->conn
->trans
->peer
->srx
.transport
.sin
;
857 msg
.msg_namelen
= sizeof(call
->conn
->trans
->peer
->srx
.transport
.sin
);
858 msg
.msg_control
= NULL
;
859 msg
.msg_controllen
= 0;
862 hdr
.epoch
= call
->conn
->epoch
;
864 hdr
.callNumber
= call
->call_id
;
866 hdr
.type
= RXRPC_PACKET_TYPE_ACK
;
867 hdr
.flags
= call
->conn
->out_clientflag
;
869 hdr
.securityIndex
= call
->conn
->security_ix
;
871 hdr
.serviceId
= call
->conn
->service_id
;
873 memset(iov
, 0, sizeof(iov
));
874 iov
[0].iov_base
= &hdr
;
875 iov
[0].iov_len
= sizeof(hdr
);
877 /* deal with events of a final nature */
878 if (test_bit(RXRPC_CALL_RELEASE
, &call
->events
)) {
879 rxrpc_release_call(call
);
880 clear_bit(RXRPC_CALL_RELEASE
, &call
->events
);
883 if (test_bit(RXRPC_CALL_RCVD_ERROR
, &call
->events
)) {
886 clear_bit(RXRPC_CALL_CONN_ABORT
, &call
->events
);
887 clear_bit(RXRPC_CALL_REJECT_BUSY
, &call
->events
);
888 clear_bit(RXRPC_CALL_ABORT
, &call
->events
);
890 error
= call
->conn
->trans
->peer
->net_error
;
891 _debug("post net error %d", error
);
893 if (rxrpc_post_message(call
, RXRPC_SKB_MARK_NET_ERROR
,
896 clear_bit(RXRPC_CALL_RCVD_ERROR
, &call
->events
);
900 if (test_bit(RXRPC_CALL_CONN_ABORT
, &call
->events
)) {
901 ASSERTCMP(call
->state
, >, RXRPC_CALL_COMPLETE
);
903 clear_bit(RXRPC_CALL_REJECT_BUSY
, &call
->events
);
904 clear_bit(RXRPC_CALL_ABORT
, &call
->events
);
906 _debug("post conn abort");
908 if (rxrpc_post_message(call
, RXRPC_SKB_MARK_LOCAL_ERROR
,
909 call
->conn
->error
, true) < 0)
911 clear_bit(RXRPC_CALL_CONN_ABORT
, &call
->events
);
915 if (test_bit(RXRPC_CALL_REJECT_BUSY
, &call
->events
)) {
916 hdr
.type
= RXRPC_PACKET_TYPE_BUSY
;
917 genbit
= RXRPC_CALL_REJECT_BUSY
;
921 if (test_bit(RXRPC_CALL_ABORT
, &call
->events
)) {
922 ASSERTCMP(call
->state
, >, RXRPC_CALL_COMPLETE
);
924 if (rxrpc_post_message(call
, RXRPC_SKB_MARK_LOCAL_ERROR
,
925 ECONNABORTED
, true) < 0)
927 hdr
.type
= RXRPC_PACKET_TYPE_ABORT
;
928 data
= htonl(call
->abort_code
);
929 iov
[1].iov_base
= &data
;
930 iov
[1].iov_len
= sizeof(data
);
931 genbit
= RXRPC_CALL_ABORT
;
935 if (test_bit(RXRPC_CALL_ACK_FINAL
, &call
->events
)) {
936 genbit
= RXRPC_CALL_ACK_FINAL
;
938 ack
.bufferSpace
= htons(8);
941 ack
.reason
= RXRPC_ACK_IDLE
;
943 call
->ackr_reason
= 0;
945 spin_lock_bh(&call
->lock
);
946 ack
.serial
= call
->ackr_serial
;
947 ack
.previousPacket
= call
->ackr_prev_seq
;
948 ack
.firstPacket
= htonl(call
->rx_data_eaten
+ 1);
949 spin_unlock_bh(&call
->lock
);
953 iov
[1].iov_base
= &ack
;
954 iov
[1].iov_len
= sizeof(ack
);
955 iov
[2].iov_base
= &pad
;
957 iov
[3].iov_base
= &ackinfo
;
958 iov
[3].iov_len
= sizeof(ackinfo
);
962 if (call
->events
& ((1 << RXRPC_CALL_RCVD_BUSY
) |
963 (1 << RXRPC_CALL_RCVD_ABORT
))
967 if (test_bit(RXRPC_CALL_RCVD_ABORT
, &call
->events
))
968 mark
= RXRPC_SKB_MARK_REMOTE_ABORT
;
970 mark
= RXRPC_SKB_MARK_BUSY
;
972 _debug("post abort/busy");
973 rxrpc_clear_tx_window(call
);
974 if (rxrpc_post_message(call
, mark
, ECONNABORTED
, true) < 0)
977 clear_bit(RXRPC_CALL_RCVD_BUSY
, &call
->events
);
978 clear_bit(RXRPC_CALL_RCVD_ABORT
, &call
->events
);
982 if (test_and_clear_bit(RXRPC_CALL_RCVD_ACKALL
, &call
->events
)) {
983 _debug("do implicit ackall");
984 rxrpc_clear_tx_window(call
);
987 if (test_bit(RXRPC_CALL_LIFE_TIMER
, &call
->events
)) {
988 write_lock_bh(&call
->state_lock
);
989 if (call
->state
<= RXRPC_CALL_COMPLETE
) {
990 call
->state
= RXRPC_CALL_LOCALLY_ABORTED
;
991 call
->abort_code
= RX_CALL_TIMEOUT
;
992 set_bit(RXRPC_CALL_ABORT
, &call
->events
);
994 write_unlock_bh(&call
->state_lock
);
996 _debug("post timeout");
997 if (rxrpc_post_message(call
, RXRPC_SKB_MARK_LOCAL_ERROR
,
1001 clear_bit(RXRPC_CALL_LIFE_TIMER
, &call
->events
);
1005 /* deal with assorted inbound messages */
1006 if (!skb_queue_empty(&call
->rx_queue
)) {
1007 switch (rxrpc_process_rx_queue(call
, &abort_code
)) {
1016 rxrpc_abort_call(call
, abort_code
);
1021 /* handle resending */
1022 if (test_and_clear_bit(RXRPC_CALL_RESEND_TIMER
, &call
->events
))
1023 rxrpc_resend_timer(call
);
1024 if (test_and_clear_bit(RXRPC_CALL_RESEND
, &call
->events
))
1027 /* consider sending an ordinary ACK */
1028 if (test_bit(RXRPC_CALL_ACK
, &call
->events
)) {
1029 _debug("send ACK: window: %d - %d { %lx }",
1030 call
->rx_data_eaten
, call
->ackr_win_top
,
1031 call
->ackr_window
[0]);
1033 if (call
->state
> RXRPC_CALL_SERVER_ACK_REQUEST
&&
1034 call
->ackr_reason
!= RXRPC_ACK_PING_RESPONSE
) {
1035 /* ACK by sending reply DATA packet in this state */
1036 clear_bit(RXRPC_CALL_ACK
, &call
->events
);
1037 goto maybe_reschedule
;
1040 genbit
= RXRPC_CALL_ACK
;
1042 acks
= kzalloc(call
->ackr_win_top
- call
->rx_data_eaten
,
1047 //hdr.flags = RXRPC_SLOW_START_OK;
1048 ack
.bufferSpace
= htons(8);
1053 spin_lock_bh(&call
->lock
);
1054 ack
.reason
= call
->ackr_reason
;
1055 ack
.serial
= call
->ackr_serial
;
1056 ack
.previousPacket
= call
->ackr_prev_seq
;
1057 ack
.firstPacket
= htonl(call
->rx_data_eaten
+ 1);
1060 for (loop
= 0; loop
< RXRPC_ACKR_WINDOW_ASZ
; loop
++) {
1061 nbit
= loop
* BITS_PER_LONG
;
1062 for (bits
= call
->ackr_window
[loop
]; bits
; bits
>>= 1
1064 _debug("- l=%d n=%d b=%lx", loop
, nbit
, bits
);
1066 acks
[nbit
] = RXRPC_ACK_TYPE_ACK
;
1067 ack
.nAcks
= nbit
+ 1;
1072 call
->ackr_reason
= 0;
1073 spin_unlock_bh(&call
->lock
);
1077 iov
[1].iov_base
= &ack
;
1078 iov
[1].iov_len
= sizeof(ack
);
1079 iov
[2].iov_base
= acks
;
1080 iov
[2].iov_len
= ack
.nAcks
;
1081 iov
[3].iov_base
= &pad
;
1083 iov
[4].iov_base
= &ackinfo
;
1084 iov
[4].iov_len
= sizeof(ackinfo
);
1086 switch (ack
.reason
) {
1087 case RXRPC_ACK_REQUESTED
:
1088 case RXRPC_ACK_DUPLICATE
:
1089 case RXRPC_ACK_OUT_OF_SEQUENCE
:
1090 case RXRPC_ACK_EXCEEDS_WINDOW
:
1091 case RXRPC_ACK_NOSPACE
:
1092 case RXRPC_ACK_PING
:
1093 case RXRPC_ACK_PING_RESPONSE
:
1094 goto send_ACK_with_skew
;
1095 case RXRPC_ACK_DELAY
:
1096 case RXRPC_ACK_IDLE
:
1101 /* handle completion of security negotiations on an incoming
1103 if (test_and_clear_bit(RXRPC_CALL_SECURED
, &call
->events
)) {
1105 spin_lock_bh(&call
->lock
);
1107 if (call
->state
== RXRPC_CALL_SERVER_SECURING
) {
1109 write_lock(&call
->conn
->lock
);
1110 if (!test_bit(RXRPC_CALL_RELEASED
, &call
->flags
) &&
1111 !test_bit(RXRPC_CALL_RELEASE
, &call
->events
)) {
1112 _debug("not released");
1113 call
->state
= RXRPC_CALL_SERVER_ACCEPTING
;
1114 list_move_tail(&call
->accept_link
,
1115 &call
->socket
->acceptq
);
1117 write_unlock(&call
->conn
->lock
);
1118 read_lock(&call
->state_lock
);
1119 if (call
->state
< RXRPC_CALL_COMPLETE
)
1120 set_bit(RXRPC_CALL_POST_ACCEPT
, &call
->events
);
1121 read_unlock(&call
->state_lock
);
1124 spin_unlock_bh(&call
->lock
);
1125 if (!test_bit(RXRPC_CALL_POST_ACCEPT
, &call
->events
))
1126 goto maybe_reschedule
;
1129 /* post a notification of an acceptable connection to the app */
1130 if (test_bit(RXRPC_CALL_POST_ACCEPT
, &call
->events
)) {
1131 _debug("post accept");
1132 if (rxrpc_post_message(call
, RXRPC_SKB_MARK_NEW_CALL
,
1135 clear_bit(RXRPC_CALL_POST_ACCEPT
, &call
->events
);
1136 goto maybe_reschedule
;
1139 /* handle incoming call acceptance */
1140 if (test_and_clear_bit(RXRPC_CALL_ACCEPTED
, &call
->events
)) {
1142 ASSERTCMP(call
->rx_data_post
, ==, 0);
1143 call
->rx_data_post
= 1;
1144 read_lock_bh(&call
->state_lock
);
1145 if (call
->state
< RXRPC_CALL_COMPLETE
)
1146 set_bit(RXRPC_CALL_DRAIN_RX_OOS
, &call
->events
);
1147 read_unlock_bh(&call
->state_lock
);
1150 /* drain the out of sequence received packet queue into the packet Rx
1152 if (test_and_clear_bit(RXRPC_CALL_DRAIN_RX_OOS
, &call
->events
)) {
1153 while (call
->rx_data_post
== call
->rx_first_oos
)
1154 if (rxrpc_drain_rx_oos_queue(call
) < 0)
1156 goto maybe_reschedule
;
1159 /* other events may have been raised since we started checking */
1160 goto maybe_reschedule
;
1163 ack
.maxSkew
= htons(atomic_read(&call
->conn
->hi_serial
) -
1166 mtu
= call
->conn
->trans
->peer
->if_mtu
;
1167 mtu
-= call
->conn
->trans
->peer
->hdrsize
;
1168 ackinfo
.maxMTU
= htonl(mtu
);
1169 ackinfo
.rwind
= htonl(32);
1171 /* permit the peer to send us jumbo packets if it wants to */
1172 ackinfo
.rxMTU
= htonl(5692);
1173 ackinfo
.jumbo_max
= htonl(4);
1175 hdr
.serial
= htonl(atomic_inc_return(&call
->conn
->serial
));
1176 _proto("Tx ACK %%%u { m=%hu f=#%u p=#%u s=%%%u r=%s n=%u }",
1179 ntohl(ack
.firstPacket
),
1180 ntohl(ack
.previousPacket
),
1182 rxrpc_acks
[ack
.reason
],
1185 del_timer_sync(&call
->ack_timer
);
1187 set_bit(RXRPC_CALL_TX_SOFT_ACK
, &call
->flags
);
1188 goto send_message_2
;
1191 _debug("send message");
1193 hdr
.serial
= htonl(atomic_inc_return(&call
->conn
->serial
));
1194 _proto("Tx %s %%%u", rxrpc_pkts
[hdr
.type
], ntohl(hdr
.serial
));
1197 len
= iov
[0].iov_len
;
1199 if (iov
[4].iov_len
) {
1201 len
+= iov
[4].iov_len
;
1202 len
+= iov
[3].iov_len
;
1203 len
+= iov
[2].iov_len
;
1204 len
+= iov
[1].iov_len
;
1205 } else if (iov
[3].iov_len
) {
1207 len
+= iov
[3].iov_len
;
1208 len
+= iov
[2].iov_len
;
1209 len
+= iov
[1].iov_len
;
1210 } else if (iov
[2].iov_len
) {
1212 len
+= iov
[2].iov_len
;
1213 len
+= iov
[1].iov_len
;
1214 } else if (iov
[1].iov_len
) {
1216 len
+= iov
[1].iov_len
;
1219 ret
= kernel_sendmsg(call
->conn
->trans
->local
->socket
,
1220 &msg
, iov
, ioc
, len
);
1222 _debug("sendmsg failed: %d", ret
);
1223 read_lock_bh(&call
->state_lock
);
1224 if (call
->state
< RXRPC_CALL_DEAD
)
1225 rxrpc_queue_call(call
);
1226 read_unlock_bh(&call
->state_lock
);
1231 case RXRPC_CALL_ABORT
:
1232 clear_bit(genbit
, &call
->events
);
1233 clear_bit(RXRPC_CALL_RCVD_ABORT
, &call
->events
);
1236 case RXRPC_CALL_ACK_FINAL
:
1237 write_lock_bh(&call
->state_lock
);
1238 if (call
->state
== RXRPC_CALL_CLIENT_FINAL_ACK
)
1239 call
->state
= RXRPC_CALL_COMPLETE
;
1240 write_unlock_bh(&call
->state_lock
);
1244 clear_bit(genbit
, &call
->events
);
1245 switch (call
->state
) {
1246 case RXRPC_CALL_CLIENT_AWAIT_REPLY
:
1247 case RXRPC_CALL_CLIENT_RECV_REPLY
:
1248 case RXRPC_CALL_SERVER_RECV_REQUEST
:
1249 case RXRPC_CALL_SERVER_ACK_REQUEST
:
1250 _debug("start ACK timer");
1251 rxrpc_propose_ACK(call
, RXRPC_ACK_DELAY
,
1252 call
->ackr_serial
, false);
1256 goto maybe_reschedule
;
1260 del_timer_sync(&call
->ack_timer
);
1261 if (test_and_clear_bit(RXRPC_CALL_ACK_FINAL
, &call
->events
))
1262 rxrpc_put_call(call
);
1263 clear_bit(RXRPC_CALL_ACK
, &call
->events
);
1266 if (call
->events
|| !skb_queue_empty(&call
->rx_queue
)) {
1267 read_lock_bh(&call
->state_lock
);
1268 if (call
->state
< RXRPC_CALL_DEAD
)
1269 rxrpc_queue_call(call
);
1270 read_unlock_bh(&call
->state_lock
);
1273 /* don't leave aborted connections on the accept queue */
1274 if (call
->state
>= RXRPC_CALL_COMPLETE
&&
1275 !list_empty(&call
->accept_link
)) {
1276 _debug("X unlinking once-pending call %p { e=%lx f=%lx c=%x }",
1277 call
, call
->events
, call
->flags
,
1278 ntohl(call
->conn
->cid
));
1280 read_lock_bh(&call
->state_lock
);
1281 if (!test_bit(RXRPC_CALL_RELEASED
, &call
->flags
) &&
1282 !test_and_set_bit(RXRPC_CALL_RELEASE
, &call
->events
))
1283 rxrpc_queue_call(call
);
1284 read_unlock_bh(&call
->state_lock
);
1288 clear_bit(RXRPC_CALL_PROC_BUSY
, &call
->flags
);
1291 /* because we don't want two CPUs both processing the work item for one
1292 * call at the same time, we use a flag to note when it's busy; however
1293 * this means there's a race between clearing the flag and setting the
1294 * work pending bit and the work item being processed again */
1295 if (call
->events
&& !work_pending(&call
->processor
)) {
1296 _debug("jumpstart %x", ntohl(call
->conn
->cid
));
1297 rxrpc_queue_call(call
);
1304 _debug("out of memory");
1305 goto maybe_reschedule
;