Linux Audio

Check our new training course

Loading...
v5.4
   1// SPDX-License-Identifier: GPL-2.0-or-later
   2/* RxRPC packet reception
   3 *
   4 * Copyright (C) 2007, 2016 Red Hat, Inc. All Rights Reserved.
   5 * Written by David Howells (dhowells@redhat.com)
 
 
 
 
 
   6 */
   7
   8#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
   9
  10#include <linux/module.h>
  11#include <linux/net.h>
  12#include <linux/skbuff.h>
  13#include <linux/errqueue.h>
  14#include <linux/udp.h>
  15#include <linux/in.h>
  16#include <linux/in6.h>
  17#include <linux/icmp.h>
  18#include <linux/gfp.h>
  19#include <net/sock.h>
  20#include <net/af_rxrpc.h>
  21#include <net/ip.h>
  22#include <net/udp.h>
  23#include <net/net_namespace.h>
  24#include "ar-internal.h"
  25
  26static void rxrpc_proto_abort(const char *why,
  27			      struct rxrpc_call *call, rxrpc_seq_t seq)
  28{
  29	if (rxrpc_abort_call(why, call, seq, RX_PROTOCOL_ERROR, -EBADMSG)) {
  30		set_bit(RXRPC_CALL_EV_ABORT, &call->events);
  31		rxrpc_queue_call(call);
  32	}
  33}
  34
  35/*
  36 * Do TCP-style congestion management [RFC 5681].
  37 */
  38static void rxrpc_congestion_management(struct rxrpc_call *call,
  39					struct sk_buff *skb,
  40					struct rxrpc_ack_summary *summary,
  41					rxrpc_serial_t acked_serial)
  42{
  43	enum rxrpc_congest_change change = rxrpc_cong_no_change;
  44	unsigned int cumulative_acks = call->cong_cumul_acks;
  45	unsigned int cwnd = call->cong_cwnd;
  46	bool resend = false;
  47
  48	summary->flight_size =
  49		(call->tx_top - call->tx_hard_ack) - summary->nr_acks;
  50
  51	if (test_and_clear_bit(RXRPC_CALL_RETRANS_TIMEOUT, &call->flags)) {
  52		summary->retrans_timeo = true;
  53		call->cong_ssthresh = max_t(unsigned int,
  54					    summary->flight_size / 2, 2);
  55		cwnd = 1;
  56		if (cwnd >= call->cong_ssthresh &&
  57		    call->cong_mode == RXRPC_CALL_SLOW_START) {
  58			call->cong_mode = RXRPC_CALL_CONGEST_AVOIDANCE;
  59			call->cong_tstamp = skb->tstamp;
  60			cumulative_acks = 0;
  61		}
  62	}
  63
  64	cumulative_acks += summary->nr_new_acks;
  65	cumulative_acks += summary->nr_rot_new_acks;
  66	if (cumulative_acks > 255)
  67		cumulative_acks = 255;
  68
  69	summary->mode = call->cong_mode;
  70	summary->cwnd = call->cong_cwnd;
  71	summary->ssthresh = call->cong_ssthresh;
  72	summary->cumulative_acks = cumulative_acks;
  73	summary->dup_acks = call->cong_dup_acks;
  74
  75	switch (call->cong_mode) {
  76	case RXRPC_CALL_SLOW_START:
  77		if (summary->nr_nacks > 0)
  78			goto packet_loss_detected;
  79		if (summary->cumulative_acks > 0)
  80			cwnd += 1;
  81		if (cwnd >= call->cong_ssthresh) {
  82			call->cong_mode = RXRPC_CALL_CONGEST_AVOIDANCE;
  83			call->cong_tstamp = skb->tstamp;
  84		}
  85		goto out;
  86
  87	case RXRPC_CALL_CONGEST_AVOIDANCE:
  88		if (summary->nr_nacks > 0)
  89			goto packet_loss_detected;
  90
  91		/* We analyse the number of packets that get ACK'd per RTT
  92		 * period and increase the window if we managed to fill it.
  93		 */
  94		if (call->peer->rtt_usage == 0)
  95			goto out;
  96		if (ktime_before(skb->tstamp,
  97				 ktime_add_ns(call->cong_tstamp,
  98					      call->peer->rtt)))
  99			goto out_no_clear_ca;
 100		change = rxrpc_cong_rtt_window_end;
 101		call->cong_tstamp = skb->tstamp;
 102		if (cumulative_acks >= cwnd)
 103			cwnd++;
 104		goto out;
 105
 106	case RXRPC_CALL_PACKET_LOSS:
 107		if (summary->nr_nacks == 0)
 108			goto resume_normality;
 109
 110		if (summary->new_low_nack) {
 111			change = rxrpc_cong_new_low_nack;
 112			call->cong_dup_acks = 1;
 113			if (call->cong_extra > 1)
 114				call->cong_extra = 1;
 115			goto send_extra_data;
 116		}
 117
 118		call->cong_dup_acks++;
 119		if (call->cong_dup_acks < 3)
 120			goto send_extra_data;
 121
 122		change = rxrpc_cong_begin_retransmission;
 123		call->cong_mode = RXRPC_CALL_FAST_RETRANSMIT;
 124		call->cong_ssthresh = max_t(unsigned int,
 125					    summary->flight_size / 2, 2);
 126		cwnd = call->cong_ssthresh + 3;
 127		call->cong_extra = 0;
 128		call->cong_dup_acks = 0;
 129		resend = true;
 130		goto out;
 131
 132	case RXRPC_CALL_FAST_RETRANSMIT:
 133		if (!summary->new_low_nack) {
 134			if (summary->nr_new_acks == 0)
 135				cwnd += 1;
 136			call->cong_dup_acks++;
 137			if (call->cong_dup_acks == 2) {
 138				change = rxrpc_cong_retransmit_again;
 139				call->cong_dup_acks = 0;
 140				resend = true;
 141			}
 142		} else {
 143			change = rxrpc_cong_progress;
 144			cwnd = call->cong_ssthresh;
 145			if (summary->nr_nacks == 0)
 146				goto resume_normality;
 147		}
 148		goto out;
 149
 150	default:
 151		BUG();
 152		goto out;
 153	}
 154
 155resume_normality:
 156	change = rxrpc_cong_cleared_nacks;
 157	call->cong_dup_acks = 0;
 158	call->cong_extra = 0;
 159	call->cong_tstamp = skb->tstamp;
 160	if (cwnd < call->cong_ssthresh)
 161		call->cong_mode = RXRPC_CALL_SLOW_START;
 162	else
 163		call->cong_mode = RXRPC_CALL_CONGEST_AVOIDANCE;
 164out:
 165	cumulative_acks = 0;
 166out_no_clear_ca:
 167	if (cwnd >= RXRPC_RXTX_BUFF_SIZE - 1)
 168		cwnd = RXRPC_RXTX_BUFF_SIZE - 1;
 169	call->cong_cwnd = cwnd;
 170	call->cong_cumul_acks = cumulative_acks;
 171	trace_rxrpc_congest(call, summary, acked_serial, change);
 172	if (resend && !test_and_set_bit(RXRPC_CALL_EV_RESEND, &call->events))
 173		rxrpc_queue_call(call);
 174	return;
 175
 176packet_loss_detected:
 177	change = rxrpc_cong_saw_nack;
 178	call->cong_mode = RXRPC_CALL_PACKET_LOSS;
 179	call->cong_dup_acks = 0;
 180	goto send_extra_data;
 181
 182send_extra_data:
 183	/* Send some previously unsent DATA if we have some to advance the ACK
 184	 * state.
 185	 */
 186	if (call->rxtx_annotations[call->tx_top & RXRPC_RXTX_BUFF_MASK] &
 187	    RXRPC_TX_ANNO_LAST ||
 188	    summary->nr_acks != call->tx_top - call->tx_hard_ack) {
 189		call->cong_extra++;
 190		wake_up(&call->waitq);
 191	}
 192	goto out_no_clear_ca;
 193}
 194
 195/*
 196 * Ping the other end to fill our RTT cache and to retrieve the rwind
 197 * and MTU parameters.
 198 */
 199static void rxrpc_send_ping(struct rxrpc_call *call, struct sk_buff *skb)
 
 200{
 201	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 202	ktime_t now = skb->tstamp;
 203
 204	if (call->peer->rtt_usage < 3 ||
 205	    ktime_before(ktime_add_ms(call->peer->rtt_last_req, 1000), now))
 206		rxrpc_propose_ACK(call, RXRPC_ACK_PING, sp->hdr.serial,
 207				  true, true,
 208				  rxrpc_propose_ack_ping_for_params);
 209}
 210
 211/*
 212 * Apply a hard ACK by advancing the Tx window.
 213 */
 214static bool rxrpc_rotate_tx_window(struct rxrpc_call *call, rxrpc_seq_t to,
 215				   struct rxrpc_ack_summary *summary)
 216{
 217	struct sk_buff *skb, *list = NULL;
 218	bool rot_last = false;
 219	int ix;
 220	u8 annotation;
 221
 222	if (call->acks_lowest_nak == call->tx_hard_ack) {
 223		call->acks_lowest_nak = to;
 224	} else if (before_eq(call->acks_lowest_nak, to)) {
 225		summary->new_low_nack = true;
 226		call->acks_lowest_nak = to;
 227	}
 228
 229	spin_lock(&call->lock);
 230
 231	while (before(call->tx_hard_ack, to)) {
 232		call->tx_hard_ack++;
 233		ix = call->tx_hard_ack & RXRPC_RXTX_BUFF_MASK;
 234		skb = call->rxtx_buffer[ix];
 235		annotation = call->rxtx_annotations[ix];
 236		rxrpc_see_skb(skb, rxrpc_skb_rotated);
 237		call->rxtx_buffer[ix] = NULL;
 238		call->rxtx_annotations[ix] = 0;
 239		skb->next = list;
 240		list = skb;
 241
 242		if (annotation & RXRPC_TX_ANNO_LAST) {
 243			set_bit(RXRPC_CALL_TX_LAST, &call->flags);
 244			rot_last = true;
 245		}
 246		if ((annotation & RXRPC_TX_ANNO_MASK) != RXRPC_TX_ANNO_ACK)
 247			summary->nr_rot_new_acks++;
 248	}
 249
 250	spin_unlock(&call->lock);
 251
 252	trace_rxrpc_transmit(call, (rot_last ?
 253				    rxrpc_transmit_rotate_last :
 254				    rxrpc_transmit_rotate));
 255	wake_up(&call->waitq);
 256
 257	while (list) {
 258		skb = list;
 259		list = skb->next;
 260		skb_mark_not_on_list(skb);
 261		rxrpc_free_skb(skb, rxrpc_skb_freed);
 262	}
 263
 264	return rot_last;
 265}
 266
 267/*
 268 * End the transmission phase of a call.
 269 *
 270 * This occurs when we get an ACKALL packet, the first DATA packet of a reply,
 271 * or a final ACK packet.
 272 */
 273static bool rxrpc_end_tx_phase(struct rxrpc_call *call, bool reply_begun,
 274			       const char *abort_why)
 275{
 276	unsigned int state;
 277
 278	ASSERT(test_bit(RXRPC_CALL_TX_LAST, &call->flags));
 279
 280	write_lock(&call->state_lock);
 281
 282	state = call->state;
 283	switch (state) {
 284	case RXRPC_CALL_CLIENT_SEND_REQUEST:
 285	case RXRPC_CALL_CLIENT_AWAIT_REPLY:
 286		if (reply_begun)
 287			call->state = state = RXRPC_CALL_CLIENT_RECV_REPLY;
 288		else
 289			call->state = state = RXRPC_CALL_CLIENT_AWAIT_REPLY;
 290		break;
 291
 292	case RXRPC_CALL_SERVER_AWAIT_ACK:
 293		__rxrpc_call_completed(call);
 294		rxrpc_notify_socket(call);
 295		state = call->state;
 296		break;
 297
 298	default:
 299		goto bad_state;
 300	}
 301
 302	write_unlock(&call->state_lock);
 303	if (state == RXRPC_CALL_CLIENT_AWAIT_REPLY)
 304		trace_rxrpc_transmit(call, rxrpc_transmit_await_reply);
 305	else
 306		trace_rxrpc_transmit(call, rxrpc_transmit_end);
 
 307	_leave(" = ok");
 308	return true;
 309
 310bad_state:
 311	write_unlock(&call->state_lock);
 312	kdebug("end_tx %s", rxrpc_call_states[call->state]);
 313	rxrpc_proto_abort(abort_why, call, call->tx_top);
 314	return false;
 315}
 316
 317/*
 318 * Begin the reply reception phase of a call.
 319 */
 320static bool rxrpc_receiving_reply(struct rxrpc_call *call)
 321{
 322	struct rxrpc_ack_summary summary = { 0 };
 323	unsigned long now, timo;
 324	rxrpc_seq_t top = READ_ONCE(call->tx_top);
 325
 326	if (call->ackr_reason) {
 327		spin_lock_bh(&call->lock);
 328		call->ackr_reason = 0;
 329		spin_unlock_bh(&call->lock);
 330		now = jiffies;
 331		timo = now + MAX_JIFFY_OFFSET;
 332		WRITE_ONCE(call->resend_at, timo);
 333		WRITE_ONCE(call->ack_at, timo);
 334		trace_rxrpc_timer(call, rxrpc_timer_init_for_reply, now);
 335	}
 336
 
 
 337	if (!test_bit(RXRPC_CALL_TX_LAST, &call->flags)) {
 338		if (!rxrpc_rotate_tx_window(call, top, &summary)) {
 339			rxrpc_proto_abort("TXL", call, top);
 340			return false;
 341		}
 342	}
 343	if (!rxrpc_end_tx_phase(call, true, "ETD"))
 344		return false;
 345	call->tx_phase = false;
 346	return true;
 347}
 348
 349/*
 350 * Scan a data packet to validate its structure and to work out how many
 351 * subpackets it contains.
 352 *
 353 * A jumbo packet is a collection of consecutive packets glued together with
 354 * little headers between that indicate how to change the initial header for
 355 * each subpacket.
 356 *
 357 * RXRPC_JUMBO_PACKET must be set on all but the last subpacket - and all but
 358 * the last are RXRPC_JUMBO_DATALEN in size.  The last subpacket may be of any
 359 * size.
 360 */
 361static bool rxrpc_validate_data(struct sk_buff *skb)
 362{
 363	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 364	unsigned int offset = sizeof(struct rxrpc_wire_header);
 365	unsigned int len = skb->len;
 
 366	u8 flags = sp->hdr.flags;
 367
 368	for (;;) {
 369		if (flags & RXRPC_REQUEST_ACK)
 370			__set_bit(sp->nr_subpackets, sp->rx_req_ack);
 371		sp->nr_subpackets++;
 372
 373		if (!(flags & RXRPC_JUMBO_PACKET))
 374			break;
 375
 376		if (len - offset < RXRPC_JUMBO_SUBPKTLEN)
 377			goto protocol_error;
 378		if (flags & RXRPC_LAST_PACKET)
 379			goto protocol_error;
 380		offset += RXRPC_JUMBO_DATALEN;
 381		if (skb_copy_bits(skb, offset, &flags, 1) < 0)
 382			goto protocol_error;
 383		offset += sizeof(struct rxrpc_jumbo_header);
 384	}
 385
 386	if (flags & RXRPC_LAST_PACKET)
 387		sp->rx_flags |= RXRPC_SKB_INCL_LAST;
 388	return true;
 389
 390protocol_error:
 391	return false;
 392}
 393
 394/*
 395 * Handle reception of a duplicate packet.
 396 *
 397 * We have to take care to avoid an attack here whereby we're given a series of
 398 * jumbograms, each with a sequence number one before the preceding one and
 399 * filled up to maximum UDP size.  If they never send us the first packet in
 400 * the sequence, they can cause us to have to hold on to around 2MiB of kernel
 401 * space until the call times out.
 402 *
 403 * We limit the space usage by only accepting three duplicate jumbo packets per
 404 * call.  After that, we tell the other side we're no longer accepting jumbos
 405 * (that information is encoded in the ACK packet).
 406 */
 407static void rxrpc_input_dup_data(struct rxrpc_call *call, rxrpc_seq_t seq,
 408				 bool is_jumbo, bool *_jumbo_bad)
 409{
 410	/* Discard normal packets that are duplicates. */
 411	if (is_jumbo)
 412		return;
 413
 414	/* Skip jumbo subpackets that are duplicates.  When we've had three or
 415	 * more partially duplicate jumbo packets, we refuse to take any more
 416	 * jumbos for this call.
 417	 */
 418	if (!*_jumbo_bad) {
 419		call->nr_jumbo_bad++;
 420		*_jumbo_bad = true;
 421	}
 422}
 423
 424/*
 425 * Process a DATA packet, adding the packet to the Rx ring.  The caller's
 426 * packet ref must be passed on or discarded.
 427 */
 428static void rxrpc_input_data(struct rxrpc_call *call, struct sk_buff *skb)
 
 429{
 430	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 431	enum rxrpc_call_state state;
 432	unsigned int j;
 
 433	rxrpc_serial_t serial = sp->hdr.serial, ack_serial = 0;
 434	rxrpc_seq_t seq0 = sp->hdr.seq, hard_ack;
 435	bool immediate_ack = false, jumbo_bad = false;
 436	u8 ack = 0;
 
 437
 438	_enter("{%u,%u},{%u,%u}",
 439	       call->rx_hard_ack, call->rx_top, skb->len, seq0);
 440
 441	_proto("Rx DATA %%%u { #%u f=%02x n=%u }",
 442	       sp->hdr.serial, seq0, sp->hdr.flags, sp->nr_subpackets);
 443
 444	state = READ_ONCE(call->state);
 445	if (state >= RXRPC_CALL_COMPLETE) {
 446		rxrpc_free_skb(skb, rxrpc_skb_freed);
 447		return;
 448	}
 449
 450	if (call->state == RXRPC_CALL_SERVER_RECV_REQUEST) {
 451		unsigned long timo = READ_ONCE(call->next_req_timo);
 452		unsigned long now, expect_req_by;
 453
 454		if (timo) {
 455			now = jiffies;
 456			expect_req_by = now + timo;
 457			WRITE_ONCE(call->expect_req_by, expect_req_by);
 458			rxrpc_reduce_call_timer(call, expect_req_by, now,
 459						rxrpc_timer_set_for_idle);
 460		}
 461	}
 462
 463	spin_lock(&call->input_lock);
 464
 465	/* Received data implicitly ACKs all of the request packets we sent
 466	 * when we're acting as a client.
 467	 */
 468	if ((state == RXRPC_CALL_CLIENT_SEND_REQUEST ||
 469	     state == RXRPC_CALL_CLIENT_AWAIT_REPLY) &&
 470	    !rxrpc_receiving_reply(call))
 471		goto unlock;
 
 
 472
 473	call->ackr_prev_seq = seq0;
 474	hard_ack = READ_ONCE(call->rx_hard_ack);
 
 
 
 
 
 475
 476	if (sp->nr_subpackets > 1) {
 
 477		if (call->nr_jumbo_bad > 3) {
 478			ack = RXRPC_ACK_NOSPACE;
 479			ack_serial = serial;
 480			goto ack;
 481		}
 
 482	}
 483
 484	for (j = 0; j < sp->nr_subpackets; j++) {
 485		rxrpc_serial_t serial = sp->hdr.serial + j;
 486		rxrpc_seq_t seq = seq0 + j;
 487		unsigned int ix = seq & RXRPC_RXTX_BUFF_MASK;
 488		bool terminal = (j == sp->nr_subpackets - 1);
 489		bool last = terminal && (sp->rx_flags & RXRPC_SKB_INCL_LAST);
 490		u8 flags, annotation = j;
 491
 492		_proto("Rx DATA+%u %%%u { #%x t=%u l=%u }",
 493		     j, serial, seq, terminal, last);
 494
 495		if (last) {
 496			if (test_bit(RXRPC_CALL_RX_LAST, &call->flags) &&
 497			    seq != call->rx_top) {
 498				rxrpc_proto_abort("LSN", call, seq);
 499				goto unlock;
 500			}
 501		} else {
 502			if (test_bit(RXRPC_CALL_RX_LAST, &call->flags) &&
 503			    after_eq(seq, call->rx_top)) {
 504				rxrpc_proto_abort("LSA", call, seq);
 505				goto unlock;
 506			}
 507		}
 508
 509		flags = 0;
 510		if (last)
 511			flags |= RXRPC_LAST_PACKET;
 512		if (!terminal)
 513			flags |= RXRPC_JUMBO_PACKET;
 514		if (test_bit(j, sp->rx_req_ack))
 515			flags |= RXRPC_REQUEST_ACK;
 516		trace_rxrpc_rx_data(call->debug_id, seq, serial, flags, annotation);
 517
 518		if (before_eq(seq, hard_ack)) {
 
 
 519			ack = RXRPC_ACK_DUPLICATE;
 520			ack_serial = serial;
 521			continue;
 522		}
 523
 524		if (call->rxtx_buffer[ix]) {
 525			rxrpc_input_dup_data(call, seq, sp->nr_subpackets > 1,
 526					     &jumbo_bad);
 527			if (ack != RXRPC_ACK_DUPLICATE) {
 528				ack = RXRPC_ACK_DUPLICATE;
 529				ack_serial = serial;
 530			}
 531			immediate_ack = true;
 532			continue;
 533		}
 
 
 
 534
 535		if (after(seq, hard_ack + call->rx_winsize)) {
 536			ack = RXRPC_ACK_EXCEEDS_WINDOW;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 537			ack_serial = serial;
 538			if (flags & RXRPC_JUMBO_PACKET) {
 539				if (!jumbo_bad) {
 540					call->nr_jumbo_bad++;
 541					jumbo_bad = true;
 542				}
 543			}
 544
 545			goto ack;
 546		}
 
 
 
 
 
 
 
 
 
 547
 548		if (flags & RXRPC_REQUEST_ACK && !ack) {
 549			ack = RXRPC_ACK_REQUESTED;
 
 
 550			ack_serial = serial;
 551		}
 
 
 552
 553		/* Queue the packet.  We use a couple of memory barriers here as need
 554		 * to make sure that rx_top is perceived to be set after the buffer
 555		 * pointer and that the buffer pointer is set after the annotation and
 556		 * the skb data.
 557		 *
 558		 * Barriers against rxrpc_recvmsg_data() and rxrpc_rotate_rx_window()
 559		 * and also rxrpc_fill_out_ack().
 560		 */
 561		if (!terminal)
 562			rxrpc_get_skb(skb, rxrpc_skb_got);
 563		call->rxtx_annotations[ix] = annotation;
 564		smp_wmb();
 565		call->rxtx_buffer[ix] = skb;
 566		if (after(seq, call->rx_top)) {
 567			smp_store_release(&call->rx_top, seq);
 568		} else if (before(seq, call->rx_top)) {
 569			/* Send an immediate ACK if we fill in a hole */
 570			if (!ack) {
 571				ack = RXRPC_ACK_DELAY;
 572				ack_serial = serial;
 573			}
 574			immediate_ack = true;
 575		}
 576
 577		if (terminal) {
 578			/* From this point on, we're not allowed to touch the
 579			 * packet any longer as its ref now belongs to the Rx
 580			 * ring.
 581			 */
 582			skb = NULL;
 583		}
 584
 585		if (last) {
 586			set_bit(RXRPC_CALL_RX_LAST, &call->flags);
 587			if (!ack) {
 588				ack = RXRPC_ACK_DELAY;
 589				ack_serial = serial;
 590			}
 591			trace_rxrpc_receive(call, rxrpc_receive_queue_last, serial, seq);
 592		} else {
 593			trace_rxrpc_receive(call, rxrpc_receive_queue, serial, seq);
 594		}
 595
 596		if (after_eq(seq, call->rx_expect_next)) {
 597			if (after(seq, call->rx_expect_next)) {
 598				_net("OOS %u > %u", seq, call->rx_expect_next);
 599				ack = RXRPC_ACK_OUT_OF_SEQUENCE;
 600				ack_serial = serial;
 601			}
 602			call->rx_expect_next = seq + 1;
 603		}
 604	}
 605
 606ack:
 607	if (ack)
 608		rxrpc_propose_ACK(call, ack, ack_serial,
 609				  immediate_ack, true,
 610				  rxrpc_propose_ack_input_data);
 611	else
 612		rxrpc_propose_ACK(call, RXRPC_ACK_DELAY, serial,
 613				  false, true,
 614				  rxrpc_propose_ack_input_data);
 615
 616	if (seq0 == READ_ONCE(call->rx_hard_ack) + 1) {
 617		trace_rxrpc_notify_socket(call->debug_id, serial);
 618		rxrpc_notify_socket(call);
 619	}
 620
 621unlock:
 622	spin_unlock(&call->input_lock);
 623	rxrpc_free_skb(skb, rxrpc_skb_freed);
 624	_leave(" [queued]");
 625}
 626
 627/*
 628 * Process a requested ACK.
 629 */
 630static void rxrpc_input_requested_ack(struct rxrpc_call *call,
 631				      ktime_t resp_time,
 632				      rxrpc_serial_t orig_serial,
 633				      rxrpc_serial_t ack_serial)
 634{
 635	struct rxrpc_skb_priv *sp;
 636	struct sk_buff *skb;
 637	ktime_t sent_at;
 638	int ix;
 639
 640	for (ix = 0; ix < RXRPC_RXTX_BUFF_SIZE; ix++) {
 641		skb = call->rxtx_buffer[ix];
 642		if (!skb)
 643			continue;
 644
 645		sent_at = skb->tstamp;
 646		smp_rmb(); /* Read timestamp before serial. */
 647		sp = rxrpc_skb(skb);
 648		if (sp->hdr.serial != orig_serial)
 649			continue;
 
 
 650		goto found;
 651	}
 652
 653	return;
 654
 655found:
 656	rxrpc_peer_add_rtt(call, rxrpc_rtt_rx_requested_ack,
 657			   orig_serial, ack_serial, sent_at, resp_time);
 658}
 659
 660/*
 661 * Process the response to a ping that we sent to find out if we lost an ACK.
 662 *
 663 * If we got back a ping response that indicates a lower tx_top than what we
 664 * had at the time of the ping transmission, we adjudge all the DATA packets
 665 * sent between the response tx_top and the ping-time tx_top to have been lost.
 666 */
 667static void rxrpc_input_check_for_lost_ack(struct rxrpc_call *call)
 668{
 669	rxrpc_seq_t top, bottom, seq;
 670	bool resend = false;
 671
 672	spin_lock_bh(&call->lock);
 673
 674	bottom = call->tx_hard_ack + 1;
 675	top = call->acks_lost_top;
 676	if (before(bottom, top)) {
 677		for (seq = bottom; before_eq(seq, top); seq++) {
 678			int ix = seq & RXRPC_RXTX_BUFF_MASK;
 679			u8 annotation = call->rxtx_annotations[ix];
 680			u8 anno_type = annotation & RXRPC_TX_ANNO_MASK;
 681
 682			if (anno_type != RXRPC_TX_ANNO_UNACK)
 683				continue;
 684			annotation &= ~RXRPC_TX_ANNO_MASK;
 685			annotation |= RXRPC_TX_ANNO_RETRANS;
 686			call->rxtx_annotations[ix] = annotation;
 687			resend = true;
 688		}
 689	}
 690
 691	spin_unlock_bh(&call->lock);
 692
 693	if (resend && !test_and_set_bit(RXRPC_CALL_EV_RESEND, &call->events))
 694		rxrpc_queue_call(call);
 695}
 696
 697/*
 698 * Process a ping response.
 699 */
 700static void rxrpc_input_ping_response(struct rxrpc_call *call,
 701				      ktime_t resp_time,
 702				      rxrpc_serial_t orig_serial,
 703				      rxrpc_serial_t ack_serial)
 704{
 705	rxrpc_serial_t ping_serial;
 706	ktime_t ping_time;
 707
 708	ping_time = call->ping_time;
 709	smp_rmb();
 710	ping_serial = READ_ONCE(call->ping_serial);
 711
 712	if (orig_serial == call->acks_lost_ping)
 713		rxrpc_input_check_for_lost_ack(call);
 714
 715	if (before(orig_serial, ping_serial) ||
 716	    !test_and_clear_bit(RXRPC_CALL_PINGING, &call->flags))
 717		return;
 
 718	if (after(orig_serial, ping_serial))
 719		return;
 720
 721	rxrpc_peer_add_rtt(call, rxrpc_rtt_rx_ping_response,
 722			   orig_serial, ack_serial, ping_time, resp_time);
 723}
 724
 725/*
 726 * Process the extra information that may be appended to an ACK packet
 727 */
 728static void rxrpc_input_ackinfo(struct rxrpc_call *call, struct sk_buff *skb,
 729				struct rxrpc_ackinfo *ackinfo)
 730{
 731	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 732	struct rxrpc_peer *peer;
 733	unsigned int mtu;
 734	bool wake = false;
 735	u32 rwind = ntohl(ackinfo->rwind);
 736
 737	_proto("Rx ACK %%%u Info { rx=%u max=%u rwin=%u jm=%u }",
 738	       sp->hdr.serial,
 739	       ntohl(ackinfo->rxMTU), ntohl(ackinfo->maxMTU),
 740	       rwind, ntohl(ackinfo->jumbo_max));
 741
 742	if (call->tx_winsize != rwind) {
 743		if (rwind > RXRPC_RXTX_BUFF_SIZE - 1)
 744			rwind = RXRPC_RXTX_BUFF_SIZE - 1;
 745		if (rwind > call->tx_winsize)
 746			wake = true;
 747		trace_rxrpc_rx_rwind_change(call, sp->hdr.serial,
 748					    ntohl(ackinfo->rwind), wake);
 749		call->tx_winsize = rwind;
 750	}
 751
 752	if (call->cong_ssthresh > rwind)
 753		call->cong_ssthresh = rwind;
 754
 755	mtu = min(ntohl(ackinfo->rxMTU), ntohl(ackinfo->maxMTU));
 756
 757	peer = call->peer;
 758	if (mtu < peer->maxdata) {
 759		spin_lock_bh(&peer->lock);
 760		peer->maxdata = mtu;
 761		peer->mtu = mtu + peer->hdrsize;
 762		spin_unlock_bh(&peer->lock);
 763		_net("Net MTU %u (maxdata %u)", peer->mtu, peer->maxdata);
 764	}
 765
 766	if (wake)
 767		wake_up(&call->waitq);
 768}
 769
 770/*
 771 * Process individual soft ACKs.
 772 *
 773 * Each ACK in the array corresponds to one packet and can be either an ACK or
 774 * a NAK.  If we get find an explicitly NAK'd packet we resend immediately;
 775 * packets that lie beyond the end of the ACK list are scheduled for resend by
 776 * the timer on the basis that the peer might just not have processed them at
 777 * the time the ACK was sent.
 778 */
 779static void rxrpc_input_soft_acks(struct rxrpc_call *call, u8 *acks,
 780				  rxrpc_seq_t seq, int nr_acks,
 781				  struct rxrpc_ack_summary *summary)
 782{
 783	int ix;
 784	u8 annotation, anno_type;
 785
 786	for (; nr_acks > 0; nr_acks--, seq++) {
 787		ix = seq & RXRPC_RXTX_BUFF_MASK;
 788		annotation = call->rxtx_annotations[ix];
 789		anno_type = annotation & RXRPC_TX_ANNO_MASK;
 790		annotation &= ~RXRPC_TX_ANNO_MASK;
 791		switch (*acks++) {
 792		case RXRPC_ACK_TYPE_ACK:
 793			summary->nr_acks++;
 794			if (anno_type == RXRPC_TX_ANNO_ACK)
 795				continue;
 796			summary->nr_new_acks++;
 797			call->rxtx_annotations[ix] =
 798				RXRPC_TX_ANNO_ACK | annotation;
 799			break;
 800		case RXRPC_ACK_TYPE_NACK:
 801			if (!summary->nr_nacks &&
 802			    call->acks_lowest_nak != seq) {
 803				call->acks_lowest_nak = seq;
 804				summary->new_low_nack = true;
 805			}
 806			summary->nr_nacks++;
 807			if (anno_type == RXRPC_TX_ANNO_NAK)
 808				continue;
 809			summary->nr_new_nacks++;
 810			if (anno_type == RXRPC_TX_ANNO_RETRANS)
 811				continue;
 812			call->rxtx_annotations[ix] =
 813				RXRPC_TX_ANNO_NAK | annotation;
 814			break;
 815		default:
 816			return rxrpc_proto_abort("SFT", call, 0);
 817		}
 818	}
 819}
 820
 821/*
 822 * Process an ACK packet.
 823 *
 824 * ack.firstPacket is the sequence number of the first soft-ACK'd/NAK'd packet
 825 * in the ACK array.  Anything before that is hard-ACK'd and may be discarded.
 826 *
 827 * A hard-ACK means that a packet has been processed and may be discarded; a
 828 * soft-ACK means that the packet may be discarded and retransmission
 829 * requested.  A phase is complete when all packets are hard-ACK'd.
 830 */
 831static void rxrpc_input_ack(struct rxrpc_call *call, struct sk_buff *skb)
 
 832{
 833	struct rxrpc_ack_summary summary = { 0 };
 834	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 835	union {
 836		struct rxrpc_ackpacket ack;
 837		struct rxrpc_ackinfo info;
 838		u8 acks[RXRPC_MAXACKS];
 839	} buf;
 840	rxrpc_serial_t acked_serial;
 841	rxrpc_seq_t first_soft_ack, hard_ack, prev_pkt;
 842	int nr_acks, offset, ioffset;
 843
 844	_enter("");
 845
 846	offset = sizeof(struct rxrpc_wire_header);
 847	if (skb_copy_bits(skb, offset, &buf.ack, sizeof(buf.ack)) < 0) {
 848		_debug("extraction failure");
 849		return rxrpc_proto_abort("XAK", call, 0);
 850	}
 851	offset += sizeof(buf.ack);
 852
 853	acked_serial = ntohl(buf.ack.serial);
 854	first_soft_ack = ntohl(buf.ack.firstPacket);
 855	prev_pkt = ntohl(buf.ack.previousPacket);
 856	hard_ack = first_soft_ack - 1;
 857	nr_acks = buf.ack.nAcks;
 858	summary.ack_reason = (buf.ack.reason < RXRPC_ACK__INVALID ?
 859			      buf.ack.reason : RXRPC_ACK__INVALID);
 860
 861	trace_rxrpc_rx_ack(call, sp->hdr.serial, acked_serial,
 862			   first_soft_ack, prev_pkt,
 863			   summary.ack_reason, nr_acks);
 864
 865	if (buf.ack.reason == RXRPC_ACK_PING_RESPONSE)
 866		rxrpc_input_ping_response(call, skb->tstamp, acked_serial,
 867					  sp->hdr.serial);
 868	if (buf.ack.reason == RXRPC_ACK_REQUESTED)
 869		rxrpc_input_requested_ack(call, skb->tstamp, acked_serial,
 870					  sp->hdr.serial);
 871
 872	if (buf.ack.reason == RXRPC_ACK_PING) {
 873		_proto("Rx ACK %%%u PING Request", sp->hdr.serial);
 874		rxrpc_propose_ACK(call, RXRPC_ACK_PING_RESPONSE,
 875				  sp->hdr.serial, true, true,
 876				  rxrpc_propose_ack_respond_to_ping);
 877	} else if (sp->hdr.flags & RXRPC_REQUEST_ACK) {
 878		rxrpc_propose_ACK(call, RXRPC_ACK_REQUESTED,
 879				  sp->hdr.serial, true, true,
 880				  rxrpc_propose_ack_respond_to_ack);
 881	}
 882
 883	/* Discard any out-of-order or duplicate ACKs (outside lock). */
 884	if (before(first_soft_ack, call->ackr_first_seq) ||
 885	    before(prev_pkt, call->ackr_prev_seq))
 886		return;
 887
 888	buf.info.rxMTU = 0;
 889	ioffset = offset + nr_acks + 3;
 890	if (skb->len >= ioffset + sizeof(buf.info) &&
 891	    skb_copy_bits(skb, ioffset, &buf.info, sizeof(buf.info)) < 0)
 892		return rxrpc_proto_abort("XAI", call, 0);
 893
 894	spin_lock(&call->input_lock);
 895
 896	/* Discard any out-of-order or duplicate ACKs (inside lock). */
 897	if (before(first_soft_ack, call->ackr_first_seq) ||
 898	    before(prev_pkt, call->ackr_prev_seq))
 899		goto out;
 900	call->acks_latest_ts = skb->tstamp;
 901	call->acks_latest = sp->hdr.serial;
 902
 903	call->ackr_first_seq = first_soft_ack;
 904	call->ackr_prev_seq = prev_pkt;
 905
 906	/* Parse rwind and mtu sizes if provided. */
 907	if (buf.info.rxMTU)
 908		rxrpc_input_ackinfo(call, skb, &buf.info);
 909
 910	if (first_soft_ack == 0) {
 911		rxrpc_proto_abort("AK0", call, 0);
 912		goto out;
 913	}
 914
 
 
 
 915	/* Ignore ACKs unless we are or have just been transmitting. */
 916	switch (READ_ONCE(call->state)) {
 917	case RXRPC_CALL_CLIENT_SEND_REQUEST:
 918	case RXRPC_CALL_CLIENT_AWAIT_REPLY:
 919	case RXRPC_CALL_SERVER_SEND_REPLY:
 920	case RXRPC_CALL_SERVER_AWAIT_ACK:
 921		break;
 922	default:
 923		goto out;
 924	}
 925
 926	if (before(hard_ack, call->tx_hard_ack) ||
 927	    after(hard_ack, call->tx_top)) {
 928		rxrpc_proto_abort("AKW", call, 0);
 929		goto out;
 930	}
 931	if (nr_acks > call->tx_top - hard_ack) {
 932		rxrpc_proto_abort("AKN", call, 0);
 933		goto out;
 934	}
 
 
 935
 936	if (after(hard_ack, call->tx_hard_ack)) {
 937		if (rxrpc_rotate_tx_window(call, hard_ack, &summary)) {
 938			rxrpc_end_tx_phase(call, false, "ETA");
 939			goto out;
 940		}
 941	}
 
 
 942
 943	if (nr_acks > 0) {
 944		if (skb_copy_bits(skb, offset, buf.acks, nr_acks) < 0) {
 945			rxrpc_proto_abort("XSA", call, 0);
 946			goto out;
 947		}
 948		rxrpc_input_soft_acks(call, buf.acks, first_soft_ack, nr_acks,
 949				      &summary);
 950	}
 951
 
 
 
 
 
 952	if (call->rxtx_annotations[call->tx_top & RXRPC_RXTX_BUFF_MASK] &
 953	    RXRPC_TX_ANNO_LAST &&
 954	    summary.nr_acks == call->tx_top - hard_ack &&
 955	    rxrpc_is_client_call(call))
 956		rxrpc_propose_ACK(call, RXRPC_ACK_PING, sp->hdr.serial,
 957				  false, true,
 958				  rxrpc_propose_ack_ping_for_lost_reply);
 959
 960	rxrpc_congestion_management(call, skb, &summary, acked_serial);
 961out:
 962	spin_unlock(&call->input_lock);
 963}
 964
 965/*
 966 * Process an ACKALL packet.
 967 */
 968static void rxrpc_input_ackall(struct rxrpc_call *call, struct sk_buff *skb)
 969{
 970	struct rxrpc_ack_summary summary = { 0 };
 971	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 972
 973	_proto("Rx ACKALL %%%u", sp->hdr.serial);
 974
 975	spin_lock(&call->input_lock);
 976
 977	if (rxrpc_rotate_tx_window(call, call->tx_top, &summary))
 978		rxrpc_end_tx_phase(call, false, "ETL");
 979
 980	spin_unlock(&call->input_lock);
 981}
 982
 983/*
 984 * Process an ABORT packet directed at a call.
 985 */
 986static void rxrpc_input_abort(struct rxrpc_call *call, struct sk_buff *skb)
 987{
 988	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 989	__be32 wtmp;
 990	u32 abort_code = RX_CALL_DEAD;
 991
 992	_enter("");
 993
 994	if (skb->len >= 4 &&
 995	    skb_copy_bits(skb, sizeof(struct rxrpc_wire_header),
 996			  &wtmp, sizeof(wtmp)) >= 0)
 997		abort_code = ntohl(wtmp);
 998
 999	trace_rxrpc_rx_abort(call, sp->hdr.serial, abort_code);
1000
1001	_proto("Rx ABORT %%%u { %x }", sp->hdr.serial, abort_code);
1002
1003	if (rxrpc_set_call_completion(call, RXRPC_CALL_REMOTELY_ABORTED,
1004				      abort_code, -ECONNABORTED))
1005		rxrpc_notify_socket(call);
1006}
1007
1008/*
1009 * Process an incoming call packet.
1010 */
1011static void rxrpc_input_call_packet(struct rxrpc_call *call,
1012				    struct sk_buff *skb)
1013{
1014	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
1015	unsigned long timo;
1016
1017	_enter("%p,%p", call, skb);
1018
1019	timo = READ_ONCE(call->next_rx_timo);
1020	if (timo) {
1021		unsigned long now = jiffies, expect_rx_by;
1022
1023		expect_rx_by = now + timo;
1024		WRITE_ONCE(call->expect_rx_by, expect_rx_by);
1025		rxrpc_reduce_call_timer(call, expect_rx_by, now,
1026					rxrpc_timer_set_for_normal);
1027	}
1028
1029	switch (sp->hdr.type) {
1030	case RXRPC_PACKET_TYPE_DATA:
1031		rxrpc_input_data(call, skb);
1032		goto no_free;
1033
1034	case RXRPC_PACKET_TYPE_ACK:
1035		rxrpc_input_ack(call, skb);
1036		break;
1037
1038	case RXRPC_PACKET_TYPE_BUSY:
1039		_proto("Rx BUSY %%%u", sp->hdr.serial);
1040
1041		/* Just ignore BUSY packets from the server; the retry and
1042		 * lifespan timers will take care of business.  BUSY packets
1043		 * from the client don't make sense.
1044		 */
1045		break;
1046
1047	case RXRPC_PACKET_TYPE_ABORT:
1048		rxrpc_input_abort(call, skb);
1049		break;
1050
1051	case RXRPC_PACKET_TYPE_ACKALL:
1052		rxrpc_input_ackall(call, skb);
1053		break;
1054
1055	default:
1056		break;
1057	}
1058
1059	rxrpc_free_skb(skb, rxrpc_skb_freed);
1060no_free:
1061	_leave("");
1062}
1063
1064/*
1065 * Handle a new service call on a channel implicitly completing the preceding
1066 * call on that channel.  This does not apply to client conns.
1067 *
1068 * TODO: If callNumber > call_id + 1, renegotiate security.
1069 */
1070static void rxrpc_input_implicit_end_call(struct rxrpc_sock *rx,
1071					  struct rxrpc_connection *conn,
1072					  struct rxrpc_call *call)
1073{
1074	switch (READ_ONCE(call->state)) {
1075	case RXRPC_CALL_SERVER_AWAIT_ACK:
1076		rxrpc_call_completed(call);
1077		/* Fall through */
1078	case RXRPC_CALL_COMPLETE:
1079		break;
1080	default:
1081		if (rxrpc_abort_call("IMP", call, 0, RX_CALL_DEAD, -ESHUTDOWN)) {
1082			set_bit(RXRPC_CALL_EV_ABORT, &call->events);
1083			rxrpc_queue_call(call);
1084		}
1085		trace_rxrpc_improper_term(call);
1086		break;
1087	}
1088
1089	spin_lock(&rx->incoming_lock);
1090	__rxrpc_disconnect_call(conn, call);
1091	spin_unlock(&rx->incoming_lock);
1092	rxrpc_notify_socket(call);
1093}
1094
1095/*
1096 * post connection-level events to the connection
1097 * - this includes challenges, responses, some aborts and call terminal packet
1098 *   retransmission.
1099 */
1100static void rxrpc_post_packet_to_conn(struct rxrpc_connection *conn,
1101				      struct sk_buff *skb)
1102{
1103	_enter("%p,%p", conn, skb);
1104
1105	skb_queue_tail(&conn->rx_queue, skb);
1106	rxrpc_queue_conn(conn);
1107}
1108
1109/*
1110 * post endpoint-level events to the local endpoint
1111 * - this includes debug and version messages
1112 */
1113static void rxrpc_post_packet_to_local(struct rxrpc_local *local,
1114				       struct sk_buff *skb)
1115{
1116	_enter("%p,%p", local, skb);
1117
1118	if (rxrpc_get_local_maybe(local)) {
1119		skb_queue_tail(&local->event_queue, skb);
1120		rxrpc_queue_local(local);
1121	} else {
1122		rxrpc_free_skb(skb, rxrpc_skb_freed);
1123	}
1124}
1125
1126/*
1127 * put a packet up for transport-level abort
1128 */
1129static void rxrpc_reject_packet(struct rxrpc_local *local, struct sk_buff *skb)
1130{
1131	CHECK_SLAB_OKAY(&local->usage);
1132
1133	if (rxrpc_get_local_maybe(local)) {
1134		skb_queue_tail(&local->reject_queue, skb);
1135		rxrpc_queue_local(local);
1136	} else {
1137		rxrpc_free_skb(skb, rxrpc_skb_freed);
1138	}
1139}
1140
1141/*
1142 * Extract the wire header from a packet and translate the byte order.
1143 */
1144static noinline
1145int rxrpc_extract_header(struct rxrpc_skb_priv *sp, struct sk_buff *skb)
1146{
1147	struct rxrpc_wire_header whdr;
1148
1149	/* dig out the RxRPC connection details */
1150	if (skb_copy_bits(skb, 0, &whdr, sizeof(whdr)) < 0) {
1151		trace_rxrpc_rx_eproto(NULL, sp->hdr.serial,
1152				      tracepoint_string("bad_hdr"));
1153		return -EBADMSG;
1154	}
1155
1156	memset(sp, 0, sizeof(*sp));
1157	sp->hdr.epoch		= ntohl(whdr.epoch);
1158	sp->hdr.cid		= ntohl(whdr.cid);
1159	sp->hdr.callNumber	= ntohl(whdr.callNumber);
1160	sp->hdr.seq		= ntohl(whdr.seq);
1161	sp->hdr.serial		= ntohl(whdr.serial);
1162	sp->hdr.flags		= whdr.flags;
1163	sp->hdr.type		= whdr.type;
1164	sp->hdr.userStatus	= whdr.userStatus;
1165	sp->hdr.securityIndex	= whdr.securityIndex;
1166	sp->hdr._rsvd		= ntohs(whdr._rsvd);
1167	sp->hdr.serviceId	= ntohs(whdr.serviceId);
1168	return 0;
1169}
1170
1171/*
1172 * handle data received on the local endpoint
1173 * - may be called in interrupt context
1174 *
1175 * [!] Note that as this is called from the encap_rcv hook, the socket is not
1176 * held locked by the caller and nothing prevents sk_user_data on the UDP from
1177 * being cleared in the middle of processing this function.
1178 *
1179 * Called with the RCU read lock held from the IP layer via UDP.
1180 */
1181int rxrpc_input_packet(struct sock *udp_sk, struct sk_buff *skb)
1182{
1183	struct rxrpc_local *local = rcu_dereference_sk_user_data(udp_sk);
1184	struct rxrpc_connection *conn;
1185	struct rxrpc_channel *chan;
1186	struct rxrpc_call *call = NULL;
1187	struct rxrpc_skb_priv *sp;
1188	struct rxrpc_peer *peer = NULL;
1189	struct rxrpc_sock *rx = NULL;
1190	unsigned int channel;
 
1191
1192	_enter("%p", udp_sk);
1193
1194	if (unlikely(!local)) {
1195		kfree_skb(skb);
1196		return 0;
 
 
 
 
 
1197	}
1198	if (skb->tstamp == 0)
1199		skb->tstamp = ktime_get_real();
1200
1201	rxrpc_new_skb(skb, rxrpc_skb_received);
 
 
 
 
 
 
 
 
 
 
1202
1203	skb_pull(skb, sizeof(struct udphdr));
1204
1205	/* The UDP protocol already released all skb resources;
1206	 * we are free to add our own data there.
1207	 */
1208	sp = rxrpc_skb(skb);
1209
1210	/* dig out the RxRPC connection details */
1211	if (rxrpc_extract_header(sp, skb) < 0)
1212		goto bad_message;
1213
1214	if (IS_ENABLED(CONFIG_AF_RXRPC_INJECT_LOSS)) {
1215		static int lose;
1216		if ((lose++ & 7) == 7) {
1217			trace_rxrpc_rx_lose(sp);
1218			rxrpc_free_skb(skb, rxrpc_skb_lost);
1219			return 0;
1220		}
1221	}
1222
1223	if (skb->tstamp == 0)
1224		skb->tstamp = ktime_get_real();
1225	trace_rxrpc_rx_packet(sp);
1226
 
 
 
 
 
 
 
 
 
 
1227	switch (sp->hdr.type) {
1228	case RXRPC_PACKET_TYPE_VERSION:
1229		if (rxrpc_to_client(sp))
1230			goto discard;
1231		rxrpc_post_packet_to_local(local, skb);
1232		goto out;
1233
1234	case RXRPC_PACKET_TYPE_BUSY:
1235		if (rxrpc_to_server(sp))
1236			goto discard;
1237		/* Fall through */
1238	case RXRPC_PACKET_TYPE_ACK:
1239	case RXRPC_PACKET_TYPE_ACKALL:
1240		if (sp->hdr.callNumber == 0)
1241			goto bad_message;
1242		/* Fall through */
1243	case RXRPC_PACKET_TYPE_ABORT:
1244		break;
1245
1246	case RXRPC_PACKET_TYPE_DATA:
1247		if (sp->hdr.callNumber == 0 ||
1248		    sp->hdr.seq == 0)
1249			goto bad_message;
1250		if (!rxrpc_validate_data(skb))
 
1251			goto bad_message;
1252
1253		/* Unshare the packet so that it can be modified for in-place
1254		 * decryption.
1255		 */
1256		if (sp->hdr.securityIndex != 0) {
1257			struct sk_buff *nskb = skb_unshare(skb, GFP_ATOMIC);
1258			if (!nskb) {
1259				rxrpc_eaten_skb(skb, rxrpc_skb_unshared_nomem);
1260				goto out;
1261			}
1262
1263			if (nskb != skb) {
1264				rxrpc_eaten_skb(skb, rxrpc_skb_received);
1265				skb = nskb;
1266				rxrpc_new_skb(skb, rxrpc_skb_unshared);
1267				sp = rxrpc_skb(skb);
1268			}
1269		}
1270		break;
1271
1272	case RXRPC_PACKET_TYPE_CHALLENGE:
1273		if (rxrpc_to_server(sp))
1274			goto discard;
1275		break;
1276	case RXRPC_PACKET_TYPE_RESPONSE:
1277		if (rxrpc_to_client(sp))
1278			goto discard;
1279		break;
1280
1281		/* Packet types 9-11 should just be ignored. */
1282	case RXRPC_PACKET_TYPE_PARAMS:
1283	case RXRPC_PACKET_TYPE_10:
1284	case RXRPC_PACKET_TYPE_11:
1285		goto discard;
1286
1287	default:
1288		_proto("Rx Bad Packet Type %u", sp->hdr.type);
1289		goto bad_message;
1290	}
1291
1292	if (sp->hdr.serviceId == 0)
1293		goto bad_message;
1294
1295	if (rxrpc_to_server(sp)) {
1296		/* Weed out packets to services we're not offering.  Packets
1297		 * that would begin a call are explicitly rejected and the rest
1298		 * are just discarded.
1299		 */
1300		rx = rcu_dereference(local->service);
1301		if (!rx || (sp->hdr.serviceId != rx->srx.srx_service &&
1302			    sp->hdr.serviceId != rx->second_service)) {
1303			if (sp->hdr.type == RXRPC_PACKET_TYPE_DATA &&
1304			    sp->hdr.seq == 1)
1305				goto unsupported_service;
1306			goto discard;
1307		}
1308	}
1309
1310	conn = rxrpc_find_connection_rcu(local, skb, &peer);
1311	if (conn) {
1312		if (sp->hdr.securityIndex != conn->security_ix)
1313			goto wrong_security;
1314
1315		if (sp->hdr.serviceId != conn->service_id) {
1316			int old_id;
1317
1318			if (!test_bit(RXRPC_CONN_PROBING_FOR_UPGRADE, &conn->flags))
1319				goto reupgrade;
1320			old_id = cmpxchg(&conn->service_id, conn->params.service_id,
1321					 sp->hdr.serviceId);
1322
1323			if (old_id != conn->params.service_id &&
1324			    old_id != sp->hdr.serviceId)
1325				goto reupgrade;
 
1326		}
1327
1328		if (sp->hdr.callNumber == 0) {
1329			/* Connection-level packet */
1330			_debug("CONN %p {%d}", conn, conn->debug_id);
1331			rxrpc_post_packet_to_conn(conn, skb);
1332			goto out;
1333		}
1334
1335		if ((int)sp->hdr.serial - (int)conn->hi_serial > 0)
1336			conn->hi_serial = sp->hdr.serial;
 
 
 
 
 
 
 
1337
1338		/* Call-bound packets are routed by connection channel. */
1339		channel = sp->hdr.cid & RXRPC_CHANNELMASK;
1340		chan = &conn->channels[channel];
1341
1342		/* Ignore really old calls */
1343		if (sp->hdr.callNumber < chan->last_call)
1344			goto discard;
1345
1346		if (sp->hdr.callNumber == chan->last_call) {
1347			if (chan->call ||
1348			    sp->hdr.type == RXRPC_PACKET_TYPE_ABORT)
1349				goto discard;
1350
1351			/* For the previous service call, if completed
1352			 * successfully, we discard all further packets.
1353			 */
1354			if (rxrpc_conn_is_service(conn) &&
1355			    chan->last_type == RXRPC_PACKET_TYPE_ACK)
1356				goto discard;
1357
1358			/* But otherwise we need to retransmit the final packet
1359			 * from data cached in the connection record.
1360			 */
1361			if (sp->hdr.type == RXRPC_PACKET_TYPE_DATA)
1362				trace_rxrpc_rx_data(chan->call_debug_id,
1363						    sp->hdr.seq,
1364						    sp->hdr.serial,
1365						    sp->hdr.flags, 0);
1366			rxrpc_post_packet_to_conn(conn, skb);
1367			goto out;
1368		}
1369
1370		call = rcu_dereference(chan->call);
1371
1372		if (sp->hdr.callNumber > chan->call_id) {
1373			if (rxrpc_to_client(sp))
 
1374				goto reject_packet;
 
1375			if (call)
1376				rxrpc_input_implicit_end_call(rx, conn, call);
1377			call = NULL;
1378		}
1379
1380		if (call) {
1381			if (sp->hdr.serviceId != call->service_id)
1382				call->service_id = sp->hdr.serviceId;
1383			if ((int)sp->hdr.serial - (int)call->rx_serial > 0)
1384				call->rx_serial = sp->hdr.serial;
1385			if (!test_bit(RXRPC_CALL_RX_HEARD, &call->flags))
1386				set_bit(RXRPC_CALL_RX_HEARD, &call->flags);
1387		}
1388	}
1389
1390	if (!call || atomic_read(&call->usage) == 0) {
1391		if (rxrpc_to_client(sp) ||
 
1392		    sp->hdr.type != RXRPC_PACKET_TYPE_DATA)
1393			goto bad_message;
1394		if (sp->hdr.seq != 1)
1395			goto discard;
1396		call = rxrpc_new_incoming_call(local, rx, skb);
1397		if (!call)
 
1398			goto reject_packet;
1399		rxrpc_send_ping(call, skb);
 
1400		mutex_unlock(&call->user_mutex);
1401	}
1402
1403	/* Process a call packet; this either discards or passes on the ref
1404	 * elsewhere.
1405	 */
1406	rxrpc_input_call_packet(call, skb);
1407	goto out;
1408
 
 
1409discard:
1410	rxrpc_free_skb(skb, rxrpc_skb_freed);
1411out:
1412	trace_rxrpc_rx_done(0, 0);
1413	return 0;
 
 
 
 
1414
1415wrong_security:
 
1416	trace_rxrpc_abort(0, "SEC", sp->hdr.cid, sp->hdr.callNumber, sp->hdr.seq,
1417			  RXKADINCONSISTENCY, EBADMSG);
1418	skb->priority = RXKADINCONSISTENCY;
1419	goto post_abort;
1420
1421unsupported_service:
1422	trace_rxrpc_abort(0, "INV", sp->hdr.cid, sp->hdr.callNumber, sp->hdr.seq,
1423			  RX_INVALID_OPERATION, EOPNOTSUPP);
1424	skb->priority = RX_INVALID_OPERATION;
1425	goto post_abort;
1426
1427reupgrade:
 
1428	trace_rxrpc_abort(0, "UPG", sp->hdr.cid, sp->hdr.callNumber, sp->hdr.seq,
1429			  RX_PROTOCOL_ERROR, EBADMSG);
1430	goto protocol_error;
1431
 
 
1432bad_message:
1433	trace_rxrpc_abort(0, "BAD", sp->hdr.cid, sp->hdr.callNumber, sp->hdr.seq,
1434			  RX_PROTOCOL_ERROR, EBADMSG);
1435protocol_error:
1436	skb->priority = RX_PROTOCOL_ERROR;
1437post_abort:
1438	skb->mark = RXRPC_SKB_MARK_REJECT_ABORT;
1439reject_packet:
1440	trace_rxrpc_rx_done(skb->mark, skb->priority);
1441	rxrpc_reject_packet(local, skb);
1442	_leave(" [badmsg]");
1443	return 0;
1444}
v4.17
 
   1/* RxRPC packet reception
   2 *
   3 * Copyright (C) 2007, 2016 Red Hat, Inc. All Rights Reserved.
   4 * Written by David Howells (dhowells@redhat.com)
   5 *
   6 * This program is free software; you can redistribute it and/or
   7 * modify it under the terms of the GNU General Public License
   8 * as published by the Free Software Foundation; either version
   9 * 2 of the License, or (at your option) any later version.
  10 */
  11
  12#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  13
  14#include <linux/module.h>
  15#include <linux/net.h>
  16#include <linux/skbuff.h>
  17#include <linux/errqueue.h>
  18#include <linux/udp.h>
  19#include <linux/in.h>
  20#include <linux/in6.h>
  21#include <linux/icmp.h>
  22#include <linux/gfp.h>
  23#include <net/sock.h>
  24#include <net/af_rxrpc.h>
  25#include <net/ip.h>
  26#include <net/udp.h>
  27#include <net/net_namespace.h>
  28#include "ar-internal.h"
  29
  30static void rxrpc_proto_abort(const char *why,
  31			      struct rxrpc_call *call, rxrpc_seq_t seq)
  32{
  33	if (rxrpc_abort_call(why, call, seq, RX_PROTOCOL_ERROR, -EBADMSG)) {
  34		set_bit(RXRPC_CALL_EV_ABORT, &call->events);
  35		rxrpc_queue_call(call);
  36	}
  37}
  38
  39/*
  40 * Do TCP-style congestion management [RFC 5681].
  41 */
  42static void rxrpc_congestion_management(struct rxrpc_call *call,
  43					struct sk_buff *skb,
  44					struct rxrpc_ack_summary *summary,
  45					rxrpc_serial_t acked_serial)
  46{
  47	enum rxrpc_congest_change change = rxrpc_cong_no_change;
  48	unsigned int cumulative_acks = call->cong_cumul_acks;
  49	unsigned int cwnd = call->cong_cwnd;
  50	bool resend = false;
  51
  52	summary->flight_size =
  53		(call->tx_top - call->tx_hard_ack) - summary->nr_acks;
  54
  55	if (test_and_clear_bit(RXRPC_CALL_RETRANS_TIMEOUT, &call->flags)) {
  56		summary->retrans_timeo = true;
  57		call->cong_ssthresh = max_t(unsigned int,
  58					    summary->flight_size / 2, 2);
  59		cwnd = 1;
  60		if (cwnd >= call->cong_ssthresh &&
  61		    call->cong_mode == RXRPC_CALL_SLOW_START) {
  62			call->cong_mode = RXRPC_CALL_CONGEST_AVOIDANCE;
  63			call->cong_tstamp = skb->tstamp;
  64			cumulative_acks = 0;
  65		}
  66	}
  67
  68	cumulative_acks += summary->nr_new_acks;
  69	cumulative_acks += summary->nr_rot_new_acks;
  70	if (cumulative_acks > 255)
  71		cumulative_acks = 255;
  72
  73	summary->mode = call->cong_mode;
  74	summary->cwnd = call->cong_cwnd;
  75	summary->ssthresh = call->cong_ssthresh;
  76	summary->cumulative_acks = cumulative_acks;
  77	summary->dup_acks = call->cong_dup_acks;
  78
  79	switch (call->cong_mode) {
  80	case RXRPC_CALL_SLOW_START:
  81		if (summary->nr_nacks > 0)
  82			goto packet_loss_detected;
  83		if (summary->cumulative_acks > 0)
  84			cwnd += 1;
  85		if (cwnd >= call->cong_ssthresh) {
  86			call->cong_mode = RXRPC_CALL_CONGEST_AVOIDANCE;
  87			call->cong_tstamp = skb->tstamp;
  88		}
  89		goto out;
  90
  91	case RXRPC_CALL_CONGEST_AVOIDANCE:
  92		if (summary->nr_nacks > 0)
  93			goto packet_loss_detected;
  94
  95		/* We analyse the number of packets that get ACK'd per RTT
  96		 * period and increase the window if we managed to fill it.
  97		 */
  98		if (call->peer->rtt_usage == 0)
  99			goto out;
 100		if (ktime_before(skb->tstamp,
 101				 ktime_add_ns(call->cong_tstamp,
 102					      call->peer->rtt)))
 103			goto out_no_clear_ca;
 104		change = rxrpc_cong_rtt_window_end;
 105		call->cong_tstamp = skb->tstamp;
 106		if (cumulative_acks >= cwnd)
 107			cwnd++;
 108		goto out;
 109
 110	case RXRPC_CALL_PACKET_LOSS:
 111		if (summary->nr_nacks == 0)
 112			goto resume_normality;
 113
 114		if (summary->new_low_nack) {
 115			change = rxrpc_cong_new_low_nack;
 116			call->cong_dup_acks = 1;
 117			if (call->cong_extra > 1)
 118				call->cong_extra = 1;
 119			goto send_extra_data;
 120		}
 121
 122		call->cong_dup_acks++;
 123		if (call->cong_dup_acks < 3)
 124			goto send_extra_data;
 125
 126		change = rxrpc_cong_begin_retransmission;
 127		call->cong_mode = RXRPC_CALL_FAST_RETRANSMIT;
 128		call->cong_ssthresh = max_t(unsigned int,
 129					    summary->flight_size / 2, 2);
 130		cwnd = call->cong_ssthresh + 3;
 131		call->cong_extra = 0;
 132		call->cong_dup_acks = 0;
 133		resend = true;
 134		goto out;
 135
 136	case RXRPC_CALL_FAST_RETRANSMIT:
 137		if (!summary->new_low_nack) {
 138			if (summary->nr_new_acks == 0)
 139				cwnd += 1;
 140			call->cong_dup_acks++;
 141			if (call->cong_dup_acks == 2) {
 142				change = rxrpc_cong_retransmit_again;
 143				call->cong_dup_acks = 0;
 144				resend = true;
 145			}
 146		} else {
 147			change = rxrpc_cong_progress;
 148			cwnd = call->cong_ssthresh;
 149			if (summary->nr_nacks == 0)
 150				goto resume_normality;
 151		}
 152		goto out;
 153
 154	default:
 155		BUG();
 156		goto out;
 157	}
 158
 159resume_normality:
 160	change = rxrpc_cong_cleared_nacks;
 161	call->cong_dup_acks = 0;
 162	call->cong_extra = 0;
 163	call->cong_tstamp = skb->tstamp;
 164	if (cwnd < call->cong_ssthresh)
 165		call->cong_mode = RXRPC_CALL_SLOW_START;
 166	else
 167		call->cong_mode = RXRPC_CALL_CONGEST_AVOIDANCE;
 168out:
 169	cumulative_acks = 0;
 170out_no_clear_ca:
 171	if (cwnd >= RXRPC_RXTX_BUFF_SIZE - 1)
 172		cwnd = RXRPC_RXTX_BUFF_SIZE - 1;
 173	call->cong_cwnd = cwnd;
 174	call->cong_cumul_acks = cumulative_acks;
 175	trace_rxrpc_congest(call, summary, acked_serial, change);
 176	if (resend && !test_and_set_bit(RXRPC_CALL_EV_RESEND, &call->events))
 177		rxrpc_queue_call(call);
 178	return;
 179
 180packet_loss_detected:
 181	change = rxrpc_cong_saw_nack;
 182	call->cong_mode = RXRPC_CALL_PACKET_LOSS;
 183	call->cong_dup_acks = 0;
 184	goto send_extra_data;
 185
 186send_extra_data:
 187	/* Send some previously unsent DATA if we have some to advance the ACK
 188	 * state.
 189	 */
 190	if (call->rxtx_annotations[call->tx_top & RXRPC_RXTX_BUFF_MASK] &
 191	    RXRPC_TX_ANNO_LAST ||
 192	    summary->nr_acks != call->tx_top - call->tx_hard_ack) {
 193		call->cong_extra++;
 194		wake_up(&call->waitq);
 195	}
 196	goto out_no_clear_ca;
 197}
 198
 199/*
 200 * Ping the other end to fill our RTT cache and to retrieve the rwind
 201 * and MTU parameters.
 202 */
 203static void rxrpc_send_ping(struct rxrpc_call *call, struct sk_buff *skb,
 204			    int skew)
 205{
 206	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 207	ktime_t now = skb->tstamp;
 208
 209	if (call->peer->rtt_usage < 3 ||
 210	    ktime_before(ktime_add_ms(call->peer->rtt_last_req, 1000), now))
 211		rxrpc_propose_ACK(call, RXRPC_ACK_PING, skew, sp->hdr.serial,
 212				  true, true,
 213				  rxrpc_propose_ack_ping_for_params);
 214}
 215
 216/*
 217 * Apply a hard ACK by advancing the Tx window.
 218 */
 219static void rxrpc_rotate_tx_window(struct rxrpc_call *call, rxrpc_seq_t to,
 220				   struct rxrpc_ack_summary *summary)
 221{
 222	struct sk_buff *skb, *list = NULL;
 
 223	int ix;
 224	u8 annotation;
 225
 226	if (call->acks_lowest_nak == call->tx_hard_ack) {
 227		call->acks_lowest_nak = to;
 228	} else if (before_eq(call->acks_lowest_nak, to)) {
 229		summary->new_low_nack = true;
 230		call->acks_lowest_nak = to;
 231	}
 232
 233	spin_lock(&call->lock);
 234
 235	while (before(call->tx_hard_ack, to)) {
 236		call->tx_hard_ack++;
 237		ix = call->tx_hard_ack & RXRPC_RXTX_BUFF_MASK;
 238		skb = call->rxtx_buffer[ix];
 239		annotation = call->rxtx_annotations[ix];
 240		rxrpc_see_skb(skb, rxrpc_skb_tx_rotated);
 241		call->rxtx_buffer[ix] = NULL;
 242		call->rxtx_annotations[ix] = 0;
 243		skb->next = list;
 244		list = skb;
 245
 246		if (annotation & RXRPC_TX_ANNO_LAST)
 247			set_bit(RXRPC_CALL_TX_LAST, &call->flags);
 
 
 248		if ((annotation & RXRPC_TX_ANNO_MASK) != RXRPC_TX_ANNO_ACK)
 249			summary->nr_rot_new_acks++;
 250	}
 251
 252	spin_unlock(&call->lock);
 253
 254	trace_rxrpc_transmit(call, (test_bit(RXRPC_CALL_TX_LAST, &call->flags) ?
 255				    rxrpc_transmit_rotate_last :
 256				    rxrpc_transmit_rotate));
 257	wake_up(&call->waitq);
 258
 259	while (list) {
 260		skb = list;
 261		list = skb->next;
 262		skb->next = NULL;
 263		rxrpc_free_skb(skb, rxrpc_skb_tx_freed);
 264	}
 
 
 265}
 266
 267/*
 268 * End the transmission phase of a call.
 269 *
 270 * This occurs when we get an ACKALL packet, the first DATA packet of a reply,
 271 * or a final ACK packet.
 272 */
 273static bool rxrpc_end_tx_phase(struct rxrpc_call *call, bool reply_begun,
 274			       const char *abort_why)
 275{
 
 276
 277	ASSERT(test_bit(RXRPC_CALL_TX_LAST, &call->flags));
 278
 279	write_lock(&call->state_lock);
 280
 281	switch (call->state) {
 
 282	case RXRPC_CALL_CLIENT_SEND_REQUEST:
 283	case RXRPC_CALL_CLIENT_AWAIT_REPLY:
 284		if (reply_begun)
 285			call->state = RXRPC_CALL_CLIENT_RECV_REPLY;
 286		else
 287			call->state = RXRPC_CALL_CLIENT_AWAIT_REPLY;
 288		break;
 289
 290	case RXRPC_CALL_SERVER_AWAIT_ACK:
 291		__rxrpc_call_completed(call);
 292		rxrpc_notify_socket(call);
 
 293		break;
 294
 295	default:
 296		goto bad_state;
 297	}
 298
 299	write_unlock(&call->state_lock);
 300	if (call->state == RXRPC_CALL_CLIENT_AWAIT_REPLY) {
 301		trace_rxrpc_transmit(call, rxrpc_transmit_await_reply);
 302	} else {
 303		trace_rxrpc_transmit(call, rxrpc_transmit_end);
 304	}
 305	_leave(" = ok");
 306	return true;
 307
 308bad_state:
 309	write_unlock(&call->state_lock);
 310	kdebug("end_tx %s", rxrpc_call_states[call->state]);
 311	rxrpc_proto_abort(abort_why, call, call->tx_top);
 312	return false;
 313}
 314
 315/*
 316 * Begin the reply reception phase of a call.
 317 */
 318static bool rxrpc_receiving_reply(struct rxrpc_call *call)
 319{
 320	struct rxrpc_ack_summary summary = { 0 };
 321	unsigned long now, timo;
 322	rxrpc_seq_t top = READ_ONCE(call->tx_top);
 323
 324	if (call->ackr_reason) {
 325		spin_lock_bh(&call->lock);
 326		call->ackr_reason = 0;
 327		spin_unlock_bh(&call->lock);
 328		now = jiffies;
 329		timo = now + MAX_JIFFY_OFFSET;
 330		WRITE_ONCE(call->resend_at, timo);
 331		WRITE_ONCE(call->ack_at, timo);
 332		trace_rxrpc_timer(call, rxrpc_timer_init_for_reply, now);
 333	}
 334
 335	if (!test_bit(RXRPC_CALL_TX_LAST, &call->flags))
 336		rxrpc_rotate_tx_window(call, top, &summary);
 337	if (!test_bit(RXRPC_CALL_TX_LAST, &call->flags)) {
 338		rxrpc_proto_abort("TXL", call, top);
 339		return false;
 
 
 340	}
 341	if (!rxrpc_end_tx_phase(call, true, "ETD"))
 342		return false;
 343	call->tx_phase = false;
 344	return true;
 345}
 346
 347/*
 348 * Scan a jumbo packet to validate its structure and to work out how many
 349 * subpackets it contains.
 350 *
 351 * A jumbo packet is a collection of consecutive packets glued together with
 352 * little headers between that indicate how to change the initial header for
 353 * each subpacket.
 354 *
 355 * RXRPC_JUMBO_PACKET must be set on all but the last subpacket - and all but
 356 * the last are RXRPC_JUMBO_DATALEN in size.  The last subpacket may be of any
 357 * size.
 358 */
 359static bool rxrpc_validate_jumbo(struct sk_buff *skb)
 360{
 361	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 362	unsigned int offset = sizeof(struct rxrpc_wire_header);
 363	unsigned int len = skb->len;
 364	int nr_jumbo = 1;
 365	u8 flags = sp->hdr.flags;
 366
 367	do {
 368		nr_jumbo++;
 
 
 
 
 
 
 369		if (len - offset < RXRPC_JUMBO_SUBPKTLEN)
 370			goto protocol_error;
 371		if (flags & RXRPC_LAST_PACKET)
 372			goto protocol_error;
 373		offset += RXRPC_JUMBO_DATALEN;
 374		if (skb_copy_bits(skb, offset, &flags, 1) < 0)
 375			goto protocol_error;
 376		offset += sizeof(struct rxrpc_jumbo_header);
 377	} while (flags & RXRPC_JUMBO_PACKET);
 378
 379	sp->nr_jumbo = nr_jumbo;
 
 380	return true;
 381
 382protocol_error:
 383	return false;
 384}
 385
 386/*
 387 * Handle reception of a duplicate packet.
 388 *
 389 * We have to take care to avoid an attack here whereby we're given a series of
 390 * jumbograms, each with a sequence number one before the preceding one and
 391 * filled up to maximum UDP size.  If they never send us the first packet in
 392 * the sequence, they can cause us to have to hold on to around 2MiB of kernel
 393 * space until the call times out.
 394 *
 395 * We limit the space usage by only accepting three duplicate jumbo packets per
 396 * call.  After that, we tell the other side we're no longer accepting jumbos
 397 * (that information is encoded in the ACK packet).
 398 */
 399static void rxrpc_input_dup_data(struct rxrpc_call *call, rxrpc_seq_t seq,
 400				 u8 annotation, bool *_jumbo_bad)
 401{
 402	/* Discard normal packets that are duplicates. */
 403	if (annotation == 0)
 404		return;
 405
 406	/* Skip jumbo subpackets that are duplicates.  When we've had three or
 407	 * more partially duplicate jumbo packets, we refuse to take any more
 408	 * jumbos for this call.
 409	 */
 410	if (!*_jumbo_bad) {
 411		call->nr_jumbo_bad++;
 412		*_jumbo_bad = true;
 413	}
 414}
 415
 416/*
 417 * Process a DATA packet, adding the packet to the Rx ring.
 
 418 */
 419static void rxrpc_input_data(struct rxrpc_call *call, struct sk_buff *skb,
 420			     u16 skew)
 421{
 422	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 423	enum rxrpc_call_state state;
 424	unsigned int offset = sizeof(struct rxrpc_wire_header);
 425	unsigned int ix;
 426	rxrpc_serial_t serial = sp->hdr.serial, ack_serial = 0;
 427	rxrpc_seq_t seq = sp->hdr.seq, hard_ack;
 428	bool immediate_ack = false, jumbo_bad = false, queued;
 429	u16 len;
 430	u8 ack = 0, flags, annotation = 0;
 431
 432	_enter("{%u,%u},{%u,%u}",
 433	       call->rx_hard_ack, call->rx_top, skb->len, seq);
 434
 435	_proto("Rx DATA %%%u { #%u f=%02x }",
 436	       sp->hdr.serial, seq, sp->hdr.flags);
 437
 438	state = READ_ONCE(call->state);
 439	if (state >= RXRPC_CALL_COMPLETE)
 
 440		return;
 
 441
 442	if (call->state == RXRPC_CALL_SERVER_RECV_REQUEST) {
 443		unsigned long timo = READ_ONCE(call->next_req_timo);
 444		unsigned long now, expect_req_by;
 445
 446		if (timo) {
 447			now = jiffies;
 448			expect_req_by = now + timo;
 449			WRITE_ONCE(call->expect_req_by, expect_req_by);
 450			rxrpc_reduce_call_timer(call, expect_req_by, now,
 451						rxrpc_timer_set_for_idle);
 452		}
 453	}
 454
 
 
 455	/* Received data implicitly ACKs all of the request packets we sent
 456	 * when we're acting as a client.
 457	 */
 458	if ((state == RXRPC_CALL_CLIENT_SEND_REQUEST ||
 459	     state == RXRPC_CALL_CLIENT_AWAIT_REPLY) &&
 460	    !rxrpc_receiving_reply(call))
 461		return;
 462
 463	call->ackr_prev_seq = seq;
 464
 
 465	hard_ack = READ_ONCE(call->rx_hard_ack);
 466	if (after(seq, hard_ack + call->rx_winsize)) {
 467		ack = RXRPC_ACK_EXCEEDS_WINDOW;
 468		ack_serial = serial;
 469		goto ack;
 470	}
 471
 472	flags = sp->hdr.flags;
 473	if (flags & RXRPC_JUMBO_PACKET) {
 474		if (call->nr_jumbo_bad > 3) {
 475			ack = RXRPC_ACK_NOSPACE;
 476			ack_serial = serial;
 477			goto ack;
 478		}
 479		annotation = 1;
 480	}
 481
 482next_subpacket:
 483	queued = false;
 484	ix = seq & RXRPC_RXTX_BUFF_MASK;
 485	len = skb->len;
 486	if (flags & RXRPC_JUMBO_PACKET)
 487		len = RXRPC_JUMBO_DATALEN;
 488
 489	if (flags & RXRPC_LAST_PACKET) {
 490		if (test_bit(RXRPC_CALL_RX_LAST, &call->flags) &&
 491		    seq != call->rx_top)
 492			return rxrpc_proto_abort("LSN", call, seq);
 493	} else {
 494		if (test_bit(RXRPC_CALL_RX_LAST, &call->flags) &&
 495		    after_eq(seq, call->rx_top))
 496			return rxrpc_proto_abort("LSA", call, seq);
 497	}
 498
 499	trace_rxrpc_rx_data(call, seq, serial, flags, annotation);
 500	if (before_eq(seq, hard_ack)) {
 501		ack = RXRPC_ACK_DUPLICATE;
 502		ack_serial = serial;
 503		goto skip;
 504	}
 
 505
 506	if (flags & RXRPC_REQUEST_ACK && !ack) {
 507		ack = RXRPC_ACK_REQUESTED;
 508		ack_serial = serial;
 509	}
 
 
 
 
 510
 511	if (call->rxtx_buffer[ix]) {
 512		rxrpc_input_dup_data(call, seq, annotation, &jumbo_bad);
 513		if (ack != RXRPC_ACK_DUPLICATE) {
 514			ack = RXRPC_ACK_DUPLICATE;
 515			ack_serial = serial;
 
 
 
 
 
 
 
 
 
 
 
 
 516		}
 517		immediate_ack = true;
 518		goto skip;
 519	}
 520
 521	/* Queue the packet.  We use a couple of memory barriers here as need
 522	 * to make sure that rx_top is perceived to be set after the buffer
 523	 * pointer and that the buffer pointer is set after the annotation and
 524	 * the skb data.
 525	 *
 526	 * Barriers against rxrpc_recvmsg_data() and rxrpc_rotate_rx_window()
 527	 * and also rxrpc_fill_out_ack().
 528	 */
 529	rxrpc_get_skb(skb, rxrpc_skb_rx_got);
 530	call->rxtx_annotations[ix] = annotation;
 531	smp_wmb();
 532	call->rxtx_buffer[ix] = skb;
 533	if (after(seq, call->rx_top)) {
 534		smp_store_release(&call->rx_top, seq);
 535	} else if (before(seq, call->rx_top)) {
 536		/* Send an immediate ACK if we fill in a hole */
 537		if (!ack) {
 538			ack = RXRPC_ACK_DELAY;
 539			ack_serial = serial;
 
 
 
 
 
 
 
 
 540		}
 541		immediate_ack = true;
 542	}
 543	if (flags & RXRPC_LAST_PACKET) {
 544		set_bit(RXRPC_CALL_RX_LAST, &call->flags);
 545		trace_rxrpc_receive(call, rxrpc_receive_queue_last, serial, seq);
 546	} else {
 547		trace_rxrpc_receive(call, rxrpc_receive_queue, serial, seq);
 548	}
 549	queued = true;
 550
 551	if (after_eq(seq, call->rx_expect_next)) {
 552		if (after(seq, call->rx_expect_next)) {
 553			_net("OOS %u > %u", seq, call->rx_expect_next);
 554			ack = RXRPC_ACK_OUT_OF_SEQUENCE;
 555			ack_serial = serial;
 556		}
 557		call->rx_expect_next = seq + 1;
 558	}
 559
 560skip:
 561	offset += len;
 562	if (flags & RXRPC_JUMBO_PACKET) {
 563		if (skb_copy_bits(skb, offset, &flags, 1) < 0)
 564			return rxrpc_proto_abort("XJF", call, seq);
 565		offset += sizeof(struct rxrpc_jumbo_header);
 566		seq++;
 567		serial++;
 568		annotation++;
 569		if (flags & RXRPC_JUMBO_PACKET)
 570			annotation |= RXRPC_RX_ANNO_JLAST;
 571		if (after(seq, hard_ack + call->rx_winsize)) {
 572			ack = RXRPC_ACK_EXCEEDS_WINDOW;
 573			ack_serial = serial;
 574			if (!jumbo_bad) {
 575				call->nr_jumbo_bad++;
 576				jumbo_bad = true;
 
 
 
 577			}
 578			goto ack;
 
 
 
 
 
 
 
 
 579		}
 580
 581		_proto("Rx DATA Jumbo %%%u", serial);
 582		goto next_subpacket;
 583	}
 
 
 
 
 
 
 
 584
 585	if (queued && flags & RXRPC_LAST_PACKET && !ack) {
 586		ack = RXRPC_ACK_DELAY;
 587		ack_serial = serial;
 
 
 
 
 
 588	}
 589
 590ack:
 591	if (ack)
 592		rxrpc_propose_ACK(call, ack, skew, ack_serial,
 593				  immediate_ack, true,
 594				  rxrpc_propose_ack_input_data);
 
 
 
 
 595
 596	if (sp->hdr.seq == READ_ONCE(call->rx_hard_ack) + 1)
 
 597		rxrpc_notify_socket(call);
 
 
 
 
 
 598	_leave(" [queued]");
 599}
 600
 601/*
 602 * Process a requested ACK.
 603 */
 604static void rxrpc_input_requested_ack(struct rxrpc_call *call,
 605				      ktime_t resp_time,
 606				      rxrpc_serial_t orig_serial,
 607				      rxrpc_serial_t ack_serial)
 608{
 609	struct rxrpc_skb_priv *sp;
 610	struct sk_buff *skb;
 611	ktime_t sent_at;
 612	int ix;
 613
 614	for (ix = 0; ix < RXRPC_RXTX_BUFF_SIZE; ix++) {
 615		skb = call->rxtx_buffer[ix];
 616		if (!skb)
 617			continue;
 618
 
 
 619		sp = rxrpc_skb(skb);
 620		if (sp->hdr.serial != orig_serial)
 621			continue;
 622		smp_rmb();
 623		sent_at = skb->tstamp;
 624		goto found;
 625	}
 
 626	return;
 627
 628found:
 629	rxrpc_peer_add_rtt(call, rxrpc_rtt_rx_requested_ack,
 630			   orig_serial, ack_serial, sent_at, resp_time);
 631}
 632
 633/*
 634 * Process the response to a ping that we sent to find out if we lost an ACK.
 635 *
 636 * If we got back a ping response that indicates a lower tx_top than what we
 637 * had at the time of the ping transmission, we adjudge all the DATA packets
 638 * sent between the response tx_top and the ping-time tx_top to have been lost.
 639 */
 640static void rxrpc_input_check_for_lost_ack(struct rxrpc_call *call)
 641{
 642	rxrpc_seq_t top, bottom, seq;
 643	bool resend = false;
 644
 645	spin_lock_bh(&call->lock);
 646
 647	bottom = call->tx_hard_ack + 1;
 648	top = call->acks_lost_top;
 649	if (before(bottom, top)) {
 650		for (seq = bottom; before_eq(seq, top); seq++) {
 651			int ix = seq & RXRPC_RXTX_BUFF_MASK;
 652			u8 annotation = call->rxtx_annotations[ix];
 653			u8 anno_type = annotation & RXRPC_TX_ANNO_MASK;
 654
 655			if (anno_type != RXRPC_TX_ANNO_UNACK)
 656				continue;
 657			annotation &= ~RXRPC_TX_ANNO_MASK;
 658			annotation |= RXRPC_TX_ANNO_RETRANS;
 659			call->rxtx_annotations[ix] = annotation;
 660			resend = true;
 661		}
 662	}
 663
 664	spin_unlock_bh(&call->lock);
 665
 666	if (resend && !test_and_set_bit(RXRPC_CALL_EV_RESEND, &call->events))
 667		rxrpc_queue_call(call);
 668}
 669
 670/*
 671 * Process a ping response.
 672 */
 673static void rxrpc_input_ping_response(struct rxrpc_call *call,
 674				      ktime_t resp_time,
 675				      rxrpc_serial_t orig_serial,
 676				      rxrpc_serial_t ack_serial)
 677{
 678	rxrpc_serial_t ping_serial;
 679	ktime_t ping_time;
 680
 681	ping_time = call->ping_time;
 682	smp_rmb();
 683	ping_serial = call->ping_serial;
 684
 685	if (orig_serial == call->acks_lost_ping)
 686		rxrpc_input_check_for_lost_ack(call);
 687
 688	if (!test_bit(RXRPC_CALL_PINGING, &call->flags) ||
 689	    before(orig_serial, ping_serial))
 690		return;
 691	clear_bit(RXRPC_CALL_PINGING, &call->flags);
 692	if (after(orig_serial, ping_serial))
 693		return;
 694
 695	rxrpc_peer_add_rtt(call, rxrpc_rtt_rx_ping_response,
 696			   orig_serial, ack_serial, ping_time, resp_time);
 697}
 698
 699/*
 700 * Process the extra information that may be appended to an ACK packet
 701 */
 702static void rxrpc_input_ackinfo(struct rxrpc_call *call, struct sk_buff *skb,
 703				struct rxrpc_ackinfo *ackinfo)
 704{
 705	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 706	struct rxrpc_peer *peer;
 707	unsigned int mtu;
 708	bool wake = false;
 709	u32 rwind = ntohl(ackinfo->rwind);
 710
 711	_proto("Rx ACK %%%u Info { rx=%u max=%u rwin=%u jm=%u }",
 712	       sp->hdr.serial,
 713	       ntohl(ackinfo->rxMTU), ntohl(ackinfo->maxMTU),
 714	       rwind, ntohl(ackinfo->jumbo_max));
 715
 716	if (call->tx_winsize != rwind) {
 717		if (rwind > RXRPC_RXTX_BUFF_SIZE - 1)
 718			rwind = RXRPC_RXTX_BUFF_SIZE - 1;
 719		if (rwind > call->tx_winsize)
 720			wake = true;
 721		trace_rxrpc_rx_rwind_change(call, sp->hdr.serial,
 722					    ntohl(ackinfo->rwind), wake);
 723		call->tx_winsize = rwind;
 724	}
 725
 726	if (call->cong_ssthresh > rwind)
 727		call->cong_ssthresh = rwind;
 728
 729	mtu = min(ntohl(ackinfo->rxMTU), ntohl(ackinfo->maxMTU));
 730
 731	peer = call->peer;
 732	if (mtu < peer->maxdata) {
 733		spin_lock_bh(&peer->lock);
 734		peer->maxdata = mtu;
 735		peer->mtu = mtu + peer->hdrsize;
 736		spin_unlock_bh(&peer->lock);
 737		_net("Net MTU %u (maxdata %u)", peer->mtu, peer->maxdata);
 738	}
 739
 740	if (wake)
 741		wake_up(&call->waitq);
 742}
 743
 744/*
 745 * Process individual soft ACKs.
 746 *
 747 * Each ACK in the array corresponds to one packet and can be either an ACK or
 748 * a NAK.  If we get find an explicitly NAK'd packet we resend immediately;
 749 * packets that lie beyond the end of the ACK list are scheduled for resend by
 750 * the timer on the basis that the peer might just not have processed them at
 751 * the time the ACK was sent.
 752 */
 753static void rxrpc_input_soft_acks(struct rxrpc_call *call, u8 *acks,
 754				  rxrpc_seq_t seq, int nr_acks,
 755				  struct rxrpc_ack_summary *summary)
 756{
 757	int ix;
 758	u8 annotation, anno_type;
 759
 760	for (; nr_acks > 0; nr_acks--, seq++) {
 761		ix = seq & RXRPC_RXTX_BUFF_MASK;
 762		annotation = call->rxtx_annotations[ix];
 763		anno_type = annotation & RXRPC_TX_ANNO_MASK;
 764		annotation &= ~RXRPC_TX_ANNO_MASK;
 765		switch (*acks++) {
 766		case RXRPC_ACK_TYPE_ACK:
 767			summary->nr_acks++;
 768			if (anno_type == RXRPC_TX_ANNO_ACK)
 769				continue;
 770			summary->nr_new_acks++;
 771			call->rxtx_annotations[ix] =
 772				RXRPC_TX_ANNO_ACK | annotation;
 773			break;
 774		case RXRPC_ACK_TYPE_NACK:
 775			if (!summary->nr_nacks &&
 776			    call->acks_lowest_nak != seq) {
 777				call->acks_lowest_nak = seq;
 778				summary->new_low_nack = true;
 779			}
 780			summary->nr_nacks++;
 781			if (anno_type == RXRPC_TX_ANNO_NAK)
 782				continue;
 783			summary->nr_new_nacks++;
 784			if (anno_type == RXRPC_TX_ANNO_RETRANS)
 785				continue;
 786			call->rxtx_annotations[ix] =
 787				RXRPC_TX_ANNO_NAK | annotation;
 788			break;
 789		default:
 790			return rxrpc_proto_abort("SFT", call, 0);
 791		}
 792	}
 793}
 794
 795/*
 796 * Process an ACK packet.
 797 *
 798 * ack.firstPacket is the sequence number of the first soft-ACK'd/NAK'd packet
 799 * in the ACK array.  Anything before that is hard-ACK'd and may be discarded.
 800 *
 801 * A hard-ACK means that a packet has been processed and may be discarded; a
 802 * soft-ACK means that the packet may be discarded and retransmission
 803 * requested.  A phase is complete when all packets are hard-ACK'd.
 804 */
 805static void rxrpc_input_ack(struct rxrpc_call *call, struct sk_buff *skb,
 806			    u16 skew)
 807{
 808	struct rxrpc_ack_summary summary = { 0 };
 809	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 810	union {
 811		struct rxrpc_ackpacket ack;
 812		struct rxrpc_ackinfo info;
 813		u8 acks[RXRPC_MAXACKS];
 814	} buf;
 815	rxrpc_serial_t acked_serial;
 816	rxrpc_seq_t first_soft_ack, hard_ack;
 817	int nr_acks, offset, ioffset;
 818
 819	_enter("");
 820
 821	offset = sizeof(struct rxrpc_wire_header);
 822	if (skb_copy_bits(skb, offset, &buf.ack, sizeof(buf.ack)) < 0) {
 823		_debug("extraction failure");
 824		return rxrpc_proto_abort("XAK", call, 0);
 825	}
 826	offset += sizeof(buf.ack);
 827
 828	acked_serial = ntohl(buf.ack.serial);
 829	first_soft_ack = ntohl(buf.ack.firstPacket);
 
 830	hard_ack = first_soft_ack - 1;
 831	nr_acks = buf.ack.nAcks;
 832	summary.ack_reason = (buf.ack.reason < RXRPC_ACK__INVALID ?
 833			      buf.ack.reason : RXRPC_ACK__INVALID);
 834
 835	trace_rxrpc_rx_ack(call, sp->hdr.serial, acked_serial,
 836			   first_soft_ack, ntohl(buf.ack.previousPacket),
 837			   summary.ack_reason, nr_acks);
 838
 839	if (buf.ack.reason == RXRPC_ACK_PING_RESPONSE)
 840		rxrpc_input_ping_response(call, skb->tstamp, acked_serial,
 841					  sp->hdr.serial);
 842	if (buf.ack.reason == RXRPC_ACK_REQUESTED)
 843		rxrpc_input_requested_ack(call, skb->tstamp, acked_serial,
 844					  sp->hdr.serial);
 845
 846	if (buf.ack.reason == RXRPC_ACK_PING) {
 847		_proto("Rx ACK %%%u PING Request", sp->hdr.serial);
 848		rxrpc_propose_ACK(call, RXRPC_ACK_PING_RESPONSE,
 849				  skew, sp->hdr.serial, true, true,
 850				  rxrpc_propose_ack_respond_to_ping);
 851	} else if (sp->hdr.flags & RXRPC_REQUEST_ACK) {
 852		rxrpc_propose_ACK(call, RXRPC_ACK_REQUESTED,
 853				  skew, sp->hdr.serial, true, true,
 854				  rxrpc_propose_ack_respond_to_ack);
 855	}
 856
 
 
 
 
 
 
 857	ioffset = offset + nr_acks + 3;
 858	if (skb->len >= ioffset + sizeof(buf.info)) {
 859		if (skb_copy_bits(skb, ioffset, &buf.info, sizeof(buf.info)) < 0)
 860			return rxrpc_proto_abort("XAI", call, 0);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 861		rxrpc_input_ackinfo(call, skb, &buf.info);
 
 
 
 
 862	}
 863
 864	if (first_soft_ack == 0)
 865		return rxrpc_proto_abort("AK0", call, 0);
 866
 867	/* Ignore ACKs unless we are or have just been transmitting. */
 868	switch (READ_ONCE(call->state)) {
 869	case RXRPC_CALL_CLIENT_SEND_REQUEST:
 870	case RXRPC_CALL_CLIENT_AWAIT_REPLY:
 871	case RXRPC_CALL_SERVER_SEND_REPLY:
 872	case RXRPC_CALL_SERVER_AWAIT_ACK:
 873		break;
 874	default:
 875		return;
 876	}
 877
 878	/* Discard any out-of-order or duplicate ACKs. */
 879	if (before_eq(sp->hdr.serial, call->acks_latest)) {
 880		_debug("discard ACK %d <= %d",
 881		       sp->hdr.serial, call->acks_latest);
 882		return;
 
 
 
 883	}
 884	call->acks_latest_ts = skb->tstamp;
 885	call->acks_latest = sp->hdr.serial;
 886
 887	if (before(hard_ack, call->tx_hard_ack) ||
 888	    after(hard_ack, call->tx_top))
 889		return rxrpc_proto_abort("AKW", call, 0);
 890	if (nr_acks > call->tx_top - hard_ack)
 891		return rxrpc_proto_abort("AKN", call, 0);
 892
 893	if (after(hard_ack, call->tx_hard_ack))
 894		rxrpc_rotate_tx_window(call, hard_ack, &summary);
 895
 896	if (nr_acks > 0) {
 897		if (skb_copy_bits(skb, offset, buf.acks, nr_acks) < 0)
 898			return rxrpc_proto_abort("XSA", call, 0);
 
 
 899		rxrpc_input_soft_acks(call, buf.acks, first_soft_ack, nr_acks,
 900				      &summary);
 901	}
 902
 903	if (test_bit(RXRPC_CALL_TX_LAST, &call->flags)) {
 904		rxrpc_end_tx_phase(call, false, "ETA");
 905		return;
 906	}
 907
 908	if (call->rxtx_annotations[call->tx_top & RXRPC_RXTX_BUFF_MASK] &
 909	    RXRPC_TX_ANNO_LAST &&
 910	    summary.nr_acks == call->tx_top - hard_ack &&
 911	    rxrpc_is_client_call(call))
 912		rxrpc_propose_ACK(call, RXRPC_ACK_PING, skew, sp->hdr.serial,
 913				  false, true,
 914				  rxrpc_propose_ack_ping_for_lost_reply);
 915
 916	return rxrpc_congestion_management(call, skb, &summary, acked_serial);
 
 
 917}
 918
 919/*
 920 * Process an ACKALL packet.
 921 */
 922static void rxrpc_input_ackall(struct rxrpc_call *call, struct sk_buff *skb)
 923{
 924	struct rxrpc_ack_summary summary = { 0 };
 925	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 926
 927	_proto("Rx ACKALL %%%u", sp->hdr.serial);
 928
 929	rxrpc_rotate_tx_window(call, call->tx_top, &summary);
 930	if (test_bit(RXRPC_CALL_TX_LAST, &call->flags))
 
 931		rxrpc_end_tx_phase(call, false, "ETL");
 
 
 932}
 933
 934/*
 935 * Process an ABORT packet directed at a call.
 936 */
 937static void rxrpc_input_abort(struct rxrpc_call *call, struct sk_buff *skb)
 938{
 939	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 940	__be32 wtmp;
 941	u32 abort_code = RX_CALL_DEAD;
 942
 943	_enter("");
 944
 945	if (skb->len >= 4 &&
 946	    skb_copy_bits(skb, sizeof(struct rxrpc_wire_header),
 947			  &wtmp, sizeof(wtmp)) >= 0)
 948		abort_code = ntohl(wtmp);
 949
 950	trace_rxrpc_rx_abort(call, sp->hdr.serial, abort_code);
 951
 952	_proto("Rx ABORT %%%u { %x }", sp->hdr.serial, abort_code);
 953
 954	if (rxrpc_set_call_completion(call, RXRPC_CALL_REMOTELY_ABORTED,
 955				      abort_code, -ECONNABORTED))
 956		rxrpc_notify_socket(call);
 957}
 958
 959/*
 960 * Process an incoming call packet.
 961 */
 962static void rxrpc_input_call_packet(struct rxrpc_call *call,
 963				    struct sk_buff *skb, u16 skew)
 964{
 965	struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
 966	unsigned long timo;
 967
 968	_enter("%p,%p", call, skb);
 969
 970	timo = READ_ONCE(call->next_rx_timo);
 971	if (timo) {
 972		unsigned long now = jiffies, expect_rx_by;
 973
 974		expect_rx_by = now + timo;
 975		WRITE_ONCE(call->expect_rx_by, expect_rx_by);
 976		rxrpc_reduce_call_timer(call, expect_rx_by, now,
 977					rxrpc_timer_set_for_normal);
 978	}
 979
 980	switch (sp->hdr.type) {
 981	case RXRPC_PACKET_TYPE_DATA:
 982		rxrpc_input_data(call, skb, skew);
 983		break;
 984
 985	case RXRPC_PACKET_TYPE_ACK:
 986		rxrpc_input_ack(call, skb, skew);
 987		break;
 988
 989	case RXRPC_PACKET_TYPE_BUSY:
 990		_proto("Rx BUSY %%%u", sp->hdr.serial);
 991
 992		/* Just ignore BUSY packets from the server; the retry and
 993		 * lifespan timers will take care of business.  BUSY packets
 994		 * from the client don't make sense.
 995		 */
 996		break;
 997
 998	case RXRPC_PACKET_TYPE_ABORT:
 999		rxrpc_input_abort(call, skb);
1000		break;
1001
1002	case RXRPC_PACKET_TYPE_ACKALL:
1003		rxrpc_input_ackall(call, skb);
1004		break;
1005
1006	default:
1007		break;
1008	}
1009
 
 
1010	_leave("");
1011}
1012
1013/*
1014 * Handle a new call on a channel implicitly completing the preceding call on
1015 * that channel.
1016 *
1017 * TODO: If callNumber > call_id + 1, renegotiate security.
1018 */
1019static void rxrpc_input_implicit_end_call(struct rxrpc_connection *conn,
 
1020					  struct rxrpc_call *call)
1021{
1022	switch (READ_ONCE(call->state)) {
1023	case RXRPC_CALL_SERVER_AWAIT_ACK:
1024		rxrpc_call_completed(call);
1025		break;
1026	case RXRPC_CALL_COMPLETE:
1027		break;
1028	default:
1029		if (rxrpc_abort_call("IMP", call, 0, RX_CALL_DEAD, -ESHUTDOWN)) {
1030			set_bit(RXRPC_CALL_EV_ABORT, &call->events);
1031			rxrpc_queue_call(call);
1032		}
 
1033		break;
1034	}
1035
1036	trace_rxrpc_improper_term(call);
1037	__rxrpc_disconnect_call(conn, call);
 
1038	rxrpc_notify_socket(call);
1039}
1040
1041/*
1042 * post connection-level events to the connection
1043 * - this includes challenges, responses, some aborts and call terminal packet
1044 *   retransmission.
1045 */
1046static void rxrpc_post_packet_to_conn(struct rxrpc_connection *conn,
1047				      struct sk_buff *skb)
1048{
1049	_enter("%p,%p", conn, skb);
1050
1051	skb_queue_tail(&conn->rx_queue, skb);
1052	rxrpc_queue_conn(conn);
1053}
1054
1055/*
1056 * post endpoint-level events to the local endpoint
1057 * - this includes debug and version messages
1058 */
1059static void rxrpc_post_packet_to_local(struct rxrpc_local *local,
1060				       struct sk_buff *skb)
1061{
1062	_enter("%p,%p", local, skb);
1063
1064	skb_queue_tail(&local->event_queue, skb);
1065	rxrpc_queue_local(local);
 
 
 
 
1066}
1067
1068/*
1069 * put a packet up for transport-level abort
1070 */
1071static void rxrpc_reject_packet(struct rxrpc_local *local, struct sk_buff *skb)
1072{
1073	CHECK_SLAB_OKAY(&local->usage);
1074
1075	skb_queue_tail(&local->reject_queue, skb);
1076	rxrpc_queue_local(local);
 
 
 
 
1077}
1078
1079/*
1080 * Extract the wire header from a packet and translate the byte order.
1081 */
1082static noinline
1083int rxrpc_extract_header(struct rxrpc_skb_priv *sp, struct sk_buff *skb)
1084{
1085	struct rxrpc_wire_header whdr;
1086
1087	/* dig out the RxRPC connection details */
1088	if (skb_copy_bits(skb, 0, &whdr, sizeof(whdr)) < 0) {
1089		trace_rxrpc_rx_eproto(NULL, sp->hdr.serial,
1090				      tracepoint_string("bad_hdr"));
1091		return -EBADMSG;
1092	}
1093
1094	memset(sp, 0, sizeof(*sp));
1095	sp->hdr.epoch		= ntohl(whdr.epoch);
1096	sp->hdr.cid		= ntohl(whdr.cid);
1097	sp->hdr.callNumber	= ntohl(whdr.callNumber);
1098	sp->hdr.seq		= ntohl(whdr.seq);
1099	sp->hdr.serial		= ntohl(whdr.serial);
1100	sp->hdr.flags		= whdr.flags;
1101	sp->hdr.type		= whdr.type;
1102	sp->hdr.userStatus	= whdr.userStatus;
1103	sp->hdr.securityIndex	= whdr.securityIndex;
1104	sp->hdr._rsvd		= ntohs(whdr._rsvd);
1105	sp->hdr.serviceId	= ntohs(whdr.serviceId);
1106	return 0;
1107}
1108
1109/*
1110 * handle data received on the local endpoint
1111 * - may be called in interrupt context
1112 *
1113 * The socket is locked by the caller and this prevents the socket from being
1114 * shut down and the local endpoint from going away, thus sk_user_data will not
1115 * be cleared until this function returns.
 
 
1116 */
1117void rxrpc_data_ready(struct sock *udp_sk)
1118{
 
1119	struct rxrpc_connection *conn;
1120	struct rxrpc_channel *chan;
1121	struct rxrpc_call *call;
1122	struct rxrpc_skb_priv *sp;
1123	struct rxrpc_local *local = udp_sk->sk_user_data;
1124	struct sk_buff *skb;
1125	unsigned int channel;
1126	int ret, skew;
1127
1128	_enter("%p", udp_sk);
1129
1130	ASSERT(!irqs_disabled());
1131
1132	skb = skb_recv_udp(udp_sk, 0, 1, &ret);
1133	if (!skb) {
1134		if (ret == -EAGAIN)
1135			return;
1136		_debug("UDP socket error %d", ret);
1137		return;
1138	}
 
 
1139
1140	rxrpc_new_skb(skb, rxrpc_skb_rx_received);
1141
1142	_net("recv skb %p", skb);
1143
1144	/* we'll probably need to checksum it (didn't call sock_recvmsg) */
1145	if (skb_checksum_complete(skb)) {
1146		rxrpc_free_skb(skb, rxrpc_skb_rx_freed);
1147		__UDP_INC_STATS(&init_net, UDP_MIB_INERRORS, 0);
1148		_leave(" [CSUM failed]");
1149		return;
1150	}
1151
1152	__UDP_INC_STATS(&init_net, UDP_MIB_INDATAGRAMS, 0);
1153
1154	/* The UDP protocol already released all skb resources;
1155	 * we are free to add our own data there.
1156	 */
1157	sp = rxrpc_skb(skb);
1158
1159	/* dig out the RxRPC connection details */
1160	if (rxrpc_extract_header(sp, skb) < 0)
1161		goto bad_message;
1162
1163	if (IS_ENABLED(CONFIG_AF_RXRPC_INJECT_LOSS)) {
1164		static int lose;
1165		if ((lose++ & 7) == 7) {
1166			trace_rxrpc_rx_lose(sp);
1167			rxrpc_lose_skb(skb, rxrpc_skb_rx_lost);
1168			return;
1169		}
1170	}
1171
 
 
1172	trace_rxrpc_rx_packet(sp);
1173
1174	_net("Rx RxRPC %s ep=%x call=%x:%x",
1175	     sp->hdr.flags & RXRPC_CLIENT_INITIATED ? "ToServer" : "ToClient",
1176	     sp->hdr.epoch, sp->hdr.cid, sp->hdr.callNumber);
1177
1178	if (sp->hdr.type >= RXRPC_N_PACKET_TYPES ||
1179	    !((RXRPC_SUPPORTED_PACKET_TYPES >> sp->hdr.type) & 1)) {
1180		_proto("Rx Bad Packet Type %u", sp->hdr.type);
1181		goto bad_message;
1182	}
1183
1184	switch (sp->hdr.type) {
1185	case RXRPC_PACKET_TYPE_VERSION:
1186		if (!(sp->hdr.flags & RXRPC_CLIENT_INITIATED))
1187			goto discard;
1188		rxrpc_post_packet_to_local(local, skb);
1189		goto out;
1190
1191	case RXRPC_PACKET_TYPE_BUSY:
1192		if (sp->hdr.flags & RXRPC_CLIENT_INITIATED)
1193			goto discard;
1194		/* Fall through */
 
 
 
 
 
 
 
1195
1196	case RXRPC_PACKET_TYPE_DATA:
1197		if (sp->hdr.callNumber == 0)
 
1198			goto bad_message;
1199		if (sp->hdr.flags & RXRPC_JUMBO_PACKET &&
1200		    !rxrpc_validate_jumbo(skb))
1201			goto bad_message;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1202		break;
1203
1204		/* Packet types 9-11 should just be ignored. */
1205	case RXRPC_PACKET_TYPE_PARAMS:
1206	case RXRPC_PACKET_TYPE_10:
1207	case RXRPC_PACKET_TYPE_11:
1208		goto discard;
 
 
 
 
1209	}
1210
1211	rcu_read_lock();
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1212
1213	conn = rxrpc_find_connection_rcu(local, skb);
1214	if (conn) {
1215		if (sp->hdr.securityIndex != conn->security_ix)
1216			goto wrong_security;
1217
1218		if (sp->hdr.serviceId != conn->service_id) {
1219			if (!test_bit(RXRPC_CONN_PROBING_FOR_UPGRADE, &conn->flags) ||
1220			    conn->service_id != conn->params.service_id)
 
 
 
 
 
 
 
1221				goto reupgrade;
1222			conn->service_id = sp->hdr.serviceId;
1223		}
1224
1225		if (sp->hdr.callNumber == 0) {
1226			/* Connection-level packet */
1227			_debug("CONN %p {%d}", conn, conn->debug_id);
1228			rxrpc_post_packet_to_conn(conn, skb);
1229			goto out_unlock;
1230		}
1231
1232		/* Note the serial number skew here */
1233		skew = (int)sp->hdr.serial - (int)conn->hi_serial;
1234		if (skew >= 0) {
1235			if (skew > 0)
1236				conn->hi_serial = sp->hdr.serial;
1237		} else {
1238			skew = -skew;
1239			skew = min(skew, 65535);
1240		}
1241
1242		/* Call-bound packets are routed by connection channel. */
1243		channel = sp->hdr.cid & RXRPC_CHANNELMASK;
1244		chan = &conn->channels[channel];
1245
1246		/* Ignore really old calls */
1247		if (sp->hdr.callNumber < chan->last_call)
1248			goto discard_unlock;
1249
1250		if (sp->hdr.callNumber == chan->last_call) {
1251			if (chan->call ||
1252			    sp->hdr.type == RXRPC_PACKET_TYPE_ABORT)
1253				goto discard_unlock;
1254
1255			/* For the previous service call, if completed
1256			 * successfully, we discard all further packets.
1257			 */
1258			if (rxrpc_conn_is_service(conn) &&
1259			    chan->last_type == RXRPC_PACKET_TYPE_ACK)
1260				goto discard_unlock;
1261
1262			/* But otherwise we need to retransmit the final packet
1263			 * from data cached in the connection record.
1264			 */
 
 
 
 
 
1265			rxrpc_post_packet_to_conn(conn, skb);
1266			goto out_unlock;
1267		}
1268
1269		call = rcu_dereference(chan->call);
1270
1271		if (sp->hdr.callNumber > chan->call_id) {
1272			if (!(sp->hdr.flags & RXRPC_CLIENT_INITIATED)) {
1273				rcu_read_unlock();
1274				goto reject_packet;
1275			}
1276			if (call)
1277				rxrpc_input_implicit_end_call(conn, call);
1278			call = NULL;
1279		}
1280
1281		if (call && sp->hdr.serviceId != call->service_id)
1282			call->service_id = sp->hdr.serviceId;
1283	} else {
1284		skew = 0;
1285		call = NULL;
 
 
 
1286	}
1287
1288	if (!call || atomic_read(&call->usage) == 0) {
1289		if (!(sp->hdr.type & RXRPC_CLIENT_INITIATED) ||
1290		    sp->hdr.callNumber == 0 ||
1291		    sp->hdr.type != RXRPC_PACKET_TYPE_DATA)
1292			goto bad_message_unlock;
1293		if (sp->hdr.seq != 1)
1294			goto discard_unlock;
1295		call = rxrpc_new_incoming_call(local, conn, skb);
1296		if (!call) {
1297			rcu_read_unlock();
1298			goto reject_packet;
1299		}
1300		rxrpc_send_ping(call, skb, skew);
1301		mutex_unlock(&call->user_mutex);
1302	}
1303
1304	rxrpc_input_call_packet(call, skb, skew);
1305	goto discard_unlock;
 
 
 
1306
1307discard_unlock:
1308	rcu_read_unlock();
1309discard:
1310	rxrpc_free_skb(skb, rxrpc_skb_rx_freed);
1311out:
1312	trace_rxrpc_rx_done(0, 0);
1313	return;
1314
1315out_unlock:
1316	rcu_read_unlock();
1317	goto out;
1318
1319wrong_security:
1320	rcu_read_unlock();
1321	trace_rxrpc_abort(0, "SEC", sp->hdr.cid, sp->hdr.callNumber, sp->hdr.seq,
1322			  RXKADINCONSISTENCY, EBADMSG);
1323	skb->priority = RXKADINCONSISTENCY;
1324	goto post_abort;
1325
 
 
 
 
 
 
1326reupgrade:
1327	rcu_read_unlock();
1328	trace_rxrpc_abort(0, "UPG", sp->hdr.cid, sp->hdr.callNumber, sp->hdr.seq,
1329			  RX_PROTOCOL_ERROR, EBADMSG);
1330	goto protocol_error;
1331
1332bad_message_unlock:
1333	rcu_read_unlock();
1334bad_message:
1335	trace_rxrpc_abort(0, "BAD", sp->hdr.cid, sp->hdr.callNumber, sp->hdr.seq,
1336			  RX_PROTOCOL_ERROR, EBADMSG);
1337protocol_error:
1338	skb->priority = RX_PROTOCOL_ERROR;
1339post_abort:
1340	skb->mark = RXRPC_SKB_MARK_LOCAL_ABORT;
1341reject_packet:
1342	trace_rxrpc_rx_done(skb->mark, skb->priority);
1343	rxrpc_reject_packet(local, skb);
1344	_leave(" [badmsg]");
 
1345}