ccid3.c 36.3 KB
Newer Older
1 2 3 4
/*
 *  net/dccp/ccids/ccid3.c
 *
 *  Copyright (c) 2005 The University of Waikato, Hamilton, New Zealand.
5
 *  Copyright (c) 2005-6 Ian McDonald <ian.mcdonald@jandi.co.nz>
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38
 *
 *  An implementation of the DCCP protocol
 *
 *  This code has been developed by the University of Waikato WAND
 *  research group. For further information please see http://www.wand.net.nz/
 *
 *  This code also uses code from Lulea University, rereleased as GPL by its
 *  authors:
 *  Copyright (c) 2003 Nils-Erik Mattsson, Joacim Haggmark, Magnus Erixzon
 *
 *  Changes to meet Linux coding standards, to make it meet latest ccid3 draft
 *  and to make it work as a loadable module in the DCCP stack written by
 *  Arnaldo Carvalho de Melo <acme@conectiva.com.br>.
 *
 *  Copyright (c) 2005 Arnaldo Carvalho de Melo <acme@conectiva.com.br>
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation; either version 2 of the License, or
 *  (at your option) any later version.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
 *  along with this program; if not, write to the Free Software
 *  Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 */

#include "../ccid.h"
#include "../dccp.h"
39
#include "lib/packet_history.h"
40
#include "lib/loss_interval.h"
41
#include "lib/tfrc.h"
42 43
#include "ccid3.h"

44
/*
45 46
 * Reason for maths here is to avoid 32 bit overflow when a is big.
 * With this we get close to the limit.
47
 */
48
static u32 usecs_div(const u32 a, const u32 b)
49
{
50 51 52 53 54 55 56 57 58 59 60
	const u32 div = a < (UINT_MAX / (USEC_PER_SEC /    10)) ?    10 :
			a < (UINT_MAX / (USEC_PER_SEC /    50)) ?    50 :
			a < (UINT_MAX / (USEC_PER_SEC /   100)) ?   100 :
			a < (UINT_MAX / (USEC_PER_SEC /   500)) ?   500 :
			a < (UINT_MAX / (USEC_PER_SEC /  1000)) ?  1000 :
			a < (UINT_MAX / (USEC_PER_SEC /  5000)) ?  5000 :
			a < (UINT_MAX / (USEC_PER_SEC / 10000)) ? 10000 :
			a < (UINT_MAX / (USEC_PER_SEC / 50000)) ? 50000 :
								 100000;
	const u32 tmp = a * (USEC_PER_SEC / div);
	return (b >= 2 * div) ? tmp / (b / div) : tmp;
61 62
}

63

64 65 66 67

#ifdef CONFIG_IP_DCCP_CCID3_DEBUG
static int ccid3_debug;
#define ccid3_pr_debug(format, a...)	DCCP_PR_DEBUG(ccid3_debug, format, ##a)
68 69 70 71
#else
#define ccid3_pr_debug(format, a...)
#endif

72 73
static struct dccp_tx_hist *ccid3_tx_hist;
static struct dccp_rx_hist *ccid3_rx_hist;
74
static struct dccp_li_hist *ccid3_li_hist;
75

76
#ifdef CONFIG_IP_DCCP_CCID3_DEBUG
77 78 79 80 81 82 83 84 85 86 87 88 89
static const char *ccid3_tx_state_name(enum ccid3_hc_tx_states state)
{
	static char *ccid3_state_names[] = {
	[TFRC_SSTATE_NO_SENT]  = "NO_SENT",
	[TFRC_SSTATE_NO_FBACK] = "NO_FBACK",
	[TFRC_SSTATE_FBACK]    = "FBACK",
	[TFRC_SSTATE_TERM]     = "TERM",
	};

	return ccid3_state_names[state];
}
#endif

90 91
static void ccid3_hc_tx_set_state(struct sock *sk,
				  enum ccid3_hc_tx_states state)
92
{
93
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
94 95 96
	enum ccid3_hc_tx_states oldstate = hctx->ccid3hctx_state;

	ccid3_pr_debug("%s(%p) %-8.8s -> %s\n",
97 98
		       dccp_role(sk), sk, ccid3_tx_state_name(oldstate),
		       ccid3_tx_state_name(state));
99 100 101 102
	WARN_ON(state == oldstate);
	hctx->ccid3hctx_state = state;
}

103 104 105 106 107
/*
 * Recalculate scheduled nominal send time t_nom, inter-packet interval
 * t_ipi, and delta value. Should be called after each change to X.
 */
static inline void ccid3_update_send_time(struct ccid3_hc_tx_sock *hctx)
108
{
109 110 111
	timeval_sub_usecs(&hctx->ccid3hctx_t_nom, hctx->ccid3hctx_t_ipi);

	/* Calculate new t_ipi (inter packet interval) by t_ipi = s / X_inst */
112
	hctx->ccid3hctx_t_ipi = usecs_div(hctx->ccid3hctx_s, hctx->ccid3hctx_x);
113

114 115 116 117
	/* Update nominal send time with regard to the new t_ipi */
	timeval_add_usecs(&hctx->ccid3hctx_t_nom, hctx->ccid3hctx_t_ipi);

	/* Calculate new delta by delta = min(t_ipi / 2, t_gran / 2) */
118 119
	hctx->ccid3hctx_delta = min_t(u32, hctx->ccid3hctx_t_ipi / 2,
					   TFRC_OPSYS_HALF_TIME_GRAN);
120 121 122 123 124 125 126 127 128 129 130
}
/*
 * Update X by
 *    If (p > 0)
 *       x_calc = calcX(s, R, p);
 *       X = max(min(X_calc, 2 * X_recv), s / t_mbi);
 *    Else
 *       If (now - tld >= R)
 *          X = max(min(2 * X, 2 * X_recv), s / R);
 *          tld = now;
 */ 
131 132
static void ccid3_hc_tx_update_x(struct sock *sk, struct timeval *now)

133
{
134
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
135
	const __u32 old_x = hctx->ccid3hctx_x;
136

137 138
	/* To avoid large error in calcX */
	if (hctx->ccid3hctx_p >= TFRC_SMALLEST_P) {
139 140 141
		hctx->ccid3hctx_x_calc = tfrc_calc_x(hctx->ccid3hctx_s,
						     hctx->ccid3hctx_rtt,
						     hctx->ccid3hctx_p);
142 143 144 145 146 147 148 149 150 151 152 153 154
		hctx->ccid3hctx_x = max_t(u32, min(hctx->ccid3hctx_x_calc,
						   hctx->ccid3hctx_x_recv * 2),
					       hctx->ccid3hctx_s / TFRC_T_MBI);

	} else if (timeval_delta(now, &hctx->ccid3hctx_t_ld) >=
							  hctx->ccid3hctx_rtt) {
		hctx->ccid3hctx_x = max(min(hctx->ccid3hctx_x_recv,
					    hctx->ccid3hctx_x      ) * 2,
					usecs_div(hctx->ccid3hctx_s,
					       	  hctx->ccid3hctx_rtt)   );
		hctx->ccid3hctx_t_ld = *now;
	} else
		ccid3_pr_debug("Not changing X\n");
155

156 157
	if (hctx->ccid3hctx_x != old_x)
		ccid3_update_send_time(hctx);
158 159
}

160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178
/*
 * 	Track the mean packet size `s' (cf. RFC 4342, 5.3 and  RFC 3448, 4.1)
 * 	@len: DCCP packet payload size in bytes
 */
static inline void ccid3_hc_tx_update_s(struct ccid3_hc_tx_sock *hctx, int len)
{
	if (unlikely(len == 0))
		ccid3_pr_debug("Packet payload length is 0 - not updating\n");
	else
		hctx->ccid3hctx_s = hctx->ccid3hctx_s == 0 ? len :
				    (9 * hctx->ccid3hctx_s + len) / 10;
	/*
	 * Note: We could do a potential optimisation here - when `s' changes,
	 *	 recalculate sending rate and consequently t_ipi, t_delta, and
	 *	 t_now. This is however non-standard, and the benefits are not
	 *	 clear, so it is currently left out.
	 */
}

179 180 181
static void ccid3_hc_tx_no_feedback_timer(unsigned long data)
{
	struct sock *sk = (struct sock *)data;
182
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
183
	unsigned long t_nfb = USEC_PER_SEC / 5;
184 185 186 187 188

	bh_lock_sock(sk);
	if (sock_owned_by_user(sk)) {
		/* Try again later. */
		/* XXX: set some sensible MIB */
189
		goto restart_timer;
190 191 192 193 194 195 196
	}

	ccid3_pr_debug("%s, sk=%p, state=%s\n", dccp_role(sk), sk,
		       ccid3_tx_state_name(hctx->ccid3hctx_state));
	
	switch (hctx->ccid3hctx_state) {
	case TFRC_SSTATE_NO_FBACK:
197 198 199
		/* RFC 3448, 4.4: Halve send rate directly */
		hctx->ccid3hctx_x = min_t(u32, hctx->ccid3hctx_x / 2,
					       hctx->ccid3hctx_s / TFRC_T_MBI);
200

201 202 203 204
		ccid3_pr_debug("%s, sk=%p, state=%s, updated tx rate to %d "
			       "bytes/s\n",
			       dccp_role(sk), sk,
			       ccid3_tx_state_name(hctx->ccid3hctx_state),
205
			       hctx->ccid3hctx_x);
206 207
		/* The value of R is still undefined and so we can not recompute
		 * the timout value. Keep initial value as per [RFC 4342, 5]. */
208
		t_nfb = TFRC_INITIAL_TIMEOUT;
209
		ccid3_update_send_time(hctx);
210 211
		break;
	case TFRC_SSTATE_FBACK:
212 213 214 215 216
		/*
		 * Check if IDLE since last timeout and recv rate is less than
		 * 4 packets per RTT
		 */
		if (!hctx->ccid3hctx_idle ||
217 218
		    (hctx->ccid3hctx_x_recv >=
		     4 * usecs_div(hctx->ccid3hctx_s, hctx->ccid3hctx_rtt))) {
219 220
			struct timeval now;

221 222
			ccid3_pr_debug("%s, sk=%p, state=%s, not idle\n",
				       dccp_role(sk), sk,
223 224 225 226 227 228 229 230
				       ccid3_tx_state_name(hctx->ccid3hctx_state));
			/* Halve sending rate */

			/*  If (X_calc > 2 * X_recv)
			 *    X_recv = max(X_recv / 2, s / (2 * t_mbi));
			 *  Else
			 *    X_recv = X_calc / 4;
			 */
231 232
			BUG_ON(hctx->ccid3hctx_p >= TFRC_SMALLEST_P &&
			       hctx->ccid3hctx_x_calc == 0);
233 234 235 236 237

			/* check also if p is zero -> x_calc is infinity? */
			if (hctx->ccid3hctx_p < TFRC_SMALLEST_P ||
			    hctx->ccid3hctx_x_calc > 2 * hctx->ccid3hctx_x_recv)
				hctx->ccid3hctx_x_recv = max_t(u32, hctx->ccid3hctx_x_recv / 2,
238
								    hctx->ccid3hctx_s / (2 * TFRC_T_MBI));
239 240 241 242
			else
				hctx->ccid3hctx_x_recv = hctx->ccid3hctx_x_calc / 4;

			/* Update sending rate */
243 244
			dccp_timestamp(sk, &now);
			ccid3_hc_tx_update_x(sk, &now);
245
		}
246 247
		/*
		 * Schedule no feedback timer to expire in
248
		 * max(4 * R, 2 * s/X)  =  max(4 * R, 2 * t_ipi)
249
		 */
250
		t_nfb = max(4 * hctx->ccid3hctx_rtt, 2 * hctx->ccid3hctx_t_ipi);
251
		break;
252 253 254 255
	case TFRC_SSTATE_NO_SENT:
		DCCP_BUG("Illegal %s state NO_SENT, sk=%p", dccp_role(sk), sk);
		/* fall through */
	case TFRC_SSTATE_TERM:
256 257 258 259
		goto out;
	}

	hctx->ccid3hctx_idle = 1;
260 261 262

restart_timer:
	sk_reset_timer(sk, &hctx->ccid3hctx_no_feedback_timer,
263
		           jiffies + usecs_to_jiffies(t_nfb));
264 265 266 267 268
out:
	bh_unlock_sock(sk);
	sock_put(sk);
}

269 270 271 272 273 274
/*
 * returns
 *   > 0: delay (in msecs) that should pass before actually sending
 *   = 0: can send immediately
 *   < 0: error condition; do not send packet
 */
275 276
static int ccid3_hc_tx_send_packet(struct sock *sk,
				   struct sk_buff *skb, int len)
277 278
{
	struct dccp_sock *dp = dccp_sk(sk);
279
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
280
	struct dccp_tx_hist_entry *new_packet;
281
	struct timeval now;
282
	long delay;
283

284
	BUG_ON(hctx == NULL);
285

286
	/*
287 288 289
	 * This function is called only for Data and DataAck packets. Sending
	 * zero-sized Data(Ack)s is theoretically possible, but for congestion
	 * control this case is pathological - ignore it.
290
	 */
291
	if (unlikely(len == 0))
292
		return -EBADMSG;
293 294

	/* See if last packet allocated was not sent */
295 296
	new_packet = dccp_tx_hist_head(&hctx->ccid3hctx_hist);
	if (new_packet == NULL || new_packet->dccphtx_sent) {
297 298
		new_packet = dccp_tx_hist_entry_new(ccid3_tx_hist,
						    SLAB_ATOMIC);
299

300
		if (unlikely(new_packet == NULL)) {
301 302
			DCCP_WARN("%s, sk=%p, not enough mem to add to history,"
				  "send refused\n", dccp_role(sk), sk);
303
			return -ENOBUFS;
304 305
		}

306
		dccp_tx_hist_add_entry(&hctx->ccid3hctx_hist, new_packet);
307 308
	}

309
	dccp_timestamp(sk, &now);
310 311 312

	switch (hctx->ccid3hctx_state) {
	case TFRC_SSTATE_NO_SENT:
313 314
		sk_reset_timer(sk, &hctx->ccid3hctx_no_feedback_timer,
			       jiffies + usecs_to_jiffies(TFRC_INITIAL_TIMEOUT));
315 316 317 318
		hctx->ccid3hctx_last_win_count	 = 0;
		hctx->ccid3hctx_t_last_win_count = now;
		ccid3_hc_tx_set_state(sk, TFRC_SSTATE_NO_FBACK);

319 320 321 322
		/* Set initial sending rate to 1 packet per second */
		ccid3_hc_tx_update_s(hctx, len);
		hctx->ccid3hctx_x     = hctx->ccid3hctx_s;

323 324 325 326 327 328
		/* First timeout, according to [RFC 3448, 4.2], is 1 second */
		hctx->ccid3hctx_t_ipi = USEC_PER_SEC;
		/* Initial delta: minimum of 0.5 sec and t_gran/2 */
		hctx->ccid3hctx_delta = TFRC_OPSYS_HALF_TIME_GRAN;

		/* Set t_0 for initial packet */
329 330 331 332
		hctx->ccid3hctx_t_nom = now;
		break;
	case TFRC_SSTATE_NO_FBACK:
	case TFRC_SSTATE_FBACK:
333 334 335 336 337 338 339 340 341
		delay = timeval_delta(&hctx->ccid3hctx_t_nom, &now);
		/*
		 * 	Scheduling of packet transmissions [RFC 3448, 4.6]
		 *
		 * if (t_now > t_nom - delta)
		 *       // send the packet now
		 * else
		 *       // send the packet in (t_nom - t_now) milliseconds.
		 */
342 343
		if (delay >= hctx->ccid3hctx_delta)
			return delay / 1000L;
344
		break;
345 346
	case TFRC_SSTATE_TERM:
		DCCP_BUG("Illegal %s state TERM, sk=%p", dccp_role(sk), sk);
347
		return -EINVAL;
348 349
	}

350 351 352 353 354 355 356
	/* prepare to send now (add options etc.) */
	dp->dccps_hc_tx_insert_options = 1;
	new_packet->dccphtx_ccval = DCCP_SKB_CB(skb)->dccpd_ccval =
				    hctx->ccid3hctx_last_win_count;
	timeval_add_usecs(&hctx->ccid3hctx_t_nom, hctx->ccid3hctx_t_ipi);

	return 0;
357 358 359 360
}

static void ccid3_hc_tx_packet_sent(struct sock *sk, int more, int len)
{
361 362
	const struct dccp_sock *dp = dccp_sk(sk);
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
363 364
	struct timeval now;

365
	BUG_ON(hctx == NULL);
366

367
	dccp_timestamp(sk, &now);
368 369 370 371

	/* check if we have sent a data packet */
	if (len > 0) {
		unsigned long quarter_rtt;
372
		struct dccp_tx_hist_entry *packet;
373

374 375
		ccid3_hc_tx_update_s(hctx, len);

376
		packet = dccp_tx_hist_head(&hctx->ccid3hctx_hist);
377
		if (unlikely(packet == NULL)) {
378
			DCCP_WARN("packet doesn't exist in history!\n");
379 380
			return;
		}
381
		if (unlikely(packet->dccphtx_sent)) {
382
			DCCP_WARN("no unsent packet in history!\n");
383 384
			return;
		}
385 386
		packet->dccphtx_tstamp = now;
		packet->dccphtx_seqno  = dp->dccps_gss;
387
		/*
388
		 * Check if win_count have changed
389
		 * Algorithm in "8.1. Window Counter Value" in RFC 4342.
390
		 */
391 392 393 394
		quarter_rtt = timeval_delta(&now, &hctx->ccid3hctx_t_last_win_count);
		if (likely(hctx->ccid3hctx_rtt > 8))
			quarter_rtt /= hctx->ccid3hctx_rtt / 4;

395 396 397 398
		if (quarter_rtt > 0) {
			hctx->ccid3hctx_t_last_win_count = now;
			hctx->ccid3hctx_last_win_count	 = (hctx->ccid3hctx_last_win_count +
							    min_t(unsigned long, quarter_rtt, 5)) % 16;
399 400
			ccid3_pr_debug("%s, sk=%p, window changed from "
				       "%u to %u!\n",
401
				       dccp_role(sk), sk,
402
				       packet->dccphtx_ccval,
403 404
				       hctx->ccid3hctx_last_win_count);
		}
405

406
		hctx->ccid3hctx_idle = 0;
407
		packet->dccphtx_rtt  = hctx->ccid3hctx_rtt;
408
		packet->dccphtx_sent = 1;
409 410 411 412 413 414 415
	} else
		ccid3_pr_debug("%s, sk=%p, seqno=%llu NOT inserted!\n",
			       dccp_role(sk), sk, dp->dccps_gss);
}

static void ccid3_hc_tx_packet_recv(struct sock *sk, struct sk_buff *skb)
{
416 417
	const struct dccp_sock *dp = dccp_sk(sk);
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
418
	struct ccid3_options_received *opt_recv;
419
	struct dccp_tx_hist_entry *packet;
420
	struct timeval now;
421
	unsigned long t_nfb;
I
Ian McDonald 已提交
422
	u32 t_elapsed;
423 424 425
	u32 pinv;
	u32 x_recv;
	u32 r_sample;
426

427
	BUG_ON(hctx == NULL);
428 429 430 431 432 433 434 435

	/* we are only interested in ACKs */
	if (!(DCCP_SKB_CB(skb)->dccpd_type == DCCP_PKT_ACK ||
	      DCCP_SKB_CB(skb)->dccpd_type == DCCP_PKT_DATAACK))
		return;

	opt_recv = &hctx->ccid3hctx_options_received;

436
	t_elapsed = dp->dccps_options_received.dccpor_elapsed_time * 10;
437 438 439 440 441 442 443 444 445
	x_recv = opt_recv->ccid3or_receive_rate;
	pinv = opt_recv->ccid3or_loss_event_rate;

	switch (hctx->ccid3hctx_state) {
	case TFRC_SSTATE_NO_FBACK:
	case TFRC_SSTATE_FBACK:
		/* Calculate new round trip sample by
		 * R_sample = (now - t_recvdata) - t_delay */
		/* get t_recvdata from history */
446 447
		packet = dccp_tx_hist_find_entry(&hctx->ccid3hctx_hist,
						 DCCP_SKB_CB(skb)->dccpd_ack_seq);
448
		if (unlikely(packet == NULL)) {
449 450
			DCCP_WARN("%s, sk=%p, seqno %llu(%s) does't exist "
				  "in history!\n",  dccp_role(sk), sk,
451
			    (unsigned long long)DCCP_SKB_CB(skb)->dccpd_ack_seq,
452
				  dccp_packet_name(DCCP_SKB_CB(skb)->dccpd_type));
453 454 455 456
			return;
		}

		/* Update RTT */
457 458
		dccp_timestamp(sk, &now);
		r_sample = timeval_delta(&now, &packet->dccphtx_tstamp);
459
		if (unlikely(r_sample <= t_elapsed))
460 461
			DCCP_WARN("r_sample=%uus,t_elapsed=%uus\n",
				  r_sample, t_elapsed);
462 463
		else
			r_sample -= t_elapsed;
464 465 466 467 468 469 470 471 472 473

		/* Update RTT estimate by 
		 * If (No feedback recv)
		 *    R = R_sample;
		 * Else
		 *    R = q * R + (1 - q) * R_sample;
		 *
		 * q is a constant, RFC 3448 recomments 0.9
		 */
		if (hctx->ccid3hctx_state == TFRC_SSTATE_NO_FBACK) {
474 475 476 477 478 479 480 481 482
			/* Use Larger Initial Windows [RFC 4342, sec. 5]
			 * We deviate in that we use `s' instead of `MSS'. */
			u16 w_init = max(    4 * hctx->ccid3hctx_s,
					 max(2 * hctx->ccid3hctx_s, 4380));
			hctx->ccid3hctx_rtt  = r_sample;
			hctx->ccid3hctx_x    = usecs_div(w_init, r_sample);
			hctx->ccid3hctx_t_ld = now;

			ccid3_update_send_time(hctx);
483
			ccid3_hc_tx_set_state(sk, TFRC_SSTATE_FBACK);
484
		} else {
485 486
			hctx->ccid3hctx_rtt = (hctx->ccid3hctx_rtt * 9) / 10 +
					      r_sample / 10;
487 488
			ccid3_hc_tx_update_x(sk, &now);
		}
489

490 491 492
		ccid3_pr_debug("%s, sk=%p, New RTT estimate=%uus, "
			       "r_sample=%us\n", dccp_role(sk), sk,
			       hctx->ccid3hctx_rtt, r_sample);
493 494

		/* Update receive rate */
495
		hctx->ccid3hctx_x_recv = x_recv;/* X_recv in bytes per sec */
496 497 498 499 500 501 502 503 504

		/* Update loss event rate */
		if (pinv == ~0 || pinv == 0)
			hctx->ccid3hctx_p = 0;
		else {
			hctx->ccid3hctx_p = 1000000 / pinv;

			if (hctx->ccid3hctx_p < TFRC_SMALLEST_P) {
				hctx->ccid3hctx_p = TFRC_SMALLEST_P;
505 506
				ccid3_pr_debug("%s, sk=%p, Smallest p used!\n",
					       dccp_role(sk), sk);
507 508 509 510 511 512 513
			}
		}

		/* unschedule no feedback timer */
		sk_stop_timer(sk, &hctx->ccid3hctx_no_feedback_timer);

		/* remove all packets older than the one acked from history */
514 515
		dccp_tx_hist_purge_older(ccid3_tx_hist,
					 &hctx->ccid3hctx_hist, packet);
516 517
		/*
		 * As we have calculated new ipi, delta, t_nom it is possible that
518
		 * we now can send a packet, so wake up dccp_wait_for_ccid
519 520
		 */
		sk->sk_write_space(sk);
521

522 523 524 525 526
		/* Update timeout interval. We use the alternative variant of
		 * [RFC 3448, 3.1] which sets the upper bound of t_rto to one
		 * second, as it is suggested for TCP (see RFC 2988, 2.4). */
		hctx->ccid3hctx_t_rto = max_t(u32, 4 * hctx->ccid3hctx_rtt,
					      	   USEC_PER_SEC            );
527 528
		/*
		 * Schedule no feedback timer to expire in
529
		 * max(4 * R, 2 * s/X)  =  max(4 * R, 2 * t_ipi)
530
		 */
531
		t_nfb = max(4 * hctx->ccid3hctx_rtt, 2 * hctx->ccid3hctx_t_ipi);
532
			
533 534 535
		ccid3_pr_debug("%s, sk=%p, Scheduled no feedback timer to "
			       "expire in %lu jiffies (%luus)\n",
			       dccp_role(sk), sk,
536
			       usecs_to_jiffies(t_nfb), t_nfb);
537 538

		sk_reset_timer(sk, &hctx->ccid3hctx_no_feedback_timer, 
539
				   jiffies + usecs_to_jiffies(t_nfb));
540 541 542 543

		/* set idle flag */
		hctx->ccid3hctx_idle = 1;   
		break;
G
Gerrit Renker 已提交
544 545 546 547
	case TFRC_SSTATE_NO_SENT:
		DCCP_WARN("Illegal ACK received - no packet has been sent\n");
		/* fall through */
	case TFRC_SSTATE_TERM:		/* ignore feedback when closing */
548 549 550 551
		break;
	}
}

552
static int ccid3_hc_tx_insert_options(struct sock *sk, struct sk_buff *skb)
553
{
554
	const struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
555

556 557
	BUG_ON(hctx == NULL);

558 559 560
	if (sk->sk_state == DCCP_OPEN || sk->sk_state == DCCP_PARTOPEN)
		DCCP_SKB_CB(skb)->dccpd_ccval = hctx->ccid3hctx_last_win_count;
	return 0;
561 562 563
}

static int ccid3_hc_tx_parse_options(struct sock *sk, unsigned char option,
564 565
				     unsigned char len, u16 idx,
				     unsigned char *value)
566 567
{
	int rc = 0;
568 569
	const struct dccp_sock *dp = dccp_sk(sk);
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
570 571
	struct ccid3_options_received *opt_recv;

572
	BUG_ON(hctx == NULL);
573 574 575 576 577 578 579 580 581 582 583 584 585

	opt_recv = &hctx->ccid3hctx_options_received;

	if (opt_recv->ccid3or_seqno != dp->dccps_gsr) {
		opt_recv->ccid3or_seqno		     = dp->dccps_gsr;
		opt_recv->ccid3or_loss_event_rate    = ~0;
		opt_recv->ccid3or_loss_intervals_idx = 0;
		opt_recv->ccid3or_loss_intervals_len = 0;
		opt_recv->ccid3or_receive_rate	     = 0;
	}

	switch (option) {
	case TFRC_OPT_LOSS_EVENT_RATE:
586
		if (unlikely(len != 4)) {
587 588 589
			DCCP_WARN("%s, sk=%p, invalid len %d "
				  "for TFRC_OPT_LOSS_EVENT_RATE\n",
				  dccp_role(sk), sk, len);
590 591
			rc = -EINVAL;
		} else {
592
			opt_recv->ccid3or_loss_event_rate = ntohl(*(__be32 *)value);
593 594 595 596 597 598 599 600 601 602 603 604 605 606
			ccid3_pr_debug("%s, sk=%p, LOSS_EVENT_RATE=%u\n",
				       dccp_role(sk), sk,
				       opt_recv->ccid3or_loss_event_rate);
		}
		break;
	case TFRC_OPT_LOSS_INTERVALS:
		opt_recv->ccid3or_loss_intervals_idx = idx;
		opt_recv->ccid3or_loss_intervals_len = len;
		ccid3_pr_debug("%s, sk=%p, LOSS_INTERVALS=(%u, %u)\n",
			       dccp_role(sk), sk,
			       opt_recv->ccid3or_loss_intervals_idx,
			       opt_recv->ccid3or_loss_intervals_len);
		break;
	case TFRC_OPT_RECEIVE_RATE:
607
		if (unlikely(len != 4)) {
608 609 610
			DCCP_WARN("%s, sk=%p, invalid len %d "
				  "for TFRC_OPT_RECEIVE_RATE\n",
				  dccp_role(sk), sk, len);
611 612
			rc = -EINVAL;
		} else {
613
			opt_recv->ccid3or_receive_rate = ntohl(*(__be32 *)value);
614 615 616 617 618 619 620 621 622 623
			ccid3_pr_debug("%s, sk=%p, RECEIVE_RATE=%u\n",
				       dccp_role(sk), sk,
				       opt_recv->ccid3or_receive_rate);
		}
		break;
	}

	return rc;
}

624
static int ccid3_hc_tx_init(struct ccid *ccid, struct sock *sk)
625
{
626
	struct ccid3_hc_tx_sock *hctx = ccid_priv(ccid);
627

628
	hctx->ccid3hctx_s     = 0;
629 630
	hctx->ccid3hctx_state = TFRC_SSTATE_NO_SENT;
	INIT_LIST_HEAD(&hctx->ccid3hctx_hist);
631 632 633

	hctx->ccid3hctx_no_feedback_timer.function = ccid3_hc_tx_no_feedback_timer;
	hctx->ccid3hctx_no_feedback_timer.data     = (unsigned long)sk;
634 635 636 637 638 639 640
	init_timer(&hctx->ccid3hctx_no_feedback_timer);

	return 0;
}

static void ccid3_hc_tx_exit(struct sock *sk)
{
641
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
642 643 644 645 646 647 648

	BUG_ON(hctx == NULL);

	ccid3_hc_tx_set_state(sk, TFRC_SSTATE_TERM);
	sk_stop_timer(sk, &hctx->ccid3hctx_no_feedback_timer);

	/* Empty packet history */
649
	dccp_tx_hist_purge(ccid3_tx_hist, &hctx->ccid3hctx_hist);
650 651 652 653 654 655
}

/*
 * RX Half Connection methods
 */

656
#ifdef CONFIG_IP_DCCP_CCID3_DEBUG
657 658 659 660 661 662 663 664 665 666 667 668
static const char *ccid3_rx_state_name(enum ccid3_hc_rx_states state)
{
	static char *ccid3_rx_state_names[] = {
	[TFRC_RSTATE_NO_DATA] = "NO_DATA",
	[TFRC_RSTATE_DATA]    = "DATA",
	[TFRC_RSTATE_TERM]    = "TERM",
	};

	return ccid3_rx_state_names[state];
}
#endif

669 670
static void ccid3_hc_rx_set_state(struct sock *sk,
				  enum ccid3_hc_rx_states state)
671
{
672
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
673 674 675
	enum ccid3_hc_rx_states oldstate = hcrx->ccid3hcrx_state;

	ccid3_pr_debug("%s(%p) %-8.8s -> %s\n",
676 677
		       dccp_role(sk), sk, ccid3_rx_state_name(oldstate),
		       ccid3_rx_state_name(state));
678 679 680 681
	WARN_ON(state == oldstate);
	hcrx->ccid3hcrx_state = state;
}

682 683 684 685 686 687 688 689 690
static inline void ccid3_hc_rx_update_s(struct ccid3_hc_rx_sock *hcrx, int len)
{
	if (unlikely(len == 0))	/* don't update on empty packets (e.g. ACKs) */
		ccid3_pr_debug("Packet payload length is 0 - not updating\n");
	else
		hcrx->ccid3hcrx_s = hcrx->ccid3hcrx_s == 0 ? len :
				    (9 * hcrx->ccid3hcrx_s + len) / 10;
}

691 692
static void ccid3_hc_rx_send_feedback(struct sock *sk)
{
693
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
694
	struct dccp_sock *dp = dccp_sk(sk);
695
	struct dccp_rx_hist_entry *packet;
696
	struct timeval now;
697 698 699

	ccid3_pr_debug("%s, sk=%p\n", dccp_role(sk), sk);

700
	dccp_timestamp(sk, &now);
701

702 703 704 705 706
	switch (hcrx->ccid3hcrx_state) {
	case TFRC_RSTATE_NO_DATA:
		hcrx->ccid3hcrx_x_recv = 0;
		break;
	case TFRC_RSTATE_DATA: {
707 708
		const u32 delta = timeval_delta(&now,
					&hcrx->ccid3hcrx_tstamp_last_feedback);
709 710
		hcrx->ccid3hcrx_x_recv = usecs_div(hcrx->ccid3hcrx_bytes_recv,
						   delta);
711 712
	}
		break;
713 714
	case TFRC_RSTATE_TERM:
		DCCP_BUG("Illegal %s state TERM, sk=%p", dccp_role(sk), sk);
715 716 717
		return;
	}

718
	packet = dccp_rx_hist_find_data_packet(&hcrx->ccid3hcrx_hist);
719
	if (unlikely(packet == NULL)) {
720 721
		DCCP_WARN("%s, sk=%p, no data packet in history!\n",
			  dccp_role(sk), sk);
722 723 724
		return;
	}

725
	hcrx->ccid3hcrx_tstamp_last_feedback = now;
I
Ian McDonald 已提交
726
	hcrx->ccid3hcrx_ccval_last_counter   = packet->dccphrx_ccval;
727 728 729
	hcrx->ccid3hcrx_bytes_recv	     = 0;

	/* Convert to multiples of 10us */
730 731
	hcrx->ccid3hcrx_elapsed_time =
			timeval_delta(&now, &packet->dccphrx_tstamp) / 10;
732 733 734 735
	if (hcrx->ccid3hcrx_p == 0)
		hcrx->ccid3hcrx_pinv = ~0;
	else
		hcrx->ccid3hcrx_pinv = 1000000 / hcrx->ccid3hcrx_p;
736
	dp->dccps_hc_rx_insert_options = 1;
737 738 739
	dccp_send_ack(sk);
}

740
static int ccid3_hc_rx_insert_options(struct sock *sk, struct sk_buff *skb)
741
{
742
	const struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
743
	__be32 x_recv, pinv;
744

745 746 747
	BUG_ON(hcrx == NULL);

	if (!(sk->sk_state == DCCP_OPEN || sk->sk_state == DCCP_PARTOPEN))
748
		return 0;
749

I
Ian McDonald 已提交
750
	DCCP_SKB_CB(skb)->dccpd_ccval = hcrx->ccid3hcrx_ccval_last_counter;
751 752

	if (dccp_packet_without_ack(skb))
753 754
		return 0;

755 756
	x_recv = htonl(hcrx->ccid3hcrx_x_recv);
	pinv   = htonl(hcrx->ccid3hcrx_pinv);
757 758 759 760 761 762 763 764 765 766 767 768

	if ((hcrx->ccid3hcrx_elapsed_time != 0 &&
	     dccp_insert_option_elapsed_time(sk, skb,
					     hcrx->ccid3hcrx_elapsed_time)) ||
	    dccp_insert_option_timestamp(sk, skb) ||
	    dccp_insert_option(sk, skb, TFRC_OPT_LOSS_EVENT_RATE,
		    	       &pinv, sizeof(pinv)) ||
	    dccp_insert_option(sk, skb, TFRC_OPT_RECEIVE_RATE,
		    	       &x_recv, sizeof(x_recv)))
		return -1;

	return 0;
769 770 771 772 773 774 775 776
}

/* calculate first loss interval
 *
 * returns estimated loss interval in usecs */

static u32 ccid3_hc_rx_calc_first_li(struct sock *sk)
{
777
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
778
	struct dccp_rx_hist_entry *entry, *next, *tail = NULL;
779
	u32 rtt, delta, x_recv, fval, p, tmp2;
780
	struct timeval tstamp = { 0, };
781 782 783 784 785
	int interval = 0;
	int win_count = 0;
	int step = 0;
	u64 tmp1;

786 787 788
	list_for_each_entry_safe(entry, next, &hcrx->ccid3hcrx_hist,
				 dccphrx_node) {
		if (dccp_rx_hist_entry_data_packet(entry)) {
789 790 791 792
			tail = entry;

			switch (step) {
			case 0:
793
				tstamp	  = entry->dccphrx_tstamp;
794
				win_count = entry->dccphrx_ccval;
795 796 797
				step = 1;
				break;
			case 1:
798
				interval = win_count - entry->dccphrx_ccval;
799 800 801 802 803 804 805 806 807
				if (interval < 0)
					interval += TFRC_WIN_COUNT_LIMIT;
				if (interval > 4)
					goto found;
				break;
			}
		}
	}

808
	if (unlikely(step == 0)) {
809 810
		DCCP_WARN("%s, sk=%p, packet history has no data packets!\n",
			  dccp_role(sk), sk);
811 812 813
		return ~0;
	}

814
	if (unlikely(interval == 0)) {
815 816
		DCCP_WARN("%s, sk=%p, Could not find a win_count interval > 0."
			  "Defaulting to 1\n", dccp_role(sk), sk);
817 818 819
		interval = 1;
	}
found:
I
Ian McDonald 已提交
820
	if (!tail) {
821
		DCCP_CRIT("tail is null\n");
I
Ian McDonald 已提交
822 823
		return ~0;
	}
824
	rtt = timeval_delta(&tstamp, &tail->dccphrx_tstamp) * 4 / interval;
825 826
	ccid3_pr_debug("%s, sk=%p, approximated RTT to %uus\n",
		       dccp_role(sk), sk, rtt);
827 828 829 830 831

	if (rtt == 0) {
		DCCP_WARN("RTT==0, setting to 1\n");
 		rtt = 1;
	}
832

833 834 835
	dccp_timestamp(sk, &tstamp);
	delta = timeval_delta(&tstamp, &hcrx->ccid3hcrx_tstamp_last_feedback);
	x_recv = usecs_div(hcrx->ccid3hcrx_bytes_recv, delta);
836

I
Ian McDonald 已提交
837 838 839
	if (x_recv == 0)
		x_recv = hcrx->ccid3hcrx_x_recv;

840 841 842
	tmp1 = (u64)x_recv * (u64)rtt;
	do_div(tmp1,10000000);
	tmp2 = (u32)tmp1;
I
Ian McDonald 已提交
843 844

	if (!tmp2) {
845
		DCCP_CRIT("tmp2 = 0, x_recv = %u, rtt =%u\n", x_recv, rtt);
I
Ian McDonald 已提交
846 847 848
		return ~0;
	}

849 850
	fval = (hcrx->ccid3hcrx_s * 100000) / tmp2;
	/* do not alter order above or you will get overflow on 32 bit */
851
	p = tfrc_calc_x_reverse_lookup(fval);
852 853
	ccid3_pr_debug("%s, sk=%p, receive rate=%u bytes/s, implied "
		       "loss rate=%u\n", dccp_role(sk), sk, x_recv, p);
854 855 856 857 858 859 860 861 862

	if (p == 0)
		return ~0;
	else
		return 1000000 / p; 
}

static void ccid3_hc_rx_update_li(struct sock *sk, u64 seq_loss, u8 win_loss)
{
863
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
864
	struct dccp_li_hist_entry *head;
I
Ian McDonald 已提交
865
	u64 seq_temp;
866

I
Ian McDonald 已提交
867 868 869 870
	if (list_empty(&hcrx->ccid3hcrx_li_hist)) {
		if (!dccp_li_hist_interval_new(ccid3_li_hist,
		   &hcrx->ccid3hcrx_li_hist, seq_loss, win_loss))
			return;
871

872 873 874
		head = list_entry(hcrx->ccid3hcrx_li_hist.next,
		   struct dccp_li_hist_entry, dccplih_node);
		head->dccplih_interval = ccid3_hc_rx_calc_first_li(sk);
I
Ian McDonald 已提交
875 876 877 878
	} else {
		struct dccp_li_hist_entry *entry;
		struct list_head *tail;

879 880
		head = list_entry(hcrx->ccid3hcrx_li_hist.next,
		   struct dccp_li_hist_entry, dccplih_node);
I
Ian McDonald 已提交
881 882 883 884 885 886 887 888 889 890
		/* FIXME win count check removed as was wrong */
		/* should make this check with receive history */
		/* and compare there as per section 10.2 of RFC4342 */

		/* new loss event detected */
		/* calculate last interval length */
		seq_temp = dccp_delta_seqno(head->dccplih_seqno, seq_loss);
		entry = dccp_li_hist_entry_new(ccid3_li_hist, SLAB_ATOMIC);

		if (entry == NULL) {
891
			DCCP_BUG("out of memory - can not allocate entry");
892
			return;
I
Ian McDonald 已提交
893 894 895 896 897 898 899 900 901 902 903 904 905
		}

		list_add(&entry->dccplih_node, &hcrx->ccid3hcrx_li_hist);

		tail = hcrx->ccid3hcrx_li_hist.prev;
		list_del(tail);
		kmem_cache_free(ccid3_li_hist->dccplih_slab, tail);

		/* Create the newest interval */
		entry->dccplih_seqno = seq_loss;
		entry->dccplih_interval = seq_temp;
		entry->dccplih_win_count = win_loss;
	}
906 907
}

I
Ian McDonald 已提交
908 909
static int ccid3_hc_rx_detect_loss(struct sock *sk,
                                    struct dccp_rx_hist_entry *packet)
910
{
911
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
I
Ian McDonald 已提交
912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927
	struct dccp_rx_hist_entry *rx_hist = dccp_rx_hist_head(&hcrx->ccid3hcrx_hist);
	u64 seqno = packet->dccphrx_seqno;
	u64 tmp_seqno;
	int loss = 0;
	u8 ccval;


	tmp_seqno = hcrx->ccid3hcrx_seqno_nonloss;

	if (!rx_hist ||
	   follows48(packet->dccphrx_seqno, hcrx->ccid3hcrx_seqno_nonloss)) {
		hcrx->ccid3hcrx_seqno_nonloss = seqno;
		hcrx->ccid3hcrx_ccval_nonloss = packet->dccphrx_ccval;
		goto detect_out;
	}

928

I
Ian McDonald 已提交
929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957
	while (dccp_delta_seqno(hcrx->ccid3hcrx_seqno_nonloss, seqno)
	   > TFRC_RECV_NUM_LATE_LOSS) {
		loss = 1;
		ccid3_hc_rx_update_li(sk, hcrx->ccid3hcrx_seqno_nonloss,
		   hcrx->ccid3hcrx_ccval_nonloss);
		tmp_seqno = hcrx->ccid3hcrx_seqno_nonloss;
		dccp_inc_seqno(&tmp_seqno);
		hcrx->ccid3hcrx_seqno_nonloss = tmp_seqno;
		dccp_inc_seqno(&tmp_seqno);
		while (dccp_rx_hist_find_entry(&hcrx->ccid3hcrx_hist,
		   tmp_seqno, &ccval)) {
		   	hcrx->ccid3hcrx_seqno_nonloss = tmp_seqno;
			hcrx->ccid3hcrx_ccval_nonloss = ccval;
			dccp_inc_seqno(&tmp_seqno);
		}
	}

	/* FIXME - this code could be simplified with above while */
	/* but works at moment */
	if (follows48(packet->dccphrx_seqno, hcrx->ccid3hcrx_seqno_nonloss)) {
		hcrx->ccid3hcrx_seqno_nonloss = seqno;
		hcrx->ccid3hcrx_ccval_nonloss = packet->dccphrx_ccval;
	}

detect_out:
	dccp_rx_hist_add_packet(ccid3_rx_hist, &hcrx->ccid3hcrx_hist,
		   &hcrx->ccid3hcrx_li_hist, packet,
		   hcrx->ccid3hcrx_seqno_nonloss);
	return loss;
958 959 960 961
}

static void ccid3_hc_rx_packet_recv(struct sock *sk, struct sk_buff *skb)
{
962
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
963
	const struct dccp_options_received *opt_recv;
964
	struct dccp_rx_hist_entry *packet;
965
	struct timeval now;
I
Ian McDonald 已提交
966
	u32 p_prev, rtt_prev, r_sample, t_elapsed;
967
	int loss, payload_size;
968

969
	BUG_ON(hcrx == NULL);
970

971
	opt_recv = &dccp_sk(sk)->dccps_options_received;
972

973 974 975 976 977
	switch (DCCP_SKB_CB(skb)->dccpd_type) {
	case DCCP_PKT_ACK:
		if (hcrx->ccid3hcrx_state == TFRC_RSTATE_NO_DATA)
			return;
	case DCCP_PKT_DATAACK:
978
		if (opt_recv->dccpor_timestamp_echo == 0)
979
			break;
I
Ian McDonald 已提交
980
		rtt_prev = hcrx->ccid3hcrx_rtt;
981
		dccp_timestamp(sk, &now);
982 983 984 985 986
		timeval_sub_usecs(&now, opt_recv->dccpor_timestamp_echo * 10);
		r_sample = timeval_usecs(&now);
		t_elapsed = opt_recv->dccpor_elapsed_time * 10;

		if (unlikely(r_sample <= t_elapsed))
987 988
			DCCP_WARN("r_sample=%uus, t_elapsed=%uus\n",
				  r_sample, t_elapsed);
989 990 991 992 993 994 995 996 997
		else
			r_sample -= t_elapsed;

		if (hcrx->ccid3hcrx_state == TFRC_RSTATE_NO_DATA)
			hcrx->ccid3hcrx_rtt = r_sample;
		else
			hcrx->ccid3hcrx_rtt = (hcrx->ccid3hcrx_rtt * 9) / 10 +
					      r_sample / 10;

I
Ian McDonald 已提交
998 999
		if (rtt_prev != hcrx->ccid3hcrx_rtt)
			ccid3_pr_debug("%s, New RTT=%uus, elapsed time=%u\n",
1000 1001
				       dccp_role(sk), hcrx->ccid3hcrx_rtt,
				       opt_recv->dccpor_elapsed_time);
1002 1003 1004
		break;
	case DCCP_PKT_DATA:
		break;
1005
	default: /* We're not interested in other packet types, move along */
1006 1007 1008
		return;
	}

1009
	packet = dccp_rx_hist_entry_new(ccid3_rx_hist, sk, opt_recv->dccpor_ndp,
1010
					skb, SLAB_ATOMIC);
1011
	if (unlikely(packet == NULL)) {
1012 1013
		DCCP_WARN("%s, sk=%p, Not enough mem to add rx packet "
			  "to history, consider it lost!\n", dccp_role(sk), sk);
1014 1015 1016
		return;
	}

I
Ian McDonald 已提交
1017
	loss = ccid3_hc_rx_detect_loss(sk, packet);
1018 1019 1020 1021

	if (DCCP_SKB_CB(skb)->dccpd_type == DCCP_PKT_ACK)
		return;

1022 1023 1024
	payload_size = skb->len - dccp_hdr(skb)->dccph_doff * 4;
	ccid3_hc_rx_update_s(hcrx, payload_size);

1025 1026
	switch (hcrx->ccid3hcrx_state) {
	case TFRC_RSTATE_NO_DATA:
1027 1028 1029 1030
		ccid3_pr_debug("%s, sk=%p(%s), skb=%p, sending initial "
			       "feedback\n",
			       dccp_role(sk), sk,
			       dccp_state_name(sk->sk_state), skb);
1031 1032 1033 1034
		ccid3_hc_rx_send_feedback(sk);
		ccid3_hc_rx_set_state(sk, TFRC_RSTATE_DATA);
		return;
	case TFRC_RSTATE_DATA:
1035
		hcrx->ccid3hcrx_bytes_recv += payload_size;
I
Ian McDonald 已提交
1036
		if (loss)
1037 1038
			break;

1039
		dccp_timestamp(sk, &now);
1040 1041 1042 1043
		if (timeval_delta(&now, &hcrx->ccid3hcrx_tstamp_last_ack) >=
		    hcrx->ccid3hcrx_rtt) {
			hcrx->ccid3hcrx_tstamp_last_ack = now;
			ccid3_hc_rx_send_feedback(sk);
1044
		}
1045
		return;
1046 1047
	case TFRC_RSTATE_TERM:
		DCCP_BUG("Illegal %s state TERM, sk=%p", dccp_role(sk), sk);
1048 1049 1050 1051
		return;
	}

	/* Dealing with packet loss */
1052 1053
	ccid3_pr_debug("%s, sk=%p(%s), data loss! Reacting...\n",
		       dccp_role(sk), sk, dccp_state_name(sk->sk_state));
1054 1055 1056 1057

	p_prev = hcrx->ccid3hcrx_p;
	
	/* Calculate loss event rate */
I
Ian McDonald 已提交
1058 1059 1060
	if (!list_empty(&hcrx->ccid3hcrx_li_hist)) {
		u32 i_mean = dccp_li_hist_calc_i_mean(&hcrx->ccid3hcrx_li_hist);

1061
		/* Scaling up by 1000000 as fixed decimal */
I
Ian McDonald 已提交
1062 1063
		if (i_mean != 0)
			hcrx->ccid3hcrx_p = 1000000 / i_mean;
1064 1065
	} else
		DCCP_BUG("empty loss history");
1066 1067 1068 1069 1070 1071 1072

	if (hcrx->ccid3hcrx_p > p_prev) {
		ccid3_hc_rx_send_feedback(sk);
		return;
	}
}

1073
static int ccid3_hc_rx_init(struct ccid *ccid, struct sock *sk)
1074
{
1075
	struct ccid3_hc_rx_sock *hcrx = ccid_priv(ccid);
1076 1077 1078 1079 1080

	ccid3_pr_debug("%s, sk=%p\n", dccp_role(sk), sk);

	hcrx->ccid3hcrx_state = TFRC_RSTATE_NO_DATA;
	INIT_LIST_HEAD(&hcrx->ccid3hcrx_hist);
1081
	INIT_LIST_HEAD(&hcrx->ccid3hcrx_li_hist);
1082
	dccp_timestamp(sk, &hcrx->ccid3hcrx_tstamp_last_ack);
1083
	hcrx->ccid3hcrx_tstamp_last_feedback = hcrx->ccid3hcrx_tstamp_last_ack;
1084
	hcrx->ccid3hcrx_s   = 0;
1085
	hcrx->ccid3hcrx_rtt = 5000; /* XXX 5ms for now... */
1086 1087 1088 1089 1090
	return 0;
}

static void ccid3_hc_rx_exit(struct sock *sk)
{
1091
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
1092

1093
	BUG_ON(hcrx == NULL);
1094 1095 1096 1097

	ccid3_hc_rx_set_state(sk, TFRC_RSTATE_TERM);

	/* Empty packet history */
1098
	dccp_rx_hist_purge(ccid3_rx_hist, &hcrx->ccid3hcrx_hist);
1099 1100

	/* Empty loss interval history */
1101
	dccp_li_hist_purge(ccid3_li_hist, &hcrx->ccid3hcrx_li_hist);
1102 1103
}

1104 1105
static void ccid3_hc_rx_get_info(struct sock *sk, struct tcp_info *info)
{
1106
	const struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
1107

1108 1109 1110 1111
	/* Listen socks doesn't have a private CCID block */
	if (sk->sk_state == DCCP_LISTEN)
		return;

1112
	BUG_ON(hcrx == NULL);
1113 1114 1115 1116 1117 1118 1119 1120

	info->tcpi_ca_state	= hcrx->ccid3hcrx_state;
	info->tcpi_options	|= TCPI_OPT_TIMESTAMPS;
	info->tcpi_rcv_rtt	= hcrx->ccid3hcrx_rtt;
}

static void ccid3_hc_tx_get_info(struct sock *sk, struct tcp_info *info)
{
1121
	const struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
1122

1123 1124 1125 1126
	/* Listen socks doesn't have a private CCID block */
	if (sk->sk_state == DCCP_LISTEN)
		return;

1127
	BUG_ON(hctx == NULL);
1128 1129 1130 1131 1132

	info->tcpi_rto = hctx->ccid3hctx_t_rto;
	info->tcpi_rtt = hctx->ccid3hctx_rtt;
}

1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186
static int ccid3_hc_rx_getsockopt(struct sock *sk, const int optname, int len,
				  u32 __user *optval, int __user *optlen)
{
	const struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
	const void *val;
	
	/* Listen socks doesn't have a private CCID block */
	if (sk->sk_state == DCCP_LISTEN)
		return -EINVAL;

	switch (optname) {
	case DCCP_SOCKOPT_CCID_RX_INFO:
		if (len < sizeof(hcrx->ccid3hcrx_tfrc))
			return -EINVAL;
		len = sizeof(hcrx->ccid3hcrx_tfrc);
		val = &hcrx->ccid3hcrx_tfrc;
		break;
	default:
		return -ENOPROTOOPT;
	}

	if (put_user(len, optlen) || copy_to_user(optval, val, len))
		return -EFAULT;

	return 0;
}

static int ccid3_hc_tx_getsockopt(struct sock *sk, const int optname, int len,
				  u32 __user *optval, int __user *optlen)
{
	const struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
	const void *val;
	
	/* Listen socks doesn't have a private CCID block */
	if (sk->sk_state == DCCP_LISTEN)
		return -EINVAL;

	switch (optname) {
	case DCCP_SOCKOPT_CCID_TX_INFO:
		if (len < sizeof(hctx->ccid3hctx_tfrc))
			return -EINVAL;
		len = sizeof(hctx->ccid3hctx_tfrc);
		val = &hctx->ccid3hctx_tfrc;
		break;
	default:
		return -ENOPROTOOPT;
	}

	if (put_user(len, optlen) || copy_to_user(optval, val, len))
		return -EFAULT;

	return 0;
}

1187
static struct ccid_operations ccid3 = {
I
Ian McDonald 已提交
1188
	.ccid_id		   = DCCPC_CCID3,
1189 1190
	.ccid_name		   = "ccid3",
	.ccid_owner		   = THIS_MODULE,
1191
	.ccid_hc_tx_obj_size	   = sizeof(struct ccid3_hc_tx_sock),
1192 1193 1194 1195 1196 1197 1198
	.ccid_hc_tx_init	   = ccid3_hc_tx_init,
	.ccid_hc_tx_exit	   = ccid3_hc_tx_exit,
	.ccid_hc_tx_send_packet	   = ccid3_hc_tx_send_packet,
	.ccid_hc_tx_packet_sent	   = ccid3_hc_tx_packet_sent,
	.ccid_hc_tx_packet_recv	   = ccid3_hc_tx_packet_recv,
	.ccid_hc_tx_insert_options = ccid3_hc_tx_insert_options,
	.ccid_hc_tx_parse_options  = ccid3_hc_tx_parse_options,
1199
	.ccid_hc_rx_obj_size	   = sizeof(struct ccid3_hc_rx_sock),
1200 1201 1202 1203
	.ccid_hc_rx_init	   = ccid3_hc_rx_init,
	.ccid_hc_rx_exit	   = ccid3_hc_rx_exit,
	.ccid_hc_rx_insert_options = ccid3_hc_rx_insert_options,
	.ccid_hc_rx_packet_recv	   = ccid3_hc_rx_packet_recv,
1204 1205
	.ccid_hc_rx_get_info	   = ccid3_hc_rx_get_info,
	.ccid_hc_tx_get_info	   = ccid3_hc_tx_get_info,
1206 1207
	.ccid_hc_rx_getsockopt	   = ccid3_hc_rx_getsockopt,
	.ccid_hc_tx_getsockopt	   = ccid3_hc_tx_getsockopt,
1208 1209
};
 
1210
#ifdef CONFIG_IP_DCCP_CCID3_DEBUG
1211 1212
module_param(ccid3_debug, int, 0444);
MODULE_PARM_DESC(ccid3_debug, "Enable debug messages");
1213
#endif
1214 1215 1216

static __init int ccid3_module_init(void)
{
1217
	int rc = -ENOBUFS;
1218

1219 1220
	ccid3_rx_hist = dccp_rx_hist_new("ccid3");
	if (ccid3_rx_hist == NULL)
1221 1222
		goto out;

1223 1224 1225
	ccid3_tx_hist = dccp_tx_hist_new("ccid3");
	if (ccid3_tx_hist == NULL)
		goto out_free_rx;
1226

1227 1228
	ccid3_li_hist = dccp_li_hist_new("ccid3");
	if (ccid3_li_hist == NULL)
1229
		goto out_free_tx;
1230 1231 1232 1233 1234 1235

	rc = ccid_register(&ccid3);
	if (rc != 0) 
		goto out_free_loss_interval_history;
out:
	return rc;
1236

1237
out_free_loss_interval_history:
1238 1239
	dccp_li_hist_delete(ccid3_li_hist);
	ccid3_li_hist = NULL;
1240 1241 1242 1243 1244 1245
out_free_tx:
	dccp_tx_hist_delete(ccid3_tx_hist);
	ccid3_tx_hist = NULL;
out_free_rx:
	dccp_rx_hist_delete(ccid3_rx_hist);
	ccid3_rx_hist = NULL;
1246 1247 1248 1249 1250 1251 1252 1253
	goto out;
}
module_init(ccid3_module_init);

static __exit void ccid3_module_exit(void)
{
	ccid_unregister(&ccid3);

1254 1255 1256
	if (ccid3_tx_hist != NULL) {
		dccp_tx_hist_delete(ccid3_tx_hist);
		ccid3_tx_hist = NULL;
1257
	}
1258 1259 1260
	if (ccid3_rx_hist != NULL) {
		dccp_rx_hist_delete(ccid3_rx_hist);
		ccid3_rx_hist = NULL;
1261
	}
1262 1263 1264
	if (ccid3_li_hist != NULL) {
		dccp_li_hist_delete(ccid3_li_hist);
		ccid3_li_hist = NULL;
1265 1266 1267 1268
	}
}
module_exit(ccid3_module_exit);

1269
MODULE_AUTHOR("Ian McDonald <ian.mcdonald@jandi.co.nz>, "
1270
	      "Arnaldo Carvalho de Melo <acme@ghostprotocols.net>");
1271 1272 1273
MODULE_DESCRIPTION("DCCP TFRC CCID3 CCID");
MODULE_LICENSE("GPL");
MODULE_ALIAS("net-dccp-ccid-3");